diff --git a/.gitignore b/.gitignore
new file mode 100644
index 000000000..8623fa076
--- /dev/null
+++ b/.gitignore
@@ -0,0 +1,20 @@
+/*.bam
+/*.bai
+/*.bed
+*.idx
+*~
+/*.vcf
+/*.txt
+/*.csh
+/.*
+/*.pdf
+/*.eval
+*.ipr
+*.iws
+*.iml
+.DS_Store
+queueScatterGather
+/foo*
+/bar*
+integrationtests/
+public/testdata/onTheFlyOutputTest.vcf
diff --git a/build.xml b/build.xml
index babf31506..232b074f6 100644
--- a/build.xml
+++ b/build.xml
@@ -28,6 +28,8 @@
 
     <property name="build.dir" value="build" />
     <property name="dist.dir" value="dist" />
+    <property name="contract.dump.dir" value="dump" />
+    <property name="pipelinetest.dir" value="pipelinetests" />
     <property name="lib.dir" value="lib" />
     <property name="external.dir" value="external" />
     <property name="public.dir" value="public" />
@@ -35,18 +37,26 @@
     <property name="java.public.source.dir" value="${public.dir}/java/src" />
     <property name="java.private.source.dir" value="${private.dir}/java/src" />
     <property name="java.classes" value="${build.dir}/java/classes" />
+    <property name="R.public.scripts.dir" value="${public.dir}/R/scripts" />
+    <property name="R.private.scripts.dir" value="${private.dir}/R/scripts" />
+    <property name="R.public.src.dir" value="${public.dir}/R/src" />
+    <!-- Legacy: Installing libraries back into the source directory
+    instead of the build or dist directory... intentionally avoids ant clean?? -->
+    <property name="R.library.dir" value="${public.dir}/R" />
+    <property name="R.tar.dir" value="${build.dir}/R/src" />
+    <property name="R.package.path" value="org/broadinstitute/sting/utils/R" />
     <property name="resource.file" value="StingText.properties" />
     <property name="resource.path" value="${java.classes}/StingText.properties" />
 
     <property name="scala.public.source.dir" value="${public.dir}/scala/src" />
-    <property name="scala.private.source.dir" value="${private.dir}/scala/src" />    
+    <property name="scala.private.source.dir" value="${private.dir}/scala/src" />
     <property name="scala.classes" value="${build.dir}/scala/classes" />
 
     <property name="queue-extensions.source.dir" value="${build.dir}/queue-extensions/src" />
 
     <property name="javadoc.dir" value="javadoc" />
     <property name="scaladoc.dir" value="scaladoc" />
-    
+
     <!-- Contracts for Java -->
     <!-- By default, enabled only for test targets -->
     <!-- To disable for test targets, run with -Duse.contracts=false -->
@@ -60,7 +70,7 @@
 
     <!-- do we want to halt on failure of a unit test? default to yes (Bamboo uses 'no') -->
     <property name="halt" value="yes" />
-    
+
     <!-- should our unit test output go to a file or the screen?
     false means it goes to the screen (default) true to file -->
     <property name="usefile" value="false" />
@@ -82,7 +92,7 @@
         <patternset refid="java.source.pattern" />
     </fileset>
 
-    <!-- terrible hack to get gatkdocs to see all files --> 
+    <!-- terrible hack to get gatkdocs to see all files -->
     <patternset id="all.java.source.pattern">
         <include name="${java.public.source.dir}/**/*.java" />
         <include name="${java.private.source.dir}/**/*.java" />
@@ -113,7 +123,7 @@
       <exclude name="testng*.jar" />
       <exclude name="bcel*.jar" />
     </patternset>
-    
+
     <path id="external.dependencies">
       <fileset dir="${lib.dir}">
         <patternset refid="dependency.mask" />
@@ -154,16 +164,18 @@
         <property name="ivy.jar.file" value="ivy-${ivy.install.version}.jar"/>
         <property name="ivy.settings.dir" value="settings"/>
         <property file="${ivy.settings.dir}/ivysettings.properties"/>
-  
+
       <mkdir dir="${lib.dir}"/>
       <mkdir dir="${ivy.jar.dir}"/>
 
+      <!-- Comment out the following two lines to build the GATK without a network connection, assuming you have all of the libraries cached already -->
       <get src="http://repo1.maven.org/maven2/org/apache/ivy/ivy/${ivy.install.version}/${ivy.jar.file}"
            dest="${ivy.jar.dir}/${ivy.jar.file}"
            usetimestamp="true"/>
       <taskdef resource="org/apache/ivy/ant/antlib.xml"
                uri="antlib:org.apache.ivy.ant"
                classpath="${ivy.jar.dir}/${ivy.jar.file}"/>
+
       <ivy:settings file="${ivy.settings.dir}/ivysettings.xml"/>
         <property name="init.resolve.done" value="true"/>
     </target>
@@ -209,11 +221,11 @@
         <equals arg1="${git.describe.exit.value}" arg2="0" />
       </condition>
     </target>
-    
+
     <target name="tagged.build.version" depends="git.describe" if="git.describe.succeeded">
         <property name="build.version" value="${git.describe.output}" />
     </target>
-    
+
     <target name="git.rev-parse" depends="git.describe" unless="git.describe.succeeded">
       <exec executable="git" outputproperty="git.rev-parse.output" resultproperty="git.rev-parse.exit.value" failonerror="false">
         <arg line="rev-parse HEAD" />
@@ -222,11 +234,11 @@
         <equals arg1="${git.rev-parse.exit.value}" arg2="0" />
       </condition>
     </target>
-    
+
     <target name="untagged.build.version" depends="git.rev-parse" if="git.rev-parse.succeeded">
         <property name="build.version" value="${git.rev-parse.output}" />
     </target>
-    
+
     <target name="generate.build.version" depends="tagged.build.version, untagged.build.version">
         <!-- Set build.version to exported if no other value has been set -->
         <property name="build.version" value="exported" />
@@ -264,7 +276,7 @@
         <echo message="Scala build     : ${scala.target}"/>
       <echo message="source revision : ${build.version}"/>
       <echo message="build time      : ${build.timestamp}" />
-      
+
       <condition property="include.private">
         <equals arg1="${gatk.target}" arg2="private" casesensitive="false" />
       </condition>
@@ -310,13 +322,13 @@
     <target name="gatk.compile.public.source" depends="init,resolve">
         <javac fork="true" srcdir="${java.public.source.dir}" memoryMaximumSize="512m" destdir="${java.classes}" debug="true" debuglevel="lines,vars,source" classpathref="external.dependencies" tempdir="${java.io.tmpdir}">
           <compilerarg value="-proc:none"/>
-        </javac>    
+        </javac>
     </target>
 
     <target name="gatk.compile.private.source" depends="gatk.compile.public.source" if="include.private">
         <javac fork="true" srcdir="${java.private.source.dir}" memoryMaximumSize="512m" destdir="${java.classes}" debug="true" debuglevel="lines,vars,source" classpathref="external.dependencies" tempdir="${java.io.tmpdir}">
           <compilerarg value="-proc:none"/>
-        </javac>    
+        </javac>
     </target>
 
     <target name="gatk.compile.external.source" depends="gatk.compile.public.source,gatk.compile.private.source">
@@ -325,11 +337,11 @@
             <property name="dist.dir" value="${external.dist.dir}" />
             <property name="gatk.classpath" value="${external.gatk.classpath}" />
             <fileset dir="${external.dir}" includes="*/build.xml" erroronmissingdir="false" />
-        </subant>    
+        </subant>
     </target>
 
-    <target name="gatk.compile.source" 
-            depends="gatk.compile.public.source,gatk.compile.private.source,gatk.compile.external.source" 
+    <target name="gatk.compile.source"
+            depends="gatk.compile.public.source,gatk.compile.private.source,gatk.compile.external.source"
             description="compile the GATK source" />
 
    <target name="gatk.contracts.public" depends="gatk.compile.source" if="include.contracts">
@@ -339,9 +351,9 @@
                 <pathelement path="${java.classes}" />
             </classpath>
             <compilerarg value="-Acom.google.java.contract.debug"/>
-            <compilerarg value="-Acom.google.java.contract.dump=dump/"/>
+            <compilerarg value="-Acom.google.java.contract.dump=${contract.dump.dir}"/>
             <compilerarg value="-proc:only"/>
-        </javac>   
+        </javac>
    </target>
 
     <target name="check.contracts.private" depends="gatk.contracts.public">
@@ -360,14 +372,14 @@
                 <pathelement path="${java.classes}" />
             </classpath>
             <compilerarg value="-Acom.google.java.contract.debug"/>
-            <compilerarg value="-Acom.google.java.contract.dump=dump/"/>
+            <compilerarg value="-Acom.google.java.contract.dump=${contract.dump.dir}"/>
             <compilerarg value="-proc:only"/>
-        </javac>   
+        </javac>
    </target>
 
-    <target name="gatk.contracts" depends="gatk.contracts.public,gatk.contracts.private" 
+    <target name="gatk.contracts" depends="gatk.contracts.public,gatk.contracts.private"
             description="create GATK contracts" if="include.contracts" />
-    
+
     <target name="gatk.compile" depends="init,resolve,gatk.compile.source,gatk.contracts" />
 
     <target name="init.queue-extensions.generate" depends="gatk.compile">
@@ -411,9 +423,9 @@
             <src path="${scala.public.source.dir}" />
             <src path="${queue-extensions.source.dir}" />
             <include name="**/*.scala"/>
-        </scalac>    
+        </scalac>
     </target>
-    
+
     <target name="check.scala.private" depends="scala.compile.public">
         <condition property="include.scala.private">
           <and>
@@ -422,12 +434,12 @@
           </and>
         </condition>
     </target>
-    
+
     <target name="scala.compile.private" depends="check.scala.private" if="include.scala.private">
         <scalac fork="true" jvmargs="-Xmx512m" destdir="${scala.classes}" classpathref="scala.dependencies" deprecation="yes" unchecked="yes">
             <src path="${scala.private.source.dir}" />
             <include name="**/*.scala"/>
-        </scalac>       
+        </scalac>
     </target>
 
     <target name="scala.compile" depends="scala.compile.public,scala.compile.private" if="scala.include" description="compile Scala" />
@@ -530,6 +542,11 @@
 
     <target name="sting.compile" depends="gatk.compile, scala.compile" />
 
+    <target name="R.public.tar">
+        <mkdir dir="${R.tar.dir}/${R.package.path}" />
+        <tar compression="gzip" basedir="${R.public.src.dir}/${R.package.path}" includes="gsalib/**" destfile="${R.tar.dir}/${R.package.path}/gsalib.tar.gz" />
+    </target>
+
     <target name="init.jar" depends="sting.compile,extracthelp">
         <mkdir dir="${dist.dir}"/>
         <copy todir="${dist.dir}">
@@ -537,7 +554,7 @@
         </copy>
     </target>
 
-    <target name="sting-utils.jar" depends="gatk.compile, init.jar">
+    <target name="sting-utils.jar" depends="gatk.compile, init.jar, R.public.tar">
         <jar jarfile="${dist.dir}/StingUtils.jar">
             <fileset dir="${java.classes}">
               <include name="**/utils/**/*.class"/>
@@ -549,6 +566,15 @@
             <fileset dir="${java.classes}" includes="**/sting/jna/**/*.class"/>
             <fileset dir="${java.classes}" includes="net/sf/picard/**/*.class"/>
             <fileset dir="${java.classes}" includes="net/sf/samtools/**/*.class"/>
+            <fileset dir="${R.tar.dir}">
+                <include name="**/${R.package.path}/**/*.tar.gz"/>
+            </fileset>
+            <fileset dir="${R.public.scripts.dir}">
+              <include name="**/utils/**/*.R"/>
+            </fileset>
+            <fileset dir="${R.private.scripts.dir}" erroronmissingdir="false">
+              <include name="**/utils/**/*.R"/>
+            </fileset>
             <manifest>
                 <attribute name="Premain-Class" value="org.broadinstitute.sting.utils.instrumentation.Sizeof" />
             </manifest>
@@ -577,6 +603,14 @@
               <include name="**/gatk/**/*.class" />
               <include name="**/alignment/**/*.class"/>
             </fileset>
+            <fileset dir="${R.public.scripts.dir}">
+                <include name="**/gatk/**/*.R"/>
+                <include name="**/alignment/**/*.R"/>
+            </fileset>
+            <fileset dir="${R.private.scripts.dir}" erroronmissingdir="false">
+                <include name="**/gatk/**/*.R"/>
+                <include name="**/alignment/**/*.R"/>
+            </fileset>
             <manifest>
                 <attribute name="Main-Class" value="org.broadinstitute.sting.gatk.CommandLineGATK" />
             </manifest>
@@ -591,6 +625,14 @@
             <include name="**/analyzecovariates/**/*.class" />
             <include name="**/gatk/walkers/recalibration/*.class" />
           </fileset>
+            <fileset dir="${R.public.scripts.dir}">
+                <include name="**/analyzecovariates/**/*.R"/>
+                <include name="**/gatk/walkers/recalibration/**/*.R"/>
+            </fileset>
+            <fileset dir="${R.private.scripts.dir}" erroronmissingdir="false">
+                <include name="**/analyzecovariates/**/*.R"/>
+                <include name="**/gatk/walkers/recalibration/**/*.R"/>
+            </fileset>
           <manifest>
             <attribute name="Main-Class" value="org.broadinstitute.sting.analyzecovariates.AnalyzeCovariates" />
           </manifest>
@@ -603,28 +645,7 @@
             <fileset dir="${external.dir}" includes="*/build.xml" erroronmissingdir="false" />
         </subant>
     </target>
-<!--
-    <target name="gatk.oneoffs.jar" depends="gatk.compile, init.jar"
-            description="generate the GATK oneoffs distribution" if="include.oneoffs">
-        <jar jarfile="${dist.dir}/CompareBAMAlignments.jar" whenmanifestonly="skip">
-          <fileset dir="${java.classes}">
-            <include name="**/tools/**/*.class" />
-          </fileset>
-          <manifest>
-            <attribute name="Main-Class" value="org.broadinstitute.sting.oneoffprojects.tools.CompareBAMAlignments" />
-          </manifest>
-        </jar>
 
-        <jar jarfile="${dist.dir}/SliceBams.jar" whenmanifestonly="skip">
-          <fileset dir="${java.classes}">
-            <include name="**/tools/**/*.class" />
-          </fileset>
-          <manifest>
-            <attribute name="Main-Class" value="org.broadinstitute.sting.playground.tools.SliceBams" />
-          </manifest>
-        </jar>
-    </target>
--->
     <target name="scala.jar" depends="scala.compile, init.jar" if="scala.include">
         <jar jarfile="${dist.dir}/GATKScala.jar">
           <fileset dir="${scala.classes}">
@@ -641,6 +662,12 @@
             <fileset dir="${java.classes}">
               <include name="org/broadinstitute/sting/queue/**/*.class" />
             </fileset>
+            <fileset dir="${R.public.scripts.dir}">
+                <include name="org/broadinstitute/sting/queue/**/*.R"/>
+            </fileset>
+            <fileset dir="${R.private.scripts.dir}" erroronmissingdir="false">
+                <include name="org/broadinstitute/sting/queue/**/*.R"/>
+            </fileset>
             <manifest>
                 <attribute name="Main-Class" value="org.broadinstitute.sting.queue.QCommandLine" />
             </manifest>
@@ -680,20 +707,7 @@
         </jar>
 
     </target>
-<!--
-    <target name="gatk.oneoffs.manifests" depends="gatk.oneoffs.jar, init.manifests" if="include.oneoffs">
-        <jar jarfile="${dist.dir}/CompareBAMAlignments.jar" update="true" whenmanifestonly="skip">
-            <manifest>
-                <attribute name="Class-Path" value="${jar.classpath}" />
-            </manifest>
-        </jar>
-        <jar jarfile="${dist.dir}/SliceBams.jar" update="true" whenmanifestonly="skip">
-            <manifest>
-                <attribute name="Class-Path" value="${jar.classpath}" />
-            </manifest>
-        </jar>
-    </target>
--->
+
     <target name="queue.manifests" depends="queue.jar, init.manifests" if="scala.include">
         <jar jarfile="${dist.dir}/Queue.jar" update="true" >
             <manifest>
@@ -778,10 +792,6 @@
                 <pathelement location="${testng.jar}"/>
             </classpath>
             <compilerarg value="-proc:none"/>
-<!--
-            <compilerarg value="-Acom.google.java.contract.debug"/>
-            <compilerarg value="-Acom.google.java.contract.dump=dump/"/>
- -->
         </javac>
     </target>
 
@@ -798,10 +808,6 @@
                 <pathelement location="${testng.jar}"/>
             </classpath>
             <compilerarg value="-proc:none"/>
-<!--
-            <compilerarg value="-Acom.google.java.contract.debug"/>
-            <compilerarg value="-Acom.google.java.contract.dump=dump/"/>
- -->
         </javac>
     </target>
 
@@ -849,6 +855,9 @@
         <pathelement location="${java.private.test.classes}" />
         <pathelement location="${scala.public.test.classes}" />
         <pathelement location="${scala.private.test.classes}" />
+        <pathelement location="${R.tar.dir}" />
+        <pathelement location="${R.public.scripts.dir}" />
+        <pathelement location="${R.private.scripts.dir}" />
     </path>
 
     <path id="testng.gatk.releasetest.classpath">
@@ -1185,19 +1194,18 @@
     </target>
 
     <target name="clean" description="clean up" depends="clean.javadoc,clean.scaladoc,clean.gatkdocs">
-        <delete dir="out"/>
         <delete dir="${build.dir}"/>
         <delete dir="${lib.dir}"/>
-        <delete dir="dump"/>
+        <delete dir="${contract.dump.dir}"/>
         <delete dir="${staging.dir}"/>
         <delete dir="${dist.dir}"/>
-        <delete dir="pipelinetests"/>
+        <delete dir="${pipelinetest.dir}"/>
     </target>
 
     <!-- Build gsalib R module -->
     <target name="gsalib">
       <exec executable="R" failonerror="true">
-        <arg line="R CMD INSTALL -l public/R/ public/R/src/gsalib/" />
+        <arg line="R CMD INSTALL -l ${R.library.dir} ${R.public.src.dir}/${R.package.path}/gsalib" />
       </exec>
     </target>
 </project>
diff --git a/public/R/plot_residualError_OtherCovariate.R b/public/R/scripts/org/broadinstitute/sting/analyzecovariates/plot_residualError_OtherCovariate.R
similarity index 96%
rename from public/R/plot_residualError_OtherCovariate.R
rename to public/R/scripts/org/broadinstitute/sting/analyzecovariates/plot_residualError_OtherCovariate.R
index a1385ff3f..15c6fc8f0 100644
--- a/public/R/plot_residualError_OtherCovariate.R
+++ b/public/R/scripts/org/broadinstitute/sting/analyzecovariates/plot_residualError_OtherCovariate.R
@@ -1,5 +1,7 @@
 #!/bin/env Rscript
 
+library(tools)
+
 args <- commandArgs(TRUE)
 verbose = TRUE
 
@@ -47,6 +49,9 @@ if( is.numeric(c$Covariate) ) {
 }
 dev.off()
 
+if (exists('compactPDF')) {
+  compactPDF(outfile)
+}
 
 #
 # Plot mean quality versus the covariate
@@ -69,6 +74,10 @@ if( is.numeric(c$Covariate) ) {
 }
 dev.off()
 
+if (exists('compactPDF')) {
+  compactPDF(outfile)
+}
+
 #
 # Plot histogram of the covariate
 #
@@ -106,3 +115,7 @@ if( is.numeric(c$Covariate) ) {
 	axis(2,axTicks(2), format(axTicks(2), scientific=F))
 }
 dev.off()
+
+if (exists('compactPDF')) {
+  compactPDF(outfile)
+}
diff --git a/public/R/plot_residualError_QualityScoreCovariate.R b/public/R/scripts/org/broadinstitute/sting/analyzecovariates/plot_residualError_QualityScoreCovariate.R
similarity index 94%
rename from public/R/plot_residualError_QualityScoreCovariate.R
rename to public/R/scripts/org/broadinstitute/sting/analyzecovariates/plot_residualError_QualityScoreCovariate.R
index 81bc9460d..33eeb1f16 100644
--- a/public/R/plot_residualError_QualityScoreCovariate.R
+++ b/public/R/scripts/org/broadinstitute/sting/analyzecovariates/plot_residualError_QualityScoreCovariate.R
@@ -1,5 +1,7 @@
 #!/bin/env Rscript
 
+library(tools)
+
 args <- commandArgs(TRUE)
 
 input = args[1]
@@ -33,6 +35,10 @@ points(f$Qreported, f$Qempirical, type="p", col="maroon1", pch=16)
 abline(0,1, lty=2)
 dev.off()
 
+if (exists('compactPDF')) {
+  compactPDF(outfile)
+}
+
 #
 # Plot Q empirical histogram
 #
@@ -52,6 +58,10 @@ points(hst2$f.Qempirical, hst2$f.nBases, type="h", lwd=4, col="maroon1")
 axis(2,axTicks(2), format(axTicks(2), scientific=F))
 dev.off()
 
+if (exists('compactPDF')) {
+  compactPDF(outfile)
+}
+
 #
 # Plot Q reported histogram
 #
@@ -68,3 +78,7 @@ plot(hst$e.Qreported, hst$e.nBases, type="h", lwd=4, xlim=c(0,maxQ), ylim=c(0,yM
 points(hst2$f.Qreported, hst2$f.nBases, type="h", lwd=4, col="maroon1")
 axis(2,axTicks(2), format(axTicks(2), scientific=F))
 dev.off()
+
+if (exists('compactPDF')) {
+  compactPDF(outfile)
+}
diff --git a/public/R/plot_Tranches.R b/public/R/scripts/org/broadinstitute/sting/gatk/walkers/variantrecalibration/plot_Tranches.R
similarity index 98%
rename from public/R/plot_Tranches.R
rename to public/R/scripts/org/broadinstitute/sting/gatk/walkers/variantrecalibration/plot_Tranches.R
index a79ddd3ab..d96add768 100755
--- a/public/R/plot_Tranches.R
+++ b/public/R/scripts/org/broadinstitute/sting/gatk/walkers/variantrecalibration/plot_Tranches.R
@@ -1,5 +1,7 @@
 #!/bin/env Rscript
 
+library(tools)
+
 args <- commandArgs(TRUE)
 verbose = TRUE
 
@@ -85,3 +87,7 @@ if ( ! is.null(sensitivity) ) {
 }
 
 dev.off()
+
+if (exists('compactPDF')) {
+  compactPDF(outfile)
+}
diff --git a/public/R/queueJobReport.R b/public/R/scripts/org/broadinstitute/sting/queue/util/queueJobReport.R
similarity index 83%
rename from public/R/queueJobReport.R
rename to public/R/scripts/org/broadinstitute/sting/queue/util/queueJobReport.R
index 31916361e..866766c2c 100644
--- a/public/R/queueJobReport.R
+++ b/public/R/scripts/org/broadinstitute/sting/queue/util/queueJobReport.R
@@ -12,20 +12,20 @@ if ( onCMDLine ) {
   inputFileName = args[1]
   outputPDF = args[2]
 } else {
-  #inputFileName = "~/Desktop/broadLocal/GATK/unstable/report.txt"
-  inputFileName = "/humgen/gsa-hpprojects/dev/depristo/oneOffProjects/Q-25718@node1149.jobreport.txt"
+  inputFileName = "~/Desktop/broadLocal/GATK/unstable/wgs.jobreport.txt"
+  #inputFileName = "/humgen/gsa-hpprojects/dev/depristo/oneOffProjects/Q-25718@node1149.jobreport.txt"
   #inputFileName = "/humgen/gsa-hpprojects/dev/depristo/oneOffProjects/rodPerformanceGoals/history/report.082711.txt"
   outputPDF = NA
 }
 
-RUNTIME_UNITS = "(sec)"
-ORIGINAL_UNITS_TO_SECONDS = 1/1000
+RUNTIME_UNITS = "(hours)"
+ORIGINAL_UNITS_TO_RUNTIME_UNITS = 1/1000/60/60
 
 # 
 # Helper function to aggregate all of the jobs in the report across all tables
 #
 allJobsFromReport <- function(report) {
-  names <- c("jobName", "startTime", "analysisName", "doneTime", "exechosts")
+  names <- c("jobName", "startTime", "analysisName", "doneTime", "exechosts", "runtime")
   sub <- lapply(report, function(table) table[,names])
   do.call("rbind", sub)
 }
@@ -33,7 +33,7 @@ allJobsFromReport <- function(report) {
 #
 # Creates segmentation plots of time (x) vs. job (y) with segments for the duration of the job
 #
-plotJobsGantt <- function(gatkReport, sortOverall) {
+plotJobsGantt <- function(gatkReport, sortOverall, includeText) {
   allJobs = allJobsFromReport(gatkReport)
   if ( sortOverall ) {
     title = "All jobs, by analysis, by start time"
@@ -44,16 +44,18 @@ plotJobsGantt <- function(gatkReport, sortOverall) {
   }
   allJobs$index = 1:nrow(allJobs)
   minTime = min(allJobs$startTime)
-  allJobs$relStartTime = allJobs$startTime - minTime
+  allJobs$relStartTime = allJobs$startTime - minTime 
   allJobs$relDoneTime = allJobs$doneTime - minTime
   allJobs$ganttName = paste(allJobs$jobName, "@", allJobs$exechosts)
   maxRelTime = max(allJobs$relDoneTime)
   p <- ggplot(data=allJobs, aes(x=relStartTime, y=index, color=analysisName))
-  p <- p + geom_segment(aes(xend=relDoneTime, yend=index), size=2, arrow=arrow(length = unit(0.1, "cm")))
-  p <- p + geom_text(aes(x=relDoneTime, label=ganttName, hjust=-0.2), size=2)
+  p <- p + theme_bw()
+  p <- p + geom_segment(aes(xend=relDoneTime, yend=index), size=1, arrow=arrow(length = unit(0.1, "cm")))
+  if ( includeText )
+    p <- p + geom_text(aes(x=relDoneTime, label=ganttName, hjust=-0.2), size=2)
   p <- p + xlim(0, maxRelTime * 1.1)
-  p <- p + xlab(paste("Start time (relative to first job)", RUNTIME_UNITS))
-  p <- p + ylab("Job")
+  p <- p + xlab(paste("Start time, relative to first job", RUNTIME_UNITS))
+  p <- p + ylab("Job number")
   p <- p + opts(title=title)
   print(p)
 }
@@ -119,7 +121,7 @@ plotGroup <- function(groupTable) {
   if ( length(groupAnnotations) == 1 && dim(sub)[1] > 1 ) {
     # todo -- how do we group by annotations?
     p <- ggplot(data=sub, aes(x=runtime)) + geom_histogram()
-    p <- p + xlab("runtime in seconds") + ylab("No. of jobs")
+    p <- p + xlab(paste("runtime", RUNTIME_UNITS)) + ylab("No. of jobs")
     p <- p + opts(title=paste("Job runtime histogram for", name))
     print(p)
   }
@@ -139,9 +141,9 @@ print(paste("Project          :", inputFileName))
 
 convertUnits <- function(gatkReportData) {
   convertGroup <- function(g) {
-    g$runtime = g$runtime * ORIGINAL_UNITS_TO_SECONDS
-    g$startTime = g$startTime * ORIGINAL_UNITS_TO_SECONDS
-    g$doneTime = g$doneTime * ORIGINAL_UNITS_TO_SECONDS
+    g$runtime = g$runtime * ORIGINAL_UNITS_TO_RUNTIME_UNITS
+    g$startTime = g$startTime * ORIGINAL_UNITS_TO_RUNTIME_UNITS
+    g$doneTime = g$doneTime * ORIGINAL_UNITS_TO_RUNTIME_UNITS
     g
   }
   lapply(gatkReportData, convertGroup)
@@ -157,8 +159,8 @@ if ( ! is.na(outputPDF) ) {
   pdf(outputPDF, height=8.5, width=11)
 } 
 
-plotJobsGantt(gatkReportData, T)
-plotJobsGantt(gatkReportData, F)
+plotJobsGantt(gatkReportData, T, F)
+plotJobsGantt(gatkReportData, F, F)
 plotProgressByTime(gatkReportData)
 for ( group in gatkReportData ) {
  plotGroup(group)
diff --git a/public/R/src/gsalib/DESCRIPTION b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/DESCRIPTION
similarity index 100%
rename from public/R/src/gsalib/DESCRIPTION
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/DESCRIPTION
diff --git a/public/R/src/gsalib/R/gsa.error.R b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.error.R
similarity index 100%
rename from public/R/src/gsalib/R/gsa.error.R
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.error.R
diff --git a/public/R/src/gsalib/R/gsa.getargs.R b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.getargs.R
similarity index 100%
rename from public/R/src/gsalib/R/gsa.getargs.R
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.getargs.R
diff --git a/public/R/src/gsalib/R/gsa.message.R b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.message.R
similarity index 100%
rename from public/R/src/gsalib/R/gsa.message.R
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.message.R
diff --git a/public/R/src/gsalib/R/gsa.plot.venn.R b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.plot.venn.R
similarity index 100%
rename from public/R/src/gsalib/R/gsa.plot.venn.R
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.plot.venn.R
diff --git a/public/R/src/gsalib/R/gsa.read.eval.R b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.read.eval.R
similarity index 100%
rename from public/R/src/gsalib/R/gsa.read.eval.R
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.read.eval.R
diff --git a/public/R/src/gsalib/R/gsa.read.gatkreport.R b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.read.gatkreport.R
similarity index 98%
rename from public/R/src/gsalib/R/gsa.read.gatkreport.R
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.read.gatkreport.R
index 011b5240d..46bbf7eda 100644
--- a/public/R/src/gsalib/R/gsa.read.gatkreport.R
+++ b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.read.gatkreport.R
@@ -99,5 +99,5 @@ gsa.read.gatkreport <- function(filename) {
         .gsa.assignGATKTableToEnvironment(tableName, tableHeader, tableRows, tableEnv);
     }
 
-    gatkreport = as.list(tableEnv);
+    gatkreport = as.list(tableEnv, all.names=TRUE);
 }
diff --git a/public/R/src/gsalib/R/gsa.read.squidmetrics.R b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.read.squidmetrics.R
similarity index 100%
rename from public/R/src/gsalib/R/gsa.read.squidmetrics.R
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.read.squidmetrics.R
diff --git a/public/R/src/gsalib/R/gsa.read.vcf.R b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.read.vcf.R
similarity index 100%
rename from public/R/src/gsalib/R/gsa.read.vcf.R
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.read.vcf.R
diff --git a/public/R/src/gsalib/R/gsa.warn.R b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.warn.R
similarity index 100%
rename from public/R/src/gsalib/R/gsa.warn.R
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/R/gsa.warn.R
diff --git a/public/R/src/gsalib/Read-and-delete-me b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/Read-and-delete-me
similarity index 100%
rename from public/R/src/gsalib/Read-and-delete-me
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/Read-and-delete-me
diff --git a/public/R/src/gsalib/data/tearsheetdrop.jpg b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/data/tearsheetdrop.jpg
similarity index 100%
rename from public/R/src/gsalib/data/tearsheetdrop.jpg
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/data/tearsheetdrop.jpg
diff --git a/public/R/src/gsalib/man/gsa.error.Rd b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.error.Rd
similarity index 100%
rename from public/R/src/gsalib/man/gsa.error.Rd
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.error.Rd
diff --git a/public/R/src/gsalib/man/gsa.getargs.Rd b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.getargs.Rd
similarity index 100%
rename from public/R/src/gsalib/man/gsa.getargs.Rd
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.getargs.Rd
diff --git a/public/R/src/gsalib/man/gsa.message.Rd b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.message.Rd
similarity index 100%
rename from public/R/src/gsalib/man/gsa.message.Rd
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.message.Rd
diff --git a/public/R/src/gsalib/man/gsa.plot.venn.Rd b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.plot.venn.Rd
similarity index 100%
rename from public/R/src/gsalib/man/gsa.plot.venn.Rd
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.plot.venn.Rd
diff --git a/public/R/src/gsalib/man/gsa.read.eval.Rd b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.read.eval.Rd
similarity index 100%
rename from public/R/src/gsalib/man/gsa.read.eval.Rd
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.read.eval.Rd
diff --git a/public/R/src/gsalib/man/gsa.read.gatkreport.Rd b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.read.gatkreport.Rd
similarity index 100%
rename from public/R/src/gsalib/man/gsa.read.gatkreport.Rd
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.read.gatkreport.Rd
diff --git a/public/R/src/gsalib/man/gsa.read.squidmetrics.Rd b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.read.squidmetrics.Rd
similarity index 100%
rename from public/R/src/gsalib/man/gsa.read.squidmetrics.Rd
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.read.squidmetrics.Rd
diff --git a/public/R/src/gsalib/man/gsa.read.vcf.Rd b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.read.vcf.Rd
similarity index 100%
rename from public/R/src/gsalib/man/gsa.read.vcf.Rd
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.read.vcf.Rd
diff --git a/public/R/src/gsalib/man/gsa.warn.Rd b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.warn.Rd
similarity index 100%
rename from public/R/src/gsalib/man/gsa.warn.Rd
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsa.warn.Rd
diff --git a/public/R/src/gsalib/man/gsalib-package.Rd b/public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsalib-package.Rd
similarity index 100%
rename from public/R/src/gsalib/man/gsalib-package.Rd
rename to public/R/src/org/broadinstitute/sting/utils/R/gsalib/man/gsalib-package.Rd
diff --git a/public/java/src/org/broadinstitute/sting/alignment/AlignmentValidationWalker.java b/public/java/src/org/broadinstitute/sting/alignment/AlignmentValidationWalker.java
index c6755e878..a342cf932 100644
--- a/public/java/src/org/broadinstitute/sting/alignment/AlignmentValidationWalker.java
+++ b/public/java/src/org/broadinstitute/sting/alignment/AlignmentValidationWalker.java
@@ -25,7 +25,6 @@
 
 package org.broadinstitute.sting.alignment;
 
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.alignment.bwa.BWAConfiguration;
 import org.broadinstitute.sting.alignment.bwa.BWTFiles;
 import org.broadinstitute.sting.alignment.bwa.c.BWACAligner;
@@ -35,6 +34,7 @@ import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
 import org.broadinstitute.sting.gatk.walkers.ReadWalker;
 import org.broadinstitute.sting.utils.BaseUtils;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.Iterator;
 
@@ -72,12 +72,13 @@ public class AlignmentValidationWalker extends ReadWalker<Integer,Integer> {
 
     /**
      * Aligns a read to the given reference.
+     *
      * @param ref Reference over the read.  Read will most likely be unmapped, so ref will be null.
      * @param read Read to align.
      * @return Number of reads aligned by this map (aka 1).
      */
     @Override
-    public Integer map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
+    public Integer map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker) {
         //logger.info(String.format("examining read %s", read.getReadName()));
 
         byte[] bases = read.getReadBases();
diff --git a/public/java/src/org/broadinstitute/sting/alignment/AlignmentWalker.java b/public/java/src/org/broadinstitute/sting/alignment/AlignmentWalker.java
index 7064e637f..c8554573b 100644
--- a/public/java/src/org/broadinstitute/sting/alignment/AlignmentWalker.java
+++ b/public/java/src/org/broadinstitute/sting/alignment/AlignmentWalker.java
@@ -39,6 +39,7 @@ import org.broadinstitute.sting.gatk.io.StingSAMFileWriter;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
 import org.broadinstitute.sting.gatk.walkers.ReadWalker;
 import org.broadinstitute.sting.gatk.walkers.WalkerName;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.io.File;
 
@@ -92,12 +93,13 @@ public class AlignmentWalker extends ReadWalker<Integer,Integer> {
 
     /**
      * Aligns a read to the given reference.
+     *
      * @param ref Reference over the read.  Read will most likely be unmapped, so ref will be null.
      * @param read Read to align.
      * @return Number of alignments found for this read.
      */
     @Override
-    public Integer map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
+    public Integer map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker) {
         SAMRecord alignedRead = aligner.align(read,header);
         out.addAlignment(alignedRead);
         return 1;
diff --git a/public/java/src/org/broadinstitute/sting/alignment/CountBestAlignmentsWalker.java b/public/java/src/org/broadinstitute/sting/alignment/CountBestAlignmentsWalker.java
index 57d92319f..d91b83e7a 100644
--- a/public/java/src/org/broadinstitute/sting/alignment/CountBestAlignmentsWalker.java
+++ b/public/java/src/org/broadinstitute/sting/alignment/CountBestAlignmentsWalker.java
@@ -25,7 +25,6 @@
 
 package org.broadinstitute.sting.alignment;
 
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.alignment.bwa.BWAConfiguration;
 import org.broadinstitute.sting.alignment.bwa.BWTFiles;
 import org.broadinstitute.sting.alignment.bwa.c.BWACAligner;
@@ -34,6 +33,7 @@ import org.broadinstitute.sting.commandline.Output;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
 import org.broadinstitute.sting.gatk.walkers.ReadWalker;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.io.PrintStream;
 import java.util.Iterator;
@@ -79,12 +79,13 @@ public class CountBestAlignmentsWalker extends ReadWalker<Integer,Integer> {
 
     /**
      * Aligns a read to the given reference.
+     *
      * @param ref Reference over the read.  Read will most likely be unmapped, so ref will be null.
      * @param read Read to align.
      * @return Number of alignments found for this read.
      */
     @Override
-    public Integer map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
+    public Integer map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker) {
         Iterator<Alignment[]> alignmentIterator = aligner.getAllAlignments(read.getReadBases()).iterator();
         if(alignmentIterator.hasNext()) {
             int numAlignments = alignmentIterator.next().length;
diff --git a/public/java/src/org/broadinstitute/sting/analyzecovariates/AnalyzeCovariates.java b/public/java/src/org/broadinstitute/sting/analyzecovariates/AnalyzeCovariates.java
index 98f2a9b5c..a399867fa 100755
--- a/public/java/src/org/broadinstitute/sting/analyzecovariates/AnalyzeCovariates.java
+++ b/public/java/src/org/broadinstitute/sting/analyzecovariates/AnalyzeCovariates.java
@@ -25,6 +25,9 @@
 
 package org.broadinstitute.sting.analyzecovariates;
 
+import org.apache.commons.io.FileUtils;
+import org.apache.commons.io.IOUtils;
+import org.apache.log4j.Logger;
 import org.broadinstitute.sting.commandline.Argument;
 import org.broadinstitute.sting.commandline.Hidden;
 import org.broadinstitute.sting.commandline.CommandLineProgram;
@@ -33,14 +36,16 @@ import org.broadinstitute.sting.gatk.walkers.recalibration.Covariate;
 import org.broadinstitute.sting.gatk.walkers.recalibration.RecalDatum;
 import org.broadinstitute.sting.gatk.walkers.recalibration.RecalibrationArgumentCollection;
 import org.broadinstitute.sting.utils.R.RScriptExecutor;
+import org.broadinstitute.sting.utils.Utils;
 import org.broadinstitute.sting.utils.classloader.PluginManager;
 import org.broadinstitute.sting.utils.exceptions.DynamicClassResolutionException;
+import org.broadinstitute.sting.utils.exceptions.UserException;
 import org.broadinstitute.sting.utils.help.DocumentedGATKFeature;
+import org.broadinstitute.sting.utils.io.Resource;
 import org.broadinstitute.sting.utils.text.XReadLines;
 
 import java.io.*;
 import java.util.ArrayList;
-import java.util.Arrays;
 import java.util.Collection;
 import java.util.Map;
 import java.util.regex.Pattern;
@@ -71,15 +76,13 @@ import java.util.regex.Pattern;
  * </ul>
  *
  * <p>
- * NOTE: For those running this tool externally from the Broad, it is crucial to note that both the -Rscript and -resources options
- * must be changed from the default. -Rscript needs to point to your installation of Rscript (this is the scripting version of R,
- * not the interactive version) while -resources needs to point to the folder holding the R scripts that are used. For those using
- * this tool as part of the Binary Distribution the -resources should point to the resources folder that is part of the tarball.
- * For those using this tool by building from the git repository the -resources should point to the R/ subdirectory of the Sting checkout.
+ * NOTE: Rscript needs to be in your environment PATH (this is the scripting version of R, not the interactive version).
+ * See <a target="r-project" href="http://www.r-project.org">http://www.r-project.org</a> for more info on how to download and install R.
  *
  * <p>
  * See the GATK wiki for a tutorial and example recalibration accuracy plots.
- * http://www.broadinstitute.org/gsa/wiki/index.php/Base_quality_score_recalibration
+ * <a target="gatkwiki" href="http://www.broadinstitute.org/gsa/wiki/index.php/Base_quality_score_recalibration"
+ * >http://www.broadinstitute.org/gsa/wiki/index.php/Base_quality_score_recalibration</a>
  *
  * <h2>Input</h2>
  * <p>
@@ -91,7 +94,6 @@ import java.util.regex.Pattern;
  * java -Xmx4g -jar AnalyzeCovariates.jar \
  *   -recalFile /path/to/recal.table.csv  \
  *   -outputDir /path/to/output_dir/  \
- *   -resources resources/  \
  *   -ignoreQ 5
  * </pre>
  *
@@ -101,6 +103,11 @@ import java.util.regex.Pattern;
         groupName = "AnalyzeCovariates",
         summary = "Package to plot residual accuracy versus error covariates for the base quality score recalibrator")
 public class AnalyzeCovariates extends CommandLineProgram {
+    final private static Logger logger = Logger.getLogger(AnalyzeCovariates.class);
+
+    private static final String PLOT_RESDIUAL_ERROR_QUALITY_SCORE_COVARIATE = "plot_residualError_QualityScoreCovariate.R";
+    private static final String PLOT_RESDIUAL_ERROR_OTHER_COVARIATE = "plot_residualError_OtherCovariate.R";
+    private static final String PLOT_INDEL_QUALITY_RSCRIPT = "plot_indelQuality.R";
 
     /////////////////////////////
     // Command Line Arguments
@@ -114,11 +121,7 @@ public class AnalyzeCovariates extends CommandLineProgram {
     @Input(fullName = "recal_file", shortName = "recalFile", doc = "The input recal csv file to analyze", required = false)
     private String RECAL_FILE = "output.recal_data.csv";
     @Argument(fullName = "output_dir", shortName = "outputDir", doc = "The directory in which to output all the plots and intermediate data files", required = false)
-    private String OUTPUT_DIR = "analyzeCovariates/";
-    @Argument(fullName = "path_to_Rscript", shortName = "Rscript", doc = "The path to your implementation of Rscript. For Broad users this is maybe /broad/software/free/Linux/redhat_5_x86_64/pkgs/r_2.12.0/bin/Rscript", required = false)
-    private String PATH_TO_RSCRIPT = "Rscript";
-    @Argument(fullName = "path_to_resources", shortName = "resources", doc = "Path to resources folder holding the Sting R scripts.", required = false)
-    private String PATH_TO_RESOURCES = "public/R/";
+    private File OUTPUT_DIR = new File("analyzeCovariates");
     @Argument(fullName = "ignoreQ", shortName = "ignoreQ", doc = "Ignore bases with reported quality less than this number.", required = false)
     private int IGNORE_QSCORES_LESS_THAN = 5;
     @Argument(fullName = "numRG", shortName = "numRG", doc = "Only process N read groups. Default value: -1 (process all read groups)", required = false)
@@ -154,29 +157,26 @@ public class AnalyzeCovariates extends CommandLineProgram {
     protected int execute() {
 
         // create the output directory where all the data tables and plots will go
-        try {
-            Process p = Runtime.getRuntime().exec("mkdir " + OUTPUT_DIR);
-        } catch (IOException e) {
-            System.out.println("Couldn't create directory: " + OUTPUT_DIR);
-            System.out.println("User is responsible for making sure the output directory exists.");
-        }
-        if( !OUTPUT_DIR.endsWith("/") ) { OUTPUT_DIR = OUTPUT_DIR + "/"; }
-        if( !PATH_TO_RESOURCES.endsWith("/") ) { PATH_TO_RESOURCES = PATH_TO_RESOURCES + "/"; }
+        if (!OUTPUT_DIR.exists() && !OUTPUT_DIR.mkdirs())
+            throw new UserException.BadArgumentValue("--output_dir/-outDir", "Unable to create output directory: " + OUTPUT_DIR);
+
+        if (!RScriptExecutor.RSCRIPT_EXISTS)
+            Utils.warnUser(logger, "Rscript not found in environment path. Plots will not be generated.");
 
         // initialize all the data from the csv file and allocate the list of covariates
-        System.out.println("Reading in input csv file...");
+        logger.info("Reading in input csv file...");
         initializeData();
-        System.out.println("...Done!");
+        logger.info("...Done!");
 
         // output data tables for Rscript to read in
-        System.out.println("Writing out intermediate tables for R...");
+        logger.info("Writing out intermediate tables for R...");
         writeDataTables();
-        System.out.println("...Done!");
+        logger.info("...Done!");
 
         // perform the analysis using Rscript and output the plots
-        System.out.println("Calling analysis R scripts and writing out figures...");
+        logger.info("Calling analysis R scripts and writing out figures...");
         callRScripts();
-        System.out.println("...Done!");
+        logger.info("...Done!");
 
         return 0;
     }
@@ -287,37 +287,40 @@ public class AnalyzeCovariates extends CommandLineProgram {
             if(NUM_READ_GROUPS_TO_PROCESS == -1 || ++numReadGroups <= NUM_READ_GROUPS_TO_PROCESS) {
                 String readGroup = readGroupKey.toString();
                 RecalDatum readGroupDatum = (RecalDatum) dataManager.getCollapsedTable(0).data.get(readGroupKey);
-                System.out.print("Writing out data tables for read group: " + readGroup + "\twith " + readGroupDatum.getNumObservations() + " observations"  );
-                System.out.println("\tand aggregate residual error = " + String.format("%.3f", readGroupDatum.empiricalQualDouble(0, MAX_QUALITY_SCORE) - readGroupDatum.getEstimatedQReported()));
+                logger.info(String.format(
+                        "Writing out data tables for read group: %s\twith %s observations\tand aggregate residual error = %.3f",
+                        readGroup, readGroupDatum.getNumObservations(),
+                        readGroupDatum.empiricalQualDouble(0, MAX_QUALITY_SCORE) - readGroupDatum.getEstimatedQReported()));
 
                 // for each covariate
                 for( int iii = 1; iii < requestedCovariates.size(); iii++ ) {
                     Covariate cov = requestedCovariates.get(iii);
 
                     // Create a PrintStream
-                    PrintStream output = null;
+                    File outputFile = new File(OUTPUT_DIR, readGroup + "." + cov.getClass().getSimpleName()+ ".dat");
+                    PrintStream output;
                     try {
-                        output = new PrintStream(new FileOutputStream(OUTPUT_DIR + readGroup + "." + cov.getClass().getSimpleName()+ ".dat"));
-
-                    } catch (FileNotFoundException e) {
-                        System.err.println("Can't create file: " + OUTPUT_DIR + readGroup + "." + cov.getClass().getSimpleName()+ ".dat");
-                        System.exit(-1);
+                        output = new PrintStream(FileUtils.openOutputStream(outputFile));
+                    } catch (IOException e) {
+                        throw new UserException.CouldNotCreateOutputFile(outputFile, e);
                     }
 
-                    // Output the header
-                    output.println("Covariate\tQreported\tQempirical\tnMismatches\tnBases");
+                    try {
+                        // Output the header
+                        output.println("Covariate\tQreported\tQempirical\tnMismatches\tnBases");
 
-                    for( Object covariateKey : ((Map)dataManager.getCollapsedTable(iii).data.get(readGroupKey)).keySet()) {
-                        output.print( covariateKey.toString() + "\t" );                                                     // Covariate
-                        RecalDatum thisDatum = (RecalDatum)((Map)dataManager.getCollapsedTable(iii).data.get(readGroupKey)).get(covariateKey);
-                        output.print( String.format("%.3f", thisDatum.getEstimatedQReported()) + "\t" );                    // Qreported
-                        output.print( String.format("%.3f", thisDatum.empiricalQualDouble(0, MAX_QUALITY_SCORE)) + "\t" );  // Qempirical
-                        output.print( thisDatum.getNumMismatches() + "\t" );                                                // nMismatches
-                        output.println( thisDatum.getNumObservations() );                                                   // nBases
+                        for( Object covariateKey : ((Map)dataManager.getCollapsedTable(iii).data.get(readGroupKey)).keySet()) {
+                            output.print( covariateKey.toString() + "\t" );                                                     // Covariate
+                            RecalDatum thisDatum = (RecalDatum)((Map)dataManager.getCollapsedTable(iii).data.get(readGroupKey)).get(covariateKey);
+                            output.print( String.format("%.3f", thisDatum.getEstimatedQReported()) + "\t" );                    // Qreported
+                            output.print( String.format("%.3f", thisDatum.empiricalQualDouble(0, MAX_QUALITY_SCORE)) + "\t" );  // Qempirical
+                            output.print( thisDatum.getNumMismatches() + "\t" );                                                // nMismatches
+                            output.println( thisDatum.getNumObservations() );                                                   // nBases
+                        }
+                    } finally {
+                        // Close the PrintStream
+                        IOUtils.closeQuietly(output);
                     }
-
-                    // Close the PrintStream
-                    output.close();
                 }
             } else {
                 break;
@@ -327,10 +330,6 @@ public class AnalyzeCovariates extends CommandLineProgram {
     }
 
     private void callRScripts() {
-        RScriptExecutor.RScriptArgumentCollection argumentCollection =
-                new RScriptExecutor.RScriptArgumentCollection(PATH_TO_RSCRIPT, Arrays.asList(PATH_TO_RESOURCES));
-        RScriptExecutor executor = new RScriptExecutor(argumentCollection, true);
-
         int numReadGroups = 0;
 
         // for each read group
@@ -338,23 +337,32 @@ public class AnalyzeCovariates extends CommandLineProgram {
             if(++numReadGroups <= NUM_READ_GROUPS_TO_PROCESS || NUM_READ_GROUPS_TO_PROCESS == -1) {
 
                 String readGroup = readGroupKey.toString();
-                System.out.println("Analyzing read group: " + readGroup);
+                logger.info("Analyzing read group: " + readGroup);
 
                 // for each covariate
                 for( int iii = 1; iii < requestedCovariates.size(); iii++ ) {
                     Covariate cov = requestedCovariates.get(iii);
-                    final String outputFilename = OUTPUT_DIR + readGroup + "." + cov.getClass().getSimpleName()+ ".dat";
+                    final File outputFile = new File(OUTPUT_DIR, readGroup + "." + cov.getClass().getSimpleName()+ ".dat");
                     if (DO_INDEL_QUALITY) {
-                        executor.callRScripts("plot_indelQuality.R", outputFilename,
-                                cov.getClass().getSimpleName().split("Covariate")[0]); // The third argument is the name of the covariate in order to make the plots look nice
+                        RScriptExecutor executor = new RScriptExecutor();
+                        executor.addScript(new Resource(PLOT_INDEL_QUALITY_RSCRIPT, AnalyzeCovariates.class));
+                        // The second argument is the name of the covariate in order to make the plots look nice
+                        executor.addArgs(outputFile, cov.getClass().getSimpleName().split("Covariate")[0]);
+                        executor.exec();
                     }   else {
                         if( iii == 1 ) {
                             // Analyze reported quality
-                            executor.callRScripts("plot_residualError_QualityScoreCovariate.R", outputFilename,
-                                    IGNORE_QSCORES_LESS_THAN, MAX_QUALITY_SCORE, MAX_HISTOGRAM_VALUE); // The third argument is the Q scores that should be turned pink in the plot because they were ignored
+                            RScriptExecutor executor = new RScriptExecutor();
+                            executor.addScript(new Resource(PLOT_RESDIUAL_ERROR_QUALITY_SCORE_COVARIATE, AnalyzeCovariates.class));
+                            // The second argument is the Q scores that should be turned pink in the plot because they were ignored
+                            executor.addArgs(outputFile, IGNORE_QSCORES_LESS_THAN, MAX_QUALITY_SCORE, MAX_HISTOGRAM_VALUE);
+                            executor.exec();
                         } else { // Analyze all other covariates
-                            executor.callRScripts("plot_residualError_OtherCovariate.R", outputFilename,
-                                    cov.getClass().getSimpleName().split("Covariate")[0]); // The third argument is the name of the covariate in order to make the plots look nice
+                            RScriptExecutor executor = new RScriptExecutor();
+                            executor.addScript(new Resource(PLOT_RESDIUAL_ERROR_OTHER_COVARIATE, AnalyzeCovariates.class));
+                            // The second argument is the name of the covariate in order to make the plots look nice
+                            executor.addArgs(outputFile, cov.getClass().getSimpleName().split("Covariate")[0]);
+                            executor.exec();
                         }
                     }
                 }
diff --git a/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatch.java b/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatch.java
index 351583c07..c0823e5c5 100755
--- a/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatch.java
+++ b/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatch.java
@@ -46,7 +46,7 @@ public class ArgumentMatch implements Iterable<ArgumentMatch> {
     /**
      * Maps indices of command line arguments to values paired with that argument.
      */
-    public final SortedMap<Integer,List<String>> indices = new TreeMap<Integer,List<String>>();
+    public final SortedMap<ArgumentMatchSite,List<String>> sites = new TreeMap<ArgumentMatchSite,List<String>>();
 
     /**
      * An ordered, freeform collection of tags.
@@ -72,32 +72,32 @@ public class ArgumentMatch implements Iterable<ArgumentMatch> {
     }
 
     /**
-     * A simple way of indicating that an argument with the given label and definition exists at this index.
+     * A simple way of indicating that an argument with the given label and definition exists at this site.
      * @param label Label of the argument match.  Must not be null.
      * @param definition The associated definition, if one exists.  May be null.
-     * @param index Position of the argument.  Must not be null.
+     * @param site Position of the argument.  Must not be null.
      * @param tags ordered freeform text tags associated with this argument.
      */
-    public ArgumentMatch(final String label, final ArgumentDefinition definition, final int index, final Tags tags) {
-        this( label, definition, index, null, tags );
+    public ArgumentMatch(final String label, final ArgumentDefinition definition, final ArgumentMatchSite site, final Tags tags) {
+        this( label, definition, site, null, tags );
     }
 
     /**
-     * A simple way of indicating that an argument with the given label and definition exists at this index.
+     * A simple way of indicating that an argument with the given label and definition exists at this site.
      * @param label Label of the argument match.  Must not be null.
      * @param definition The associated definition, if one exists.  May be null.
-     * @param index Position of the argument.  Must not be null.
+     * @param site Position of the argument.  Must not be null.
      * @param value Value for the argument at this position.
      * @param tags ordered freeform text tags associated with this argument.
      */
-    private ArgumentMatch(final String label, final ArgumentDefinition definition, final int index, final String value, final Tags tags) {
+    private ArgumentMatch(final String label, final ArgumentDefinition definition, final ArgumentMatchSite site, final String value, final Tags tags) {
         this.label = label;
         this.definition = definition;
 
         ArrayList<String> values = new ArrayList<String>();
         if( value != null )
             values.add(value);
-        indices.put(index,values );
+        sites.put(site,values );
 
         this.tags = tags;
     }
@@ -117,7 +117,7 @@ public class ArgumentMatch implements Iterable<ArgumentMatch> {
         ArgumentMatch otherArgumentMatch = (ArgumentMatch)other;
         return this.definition.equals(otherArgumentMatch.definition) &&
                 this.label.equals(otherArgumentMatch.label) &&
-                this.indices.equals(otherArgumentMatch.indices) &&
+                this.sites.equals(otherArgumentMatch.sites) &&
                 this.tags.equals(otherArgumentMatch.tags);
     }
 
@@ -129,16 +129,17 @@ public class ArgumentMatch implements Iterable<ArgumentMatch> {
      * @param key Key which specifies the transform.
      * @return A variant of this ArgumentMatch with all keys transformed.
      */
+    @SuppressWarnings("unchecked")
     ArgumentMatch transform(Multiplexer multiplexer, Object key) {
-        SortedMap<Integer,List<String>> newIndices = new TreeMap<Integer,List<String>>();
-        for(Map.Entry<Integer,List<String>> index: indices.entrySet()) {
+        SortedMap<ArgumentMatchSite,List<String>> newIndices = new TreeMap<ArgumentMatchSite,List<String>>();
+        for(Map.Entry<ArgumentMatchSite,List<String>> site: sites.entrySet()) {
             List<String> newEntries = new ArrayList<String>();
-            for(String entry: index.getValue())
+            for(String entry: site.getValue())
                 newEntries.add(multiplexer.transformArgument(key,entry));
-            newIndices.put(index.getKey(),newEntries);
+            newIndices.put(site.getKey(),newEntries);
         }
         ArgumentMatch newArgumentMatch = new ArgumentMatch(label,definition);
-        newArgumentMatch.indices.putAll(newIndices);
+        newArgumentMatch.sites.putAll(newIndices);
         return newArgumentMatch;
     }
 
@@ -157,9 +158,9 @@ public class ArgumentMatch implements Iterable<ArgumentMatch> {
     public Iterator<ArgumentMatch> iterator() {
         return new Iterator<ArgumentMatch>() {
             /**
-             * Iterate over each the available index.
+             * Iterate over each the available site.
              */
-            private Iterator<Integer> indexIterator = null;
+            private Iterator<ArgumentMatchSite> siteIterator = null;
 
             /**
              * Iterate over each available token.
@@ -167,9 +168,9 @@ public class ArgumentMatch implements Iterable<ArgumentMatch> {
             private Iterator<String> tokenIterator = null;
 
             /**
-             * The next index to return.  Null if none remain.
+             * The next site to return.  Null if none remain.
              */
-            Integer nextIndex = null;
+            ArgumentMatchSite nextSite = null;
 
             /**
              * The next token to return.  Null if none remain.
@@ -177,7 +178,7 @@ public class ArgumentMatch implements Iterable<ArgumentMatch> {
             String nextToken = null;
 
             {
-                indexIterator = indices.keySet().iterator();
+                siteIterator = sites.keySet().iterator();
                 prepareNext();
             }
 
@@ -186,7 +187,7 @@ public class ArgumentMatch implements Iterable<ArgumentMatch> {
              * @return True if there's another token waiting in the wings.  False otherwise.
              */
             public boolean hasNext() {
-                return nextToken != null;    
+                return nextToken != null;
             }
 
             /**
@@ -194,32 +195,32 @@ public class ArgumentMatch implements Iterable<ArgumentMatch> {
              * @return The next ArgumentMatch in the series.  Should never be null.
              */
             public ArgumentMatch next() {
-                if( nextIndex == null || nextToken == null )
+                if( nextSite == null || nextToken == null )
                     throw new IllegalStateException( "No more ArgumentMatches are available" );
 
-                ArgumentMatch match = new ArgumentMatch( label, definition, nextIndex, nextToken, tags );
+                ArgumentMatch match = new ArgumentMatch( label, definition, nextSite, nextToken, tags );
                 prepareNext();
                 return match;
             }
 
             /**
              * Initialize the next ArgumentMatch to return.  If no ArgumentMatches are available,
-             * initialize nextIndex / nextToken to null.
+             * initialize nextSite / nextToken to null.
              */
             private void prepareNext() {
                 if( tokenIterator != null && tokenIterator.hasNext() ) {
                     nextToken = tokenIterator.next();
                 }
                 else {
-                    nextIndex = null;
+                    nextSite = null;
                     nextToken = null;
 
                     // Do a nested loop.  While more data is present in the inner loop, grab that data.
                     // Otherwise, troll the outer iterator looking for more data.
-                    while( indexIterator.hasNext() ) {
-                        nextIndex = indexIterator.next();
-                        if( indices.get(nextIndex) != null ) {
-                            tokenIterator = indices.get(nextIndex).iterator();
+                    while( siteIterator.hasNext() ) {
+                        nextSite = siteIterator.next();
+                        if( sites.get(nextSite) != null ) {
+                            tokenIterator = sites.get(nextSite).iterator();
                             if( tokenIterator.hasNext() ) {
                                 nextToken = tokenIterator.next();
                                 break;
@@ -245,29 +246,29 @@ public class ArgumentMatch implements Iterable<ArgumentMatch> {
      * @param other The other match to merge into.
      */
     public void mergeInto( ArgumentMatch other ) {
-        indices.putAll(other.indices);
+        sites.putAll(other.sites);
     }
 
     /**
      * Associate a value with this merge maapping.
-     * @param index index of the command-line argument to which this value is mated.
+     * @param site site of the command-line argument to which this value is mated.
      * @param value Text representation of value to add.
      */
-    public void addValue( int index, String value ) {
-        if( !indices.containsKey(index) || indices.get(index) == null )
-            indices.put(index, new ArrayList<String>() );
-        indices.get(index).add(value);
+    public void addValue( ArgumentMatchSite site, String value ) {
+        if( !sites.containsKey(site) || sites.get(site) == null )
+            sites.put(site, new ArrayList<String>() );
+        sites.get(site).add(value);
     }
 
     /**
      * Does this argument already have a value at the given site?
      * Arguments are only allowed to be single-valued per site, and
      * flags aren't allowed a value at all.
-     * @param index Index at which to check for values.
+     * @param site Site at which to check for values.
      * @return True if the argument has a value at the given site.  False otherwise.
      */
-    public boolean hasValueAtSite( int index ) {
-        return (indices.get(index) != null && indices.get(index).size() >= 1) || isArgumentFlag();
+    public boolean hasValueAtSite( ArgumentMatchSite site ) {
+        return (sites.get(site) != null && sites.get(site).size() >= 1) || isArgumentFlag();
     }
 
     /**
@@ -276,9 +277,9 @@ public class ArgumentMatch implements Iterable<ArgumentMatch> {
      */
     public List<String> values() {
         List<String> values = new ArrayList<String>();
-        for( int index: indices.keySet() ) {
-            if( indices.get(index) != null )
-                values.addAll(indices.get(index));
+        for( ArgumentMatchSite site: sites.keySet() ) {
+            if( sites.get(site) != null )
+                values.addAll(sites.get(site));
         }
         return values;
     }
diff --git a/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatchSite.java b/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatchSite.java
new file mode 100644
index 000000000..8a4120101
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatchSite.java
@@ -0,0 +1,76 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.commandline;
+
+/**
+ * Which source and the index within the source where an argument match was found.
+ */
+public class ArgumentMatchSite implements Comparable<ArgumentMatchSite> {
+    private final ArgumentMatchSource source;
+    private final int index;
+
+    public ArgumentMatchSite(ArgumentMatchSource source, int index) {
+        this.source = source;
+        this.index = index;
+    }
+
+    public ArgumentMatchSource getSource() {
+        return source;
+    }
+
+    public int getIndex() {
+        return index;
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) return true;
+        if (o == null || getClass() != o.getClass()) return false;
+
+        ArgumentMatchSite that = (ArgumentMatchSite) o;
+
+        return (index == that.index) && (source == null ? that.source == null : source.equals(that.source));
+    }
+
+    @Override
+    public int hashCode() {
+        int result = source != null ? source.hashCode() : 0;
+        // Generated by intellij. No other special reason to this implementation. -ks
+        result = 31 * result + index;
+        return result;
+    }
+
+    @Override
+    public int compareTo(ArgumentMatchSite that) {
+        int comp = this.source.compareTo(that.source);
+        if (comp != 0)
+            return comp;
+
+        // Both files are the same.
+        if (this.index == that.index)
+            return 0;
+        return this.index < that.index ? -1 : 1;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatchSource.java b/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatchSource.java
new file mode 100644
index 000000000..ed2700006
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatchSource.java
@@ -0,0 +1,98 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.commandline;
+
+import java.io.File;
+
+/**
+ * Where an argument match originated, via the commandline or a file.
+ */
+public class ArgumentMatchSource implements Comparable<ArgumentMatchSource> {
+    public static final ArgumentMatchSource COMMAND_LINE = new ArgumentMatchSource(ArgumentMatchSourceType.CommandLine, null);
+
+    private final ArgumentMatchSourceType type;
+    private final File file;
+
+    /**
+     * Creates an argument match source from the specified file.
+     * @param file File specifying the arguments. Must not be null.
+     */
+    public ArgumentMatchSource(File file) {
+        this(ArgumentMatchSourceType.File, file);
+    }
+
+    private ArgumentMatchSource(ArgumentMatchSourceType type, File file) {
+        if (type == ArgumentMatchSourceType.File && file == null)
+            throw new IllegalArgumentException("An argument match source of type File cannot have a null file.");
+        this.type = type;
+        this.file = file;
+    }
+
+    public ArgumentMatchSourceType getType() {
+        return type;
+    }
+
+    public File getFile() {
+        return file;
+    }
+
+    @Override
+    public boolean equals(Object o) {
+        if (this == o) return true;
+        if (o == null || getClass() != o.getClass()) return false;
+
+        ArgumentMatchSource that = (ArgumentMatchSource) o;
+
+        return (type == that.type) && (file == null ? that.file == null : file.equals(that.file));
+    }
+
+    @Override
+    public int hashCode() {
+        int result = type != null ? type.hashCode() : 0;
+        result = 31 * result + (file != null ? file.hashCode() : 0);
+        return result;
+    }
+
+    /**
+     * Compares two sources, putting the command line first, then files.
+     */
+    @Override
+    public int compareTo(ArgumentMatchSource that) {
+        int comp = this.type.compareTo(that.type);
+        if (comp != 0)
+            return comp;
+
+        File f1 = this.file;
+        File f2 = that.file;
+
+        if ((f1 == null) ^ (f2 == null)) {
+            // If one of the files is null and the other is not
+            // put the null file first
+            return f1 == null ? -1 : 1;
+        }
+
+        return f1 == null ? 0 : f1.compareTo(f2);
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatchSourceType.java b/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatchSourceType.java
new file mode 100644
index 000000000..3ff6e21d4
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatchSourceType.java
@@ -0,0 +1,32 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.commandline;
+
+/**
+ * Type of where an argument match originated, via the commandline or a file.
+ */
+public enum ArgumentMatchSourceType {
+    CommandLine, File
+}
diff --git a/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatches.java b/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatches.java
index 52d3b8232..3da28c420 100755
--- a/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatches.java
+++ b/public/java/src/org/broadinstitute/sting/commandline/ArgumentMatches.java
@@ -37,7 +37,7 @@ public class ArgumentMatches implements Iterable<ArgumentMatch> {
      * Collection matches from argument definition to argument value.
      * Package protected access is deliberate.
      */
-    Map<Integer,ArgumentMatch> argumentMatches = new TreeMap<Integer,ArgumentMatch>();
+    Map<ArgumentMatchSite,ArgumentMatch> argumentMatches = new TreeMap<ArgumentMatchSite,ArgumentMatch>();
 
     /**
      * Provide a place to put command-line argument values that don't seem to belong to
@@ -80,7 +80,7 @@ public class ArgumentMatches implements Iterable<ArgumentMatch> {
      * @param site Site at which to check.
      * @return True if the site has a match.  False otherwise.
      */
-    boolean hasMatch( int site ) {
+    boolean hasMatch( ArgumentMatchSite site ) {
         return argumentMatches.containsKey( site );
     }
 
@@ -90,7 +90,7 @@ public class ArgumentMatches implements Iterable<ArgumentMatch> {
      * @return The match present at the given site.
      * @throws IllegalArgumentException if site does not contain a match.
      */
-    ArgumentMatch getMatch( int site ) {
+    ArgumentMatch getMatch( ArgumentMatchSite site ) {
         if( !argumentMatches.containsKey(site) )
             throw new IllegalArgumentException( "Site does not contain an argument: " + site );
         return argumentMatches.get(site);
@@ -107,6 +107,7 @@ public class ArgumentMatches implements Iterable<ArgumentMatch> {
 
     /**
      * Return all argument matches of this source.
+     * @param parsingEngine Parsing engine.
      * @param argumentSource Argument source to match.
      * @return List of all matches.
      */
@@ -167,6 +168,7 @@ public class ArgumentMatches implements Iterable<ArgumentMatch> {
      * TODO: Generify this.
      * @param multiplexer Multiplexer that controls the transformation process.
      * @param key Key which specifies the transform.
+     * @return new argument matches.
      */
     ArgumentMatches transform(Multiplexer multiplexer, Object key) {
         ArgumentMatches newArgumentMatches = new ArgumentMatches();
@@ -187,15 +189,15 @@ public class ArgumentMatches implements Iterable<ArgumentMatch> {
         for( ArgumentMatch argumentMatch: getUniqueMatches() ) {
             if( argumentMatch.definition == match.definition && argumentMatch.tags.equals(match.tags) ) {
                 argumentMatch.mergeInto( match );
-                for( int index: match.indices.keySet() )
-                    argumentMatches.put( index, argumentMatch );
+                for( ArgumentMatchSite site: match.sites.keySet() )
+                    argumentMatches.put( site, argumentMatch );
                 definitionExists = true;
             }
         }
 
         if( !definitionExists ) {
-            for( int index: match.indices.keySet() )
-                argumentMatches.put( index, match );
+            for( ArgumentMatchSite site: match.sites.keySet() )
+                argumentMatches.put( site, match );
         }
     }    
 
diff --git a/public/java/src/org/broadinstitute/sting/commandline/ArgumentTypeDescriptor.java b/public/java/src/org/broadinstitute/sting/commandline/ArgumentTypeDescriptor.java
index d1d9cf7fe..31212a46f 100644
--- a/public/java/src/org/broadinstitute/sting/commandline/ArgumentTypeDescriptor.java
+++ b/public/java/src/org/broadinstitute/sting/commandline/ArgumentTypeDescriptor.java
@@ -336,6 +336,28 @@ class RodBindingArgumentTypeDescriptor extends ArgumentTypeDescriptor {
 
     @Override
     public Object parse(ParsingEngine parsingEngine, ArgumentSource source, Type type, ArgumentMatches matches) {
+        return parse(parsingEngine, source, type, matches, false);
+    }
+
+    /**
+     * The actual argument parsing method.
+     *
+     * IMPORTANT NOTE: the createIntervalBinding argument is a bit of a hack, but after discussions with SE we've decided
+     *   that it's the best way to proceed for now.  IntervalBindings can either be proper RodBindings (hence the use of
+     *   this parse() method) or can be Strings (representing raw intervals or the files containing them).  If createIntervalBinding
+     *   is true, we do not call parsingEngine.addRodBinding() because we don't want walkers to assume that these are the
+     *   usual set of RodBindings.  It also allows us in the future to be smart about tagging rods as intervals.  One other
+     *   side point is that we want to continue to allow the usage of non-Feature intervals so that users can theoretically
+     *   continue to input them out of order (whereas Tribble Features are ordered).
+     *
+     * @param parsingEngine      parsing engine
+     * @param source             source
+     * @param type               type to check
+     * @param matches            matches
+     * @param createIntervalBinding should we attempt to create an IntervalBinding instead of a RodBinding?
+     * @return the RodBinding/IntervalBinding object depending on the value of createIntervalBinding.
+     */
+    public Object parse(ParsingEngine parsingEngine, ArgumentSource source, Type type, ArgumentMatches matches, boolean createIntervalBinding) {
         ArgumentDefinition defaultDefinition = createDefaultArgumentDefinition(source);
         String value = getArgumentValue( defaultDefinition, matches );
         Class<? extends Feature> parameterType = JVMUtils.getParameterizedTypeClass(type);
@@ -348,7 +370,7 @@ class RodBindingArgumentTypeDescriptor extends ArgumentTypeDescriptor {
             if ( tags.getPositionalTags().size() > 2 ) {
                 throw new UserException.CommandLineException(
                         String.format("Unexpected number of positional tags for argument %s : %s. " +
-                                "Rod bindings only suport -X:type and -X:name,type argument styles",
+                                "Rod bindings only support -X:type and -X:name,type argument styles",
                                 value, source.field.getName()));
             } if ( tags.getPositionalTags().size() == 2 ) {
                 // -X:name,type style
@@ -378,7 +400,12 @@ class RodBindingArgumentTypeDescriptor extends ArgumentTypeDescriptor {
                         }
                     }
 
-                    if ( tribbleType == null )
+                    if ( tribbleType == null ) {
+                        // IntervalBindings allow streaming conversion of Strings
+                        if ( createIntervalBinding ) {
+                            return new IntervalBinding(value);
+                        }
+
                         if ( ! file.exists() ) {
                             throw new UserException.CouldNotReadInputFile(file, "file does not exist");
                         } else if ( ! file.canRead() || ! file.isFile() ) {
@@ -389,13 +416,20 @@ class RodBindingArgumentTypeDescriptor extends ArgumentTypeDescriptor {
                                             "Please add an explicit type tag :NAME listing the correct type from among the supported types:%n%s",
                                             manager.userFriendlyListOfAvailableFeatures(parameterType)));
                         }
+                    }
                 }
             }
 
             Constructor ctor = (makeRawTypeIfNecessary(type)).getConstructor(Class.class, String.class, String.class, String.class, Tags.class);
-            RodBinding result = (RodBinding)ctor.newInstance(parameterType, name, value, tribbleType, tags);
-            parsingEngine.addTags(result,tags);
-            parsingEngine.addRodBinding(result);
+            Object result;
+            if ( createIntervalBinding ) {
+                result = ctor.newInstance(parameterType, name, value, tribbleType, tags);
+            } else {
+                RodBinding rbind = (RodBinding)ctor.newInstance(parameterType, name, value, tribbleType, tags);
+                parsingEngine.addTags(rbind, tags);
+                parsingEngine.addRodBinding(rbind);
+                result = rbind;
+            }
             return result;
         } catch (InvocationTargetException e) {
             throw new UserException.CommandLineException(
@@ -409,6 +443,39 @@ class RodBindingArgumentTypeDescriptor extends ArgumentTypeDescriptor {
     }
 }
 
+/**
+ * Parser for RodBinding objects
+ */
+class IntervalBindingArgumentTypeDescriptor extends ArgumentTypeDescriptor {
+    /**
+     * We only want IntervalBinding class objects
+     * @param type The type to check.
+     * @return true if the provided class is an IntervalBinding.class
+     */
+    @Override
+    public boolean supports( Class type ) {
+        return isIntervalBinding(type);
+    }
+
+    public static boolean isIntervalBinding( Class type ) {
+        return IntervalBinding.class.isAssignableFrom(type);
+    }
+
+    /**
+     * See note from RodBindingArgumentTypeDescriptor.parse().
+     *
+     * @param parsingEngine      parsing engine
+     * @param source             source
+     * @param type               type to check
+     * @param matches            matches
+     * @return the IntervalBinding object.
+     */
+    @Override
+    public Object parse(ParsingEngine parsingEngine, ArgumentSource source, Type type, ArgumentMatches matches) {
+        return new RodBindingArgumentTypeDescriptor().parse(parsingEngine, source, type, matches, true);
+    }
+}
+
 /**
  * Parse simple argument types: java primitives, wrapper classes, and anything that has
  * a simple String constructor.
@@ -416,7 +483,7 @@ class RodBindingArgumentTypeDescriptor extends ArgumentTypeDescriptor {
 class SimpleArgumentTypeDescriptor extends ArgumentTypeDescriptor {
     @Override
     public boolean supports( Class type ) {
-        if ( RodBindingArgumentTypeDescriptor.isRodBinding(type) ) return false;
+        if ( RodBindingArgumentTypeDescriptor.isRodBinding(type) || IntervalBindingArgumentTypeDescriptor.isIntervalBinding(type) ) return false;
         if ( type.isPrimitive() ) return true;
         if ( type.isEnum() ) return true;
         if ( primitiveToWrapperMap.containsValue(type) ) return true;
diff --git a/public/java/src/org/broadinstitute/sting/commandline/CommandLineProgram.java b/public/java/src/org/broadinstitute/sting/commandline/CommandLineProgram.java
index d88e7030e..bed1e710e 100644
--- a/public/java/src/org/broadinstitute/sting/commandline/CommandLineProgram.java
+++ b/public/java/src/org/broadinstitute/sting/commandline/CommandLineProgram.java
@@ -35,10 +35,7 @@ import org.broadinstitute.sting.utils.help.ApplicationDetails;
 import org.broadinstitute.sting.utils.help.HelpFormatter;
 
 import java.io.IOException;
-import java.util.Collection;
-import java.util.Collections;
-import java.util.EnumSet;
-import java.util.Locale;
+import java.util.*;
 
 public abstract class CommandLineProgram {
 
@@ -155,6 +152,7 @@ public abstract class CommandLineProgram {
      *
      * @param clp  the command line program to execute
      * @param args the command line arguments passed in
+     * @param dryRun dry run
      * @throws Exception when an exception occurs
      */
     @SuppressWarnings("unchecked")
@@ -176,6 +174,8 @@ public abstract class CommandLineProgram {
             ParsingEngine parser = clp.parser = new ParsingEngine(clp);
             parser.addArgumentSource(clp.getClass());
 
+            Map<ArgumentMatchSource, List<String>> parsedArgs;
+
             // process the args
             if (clp.canAddArgumentsDynamically()) {
                 // if the command-line program can toss in extra args, fetch them and reparse the arguments.
@@ -196,14 +196,14 @@ public abstract class CommandLineProgram {
                 Class[] argumentSources = clp.getArgumentSources();
                 for (Class argumentSource : argumentSources)
                     parser.addArgumentSource(clp.getArgumentSourceName(argumentSource), argumentSource);
-                parser.parse(args);
+                parsedArgs = parser.parse(args);
 
                 if (isHelpPresent(parser))
                     printHelpAndExit(clp, parser);
 
                 if ( ! dryRun ) parser.validate();
             } else {
-                parser.parse(args);
+                parsedArgs = parser.parse(args);
 
                 if ( ! dryRun ) {
                     if (isHelpPresent(parser))
@@ -230,7 +230,7 @@ public abstract class CommandLineProgram {
                 }
 
                 // regardless of what happens next, generate the header information
-                HelpFormatter.generateHeaderInformation(clp.getApplicationDetails(), args);
+                HelpFormatter.generateHeaderInformation(clp.getApplicationDetails(), parsedArgs);
 
                 // call the execute
                 CommandLineProgram.result = clp.execute();
diff --git a/public/java/src/org/broadinstitute/sting/commandline/IntervalBinding.java b/public/java/src/org/broadinstitute/sting/commandline/IntervalBinding.java
new file mode 100644
index 000000000..86ca6c2df
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/commandline/IntervalBinding.java
@@ -0,0 +1,108 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.commandline;
+
+import com.google.java.contract.Requires;
+import org.broad.tribble.Feature;
+import org.broad.tribble.FeatureCodec;
+import org.broad.tribble.readers.AsciiLineReader;
+import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
+import org.broadinstitute.sting.gatk.refdata.ReferenceDependentFeatureCodec;
+import org.broadinstitute.sting.gatk.refdata.tracks.FeatureManager;
+import org.broadinstitute.sting.utils.GenomeLoc;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.interval.IntervalUtils;
+
+import java.io.File;
+import java.io.FileInputStream;
+import java.io.IOException;
+import java.util.*;
+
+/**
+ * An IntervalBinding representing a walker argument that gets bound to either a ROD track or interval string.
+ *
+ * The IntervalBinding<T> is a formal GATK argument that bridges between a walker and
+ * the engine to construct intervals for traversal at runtime.  The IntervalBinding can
+ * either be a RodBinding<T>, a string of one or more intervals, or a file with interval strings.
+ * The GATK Engine takes care of initializing the binding when appropriate and determining intervals from it.
+ *
+ * Note that this class is immutable.
+ */
+public final class IntervalBinding<T extends Feature> {
+
+    private RodBinding<T> featureIntervals;
+    private String stringIntervals;
+
+    @Requires({"type != null", "rawName != null", "source != null", "tribbleType != null", "tags != null"})
+    public IntervalBinding(Class<T> type, final String rawName, final String source, final String tribbleType, final Tags tags) {
+        featureIntervals = new RodBinding<T>(type, rawName, source, tribbleType, tags);
+    }
+
+    @Requires({"intervalArgument != null"})
+    public IntervalBinding(String intervalArgument) {
+        stringIntervals = intervalArgument;
+    }
+
+    public String getSource() {
+        if ( featureIntervals != null )
+            return featureIntervals.getSource();
+        return stringIntervals;
+    }
+
+    public List<GenomeLoc> getIntervals(GenomeAnalysisEngine toolkit) {
+        List<GenomeLoc> intervals;
+
+        if ( featureIntervals != null ) {
+            intervals = new ArrayList<GenomeLoc>();
+
+            //RMDTrackBuilder builder = new RMDTrackBuilder(toolkit.getReferenceDataSource().getReference().getSequenceDictionary(),
+            //        toolkit.getGenomeLocParser(),
+            //        toolkit.getArguments().unsafe);
+
+            // TODO -- after ROD system cleanup, go through the ROD system so that we can handle things like gzipped files
+
+            FeatureCodec codec = new FeatureManager().getByName(featureIntervals.getTribbleType()).getCodec();
+            if ( codec instanceof ReferenceDependentFeatureCodec )
+                ((ReferenceDependentFeatureCodec)codec).setGenomeLocParser(toolkit.getGenomeLocParser());
+            try {
+                FileInputStream fis = new FileInputStream(new File(featureIntervals.getSource()));
+                AsciiLineReader lineReader = new AsciiLineReader(fis);
+                codec.readHeader(lineReader);
+                String line = lineReader.readLine();
+                while ( line != null ) {
+                    intervals.add(toolkit.getGenomeLocParser().createGenomeLoc(codec.decodeLoc(line)));
+                    line = lineReader.readLine();
+                }
+            } catch (IOException e) {
+                throw new UserException("Problem reading the interval file " + featureIntervals.getSource() + "; " + e.getMessage());
+            }
+
+        } else {
+            intervals = IntervalUtils.parseIntervalArguments(toolkit.getGenomeLocParser(), stringIntervals);
+        }
+
+        return intervals;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/commandline/ParsingEngine.java b/public/java/src/org/broadinstitute/sting/commandline/ParsingEngine.java
index fbf8c6516..0fac195e1 100755
--- a/public/java/src/org/broadinstitute/sting/commandline/ParsingEngine.java
+++ b/public/java/src/org/broadinstitute/sting/commandline/ParsingEngine.java
@@ -26,6 +26,7 @@
 package org.broadinstitute.sting.commandline;
 
 import com.google.java.contract.Requires;
+import org.apache.commons.io.FileUtils;
 import org.apache.log4j.Logger;
 import org.broadinstitute.sting.utils.Utils;
 import org.broadinstitute.sting.utils.classloader.JVMUtils;
@@ -35,6 +36,8 @@ import org.broadinstitute.sting.utils.exceptions.UserException;
 import org.broadinstitute.sting.utils.help.ApplicationDetails;
 import org.broadinstitute.sting.utils.help.HelpFormatter;
 
+import java.io.File;
+import java.io.IOException;
 import java.lang.reflect.Field;
 import java.util.*;
 
@@ -75,6 +78,7 @@ public class ParsingEngine {
      * The type of set used must be ordered (but not necessarily sorted).
      */
     private static final Set<ArgumentTypeDescriptor> STANDARD_ARGUMENT_TYPE_DESCRIPTORS = new LinkedHashSet<ArgumentTypeDescriptor>( Arrays.asList(new SimpleArgumentTypeDescriptor(),
+            new IntervalBindingArgumentTypeDescriptor(),
             new RodBindingArgumentTypeDescriptor(),
             new CompoundArgumentTypeDescriptor(),
             new MultiplexArgumentTypeDescriptor()) );
@@ -100,6 +104,8 @@ public class ParsingEngine {
         if(clp != null)
             argumentTypeDescriptors.addAll(clp.getArgumentTypeDescriptors());
         argumentTypeDescriptors.addAll(STANDARD_ARGUMENT_TYPE_DESCRIPTORS);
+
+        addArgumentSource(ParsingEngineArgumentFiles.class);
     }
 
     /**
@@ -148,21 +154,43 @@ public class ParsingEngine {
      * command-line arguments to the arguments that are actually
      * required.
      * @param tokens Tokens passed on the command line.
+     * @return The parsed arguments by file.
      */
-    public void parse( String[] tokens ) {
+    public SortedMap<ArgumentMatchSource, List<String>> parse( String[] tokens ) {
         argumentMatches = new ArgumentMatches();
+        SortedMap<ArgumentMatchSource, List<String>> parsedArgs = new TreeMap<ArgumentMatchSource, List<String>>();
 
-        int lastArgumentMatchSite = -1;
+        List<String> cmdLineTokens = Arrays.asList(tokens);
+        parse(ArgumentMatchSource.COMMAND_LINE, cmdLineTokens, argumentMatches, parsedArgs);
 
-        for( int i = 0; i < tokens.length; i++ ) {
-            String token = tokens[i];
+        ParsingEngineArgumentFiles argumentFiles = new ParsingEngineArgumentFiles();
+
+        // Load the arguments ONLY into the argument files.
+        // Validation may optionally run on the rest of the arguments.
+        loadArgumentsIntoObject(argumentFiles);
+
+        for (File file: argumentFiles.files) {
+            List<String> fileTokens = getArguments(file);
+            parse(new ArgumentMatchSource(file), fileTokens, argumentMatches, parsedArgs);
+        }
+
+        return parsedArgs;
+    }
+
+    private void parse(ArgumentMatchSource matchSource, List<String> tokens,
+                       ArgumentMatches argumentMatches, SortedMap<ArgumentMatchSource, List<String>> parsedArgs) {
+        ArgumentMatchSite lastArgumentMatchSite = new ArgumentMatchSite(matchSource, -1);
+
+        int i = 0;
+        for (String token: tokens) {
             // If the token is of argument form, parse it into its own argument match.
             // Otherwise, pair it with the most recently used argument discovered.
+            ArgumentMatchSite site = new ArgumentMatchSite(matchSource, i);
             if( isArgumentForm(token) ) {
-                ArgumentMatch argumentMatch = parseArgument( token, i );
+                ArgumentMatch argumentMatch = parseArgument( token, site );
                 if( argumentMatch != null ) {
                     argumentMatches.mergeInto( argumentMatch );
-                    lastArgumentMatchSite = i;
+                    lastArgumentMatchSite = site;
                 }
             }
             else {
@@ -170,10 +198,31 @@ public class ParsingEngine {
                     !argumentMatches.getMatch(lastArgumentMatchSite).hasValueAtSite(lastArgumentMatchSite))
                     argumentMatches.getMatch(lastArgumentMatchSite).addValue( lastArgumentMatchSite, token );
                 else
-                    argumentMatches.MissingArgument.addValue( i, token );
+                    argumentMatches.MissingArgument.addValue( site, token );
 
             }
+            i++;
         }
+
+        parsedArgs.put(matchSource, tokens);
+    }
+
+    private List<String> getArguments(File file) {
+        try {
+            if (file.getAbsolutePath().endsWith(".list")) {
+                return getListArguments(file);
+            }
+        } catch (IOException e) {
+            throw new UserException.CouldNotReadInputFile(file, e);
+        }
+        throw new UserException.CouldNotReadInputFile(file, "file extension is not .list");
+    }
+
+    private List<String> getListArguments(File file) throws IOException {
+        ArrayList<String> argsList = new ArrayList<String>();
+        for (String line: FileUtils.readLines(file))
+            argsList.addAll(Arrays.asList(Utils.escapeExpressions(line)));
+        return argsList;
     }
 
     public enum ValidationType { MissingRequiredArgument,
@@ -494,7 +543,7 @@ public class ParsingEngine {
      * @param position The position of the token in question.
      * @return ArgumentMatch associated with this token, or null if no match exists.
      */    
-    private ArgumentMatch parseArgument( String token, int position ) {
+    private ArgumentMatch parseArgument( String token, ArgumentMatchSite position ) {
         if( !isArgumentForm(token) )
             throw new IllegalArgumentException( "Token is not recognizable as an argument: " + token );
 
@@ -579,9 +628,21 @@ class UnmatchedArgumentException extends ArgumentException {
 
     private static String formatArguments( ArgumentMatch invalidValues ) {
         StringBuilder sb = new StringBuilder();
-        for( int index: invalidValues.indices.keySet() )
-            for( String value: invalidValues.indices.get(index) ) {
-                sb.append( String.format("%nInvalid argument value '%s' at position %d.", value, index) );
+        for( ArgumentMatchSite site: invalidValues.sites.keySet() )
+            for( String value: invalidValues.sites.get(site) ) {
+                switch (site.getSource().getType()) {
+                    case CommandLine:
+                        sb.append( String.format("%nInvalid argument value '%s' at position %d.",
+                                value, site.getIndex()) );
+                        break;
+                    case File:
+                        sb.append( String.format("%nInvalid argument value '%s' in file %s at position %d.",
+                                value, site.getSource().getFile().getAbsolutePath(), site.getIndex()) );
+                        break;
+                    default:
+                        throw new RuntimeException( String.format("Unexpected argument match source type: %s",
+                                site.getSource().getType()));
+                }
                 if(value != null && Utils.dupString(' ',value.length()).equals(value))
                     sb.append("  Please make sure any line continuation backslashes on your command line are not followed by whitespace.");
             }
@@ -634,4 +695,13 @@ class UnknownEnumeratedValueException extends ArgumentException {
     private static String formatArguments(ArgumentDefinition definition, String argumentPassed) {
         return String.format("Invalid value %s specified for argument %s; valid options are (%s).", argumentPassed, definition.fullName, Utils.join(",",definition.validOptions));
     }
-}
\ No newline at end of file
+}
+
+/**
+ * Container class to store the list of argument files.
+ * The files will be parsed after the command line arguments.
+ */
+class ParsingEngineArgumentFiles {
+    @Argument(fullName = "arg_file", shortName = "args", doc = "Reads arguments from the specified file", required = false)
+    public List<File> files = new ArrayList<File>();
+}
diff --git a/public/java/src/org/broadinstitute/sting/commandline/ParsingMethod.java b/public/java/src/org/broadinstitute/sting/commandline/ParsingMethod.java
index a070cb5a1..452309e89 100755
--- a/public/java/src/org/broadinstitute/sting/commandline/ParsingMethod.java
+++ b/public/java/src/org/broadinstitute/sting/commandline/ParsingMethod.java
@@ -68,7 +68,7 @@ public abstract class ParsingMethod {
      * @return An argument match.  Definition field will be populated if a match was found or
      *         empty if no appropriate definition could be found. 
      */
-    public ArgumentMatch match( ArgumentDefinitions definitions, String token, int position ) {
+    public ArgumentMatch match( ArgumentDefinitions definitions, String token, ArgumentMatchSite position ) {
         // If the argument is valid, parse out the argument.
         Matcher matcher = pattern.matcher(token);
 
@@ -102,9 +102,7 @@ public abstract class ParsingMethod {
 
         // Try to find a matching argument.  If found, label that as the match.  If not found, add the argument
         // with a null definition.
-        ArgumentMatch argumentMatch = new ArgumentMatch(argument,argumentDefinition,position,tags);
-
-        return argumentMatch;
+        return new ArgumentMatch(argument,argumentDefinition,position,tags);
     }
 
     /**
diff --git a/public/java/src/org/broadinstitute/sting/gatk/GenomeAnalysisEngine.java b/public/java/src/org/broadinstitute/sting/gatk/GenomeAnalysisEngine.java
index 5b9ebd99b..f8e87aa58 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/GenomeAnalysisEngine.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/GenomeAnalysisEngine.java
@@ -28,34 +28,30 @@ import net.sf.picard.reference.IndexedFastaSequenceFile;
 import net.sf.picard.reference.ReferenceSequenceFile;
 import net.sf.samtools.*;
 import org.apache.log4j.Logger;
+import org.broad.tribble.Feature;
 import org.broadinstitute.sting.commandline.*;
 import org.broadinstitute.sting.gatk.arguments.GATKArgumentCollection;
 import org.broadinstitute.sting.gatk.arguments.ValidationExclusion;
 import org.broadinstitute.sting.gatk.datasources.reads.*;
 import org.broadinstitute.sting.gatk.datasources.reference.ReferenceDataSource;
 import org.broadinstitute.sting.gatk.datasources.rmd.ReferenceOrderedDataSource;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
-import org.broadinstitute.sting.gatk.datasources.sample.SampleDataSource;
+import org.broadinstitute.sting.gatk.samples.SampleDB;
 import org.broadinstitute.sting.gatk.executive.MicroScheduler;
 import org.broadinstitute.sting.gatk.filters.FilterManager;
 import org.broadinstitute.sting.gatk.filters.ReadFilter;
 import org.broadinstitute.sting.gatk.filters.ReadGroupBlackListFilter;
 import org.broadinstitute.sting.gatk.io.OutputTracker;
 import org.broadinstitute.sting.gatk.io.stubs.Stub;
-import org.broadinstitute.sting.gatk.refdata.tracks.RMDTrack;
 import org.broadinstitute.sting.gatk.refdata.tracks.RMDTrackBuilder;
-import org.broadinstitute.sting.gatk.refdata.utils.RMDIntervalGenerator;
 import org.broadinstitute.sting.gatk.refdata.utils.RMDTriplet;
+import org.broadinstitute.sting.gatk.samples.SampleDBBuilder;
 import org.broadinstitute.sting.gatk.walkers.*;
-import org.broadinstitute.sting.utils.GenomeLoc;
-import org.broadinstitute.sting.utils.GenomeLocParser;
-import org.broadinstitute.sting.utils.GenomeLocSortedSet;
-import org.broadinstitute.sting.utils.SequenceDictionaryUtils;
+import org.broadinstitute.sting.utils.*;
 import org.broadinstitute.sting.utils.baq.BAQ;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.interval.IntervalSetRule;
 import org.broadinstitute.sting.utils.interval.IntervalUtils;
-import org.broadinstitute.sting.utils.variantcontext.VariantContext;
 
 import java.io.File;
 import java.util.*;
@@ -92,7 +88,7 @@ public class GenomeAnalysisEngine {
     /**
      * Accessor for sample metadata
      */
-    private SampleDataSource sampleDataSource = null;
+    private SampleDB sampleDB = null;
 
     /**
      * Accessor for sharded reference-ordered data.
@@ -206,6 +202,9 @@ public class GenomeAnalysisEngine {
         // Prepare the data for traversal.
         initializeDataSources();
 
+        // initialize sampleDB
+        initializeSampleDB();
+
         // initialize and validate the interval list
         initializeIntervals();
         validateSuppliedIntervals();
@@ -222,12 +221,12 @@ public class GenomeAnalysisEngine {
         ShardStrategy shardStrategy = getShardStrategy(readsDataSource,microScheduler.getReference(),intervals);
 
         // execute the microscheduler, storing the results
-        Object result =  microScheduler.execute(this.walker, shardStrategy);
+        return microScheduler.execute(this.walker, shardStrategy);
 
         //monitor.stop();
         //logger.info(String.format("Maximum heap size consumed: %d",monitor.getMaxMemoryUsed()));
 
-        return result;
+        //return result;
     }
 
     /**
@@ -259,13 +258,12 @@ public class GenomeAnalysisEngine {
      * @return A collection of available filters.
      */
     public Collection<ReadFilter> createFilters() {
-        Set<ReadFilter> filters = new HashSet<ReadFilter>();
-        filters.addAll(WalkerManager.getReadFilters(walker,this.getFilterManager()));
+        final List<ReadFilter> filters = WalkerManager.getReadFilters(walker,this.getFilterManager());
         if (this.getArguments().readGroupBlackList != null && this.getArguments().readGroupBlackList.size() > 0)
             filters.add(new ReadGroupBlackListFilter(this.getArguments().readGroupBlackList));
-        for(String filterName: this.getArguments().readFilters)
+        for(final String filterName: this.getArguments().readFilters)
             filters.add(this.getFilterManager().createByName(filterName));
-        return Collections.unmodifiableSet(filters);
+        return Collections.unmodifiableList(filters);
     }
 
     /**
@@ -299,10 +297,14 @@ public class GenomeAnalysisEngine {
         else if(WalkerManager.getDownsamplingMethod(walker) != null)
             method = WalkerManager.getDownsamplingMethod(walker);
         else
-            method = argCollection.getDefaultDownsamplingMethod();
+            method = GATKArgumentCollection.getDefaultDownsamplingMethod();
         return method;
     }
 
+    protected void setDownsamplingMethod(DownsamplingMethod method) {
+        argCollection.setDownsamplingMethod(method);
+    }
+
     public BAQ.QualityMode getWalkerBAQQualityMode()         { return WalkerManager.getBAQQualityMode(walker); }
     public BAQ.ApplicationTime getWalkerBAQApplicationTime() { return WalkerManager.getBAQApplicationTime(walker); }    
 
@@ -381,18 +383,18 @@ public class GenomeAnalysisEngine {
         // If intervals is non-null and empty at this point, it means that the list of intervals to process
         // was filtered down to an empty set (eg., the user specified something like -L chr1 -XL chr1). Since
         // this was very likely unintentional, the user should be informed of this. Note that this is different
-        // from the case where intervals == null, which indicates either that there were no interval arguments,
-        // or that -L all was specified.
+        // from the case where intervals == null, which indicates that there were no interval arguments.
         if ( intervals != null && intervals.isEmpty() ) {
-            throw new ArgumentException("The given combination of -L and -XL options results in an empty set. " +
-                                        "No intervals to process.");
+            logger.warn("The given combination of -L and -XL options results in an empty set.  No intervals to process.");
         }
     }
 
     /**
      * Get the sharding strategy given a driving data source.
      *
+     * @param readsDataSource readsDataSource
      * @param drivingDataSource Data on which to shard.
+     * @param intervals intervals
      * @return the sharding strategy
      */
     protected ShardStrategy getShardStrategy(SAMDataSource readsDataSource, ReferenceSequenceFile drivingDataSource, GenomeLocSortedSet intervals) {
@@ -429,7 +431,7 @@ public class GenomeAnalysisEngine {
             return new MonolithicShardStrategy(getGenomeLocParser(), readsDataSource,shardType,region);
         }
 
-        ShardStrategy shardStrategy = null;
+        ShardStrategy shardStrategy;
         ShardStrategyFactory.SHATTER_STRATEGY shardType;
 
         long SHARD_SIZE = 100000L;
@@ -438,6 +440,8 @@ public class GenomeAnalysisEngine {
             if (walker instanceof RodWalker) SHARD_SIZE *= 1000;
 
             if (intervals != null && !intervals.isEmpty()) {
+                if (readsDataSource == null)
+                    throw new IllegalArgumentException("readsDataSource is null");
                 if(!readsDataSource.isEmpty() && readsDataSource.getSortOrder() != SAMFileHeader.SortOrder.coordinate)
                     throw new UserException.MissortedBAM(SAMFileHeader.SortOrder.coordinate, "Locus walkers can only traverse coordinate-sorted data.  Please resort your input BAM file(s) or set the Sort Order tag in the header appropriately.");
 
@@ -501,7 +505,8 @@ public class GenomeAnalysisEngine {
      */
     private void initializeTempDirectory() {
         File tempDir = new File(System.getProperty("java.io.tmpdir"));
-        tempDir.mkdirs();
+        if (!tempDir.exists() && !tempDir.mkdirs())
+            throw new UserException.BadTmpDir("Unable to create directory");
     }
 
     /**
@@ -566,34 +571,23 @@ public class GenomeAnalysisEngine {
     protected void initializeIntervals() {
 
         // return if no interval arguments at all
-        if ((argCollection.intervals == null) && (argCollection.excludeIntervals == null) && (argCollection.RODToInterval == null))
+        if ( argCollection.intervals == null && argCollection.excludeIntervals == null )
             return;
 
-        // if '-L all' was specified, verify that it was the only -L specified and return if so.
-        if(argCollection.intervals != null) {
-            for(String interval: argCollection.intervals) {
-                if(interval.trim().equals("all")) {
-                    if(argCollection.intervals.size() > 1)
-                        throw new UserException("'-L all' was specified along with other intervals or interval lists; the GATK cannot combine '-L all' with other intervals.");
-
-                    // '-L all' was specified and seems valid.  Return.
-                    return;
-                }
-            }
-        }
+        // Note that the use of '-L all' is no longer supported.
 
         // if include argument isn't given, create new set of all possible intervals
-        GenomeLocSortedSet includeSortedSet = (argCollection.intervals == null && argCollection.RODToInterval == null ?
+        GenomeLocSortedSet includeSortedSet = (argCollection.intervals == null ?
             GenomeLocSortedSet.createSetFromSequenceDictionary(this.referenceDataSource.getReference().getSequenceDictionary()) :
-            loadIntervals(argCollection.intervals, IntervalUtils.mergeIntervalLocations(getRODIntervals(), argCollection.intervalMerging)));
+            loadIntervals(argCollection.intervals, argCollection.intervalSetRule));
 
         // if no exclude arguments, can return parseIntervalArguments directly
-        if (argCollection.excludeIntervals == null)
+        if ( argCollection.excludeIntervals == null )
             intervals = includeSortedSet;
 
-            // otherwise there are exclude arguments => must merge include and exclude GenomeLocSortedSets
+        // otherwise there are exclude arguments => must merge include and exclude GenomeLocSortedSets
         else {
-            GenomeLocSortedSet excludeSortedSet = loadIntervals(argCollection.excludeIntervals, null);
+            GenomeLocSortedSet excludeSortedSet = loadIntervals(argCollection.excludeIntervals, IntervalSetRule.UNION);
             intervals = includeSortedSet.subtractRegions(excludeSortedSet);
 
             // logging messages only printed when exclude (-XL) arguments are given
@@ -608,47 +602,26 @@ public class GenomeAnalysisEngine {
 
     /**
      * Loads the intervals relevant to the current execution
-     * @param argList String representation of arguments; might include 'all', filenames, intervals in samtools
-     *                notation, or a combination of the above
-     * @param rodIntervals a list of ROD intervals to add to the returned set.  Can be empty or null.
+     * @param argList  argument bindings; might include filenames, intervals in samtools notation, or a combination of the above
+     * @param rule     interval merging rule
      * @return A sorted, merged list of all intervals specified in this arg list.
      */
-    protected GenomeLocSortedSet loadIntervals( List<String> argList, List<GenomeLoc> rodIntervals ) {
+    protected GenomeLocSortedSet loadIntervals( List<IntervalBinding<Feature>> argList, IntervalSetRule rule ) {
 
-        boolean allowEmptyIntervalList = (argCollection.unsafe == ValidationExclusion.TYPE.ALLOW_EMPTY_INTERVAL_LIST ||
-                                          argCollection.unsafe == ValidationExclusion.TYPE.ALL);
+        List<GenomeLoc> allIntervals = new ArrayList<GenomeLoc>(0);
+        for ( IntervalBinding intervalBinding : argList ) {
+            List<GenomeLoc> intervals = intervalBinding.getIntervals(this);
 
-        List<GenomeLoc> nonRODIntervals = IntervalUtils.parseIntervalArguments(genomeLocParser, argList, allowEmptyIntervalList);
-        List<GenomeLoc> allIntervals = IntervalUtils.mergeListsBySetOperator(rodIntervals, nonRODIntervals, argCollection.BTIMergeRule);
+            if ( intervals.isEmpty() ) {
+                logger.warn("The interval file " + intervalBinding.getSource() + " contains no intervals that could be parsed.");
+            }
+
+            allIntervals = IntervalUtils.mergeListsBySetOperator(intervals, allIntervals, rule);
+        }
 
         return IntervalUtils.sortAndMergeIntervals(genomeLocParser, allIntervals, argCollection.intervalMerging);
     }
 
-    /**
-     * if we have a ROD specified as a 'rodToIntervalTrackName', convert its records to RODs
-     * @return ROD intervals as GenomeLocs
-     */
-    private List<GenomeLoc> getRODIntervals() {
-        Map<String, ReferenceOrderedDataSource> rodNames = RMDIntervalGenerator.getRMDTrackNames(rodDataSources);
-        // Do we have any RODs that overloaded as interval lists with the 'rodToIntervalTrackName' flag?
-        List<GenomeLoc> ret = new ArrayList<GenomeLoc>();
-        if (rodNames != null && argCollection.RODToInterval != null) {
-            String rodName = argCollection.RODToInterval;
-
-            // check to make sure we have a rod of that name
-            if (!rodNames.containsKey(rodName))
-                throw new UserException.CommandLineException("--rodToIntervalTrackName (-BTI) was passed the name '"+rodName+"', which wasn't given as a ROD name in the -B option");
-
-            for (String str : rodNames.keySet())
-                if (str.equals(rodName)) {
-                    logger.info("Adding interval list from track (ROD) named " + rodName);
-                    RMDIntervalGenerator intervalGenerator = new RMDIntervalGenerator(rodNames.get(str));
-                    ret.addAll(intervalGenerator.toGenomeLocList());
-                }
-        }
-        return ret;
-    }
-
     /**
      * Add additional, externally managed IO streams for inputs.
      *
@@ -692,12 +665,22 @@ public class GenomeAnalysisEngine {
         for (ReadFilter filter : filters)
             filter.initialize(this);
 
-        sampleDataSource = new SampleDataSource(getSAMFileHeader(), argCollection.sampleFiles);
-
         // set the sequence dictionary of all of Tribble tracks to the sequence dictionary of our reference
         rodDataSources = getReferenceOrderedDataSources(referenceMetaDataFiles,referenceDataSource.getReference().getSequenceDictionary(),genomeLocParser,argCollection.unsafe);
     }
 
+    /**
+     * Entry-point function to initialize the samples database from input data and pedigree arguments
+     */
+    private void initializeSampleDB() {
+        SampleDBBuilder sampleDBBuilder = new SampleDBBuilder(this, argCollection.pedigreeValidationType);
+        sampleDBBuilder.addSamplesFromSAMHeader(getSAMFileHeader());
+        sampleDBBuilder.addSamplesFromSampleNames(SampleUtils.getUniqueSamplesFromRods(this));
+        sampleDBBuilder.addSamplesFromPedigreeFiles(argCollection.pedigreeFiles);
+        sampleDBBuilder.addSamplesFromPedigreeStrings(argCollection.pedigreeStrings);
+        sampleDB = sampleDBBuilder.getFinalSampleDB();
+    }
+
     /**
      * Gets a unique identifier for the reader sourcing this read.
      * @param read Read to examine.
@@ -716,106 +699,13 @@ public class GenomeAnalysisEngine {
         return getReadsDataSource().getSAMFile(id);
     }
 
-    /**
-     * Returns sets of samples present in the (merged) input SAM stream, grouped by readers (i.e. underlying
-     * individual bam files). For instance: if GATK is run with three input bam files (three -I arguments), then the list
-     * returned by this method will contain 3 elements (one for each reader), with each element being a set of sample names
-     * found in the corresponding bam file.
-     *
-     * @return Sets of samples in the merged input SAM stream, grouped by readers
-     */
-    public List<Set<String>> getSamplesByReaders() {
-        Collection<SAMReaderID> readers = getReadsDataSource().getReaderIDs();
-
-        List<Set<String>> sample_sets = new ArrayList<Set<String>>(readers.size());
-
-        for (SAMReaderID r : readers) {
-
-            Set<String> samples = new HashSet<String>(1);
-            sample_sets.add(samples);
-
-            for (SAMReadGroupRecord g : getReadsDataSource().getHeader(r).getReadGroups()) {
-                samples.add(g.getSample());
-            }
-        }
-
-        return sample_sets;
-
-    }
-
-    /**
-     * Returns sets of libraries present in the (merged) input SAM stream, grouped by readers (i.e. underlying
-     * individual bam files). For instance: if GATK is run with three input bam files (three -I arguments), then the list
-     * returned by this method will contain 3 elements (one for each reader), with each element being a set of library names
-     * found in the corresponding bam file.
-     *
-     * @return Sets of libraries present in the (merged) input SAM stream, grouped by readers
-     */
-    public List<Set<String>> getLibrariesByReaders() {
-
-
-        Collection<SAMReaderID> readers = getReadsDataSource().getReaderIDs();
-
-        List<Set<String>> lib_sets = new ArrayList<Set<String>>(readers.size());
-
-        for (SAMReaderID r : readers) {
-
-            Set<String> libs = new HashSet<String>(2);
-            lib_sets.add(libs);
-
-            for (SAMReadGroupRecord g : getReadsDataSource().getHeader(r).getReadGroups()) {
-                libs.add(g.getLibrary());
-            }
-        }
-
-        return lib_sets;
-
-    }
-
-    /**
-     * **** UNLESS YOU HAVE GOOD REASON TO, DO NOT USE THIS METHOD; USE getFileToReadGroupIdMapping() INSTEAD ****
-     *
-     * Returns sets of (remapped) read groups in input SAM stream, grouped by readers (i.e. underlying
-     * individual bam files). For instance: if GATK is run with three input bam files (three -I arguments), then the list
-     * returned by this method will contain 3 elements (one for each reader), with each element being a set of remapped read groups
-     * (i.e. as seen by read.getReadGroup().getReadGroupId() in the merged stream) that come from the corresponding bam file.
-     *
-     * @return sets of (merged) read group ids in order of input bams
-     */
-    public List<Set<String>> getMergedReadGroupsByReaders() {
-
-
-        Collection<SAMReaderID> readers = getReadsDataSource().getReaderIDs();
-
-        List<Set<String>> rg_sets = new ArrayList<Set<String>>(readers.size());
-
-        for (SAMReaderID r : readers) {
-
-            Set<String> groups = new HashSet<String>(5);
-            rg_sets.add(groups);
-
-            for (SAMReadGroupRecord g : getReadsDataSource().getHeader(r).getReadGroups()) {
-                if (getReadsDataSource().hasReadGroupCollisions()) { // Check if there were read group clashes with hasGroupIdDuplicates and if so:
-                    // use HeaderMerger to translate original read group id from the reader into the read group id in the
-                    // merged stream, and save that remapped read group id to associate it with specific reader
-                    groups.add(getReadsDataSource().getReadGroupId(r, g.getReadGroupId()));
-                } else {
-                    // otherwise, pass through the unmapped read groups since this is what Picard does as well
-                    groups.add(g.getReadGroupId());
-                }
-            }
-        }
-
-        return rg_sets;
-
-    }
-
     /**
      * Now that all files are open, validate the sequence dictionaries of the reads vs. the reference vrs the reference ordered data (if available).
      *
      * @param reads     Reads data source.
      * @param reference Reference data source.
      * @param rods    a collection of the reference ordered data tracks
+     * @param manager manager
      */
     private void validateSourcesAgainstReference(SAMDataSource reads, ReferenceSequenceFile reference, Collection<ReferenceOrderedDataSource> rods, RMDTrackBuilder manager) {
         if ((reads.isEmpty() && (rods == null || rods.isEmpty())) || reference == null )
@@ -844,15 +734,22 @@ public class GenomeAnalysisEngine {
     /**
      * Gets a data source for the given set of reads.
      *
+     * @param argCollection arguments
+     * @param genomeLocParser parser
+     * @param refReader reader
      * @return A data source for the given set of reads.
      */
     private SAMDataSource createReadsDataSource(GATKArgumentCollection argCollection, GenomeLocParser genomeLocParser, IndexedFastaSequenceFile refReader) {
         DownsamplingMethod method = getDownsamplingMethod();
 
+        // Synchronize the method back into the collection so that it shows up when
+        // interrogating for the downsample method during command line recreation.
+        setDownsamplingMethod(method);
+
         if ( getWalkerBAQApplicationTime() == BAQ.ApplicationTime.FORBIDDEN && argCollection.BAQMode != BAQ.CalculationMode.OFF)
             throw new UserException.BadArgumentValue("baq", "Walker cannot accept BAQ'd base qualities, and yet BAQ mode " + argCollection.BAQMode + " was requested.");
 
-        SAMDataSource dataSource = new SAMDataSource(
+        return new SAMDataSource(
                 samReaderIDs,
                 genomeLocParser,
                 argCollection.useOriginalBaseQualities,
@@ -868,14 +765,12 @@ public class GenomeAnalysisEngine {
                 refReader,
                 argCollection.defaultBaseQualities,
                 !argCollection.disableLowMemorySharding);
-        return dataSource;
     }
 
     /**
      * Opens a reference sequence file paired with an index.  Only public for testing purposes
      *
      * @param refFile Handle to a reference sequence file.  Non-null.
-     * @return A thread-safe file wrapper.
      */
     public void setReferenceDataSource(File refFile) {
         this.referenceDataSource = new ReferenceDataSource(refFile);
@@ -929,6 +824,26 @@ public class GenomeAnalysisEngine {
         return readsDataSource.getHeader(reader);
     }
 
+    /**
+     * Returns an ordered list of the unmerged SAM file headers known to this engine.
+     * @return list of header for each input SAM file, in command line order
+     */
+    public List<SAMFileHeader> getSAMFileHeaders() {
+        final List<SAMFileHeader> headers = new ArrayList<SAMFileHeader>();
+        for ( final SAMReaderID id : getReadsDataSource().getReaderIDs() ) {
+            headers.add(getReadsDataSource().getHeader(id));
+        }
+        return headers;
+    }
+
+    /**
+     * Gets the master sequence dictionary for this GATK engine instance
+     * @return a never-null dictionary listing all of the contigs known to this engine instance
+     */
+    public SAMSequenceDictionary getMasterSequenceDictionary() {
+        return getReferenceDataSource().getReference().getSequenceDictionary();
+    }
+
     /**
      * Returns data source object encapsulating all essential info and handlers used to traverse
      * reads; header merger, individual file readers etc can be accessed through the returned data source object.
@@ -939,8 +854,6 @@ public class GenomeAnalysisEngine {
         return this.readsDataSource;
     }
 
-
-
     /**
      * Sets the collection of GATK main application arguments.
      *
@@ -1027,140 +940,14 @@ public class GenomeAnalysisEngine {
         return readsDataSource == null ? null : readsDataSource.getCumulativeReadMetrics();
     }
 
-    public SampleDataSource getSampleMetadata() {
-        return this.sampleDataSource;
-    }
+    // -------------------------------------------------------------------------------------
+    //
+    // code for working with Samples database
+    //
+    // -------------------------------------------------------------------------------------
 
-    /**
-     * Get a sample by its ID
-     * If an alias is passed in, return the main sample object
-     * @param id sample id
-     * @return sample Object with this ID
-     */
-    public Sample getSampleById(String id) {
-        return sampleDataSource.getSampleById(id);
-    }
-
-    /**
-     * Get the sample for a given read group
-     * Must first look up ID for read group
-     * @param readGroup of sample
-     * @return sample object with ID from the read group
-     */
-    public Sample getSampleByReadGroup(SAMReadGroupRecord readGroup) {
-        return sampleDataSource.getSampleByReadGroup(readGroup);
-    }
-
-    /**
-     * Get a sample for a given read
-     * Must first look up read group, and then sample ID for that read group
-     * @param read of sample
-     * @return sample object of this read
-     */
-    public Sample getSampleByRead(SAMRecord read) {
-        return getSampleByReadGroup(read.getReadGroup());
-    }
-
-    /**
-     * Get number of sample objects
-     * @return size of samples map
-     */
-    public int sampleCount() {
-        return sampleDataSource.sampleCount();
-    }
-
-    /**
-     * Return all samples with a given family ID
-     * Note that this isn't terribly efficient (linear) - it may be worth adding a new family ID data structure for this
-     * @param familyId family ID
-     * @return Samples with the given family ID
-     */
-    public Set<Sample> getFamily(String familyId) {
-        return sampleDataSource.getFamily(familyId);
-    }
-
-    /**
-     * Returns all children of a given sample
-     * See note on the efficiency of getFamily() - since this depends on getFamily() it's also not efficient
-     * @param sample parent sample
-     * @return children of the given sample
-     */
-    public Set<Sample> getChildren(Sample sample) {
-        return sampleDataSource.getChildren(sample);
-    }
-
-    /**
-     * Gets all the samples
-     * @return
-     */
-    public Collection<Sample> getSamples() {
-        return sampleDataSource.getSamples();
-    }
-
-    /**
-     * Takes a list of sample names and returns their corresponding sample objects
-     *
-     * @param sampleNameList List of sample names
-     * @return Corresponding set of samples
-     */
-    public Set<Sample> getSamples(Collection<String> sampleNameList) {
-	return sampleDataSource.getSamples(sampleNameList);
-    }
-
-
-    /**
-     * Returns a set of samples that have any value (which could be null) for a given property
-     * @param key Property key
-     * @return Set of samples with the property
-     */
-    public Set<Sample> getSamplesWithProperty(String key) {
-        return sampleDataSource.getSamplesWithProperty(key);
-    }
-
-    /**
-     * Returns a set of samples that have a property with a certain value
-     * Value must be a string for now - could add a similar method for matching any objects in the future
-     *
-     * @param key Property key
-     * @param value String property value
-     * @return Set of samples that match key and value
-     */
-    public Set<Sample> getSamplesWithProperty(String key, String value) {
-        return sampleDataSource.getSamplesWithProperty(key, value);
-
-    }
-
-    /**
-     * Returns a set of sample objects for the sample names in a variant context
-     *
-     * @param context Any variant context
-     * @return a set of the sample objects
-     */
-    public Set<Sample> getSamplesByVariantContext(VariantContext context) {
-        Set<Sample> samples = new HashSet<Sample>();
-        for (String sampleName : context.getSampleNames()) {
-            samples.add(sampleDataSource.getOrCreateSample(sampleName));
-        }
-        return samples;
-    }
-
-    /**
-     * Returns all samples that were referenced in the SAM file
-     */
-    public Set<Sample> getSAMFileSamples() {
-        return sampleDataSource.getSAMFileSamples();
-    }
-
-    /**
-     * Return a subcontext restricted to samples with a given property key/value
-     * Gets the sample names from key/value and relies on VariantContext.subContextFromGenotypes for the filtering
-     * @param context VariantContext to filter
-     * @param key property key
-     * @param value property value (must be string)
-     * @return subcontext
-     */
-    public VariantContext subContextFromSampleProperty(VariantContext context, String key, String value) {
-        return sampleDataSource.subContextFromSampleProperty(context, key, value);
+    public SampleDB getSampleDB() {
+        return this.sampleDB;
     }
 
     public Map<String,String> getApproximateCommandLineArguments(Object... argumentProviders) {
diff --git a/public/java/src/org/broadinstitute/sting/gatk/ReadMetrics.java b/public/java/src/org/broadinstitute/sting/gatk/ReadMetrics.java
index 7cb615f7f..ceaa30f01 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/ReadMetrics.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/ReadMetrics.java
@@ -30,6 +30,7 @@ import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import java.util.Collections;
 import java.util.HashMap;
 import java.util.Map;
+import java.util.TreeMap;
 
 /**
  * Holds a bunch of basic information about the traversal.
@@ -102,8 +103,12 @@ public class ReadMetrics implements Cloneable {
         counter.put(filter.getClass(), c + 1L);
     }
 
-    public Map<Class,Long> getCountsByFilter() {
-        return Collections.unmodifiableMap(counter);
+    public Map<String,Long> getCountsByFilter() {
+        final TreeMap<String, Long> sortedCounts = new TreeMap<String, Long>();
+        for(Map.Entry<Class,Long> counterEntry: counter.entrySet()) {
+            sortedCounts.put(counterEntry.getKey().getSimpleName(),counterEntry.getValue());
+        }
+        return sortedCounts;
     }
 
     /**
diff --git a/public/java/src/org/broadinstitute/sting/gatk/arguments/DbsnpArgumentCollection.java b/public/java/src/org/broadinstitute/sting/gatk/arguments/DbsnpArgumentCollection.java
index 2f4dd06e2..e0c2ce72a 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/arguments/DbsnpArgumentCollection.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/arguments/DbsnpArgumentCollection.java
@@ -29,13 +29,11 @@ package org.broadinstitute.sting.gatk.arguments;
 import org.broadinstitute.sting.commandline.Input;
 import org.broadinstitute.sting.commandline.RodBinding;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
-import org.simpleframework.xml.*;
 
 /**
  * @author ebanks
  * @version 1.0
  */
-@Root
 public class DbsnpArgumentCollection {
 
     /**
diff --git a/public/java/src/org/broadinstitute/sting/gatk/arguments/GATKArgumentCollection.java b/public/java/src/org/broadinstitute/sting/gatk/arguments/GATKArgumentCollection.java
index fd39d46b0..8078a1ea4 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/arguments/GATKArgumentCollection.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/arguments/GATKArgumentCollection.java
@@ -26,34 +26,26 @@
 package org.broadinstitute.sting.gatk.arguments;
 
 import net.sf.samtools.SAMFileReader;
+import org.broad.tribble.Feature;
 import org.broadinstitute.sting.commandline.Argument;
 import org.broadinstitute.sting.commandline.Hidden;
 import org.broadinstitute.sting.commandline.Input;
+import org.broadinstitute.sting.commandline.IntervalBinding;
 import org.broadinstitute.sting.gatk.DownsampleType;
 import org.broadinstitute.sting.gatk.DownsamplingMethod;
 import org.broadinstitute.sting.gatk.phonehome.GATKRunReport;
+import org.broadinstitute.sting.gatk.samples.PedigreeValidationType;
 import org.broadinstitute.sting.utils.baq.BAQ;
-import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.interval.IntervalMergingRule;
 import org.broadinstitute.sting.utils.interval.IntervalSetRule;
-import org.simpleframework.xml.*;
-import org.simpleframework.xml.core.Persister;
-import org.simpleframework.xml.stream.Format;
-import org.simpleframework.xml.stream.HyphenStyle;
 
 import java.io.File;
-import java.io.InputStream;
-import java.io.PrintStream;
-import java.util.ArrayList;
-import java.util.HashMap;
-import java.util.List;
-import java.util.Map;
+import java.util.*;
 
 /**
  * @author aaron
  * @version 1.0
  */
-@Root
 public class GATKArgumentCollection {
 
     /* our version number */
@@ -64,58 +56,58 @@ public class GATKArgumentCollection {
     public GATKArgumentCollection() {
     }
 
-    @ElementMap(entry = "analysis_argument", key = "key", attribute = true, inline = true, required = false)
     public Map<String, String> walkerArgs = new HashMap<String, String>();
 
     // parameters and their defaults
-    @ElementList(required = false)
     @Input(fullName = "input_file", shortName = "I", doc = "SAM or BAM file(s)", required = false)
     public List<String> samFiles = new ArrayList<String>();
 
-    // parameters and their defaults
-    @ElementList(required = false)
-    @Argument(fullName = "sample_metadata", shortName = "SM", doc = "Sample file(s) in JSON format", required = false)
-    public List<File> sampleFiles = new ArrayList<File>();
-
-    @Element(required = false)
     @Argument(fullName = "read_buffer_size", shortName = "rbs", doc="Number of reads per SAM file to buffer in memory", required = false)
     public Integer readBufferSize = null;
 
-    @Element(required = false)
     @Argument(fullName = "phone_home", shortName = "et", doc="What kind of GATK run report should we generate?  Standard is the default, can be verbose or NO_ET so nothing is posted to the run repository", required = false)
     public GATKRunReport.PhoneHomeOption phoneHomeType = GATKRunReport.PhoneHomeOption.STANDARD;
 
-    @ElementList(required = false)
-    @Argument(fullName = "read_filter", shortName = "rf", doc = "Specify filtration criteria to apply to each read individually.", required = false)
+    @Argument(fullName = "read_filter", shortName = "rf", doc = "Specify filtration criteria to apply to each read individually", required = false)
     public List<String> readFilters = new ArrayList<String>();
 
-    @ElementList(required = false)
-    @Input(fullName = "intervals", shortName = "L", doc = "A list of genomic intervals over which to operate. Can be explicitly specified on the command line or in a file.", required = false)
-    public List<String> intervals = null;
+    /**
+     * Using this option one can instruct the GATK engine to traverse over only part of the genome.  This argument can be specified multiple times.
+     * One may use samtools-style intervals either explicitly (e.g. -L chr1 or -L chr1:100-200) or listed in a file (e.g. -L myFile.intervals).
+     * Additionally, one may specify a rod file to traverse over the positions for which there is a record in the file (e.g. -L file.vcf).
+     */
+    @Input(fullName = "intervals", shortName = "L", doc = "One or more genomic intervals over which to operate. Can be explicitly specified on the command line or in a file (including a rod file)", required = false)
+    public List<IntervalBinding<Feature>> intervals = null;
 
-    @ElementList(required = false)
-    @Input(fullName = "excludeIntervals", shortName = "XL", doc = "A list of genomic intervals to exclude from processing. Can be explicitly specified on the command line or in a file.", required = false)
-    public List<String> excludeIntervals = null;
+    /**
+     * Using this option one can instruct the GATK engine NOT to traverse over certain parts of the genome.  This argument can be specified multiple times.
+     * One may use samtools-style intervals either explicitly (e.g. -XL chr1 or -XL chr1:100-200) or listed in a file (e.g. -XL myFile.intervals).
+     * Additionally, one may specify a rod file to skip over the positions for which there is a record in the file (e.g. -XL file.vcf).
+     */
+    @Input(fullName = "excludeIntervals", shortName = "XL", doc = "One or more genomic intervals to exclude from processing. Can be explicitly specified on the command line or in a file (including a rod file)", required = false)
+    public List<IntervalBinding<Feature>> excludeIntervals = null;
+
+    /**
+     * How should the intervals specified by multiple -L or -XL arguments be combined?  Using this argument one can, for example, traverse over all of the positions
+     * for which there is a record in a VCF but just in chromosome 20 (-L chr20 -L file.vcf -isr INTERSECTION).
+     */
+    @Argument(fullName = "interval_set_rule", shortName = "isr", doc = "Indicates the set merging approach the interval parser should use to combine the various -L or -XL inputs", required = false)
+    public IntervalSetRule intervalSetRule = IntervalSetRule.UNION;
+
+    /**
+     * Should abutting (but not overlapping) intervals be treated as separate intervals?
+     */
+    @Argument(fullName = "interval_merging", shortName = "im", doc = "Indicates the interval merging rule we should use for abutting intervals", required = false)
+    public IntervalMergingRule intervalMerging = IntervalMergingRule.ALL;
 
-    @Element(required = false)
     @Input(fullName = "reference_sequence", shortName = "R", doc = "Reference sequence file", required = false)
     public File referenceFile = null;
 
     @Deprecated
     @Hidden
-    @ElementList(required = false)
     @Input(fullName = "rodBind", shortName = "B", doc = "Bindings for reference-ordered data, in the form :<name>,<type> <file>", required = false)
     public ArrayList<String> RODBindings = new ArrayList<String>();
 
-    @Element(required = false)
-    @Argument(fullName = "rodToIntervalTrackName", shortName = "BTI", doc = "Indicates that the named track should be converted into an interval list, to drive the traversal", required = false)
-    public String RODToInterval = null;
-
-    @Element(required = false)
-    @Argument(fullName = "BTI_merge_rule", shortName = "BTIMR", doc = "Indicates the merging approach the interval parser should use to combine the BTI track with other -L options", required = false)
-    public IntervalSetRule BTIMergeRule = IntervalSetRule.UNION;
-
-    @Element(required = false)
     @Argument(fullName = "nonDeterministicRandomSeed", shortName = "ndrs", doc = "Makes the GATK behave non deterministically, that is, the random numbers generated will be different in every run", required = false)
     public boolean nonDeterministicRandomSeed = false;
 
@@ -128,22 +120,19 @@ public class GATKArgumentCollection {
     private static DownsampleType DEFAULT_DOWNSAMPLING_TYPE = DownsampleType.BY_SAMPLE;
     private static int DEFAULT_DOWNSAMPLING_COVERAGE = 1000;
 
-    @Element(required = false)
-    @Argument(fullName = "downsampling_type", shortName="dt", doc="Type of reads downsampling to employ at a given locus.  Reads will be selected randomly to be removed from the pile based on the method described here.", required = false)
+    @Argument(fullName = "downsampling_type", shortName="dt", doc="Type of reads downsampling to employ at a given locus.  Reads will be selected randomly to be removed from the pile based on the method described here", required = false)
     public DownsampleType downsamplingType = null;
 
-    @Element(required = false)
     @Argument(fullName = "downsample_to_fraction", shortName = "dfrac", doc = "Fraction [0.0-1.0] of reads to downsample to", required = false)
     public Double downsampleFraction = null;
 
-    @Element(required = false)
     @Argument(fullName = "downsample_to_coverage", shortName = "dcov", doc = "Coverage [integer] to downsample to at any given locus; note that downsampled reads are randomly selected from all possible reads at a locus", required = false)
     public Integer downsampleCoverage = null;
 
     /**
      * Gets the downsampling method explicitly specified by the user.  If the user didn't specify
-     * a default downsampling mechanism, return null.
-     * @return The explicitly specified downsampling mechanism, or null if none exists.
+     * a default downsampling mechanism, return the default.
+     * @return The explicitly specified downsampling mechanism, or the default if none exists.
      */
     public DownsamplingMethod getDownsamplingMethod() {
         if(downsamplingType == null && downsampleFraction == null && downsampleCoverage == null)
@@ -153,16 +142,26 @@ public class GATKArgumentCollection {
         return new DownsamplingMethod(downsamplingType,downsampleCoverage,downsampleFraction);
     }
 
+    /**
+     * Set the downsampling method stored in the argument collection so that it is read back out when interrogating the command line arguments.
+     * @param method The downsampling mechanism.
+     */
+    public void setDownsamplingMethod(DownsamplingMethod method) {
+        if (method == null)
+            throw new IllegalArgumentException("method is null");
+        downsamplingType = method.type;
+        downsampleCoverage = method.toCoverage;
+        downsampleFraction = method.toFraction;
+    }
+
     // --------------------------------------------------------------------------------------------------------------
     //
     // BAQ arguments
     //
     // --------------------------------------------------------------------------------------------------------------
-    @Element(required = false)
     @Argument(fullName = "baq", shortName="baq", doc="Type of BAQ calculation to apply in the engine", required = false)
     public BAQ.CalculationMode BAQMode = BAQ.CalculationMode.OFF;
 
-    @Element(required = false)
     @Argument(fullName = "baqGapOpenPenalty", shortName="baqGOP", doc="BAQ gap open penalty (Phred Scaled).  Default value is 40.  30 is perhaps better for whole genome call sets", required = false)
     public double BAQGOP = BAQ.DEFAULT_GOP;
 
@@ -171,7 +170,6 @@ public class GATKArgumentCollection {
     // performance log arguments
     //
     // --------------------------------------------------------------------------------------------------------------
-    @Element(required = false)
     @Argument(fullName = "performanceLog", shortName="PF", doc="If provided, a GATK runtime performance log will be written to this file", required = false)
     public File performanceLog = null;
 
@@ -184,67 +182,117 @@ public class GATKArgumentCollection {
         return new DownsamplingMethod(DEFAULT_DOWNSAMPLING_TYPE,DEFAULT_DOWNSAMPLING_COVERAGE,null);
     }
 
-    @Element(required = false)
     @Argument(fullName="useOriginalQualities", shortName = "OQ", doc = "If set, use the original base quality scores from the OQ tag when present instead of the standard scores", required=false)
     public Boolean useOriginalBaseQualities = false;
 
     @Argument(fullName="defaultBaseQualities", shortName = "DBQ", doc = "If reads are missing some or all base quality scores, this value will be used for all base quality scores", required=false)
     public byte defaultBaseQualities = -1;
 
-    @Element(required = false)
     @Argument(fullName = "validation_strictness", shortName = "S", doc = "How strict should we be with validation", required = false)
     public SAMFileReader.ValidationStringency strictnessLevel = SAMFileReader.ValidationStringency.SILENT;
 
-    @Element(required = false)
     @Argument(fullName = "unsafe", shortName = "U", doc = "If set, enables unsafe operations: nothing will be checked at runtime.  For expert users only who know what they are doing.  We do not support usage of this argument.", required = false)
     public ValidationExclusion.TYPE unsafe;
 
-    /** How many threads should be allocated to this analysis. */
-    @Element(required = false)
-    @Argument(fullName = "num_threads", shortName = "nt", doc = "How many threads should be allocated to running this analysis.", required = false)
+    @Argument(fullName = "num_threads", shortName = "nt", doc = "How many threads should be allocated to running this analysis", required = false)
     public int numberOfThreads = 1;
 
-    /** What rule should we use when merging intervals */
-    @Element(required = false)
-    @Argument(fullName = "interval_merging", shortName = "im", doc = "What interval merging rule should we use.", required = false)
-    public IntervalMergingRule intervalMerging = IntervalMergingRule.ALL;
-
-    @ElementList(required = false)
-    @Input(fullName = "read_group_black_list", shortName="rgbl", doc="Filters out read groups matching <TAG>:<STRING> or a .txt file containing the filter strings one per line.", required = false)
+    @Input(fullName = "read_group_black_list", shortName="rgbl", doc="Filters out read groups matching <TAG>:<STRING> or a .txt file containing the filter strings one per line", required = false)
     public List<String> readGroupBlackList = null;
 
     // --------------------------------------------------------------------------------------------------------------
     //
-    // distributed GATK arguments
+    // PED (pedigree) support
     //
     // --------------------------------------------------------------------------------------------------------------
-    @Element(required=false)
-    @Argument(fullName="processingTracker",shortName="C",doc="A lockable, shared file for coordinating distributed GATK runs",required=false)
-    @Hidden
-    public File processingTrackerFile = null;
 
-    @Element(required=false)
-    @Argument(fullName="restartProcessingTracker",shortName="RPT",doc="Should we delete the processing tracker file at startup?",required=false)
-    @Hidden
-    public boolean restartProcessingTracker = false;
+    /**
+     * <p>Reads PED file-formatted tabular text files describing meta-data about the samples being
+     * processed in the GATK.</p>
+     *
+     * <ul>
+     *  <li>see <a href="http://www.broadinstitute.org/mpg/tagger/faq.html">http://www.broadinstitute.org/mpg/tagger/faq.html</a></li>
+     *  <li>see <a href="http://pngu.mgh.harvard.edu/~purcell/plink/data.shtml#ped">http://pngu.mgh.harvard.edu/~purcell/plink/data.shtml#ped</a></li>
+     * </ul>
+     *
+     * <p>The PED file is a white-space (space or tab) delimited file: the first six columns are mandatory:</p>
+     *
+     * <ul>
+     *  <li>Family ID</li>
+     *  <li>Individual ID</li>
+     *  <li>Paternal ID</li>
+     *  <li>Maternal ID</li>
+     *  <li>Sex (1=male; 2=female; other=unknown)</li>
+     *  <li>Phenotype</li>
+     * </ul>
+     *
+     *  <p>The IDs are alphanumeric: the combination of family and individual ID should uniquely identify a person.
+     *  A PED file must have 1 and only 1 phenotype in the sixth column. The phenotype can be either a
+     *  quantitative trait or an affection status column: GATK will automatically detect which type
+     *  (i.e. based on whether a value other than 0, 1, 2 or the missing genotype code is observed).</p>
+     *
+     *  <p>If an individual's sex is unknown, then any character other than 1 or 2 can be used.</p>
+     *
+     *  <p>You can add a comment to a PED or MAP file by starting the line with a # character. The rest of that
+     *  line will be ignored. Do not start any family IDs with this character therefore.</p>
+     *
+     *  <p>Affection status should be coded:</p>
+     *
+     * <ul>
+     *  <li>-9 missing</li>
+     *   <li>0 missing</li>
+     *   <li>1 unaffected</li>
+     *   <li>2 affected</li>
+     * </ul>
+     *
+     * <p>If any value outside of -9,0,1,2 is detected than the samples are assumed
+     * to phenotype values are interpreted as string phenotype values.  In this case -9 uniquely
+     * represents the missing value.</p>
+     *
+     * <p>Genotypes (column 7 onwards) cannot be specified to the GATK.</p>
+     *
+     * <p>For example, here are two individuals (one row = one person):</p>
+     *
+     * <pre>
+     *   FAM001  1  0 0  1  2
+     *   FAM001  2  0 0  1  2
+     * </pre>
+     *
+     * <p>Each -ped argument can be tagged with NO_FAMILY_ID, NO_PARENTS, NO_SEX, NO_PHENOTYPE to
+     * tell the GATK PED parser that the corresponding fields are missing from the ped file.</p>
+     *
+     * <p>Note that most GATK walkers do not use pedigree information.  Walkers that require pedigree
+     * data should clearly indicate so in their arguments and will throw errors if required pedigree
+     * information is missing.</p>
+     */
+    @Argument(fullName="pedigree", shortName = "ped", doc="Pedigree files for samples",required=false)
+    public List<File> pedigreeFiles = Collections.emptyList();
 
-    @Element(required=false)
-    @Argument(fullName="processingTrackerStatusFile",shortName="CSF",doc="If provided, a detailed accounting of the state of the process tracker is written to this file.  For debugging, only",required=false)
-    @Hidden
-    public File processingTrackerStatusFile = null;
+    /**
+     * Inline PED records (see -ped argument).  Each -pedString STRING can contain one or more
+     * valid PED records (see -ped) separated by semi-colons.  Supports all tags for each pedString
+     * as -ped supports
+     */
+    @Argument(fullName="pedigreeString", shortName = "pedString", doc="Pedigree string for samples",required=false)
+    public List<String> pedigreeStrings = Collections.emptyList();
 
-    @Element(required=false)
-    @Argument(fullName="processingTrackerID",shortName="CID",doc="If provided, an integer ID (starting at 1) indicating a unique id for this process within the distributed GATK group",required=false)
-    @Hidden
-    public int processTrackerID = -1;
+    /**
+     * How strict should we be in parsing the PED files?
+     */
+    @Argument(fullName="pedigreeValidationType", shortName = "pedValidationType", doc="How strict should we be in validating the pedigree information?",required=false)
+    public PedigreeValidationType pedigreeValidationType = PedigreeValidationType.STRICT;
+
+    // --------------------------------------------------------------------------------------------------------------
+    //
+    // BAM indexing and sharding arguments
+    //
+    // --------------------------------------------------------------------------------------------------------------
 
-    @Element(required = false)
     @Argument(fullName="allow_intervals_with_unindexed_bam",doc="Allow interval processing with an unsupported BAM.  NO INTEGRATION TESTS are available.  Use at your own risk.",required=false)
     @Hidden
     public boolean allowIntervalsWithUnindexedBAM = false;
 
-    @Element(required = false)
-    @Argument(fullName="disable_experimental_low_memory_sharding",doc="Disable experimental low-memory sharding functionality.",required=false)
+    @Argument(fullName="disable_experimental_low_memory_sharding",doc="Disable experimental low-memory sharding functionality",required=false)
     public boolean disableLowMemorySharding = false;
 
     // --------------------------------------------------------------------------------------------------------------
@@ -253,69 +301,6 @@ public class GATKArgumentCollection {
     //
     // --------------------------------------------------------------------------------------------------------------
 
-    /**
-     * marshal the data out to a object
-     *
-     * @param collection the GATKArgumentCollection to load into
-     * @param outputFile the file to write to
-     */
-    public static void marshal(GATKArgumentCollection collection, String outputFile) {
-        Serializer serializer = new Persister(new Format(new HyphenStyle()));
-        File result = new File(outputFile);
-        try {
-            serializer.write(collection, result);
-        } catch (Exception e) {
-            throw new ReviewedStingException("Failed to marshal the data to the file " + outputFile, e);
-        }
-    }
-
-    /**
-     * marshal the data out to a object
-     *
-     * @param collection the GATKArgumentCollection to load into
-     * @param outputFile the stream to write to
-     */
-    public static void marshal(GATKArgumentCollection collection, PrintStream outputFile) {
-        Serializer serializer = new Persister(new Format(new HyphenStyle()));
-        try {
-            serializer.write(collection, outputFile);
-        } catch (Exception e) {
-            throw new ReviewedStingException("Failed to marshal the data to the file " + outputFile, e);
-        }
-    }
-
-    /**
-     * unmashall the object from a configuration file
-     *
-     * @param filename the filename to marshal from
-     */
-    public static GATKArgumentCollection unmarshal(String filename) {
-        Serializer serializer = new Persister(new Format(new HyphenStyle()));
-        File source = new File(filename);
-        try {
-            GATKArgumentCollection example = serializer.read(GATKArgumentCollection.class, source);
-            return example;
-        } catch (Exception e) {
-            throw new ReviewedStingException("Failed to marshal the data from file " + filename, e);
-        }
-    }
-
-    /**
-     * unmashall the object from a configuration file
-     *
-     * @param file the inputstream to marshal from
-     */
-    public static GATKArgumentCollection unmarshal(InputStream file) {
-        Serializer serializer = new Persister(new Format(new HyphenStyle()));
-        try {
-            GATKArgumentCollection example = serializer.read(GATKArgumentCollection.class, file);
-            return example;
-        } catch (Exception e) {
-            throw new ReviewedStingException("Failed to marshal the data from file " + file.toString(), e);
-        }
-    }
-
-
     /**
      * test equality between two arg collections.  This function defines the statement:
      * "not fun to write"
@@ -363,7 +348,7 @@ public class GATKArgumentCollection {
         if (!other.referenceFile.equals(this.referenceFile)) {
             return false;
         }
-        if (!other.intervals.equals(this.intervals)) {
+        if ((other.intervals == null && this.intervals != null) || !other.intervals.equals(this.intervals)) {
             return false;
         }
         if (!other.excludeIntervals.equals(this.excludeIntervals)) {
@@ -386,39 +371,21 @@ public class GATKArgumentCollection {
         if (other.intervalMerging != this.intervalMerging) {
             return false;
         }
-        if ((other.RODToInterval == null && RODToInterval != null) ||
-            (other.RODToInterval != null && !other.RODToInterval.equals(RODToInterval))) {
-            return false;
-        }
 
         if (other.phoneHomeType != this.phoneHomeType) {
             return false;
         }
 
-        if (BTIMergeRule != other.BTIMergeRule)
+        if (intervalSetRule != other.intervalSetRule)
             return false;
 
-        if ( BAQMode != other.BAQMode) return false;
+        if ( BAQMode != other.BAQMode ) return false;
         if ( BAQGOP != other.BAQGOP ) return false;
 
         if ((other.performanceLog == null && this.performanceLog != null) ||
                 (other.performanceLog != null && !other.performanceLog.equals(this.performanceLog)))
             return false;
 
-        if ((other.processingTrackerFile == null && this.processingTrackerFile != null) ||
-                (other.processingTrackerFile != null && !other.processingTrackerFile.equals(this.processingTrackerFile)))
-            return false;
-
-        if ((other.processingTrackerStatusFile == null && this.processingTrackerStatusFile != null) ||
-                (other.processingTrackerStatusFile != null && !other.processingTrackerStatusFile.equals(this.processingTrackerStatusFile)))
-            return false;
-
-        if ( restartProcessingTracker != other.restartProcessingTracker )
-            return false;
-
-        if ( processTrackerID != other.processTrackerID )
-            return false;
-
         if (allowIntervalsWithUnindexedBAM != other.allowIntervalsWithUnindexedBAM)
             return false;
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/arguments/StandardVariantContextInputArgumentCollection.java b/public/java/src/org/broadinstitute/sting/gatk/arguments/StandardVariantContextInputArgumentCollection.java
index 654770fe7..4c0257e6a 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/arguments/StandardVariantContextInputArgumentCollection.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/arguments/StandardVariantContextInputArgumentCollection.java
@@ -28,13 +28,11 @@ package org.broadinstitute.sting.gatk.arguments;
 import org.broadinstitute.sting.commandline.Input;
 import org.broadinstitute.sting.commandline.RodBinding;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
-import org.simpleframework.xml.Root;
 
 /**
  * @author ebanks
  * @version 1.0
  */
-@Root
 public class StandardVariantContextInputArgumentCollection {
 
     /**
diff --git a/public/java/src/org/broadinstitute/sting/gatk/arguments/ValidationExclusion.java b/public/java/src/org/broadinstitute/sting/gatk/arguments/ValidationExclusion.java
index 0d5a23f1d..577f7929a 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/arguments/ValidationExclusion.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/arguments/ValidationExclusion.java
@@ -37,7 +37,6 @@ public class ValidationExclusion {
 
     public enum TYPE {
         ALLOW_UNINDEXED_BAM,        // allow bam files that do not have an index; we'll traverse them using monolithic shard
-        ALLOW_EMPTY_INTERVAL_LIST,  // allow the user to pass in an empty interval list
         ALLOW_UNSET_BAM_SORT_ORDER, // assume that the bam is sorted, even if the SO (sort-order) flag is not set
         NO_READ_ORDER_VERIFICATION, // do not validate that the reads are in order as we take them from the bam file
         ALLOW_SEQ_DICT_INCOMPATIBILITY, // allow dangerous, but not fatal, sequence dictionary incompabilities
diff --git a/public/java/src/org/broadinstitute/sting/gatk/contexts/AlignmentContext.java b/public/java/src/org/broadinstitute/sting/gatk/contexts/AlignmentContext.java
index 17e4a0743..57416d111 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/contexts/AlignmentContext.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/contexts/AlignmentContext.java
@@ -25,12 +25,12 @@
 
 package org.broadinstitute.sting.gatk.contexts;
 
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.HasGenomeLocation;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.pileup.ReadBackedExtendedEventPileup;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.List;
 
@@ -130,7 +130,7 @@ public class AlignmentContext implements HasGenomeLocation {
      */
     @Deprecated
     //todo: unsafe and tailored for current usage only; both pileups can be null or worse, bot can be not null in theory
-    public List<SAMRecord> getReads() { return ( basePileup.getReads() ); }
+    public List<GATKSAMRecord> getReads() { return ( basePileup.getReads() ); }
 
     /**
      * Are there any reads associated with this locus?
@@ -138,7 +138,7 @@ public class AlignmentContext implements HasGenomeLocation {
      * @return
      */
     public boolean hasReads() {
-        return basePileup != null && basePileup.size() > 0 ;
+        return basePileup != null && basePileup.getNumberOfElements() > 0 ;
     }
 
     /**
@@ -146,7 +146,7 @@ public class AlignmentContext implements HasGenomeLocation {
      * @return
      */
     public int size() {
-        return basePileup.size();
+        return basePileup.getNumberOfElements();
     }
 
     /**
diff --git a/public/java/src/org/broadinstitute/sting/gatk/contexts/AlignmentContextUtils.java b/public/java/src/org/broadinstitute/sting/gatk/contexts/AlignmentContextUtils.java
index 1f9a7d705..4e75f3ddb 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/contexts/AlignmentContextUtils.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/contexts/AlignmentContextUtils.java
@@ -26,7 +26,6 @@
 package org.broadinstitute.sting.gatk.contexts;
 
 import net.sf.samtools.SAMReadGroupRecord;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
@@ -76,14 +75,6 @@ public class AlignmentContextUtils {
         return splitContextBySampleName(context, null);
     }
 
-    public static Map<Sample, AlignmentContext> splitContextBySample(AlignmentContext context) {
-        Map<Sample, AlignmentContext> m = new HashMap<Sample, AlignmentContext>();
-        for ( Map.Entry<String, AlignmentContext> entry : splitContextBySampleName(context, null).entrySet() ) {
-            m.put(new Sample(entry.getKey()), entry.getValue());
-        }
-        return m;
-    }
-
     /**
      * Splits the given AlignmentContext into a StratifiedAlignmentContext per sample, but referencd by sample name instead
      * of sample object.
@@ -97,11 +88,11 @@ public class AlignmentContextUtils {
         GenomeLoc loc = context.getLocation();
         HashMap<String, AlignmentContext> contexts = new HashMap<String, AlignmentContext>();
 
-        for(String sample: context.getPileup().getSampleNames()) {
-            ReadBackedPileup pileupBySample = context.getPileup().getPileupForSampleName(sample);
+        for(String sample: context.getPileup().getSamples()) {
+            ReadBackedPileup pileupBySample = context.getPileup().getPileupForSample(sample);
 
             // Don't add empty pileups to the split context.
-            if(pileupBySample.size() == 0)
+            if(pileupBySample.getNumberOfElements() == 0)
                 continue;
 
             if(sample != null)
diff --git a/public/java/src/org/broadinstitute/sting/gatk/datasources/providers/AllLocusView.java b/public/java/src/org/broadinstitute/sting/gatk/datasources/providers/AllLocusView.java
index e92599494..a6731ee18 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/datasources/providers/AllLocusView.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/datasources/providers/AllLocusView.java
@@ -1,10 +1,10 @@
 package org.broadinstitute.sting.gatk.datasources.providers;
 
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.iterators.GenomeLocusIterator;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileupImpl;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.Collections;
 import java.util.List;
@@ -132,7 +132,7 @@ public class AllLocusView extends LocusView {
      * @param site Site at which to create the blank locus context.
      * @return empty context.
      */
-    private final static List<SAMRecord> EMPTY_PILEUP_READS = Collections.emptyList();
+    private final static List<GATKSAMRecord> EMPTY_PILEUP_READS = Collections.emptyList();
     private final static List<Integer> EMPTY_PILEUP_OFFSETS = Collections.emptyList();
     private AlignmentContext createEmptyLocus( GenomeLoc site ) {
         return new AlignmentContext(site,new ReadBackedPileupImpl(site, EMPTY_PILEUP_READS, EMPTY_PILEUP_OFFSETS));
diff --git a/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/LowMemoryIntervalSharder.java b/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/LowMemoryIntervalSharder.java
index ba6321121..bf5f33dc3 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/LowMemoryIntervalSharder.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/LowMemoryIntervalSharder.java
@@ -59,7 +59,7 @@ public class LowMemoryIntervalSharder implements Iterator<FilePointer> {
      */
     public FilePointer next() {
         FilePointer current = wrappedIterator.next();
-        while(wrappedIterator.hasNext() && current.minus(wrappedIterator.peek()) == 0)
+        while(wrappedIterator.hasNext() && current.isRegionUnmapped == wrappedIterator.peek().isRegionUnmapped && current.minus(wrappedIterator.peek()) == 0)
             current = current.combine(parser,wrappedIterator.next());
         return current;
     }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/SAMDataSource.java b/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/SAMDataSource.java
index 572970349..8452aadfd 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/SAMDataSource.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/SAMDataSource.java
@@ -43,6 +43,7 @@ import org.broadinstitute.sting.utils.baq.BAQ;
 import org.broadinstitute.sting.utils.baq.BAQSamIterator;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.sam.GATKSamRecordFactory;
 
 import java.io.File;
 import java.lang.reflect.InvocationTargetException;
@@ -57,6 +58,8 @@ import java.util.*;
  * Converts shards to SAM iterators over the specified region
  */
 public class SAMDataSource {
+    final private static GATKSamRecordFactory factory = new GATKSamRecordFactory();
+
     /** Backing support for reads. */
     protected final ReadProperties readProperties;
 
@@ -235,6 +238,12 @@ public class SAMDataSource {
         for(SAMFileReader reader: readers.values()) {
             // Get the sort order, forcing it to coordinate if unsorted.
             SAMFileHeader header = reader.getFileHeader();
+
+            if ( header.getReadGroups().isEmpty() ) {
+                throw new UserException.MalformedBAM(readers.getReaderID(reader).samFile,
+                        "SAM file doesn't have any read groups defined in the header.  The GATK no longer supports SAM files without read groups");
+            }
+
             SAMFileHeader.SortOrder sortOrder = header.getSortOrder() != SAMFileHeader.SortOrder.unsorted ? header.getSortOrder() : SAMFileHeader.SortOrder.coordinate;
 
             // Validate that all input files are sorted in the same order.
@@ -638,7 +647,9 @@ public class SAMDataSource {
                                                         BAQ.QualityMode qmode,
                                                         IndexedFastaSequenceFile refReader,
                                                         byte defaultBaseQualities) {
-        wrappedIterator = new ReadFormattingIterator(wrappedIterator, useOriginalBaseQualities, defaultBaseQualities);
+        if ( useOriginalBaseQualities || defaultBaseQualities >= 0 )
+            // only wrap if we are replacing the original qualitiies or using a default base quality
+            wrappedIterator = new ReadFormattingIterator(wrappedIterator, useOriginalBaseQualities, defaultBaseQualities);
 
         // NOTE: this (and other filtering) should be done before on-the-fly sorting
         //  as there is no reason to sort something that we will end of throwing away
@@ -750,6 +761,7 @@ public class SAMDataSource {
         public SAMReaders(Collection<SAMReaderID> readerIDs, SAMFileReader.ValidationStringency validationStringency) {
             for(SAMReaderID readerID: readerIDs) {
                 SAMFileReader reader = new SAMFileReader(readerID.samFile);
+                reader.setSAMRecordFactory(factory);
                 reader.enableFileSource(true);
                 reader.enableIndexMemoryMapping(false);
                 if(!enableLowMemorySharding)
diff --git a/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/utilities/FindLargeShards.java b/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/utilities/FindLargeShards.java
index 24d8bc6c5..673df6dfa 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/utilities/FindLargeShards.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/datasources/reads/utilities/FindLargeShards.java
@@ -97,7 +97,7 @@ public class FindLargeShards extends CommandLineProgram {
         // intervals
         GenomeLocSortedSet intervalSortedSet = null;
         if(intervals != null)
-            intervalSortedSet = IntervalUtils.sortAndMergeIntervals(genomeLocParser, IntervalUtils.parseIntervalArguments(genomeLocParser, intervals, true), IntervalMergingRule.ALL);
+            intervalSortedSet = IntervalUtils.sortAndMergeIntervals(genomeLocParser, IntervalUtils.parseIntervalArguments(genomeLocParser, intervals), IntervalMergingRule.ALL);
         else {
             intervalSortedSet = new GenomeLocSortedSet(genomeLocParser);
             for(SAMSequenceRecord entry: refReader.getSequenceDictionary().getSequences())
diff --git a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/PropertyDefinition.java b/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/PropertyDefinition.java
deleted file mode 100644
index 433e0af40..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/PropertyDefinition.java
+++ /dev/null
@@ -1,30 +0,0 @@
-package org.broadinstitute.sting.gatk.datasources.sample;
-
-/**
- * Created by IntelliJ IDEA.
- * User: brett
- * Date: Aug 12, 2010
- * Time: 2:09:16 PM
- */
-public class PropertyDefinition {
-
-    String property;
-
-    String[] values;
-
-    public String getProperty() {
-        return property;
-    }
-
-    public void setProperty(String property) {
-        this.property = property;
-    }
-
-    public String[] getValues() {
-        return values;
-    }
-
-    public void setValues(String[] values) {
-        this.values = values;
-    }
-}
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/Sample.java b/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/Sample.java
deleted file mode 100644
index ca8756684..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/Sample.java
+++ /dev/null
@@ -1,203 +0,0 @@
-package org.broadinstitute.sting.gatk.datasources.sample;
-
-
-import org.broadinstitute.sting.utils.exceptions.StingException;
-
-import java.util.Collections;
-import java.util.HashMap;
-import java.util.Map;
-
-/**
- * Created by IntelliJ IDEA.
- * User: brett
- * Date: Jul 26, 2010
- * Time: 3:31:38 PM
- */
-public class Sample implements java.io.Serializable {
-
-    private final String id;
-
-    private boolean hasSampleFileEntry = false; // true if this sample has an entry in a sample file
-
-    private boolean hasSAMFileEntry = false; // true if this sample has an entry in the SAM file
-
-    private HashMap<String, Object> properties = new HashMap<String, Object>();
-
-    private HashMap<String, Sample> relationships = new HashMap<String, Sample>();
-
-    public enum Gender {
-        MALE,
-        FEMALE,
-        UNKNOWN
-    }
-
-    public Sample(String id) {
-/*        if (id == null) {
-            throw new StingException("Error creating sample: sample ID cannot be null");
-        }*/
-        this.id = id;
-    }
-
-    public String getId() {
-        return this.id;
-    }
-
-    public Map<String, Object> getProperties() {
-        return properties;
-    }
-
-    public void setProperties(Map<String, Object> properties) {
-        this.properties = (HashMap) properties;
-    }
-
-    public Map<String,Sample> getRelationships() {
-        return Collections.unmodifiableMap(this.relationships);
-    }
-
-    public void setSampleFileEntry(boolean value) {
-        this.hasSampleFileEntry = value;
-    }
-
-    public boolean hasSAMFileEntry() {
-        return this.hasSAMFileEntry;
-    }
-
-    public void setSAMFileEntry(boolean value) {
-        this.hasSAMFileEntry = value;
-    }
-
-    public boolean hasSampleFileEntry() {
-        return this.hasSampleFileEntry;
-    }
-
-    /**
-     * Get one property
-     * @param key key of property
-     * @return value of property as generic object
-     */
-    public Object getProperty(String key) {
-        return properties.get(key);
-    }
-
-    /**
-     * Set a property
-     * If property already exists, it is overwritten
-     * @param key key of property
-     * @param value object to be stored in properties array
-     */
-    public void setProperty(String key, Object value) {
-
-        if (relationships.containsKey(key)) {
-            throw new StingException("The same key cannot exist as a property and a relationship");
-        }
-
-        if (key.equals("gender") && value.getClass() != Gender.class) {
-            throw new StingException("'gender' property must be of type Sample.Gender");
-        }
-
-        if (key.equals("population") && value.getClass() != String.class) {
-            throw new StingException("'population' property must be of type String");
-        }
-
-        properties.put(key, value);
-    }
-
-    /**
-     * Get one relationship
-     * @param key of relationship
-     * @return Sample object that this relationship points to
-     */
-    public Sample getRelationship(String key) {
-        return relationships.get(key);
-    }
-
-    /**
-     * Set one relationship
-     * If already set, it is overwritten
-     * @param key key of the relationship
-     * @param value Sample object this relationship points to
-     */
-    public void setRelationship(String key, Sample value) {
-        if (properties.containsKey(key)) {
-            throw new StingException("The same key cannot exist as a property and a relationship");
-        }
-        relationships.put(key, value);
-    }
-
-    /**
-     * Get the sample's mother
-     * @return sample object with relationship mother, if exists, or null
-     */
-    public Sample getMother() {
-        return getRelationship("mother");
-    }
-
-    /**
-     * Get the sample's father
-     * @return sample object with relationship father, if exists, or null
-     */
-    public Sample getFather() {
-        return getRelationship("father");
-    }
-
-    /**
-     * Get gender of the sample
-     * @return property of key "gender" - must be of type Gender
-     */
-    public Gender getGender() {
-        return (Gender) properties.get("gender");
-    }
-
-    public String getPopulation() {
-        return (String) properties.get("population");
-    }
-
-    public String getFamilyId() {
-        return (String) properties.get("familyId");
-    }
-
-    /**
-     * @return True if sample is male, false if female, unknown, or null
-     */
-    public boolean isMale() {
-        return properties.get("gender") == Gender.MALE;
-    }
-
-    /**
-     * @return True if sample is female, false if male, unknown or null
-     */
-    public boolean isFemale() {
-        return properties.get("gender") == Gender.MALE;
-    }
-
-    /**
-     *
-     * @param key property key
-     * @return true if sample has this property (even if its value is null)
-     */
-    public boolean hasProperty(String key) {
-        return properties.containsKey(key);
-    }
-
-    @Override
-    public boolean equals(Object o) {
-        if (this == o) return true;
-        if (o == null || getClass() != o.getClass()) return false;
-
-        Sample sample = (Sample) o;
-
-        if (hasSAMFileEntry != sample.hasSAMFileEntry) return false;
-        if (hasSampleFileEntry != sample.hasSampleFileEntry) return false;
-        if (id != null ? !id.equals(sample.id) : sample.id != null) return false;
-        if (properties != null ? !properties.equals(sample.properties) : sample.properties != null) return false;
-        if (relationships != null ? !relationships.equals(sample.relationships) : sample.relationships != null)
-            return false;
-
-        return true;
-    }
-
-    @Override
-    public int hashCode() {
-        return id != null ? id.hashCode() : "".hashCode();
-    }
-}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleAlias.java b/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleAlias.java
deleted file mode 100644
index ce749cb83..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleAlias.java
+++ /dev/null
@@ -1,31 +0,0 @@
-package org.broadinstitute.sting.gatk.datasources.sample;
-
-/**
- * Created by IntelliJ IDEA.
- * User: brett
- * Date: Aug 13, 2010
- * Time: 5:13:46 PM
- */
-public class SampleAlias {
-
-    String mainId;
-
-    String[] otherIds;
-
-    public String getMainId() {
-        return mainId;
-    }
-
-    public void setMainId(String mainId) {
-        this.mainId = mainId;
-    }
-
-    public String[] getOtherIds() {
-        return otherIds;
-    }
-
-    public void setOtherIds(String[] otherIds) {
-        this.otherIds = otherIds;
-    }
-
-}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleDataSource.java b/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleDataSource.java
deleted file mode 100644
index 067bf3f72..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleDataSource.java
+++ /dev/null
@@ -1,590 +0,0 @@
-package org.broadinstitute.sting.gatk.datasources.sample;
-
-import net.sf.samtools.SAMFileHeader;
-import net.sf.samtools.SAMReadGroupRecord;
-import net.sf.samtools.SAMRecord;
-import org.broadinstitute.sting.utils.SampleUtils;
-import org.broadinstitute.sting.utils.exceptions.StingException;
-import org.broadinstitute.sting.utils.variantcontext.Genotype;
-import org.broadinstitute.sting.utils.variantcontext.VariantContext;
-import org.yaml.snakeyaml.TypeDescription;
-import org.yaml.snakeyaml.Yaml;
-import org.yaml.snakeyaml.constructor.Constructor;
-
-import java.io.BufferedReader;
-import java.io.File;
-import java.io.FileReader;
-import java.io.IOException;
-import java.util.*;
-
-/**
- * Created by IntelliJ IDEA.
- * User: brett
- * Date: Jul 26, 2010
- * Time: 3:30:09 PM
- *
- * This class stores and manages sample metadata. This data is encoded in a sample file, which can be included
- * in the GATK by the "--samples" argument. This class reads and parses those files.
- *
- * Although there are a set of public methods for accessing sample data, they aren't used by walkers - they are really
- * only used by GenomeAnalysisEngine. An instance of GenomeAnalysisEngine has one SampleDataSource. When a walker
- * wants to access sample data, it asks GenomeAnalysis to fetch this data from its SampleDataSource.
- *
- */
-public class SampleDataSource {
-
-    /**
-     * SAMFileHeader that has been created for this analysis.
-     */
-    private SAMFileHeader header;
-
-    /**
-     * This is where Sample objects are stored. Samples are usually accessed by their ID, which is unique, so
-     * this is stored as a HashMap.
-     */
-    private final HashMap<String, Sample> samples = new HashMap<String, Sample>();
-
-    /**
-     * Samples can have "aliases", because sometimes the same sample is referenced by different IDs in different
-     * datasets. If this is the case, one ID is the "primary ID" and others are "aliases".
-     *
-     * This maps ID => primary ID for all samples ID strings - both primary IDs and aliases.
-     */
-    private HashMap<String, String> sampleAliases = new HashMap<String, String>();
-
-    /**
-     * While loading sample files, we must be aware of "special" properties and relationships that are always allowed
-     */
-    public static final String[] specialProperties = new String[] {"familyId", "population", "gender"};
-    public static final String[] specialRelationships = new String[] {"mother", "father"};
-
-    /**
-     * Constructor takes both a SAM header and sample files because the two must be integrated.
-     * @param header SAMFileHeader that has been created for this analysis
-     * @param sampleFiles Sample files that were included on the command line
-     */
-    public SampleDataSource(SAMFileHeader header, List<File> sampleFiles) {
-        this();
-        this.header = header;
-        // create empty sample object for each sample referenced in the SAM header
-        for (String sampleName : SampleUtils.getSAMFileSamples(header)) {
-            if (!hasSample(sampleName)) {
-                Sample newSample = new Sample(sampleName);
-                newSample.setSAMFileEntry(true);
-                samples.put(sampleName, newSample);
-            }
-        }
-
-        // add files consecutively
-        if (sampleFiles != null) {
-            for (File file : sampleFiles) {
-                addFile(file);
-            }
-        }
-    }
-
-    public SampleDataSource() {
-        samples.put(null, new Sample(null));
-    }
-
-    /**
-     * Hallucinates sample objects for all the samples in the SAM file and stores them
-     */
-    public void addSamplesFromSAMHeader(SAMFileHeader header) {
-        for (String sampleName : SampleUtils.getSAMFileSamples(header)) {
-            if (!hasSample(sampleName)) {
-                Sample newSample = new Sample(sampleName);
-                newSample.setSAMFileEntry(true);
-                samples.put(sampleName, newSample);
-            }
-        }
-    }
-
-    /**
-     * Parse one sample file and integrate it with samples that are already there
-     * Fail quickly if we find any errors in the file
-     */
-    public void addFile(File sampleFile) {
-
-        BufferedReader reader;
-        try {
-            reader = new BufferedReader(new FileReader(sampleFile));
-        }
-        catch (IOException e) {
-            throw new StingException("Could not open sample file " + sampleFile.getAbsolutePath(), e);
-        }
-
-        // set up YAML reader - a "Constructor" creates java object from YAML and "Loader" loads the file
-        Constructor con = new Constructor(SampleFileParser.class);
-        TypeDescription desc = new TypeDescription(SampleFileParser.class);
-        desc.putListPropertyType("propertyDefinitions", PropertyDefinition.class);
-        desc.putListPropertyType("sampleAliases", SampleAlias.class);
-        con.addTypeDescription(desc);
-        Yaml yaml = new Yaml(con);
-
-        // SampleFileParser stores an object representation of a sample file - this is what we'll parse
-        SampleFileParser parser;
-        try {
-            parser = (SampleFileParser) yaml.load(reader);
-        }
-        catch (Exception e) {
-            throw new StingException("There was a syntactic error with the YAML in sample file " + sampleFile.getAbsolutePath(), e);
-        }
-
-        // check to see which validation options were built into the file
-        boolean restrictProperties = parser.getAllowedProperties() != null;
-        boolean restrictRelationships = parser.getAllowedRelationships() != null;
-        boolean restrictPropertyValues = parser.getPropertyDefinitions() != null;
-
-        // propertyValues stores the values that are allowed for a given property
-        HashMap<String, HashSet> propertyValues = null;
-        if (restrictPropertyValues) {
-            propertyValues = new HashMap<String, HashSet>();
-            for (PropertyDefinition def : parser.getPropertyDefinitions()) {
-                HashSet<String> set = new HashSet<String>();
-                for (String value : def.getValues()) {
-                    set.add(value);
-                }
-                propertyValues.put(def.getProperty(), set);
-            }
-        }
-
-        // make sure the aliases are valid
-        validateAliases(parser);
-
-        // loop through each sample in the file - a SampleParser stores an object that will become a Sample
-        for (SampleParser sampleParser : parser.getSamples()) {
-
-            try {
-            // step 1: add the sample if it doesn't already exist
-            Sample sample = getSampleById(sampleParser.getId());
-            if (sample == null) {
-                sample = new Sample(sampleParser.getId());
-            }
-            addSample(sample);
-            sample.setSampleFileEntry(true);
-
-            // step 2: add the properties
-            if (sampleParser.getProperties() != null) {
-                for (String property : sampleParser.getProperties().keySet()) {
-
-                    // check that property is allowed
-                    if (restrictProperties) {
-                        if (!isPropertyValid(property, parser.getAllowedProperties())) {
-                            throw new StingException(property + " is an invalid property. It is not included in the list " +
-                                    "of allowed properties.");
-                        }
-                    }
-
-                    // next check that the value is allowed
-                    if (restrictPropertyValues) {
-                        if (!isValueAllowed(property, sampleParser.getProperties().get(property), propertyValues)) {
-                            throw new StingException("The value of property '" + property + "' is invalid. " +
-                                    "It is not included in the list of allowed values for this property.");
-                        }
-                    }
-
-                    // next check that there isn't already a conflicting property there
-                    if (sample.getProperty(property) != null &&
-                            sample.getProperty(property) != sampleParser.getProperties().get(property))
-                    {
-                        throw new StingException(property + " is a conflicting property!");
-                    }
-
-                    // checks are passed - now add the property!
-                    saveProperty(sample, property, sampleParser.getProperties().get(property));
-                }
-            }
-
-            // step 3: add the relationships
-            if (sampleParser.getRelationships() != null) {
-                for (String relationship : sampleParser.getRelationships().keySet()) {
-                    String relativeId = sampleParser.getRelationships().get(relationship);
-                    if (relativeId == null) {
-                        throw new StingException("The relationship cannot be null");
-                    }
-
-                    // first check that it's not invalid
-                    if (restrictRelationships) {
-                        if (!isRelationshipValid(relationship, parser.getAllowedRelationships())) {
-                            throw new StingException(relationship + " is an invalid relationship");
-                        }
-                    }
-
-                    // next check that there isn't already a conflicting property there
-                    if (sample.getRelationship(relationship) != null) {
-                        if (sample.getRelationship(relationship).getId() != sampleParser.getProperties().get(relationship)) {
-                            throw new StingException(relationship + " is a conflicting relationship!");
-                        }
-                        // if the relationship is already set - and consistent with what we're reading now - no need to continue
-                        else {
-                            continue;
-                        }
-                    }
-
-                    // checks are passed - now save the relationship
-                    saveRelationship(sample, relationship, relativeId);
-                }
-            }
-        } catch (Exception e) {
-              throw new StingException("An error occurred while loading this sample from the sample file: " +
-                      sampleParser.getId(), e);
-        }
-        }
-
-    }
-
-    private boolean isValueAllowed(String key, Object value, HashMap<String, HashSet> valuesList) {
-
-        // if the property values weren't specified for this property, then any value is okay
-        if (!valuesList.containsKey(key)) {
-            return true;
-        }
-
-        // if this property has enumerated values, it must be a string
-        else if (value.getClass() != String.class)
-            return false;
-
-        // is the value specified or not?
-        else if (!valuesList.get(key).contains(value))
-            return false;
-
-        return true;
-    }
-
-    /**
-     * Makes sure that the aliases are valid
-     * Checks that 1) no string is used as both a main ID and an alias;
-     * 2) no alias is used more than once
-     * @param parser
-     */
-    private void validateAliases(SampleFileParser parser) {
-
-        // no aliases sure validate
-        if (parser.getSampleAliases() == null)
-            return;
-
-        HashSet<String> mainIds = new HashSet<String>();
-        HashSet<String> otherIds = new HashSet<String>();
-
-        for (SampleAlias sampleAlias : parser.getSampleAliases()) {
-            mainIds.add(sampleAlias.getMainId());
-            for (String otherId : sampleAlias.getOtherIds()) {
-                if (mainIds.contains(otherId))
-                    throw new StingException(String.format("The aliases in your sample file are invalid - the alias %s cannot " +
-                            "be both a main ID and an other ID", otherId));
-
-                if (!otherIds.add(otherId))
-                    throw new StingException(String.format("The aliases in your sample file are invalid - %s is listed as an " +
-                            "alias more than once.", otherId));
-            }
-        }
-    }
-
-    private boolean isPropertyValid(String property, String[] allowedProperties) {
-
-        // is it a special property that is always allowed?
-        for (String allowedProperty : specialProperties) {
-            if (property.equals(allowedProperty))
-                return true;
-        }
-
-        // is it in the allowed properties list?
-        for (String allowedProperty : allowedProperties) {
-            if (property.equals(allowedProperty))
-                return true;
-        }
-
-        return false;
-    }
-
-    private boolean isRelationshipValid(String relationship, String[] allowedRelationships) {
-
-        // is it a special relationship that is always allowed?
-        for (String allowedRelationship : specialRelationships) {
-            if (relationship.equals(allowedRelationship))
-                return true;
-        }
-
-        // is it in the allowed properties list?
-        for (String allowedRelationship : allowedRelationships) {
-            if (relationship.equals(allowedRelationship))
-                return true;
-        }
-
-        return false;
-    }
-
-    /**
-     * Saves a property as the correct type
-     * @param key property key
-     * @param value property value, as read from YAML parser
-     * @return property value to be stored
-     */
-    private void saveProperty(Sample sample, String key, Object value) {
-
-        // convert gender to the right type, if it was stored as a String
-        if (key.equals("gender")) {
-            if (((String) value).toLowerCase().equals("male")) {
-                value = Sample.Gender.MALE;
-            }
-            else if (((String) value).toLowerCase().equals("female")) {
-                value = Sample.Gender.FEMALE;
-            }
-            else  if (((String) value).toLowerCase().equals("unknown")) {
-                value = Sample.Gender.UNKNOWN;
-            }
-            else if (value != null) {
-                throw new StingException("'gender' property must be male, female, or unknown.");
-            }
-        }
-        try {
-            sample.setProperty(key, value);
-        }
-        catch (Exception e) {
-            throw new StingException("Could not save property " + key, e);
-        }
-    }
-
-    /**
-     * Saves a relationship as the correct type
-     * @param key relationship key
-     * @param relativeId sample ID string of the relative
-     * @return relationship value to be stored
-     */
-    private void saveRelationship(Sample sample, String key, String relativeId) {
-
-        // get the reference that we'll store as the value
-        Sample relative = getSampleById(relativeId);
-
-        // create sample object for the relative, if necessary
-        if (relative == null) {
-            relative = new Sample(relativeId);
-            addSample(relative);
-        }
-        sample.setRelationship(key, relative);
-    }
-
-
-
-    /**
-     * Filter a sample name in case it is an alias
-     * @param sampleId to be filtered
-     * @return ID of sample that stores data for this alias
-     */
-    private String aliasFilter(String sampleId) {
-        if (!sampleAliases.containsKey(sampleId))
-            return sampleId;
-        else
-            return sampleAliases.get(sampleId);
-    }
-
-    /**
-     * Add a sample to the collection
-     * @param sample to be added
-     */
-    private void addSample(Sample sample) {
-        samples.put(sample.getId(), sample);
-    }
-
-    /**
-     * Check if sample with this ID exists
-     * Note that this will return true if name passed in is an alias
-     * @param id ID of sample to be checked
-     * @return true if sample exists; false if not
-     */
-    public boolean hasSample(String id) {
-        return samples.get(aliasFilter(id)) != null;
-    }
-
-    /**
-     * Get a sample by its ID
-     * If an alias is passed in, return the main sample object 
-     * @param id
-     * @return sample Object with this ID
-     */
-    public Sample getSampleById(String id) {
-        return samples.get(aliasFilter(id));
-    }
-
-    /**
-     * Get the sample for a given read group
-     * Must first look up ID for read group
-     * @param readGroup of sample
-     * @return sample object with ID from the read group
-     */
-    public Sample getSampleByReadGroup(SAMReadGroupRecord readGroup) {
-        String nameFromReadGroup = readGroup.getSample();
-        return getSampleById(nameFromReadGroup);
-    }
-
-    /**
-     * Get a sample for a given read
-     * Must first look up read group, and then sample ID for that read group
-     * @param read of sample
-     * @return sample object of this read
-     */
-    public Sample getSampleByRead(SAMRecord read) {
-        return getSampleByReadGroup(read.getReadGroup());
-    }
-
-    /**
-     * Get number of sample objects
-     * @return size of samples map
-     */
-    public int sampleCount() {
-        return samples.size();
-    }
-
-    /**
-     * Return all samples with a given family ID
-     * Note that this isn't terribly efficient (linear) - it may be worth adding a new family ID data structure for this
-     * @param familyId
-     * @return
-     */
-    public Set<Sample> getFamily(String familyId) {
-        HashSet<Sample> familyMembers = new HashSet<Sample>();
-
-        for (Sample sample : samples.values()) {
-            if (sample.getFamilyId() != null) {
-                if (sample.getFamilyId().equals(familyId))
-                    familyMembers.add(sample);
-            }
-        }
-        return familyMembers;
-    }
-
-    /**
-     * Returns all children of a given sample
-     * See note on the efficiency of getFamily() - since this depends on getFamily() it's also not efficient
-     * @param sample
-     * @return
-     */
-    public Set<Sample> getChildren(Sample sample) {
-        HashSet<Sample> children = new HashSet<Sample>();
-        for (Sample familyMember : getFamily(sample.getFamilyId())) {
-            if (familyMember.getMother() == sample || familyMember.getFather() == sample) {
-                children.add(familyMember);
-            }
-        }
-        return children;
-    }
-
-    public Set<Sample> getSamples() {
-        HashSet<Sample> set = new HashSet<Sample>();
-        set.addAll(samples.values());
-        return set;
-    }
-
-    /**
-     * Takes a collection of sample names and returns their corresponding sample objects
-     * Note that, since a set is returned, if you pass in a list with duplicates names there will not be any duplicates in the returned set
-     * @param sampleNameList Set of sample names
-     * @return Corresponding set of samples
-     */
-    public Set<Sample> getSamples(Collection<String> sampleNameList) {
-	HashSet<Sample> samples = new HashSet<Sample>();
-        for (String name : sampleNameList) {
-            try {
-                samples.add(getSampleById(name));
-            }
-            catch (Exception e) {
-                throw new StingException("Could not get sample with the following ID: " + name, e);
-            }
-        }
-        return samples;
-    }
-
-    /**
-     * Returns a set of samples that have any value (which could be null) for a given property
-     * @param key Property key
-     * @return Set of samples with the property
-     */
-    public Set<Sample> getSamplesWithProperty(String key) {
-        HashSet<Sample> toReturn = new HashSet<Sample>();
-        for (Sample s : samples.values()) {
-            if (s.hasProperty(key))
-                toReturn.add(s);
-        }
-        return toReturn;
-    }
-
-    /**
-     * Returns a set of samples that have a property with a certain value
-     * Value must be a string for now - could add a similar method for matching any objects in the future
-     *
-     * @param key Property key
-     * @param value String property value
-     * @return Set of samples that match key and value
-     */
-    public Set<Sample> getSamplesWithProperty(String key, String value) {
-        Set<Sample> toReturn = getSamplesWithProperty(key);
-        for (Sample s : toReturn) {
-            if (!s.getProperty(key).equals(value))
-                toReturn.remove(s);
-        }
-        return toReturn;
-    }
-
-    public Sample getOrCreateSample(String id) {
-        Sample sample = getSampleById(id);
-        if (sample == null) {
-            sample = new Sample(id);
-            addSample(sample);
-        }
-        return sample;
-    }
-
-    /**
-     * Returns all samples that were referenced in the SAM file
-     */
-    public Set<Sample> getSAMFileSamples() {
-        Set<Sample> toReturn = new HashSet<Sample>();
-        for (Sample sample : samples.values()) {
-            if (sample.hasSAMFileEntry())
-                toReturn.add(sample);
-        }
-        return toReturn;
-    }
-
-    /**
-     * Returns a set of sample objects for the sample names in a variant context
-     *
-     * @param context Any variant context
-     * @return a set of the sample objects
-     */
-    public Set<Sample> getSamplesByVariantContext(VariantContext context) {
-        Set<Sample> samples = new HashSet<Sample>();
-        for (String sampleName : context.getSampleNames()) {
-            samples.add(getOrCreateSample(sampleName));
-        }
-        return samples;
-    }
-
-
-    /**
-     * Return a subcontext restricted to samples with a given property key/value
-     * Gets the sample names from key/value and relies on VariantContext.subContextFromGenotypes for the filtering
-     * @param context VariantContext to filter
-     * @param key property key
-     * @param value property value (must be string)
-     * @return subcontext
-     */
-    public VariantContext subContextFromSampleProperty(VariantContext context, String key, String value) {
-
-        Set<String> samplesWithProperty = new HashSet<String>();
-        for (String sampleName : context.getSampleNames()) {
-            Sample s = samples.get(sampleName);
-            if (s != null && s.hasProperty(key) && s.getProperty(key).equals(value))
-                samplesWithProperty.add(sampleName);
-        }
-        Map<String, Genotype> genotypes = context.getGenotypes(samplesWithProperty);
-        return context.subContextFromGenotypes(genotypes.values());
-    }
-
-    public static SampleDataSource createEmptyDataSource() {
-        SAMFileHeader header = new SAMFileHeader();
-        return new SampleDataSource(header, null);
-    }
-
-}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleFileParser.java b/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleFileParser.java
deleted file mode 100644
index a362af663..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleFileParser.java
+++ /dev/null
@@ -1,65 +0,0 @@
-package org.broadinstitute.sting.gatk.datasources.sample;
-
-/**
- * Created by IntelliJ IDEA.
- * User: brett
- * Date: Aug 12, 2010
- * Time: 1:30:44 PM
- */
-public class SampleFileParser {
-
-    private SampleAlias[] sampleAliases;
-
-    private String[] allowedProperties;
-
-    private String[] allowedRelationships;
-
-    private PropertyDefinition[] propertyDefinitions;
-
-    private SampleParser[] samples;
-
-    public PropertyDefinition[] getPropertyDefinitions() {
-        return propertyDefinitions;
-    }
-
-    public void setPropertyDefinitions(PropertyDefinition[] propertyDefinitions) {
-        this.propertyDefinitions = propertyDefinitions;
-    }
-
-    public SampleFileParser() {
-
-    }
-
-    public String[] getAllowedProperties() {
-        return allowedProperties;
-    }
-
-    public void setAllowedProperties(String[] allowedProperties) {
-        this.allowedProperties = allowedProperties;
-    }
-
-    public SampleParser[] getSamples() {
-        return samples;
-    }
-
-    public void setSamples(SampleParser[] samples) {
-        this.samples = samples;
-    }
-
-    public String[] getAllowedRelationships() {
-        return allowedRelationships;
-    }
-
-    public void setAllowedRelationships(String[] allowedRelationships) {
-        this.allowedRelationships = allowedRelationships;
-    }
-
-    public SampleAlias[] getSampleAliases() {
-        return sampleAliases;
-    }
-
-    public void setSampleAliases(SampleAlias[] sampleAliases) {
-        this.sampleAliases = sampleAliases;
-    }
-
-}
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleParser.java b/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleParser.java
deleted file mode 100644
index f5e07ca29..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/datasources/sample/SampleParser.java
+++ /dev/null
@@ -1,43 +0,0 @@
-package org.broadinstitute.sting.gatk.datasources.sample;
-
-import java.util.HashMap;
-
-/**
- * Created by IntelliJ IDEA.
- * User: brett
- * Date: Aug 13, 2010
- * Time: 2:09:43 PM
- */
-public class SampleParser {
-
-    private String id;
-
-    private HashMap<String, Object> properties;
-
-    private HashMap<String, String> relationships;
-
-    public String getId() {
-        return id;
-    }
-
-    public void setId(String id) {
-        this.id = id;
-    }
-
-    public HashMap<String, Object> getProperties() {
-        return properties;
-    }
-
-    public void setProperties(HashMap<String, Object> properties) {
-        this.properties = properties;
-    }
-
-    public HashMap<String, String> getRelationships() {
-        return relationships;
-    }
-
-    public void setRelationships(HashMap<String, String> relationships) {
-        this.relationships = relationships;
-    }
-
-}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/executive/HierarchicalMicroScheduler.java b/public/java/src/org/broadinstitute/sting/gatk/executive/HierarchicalMicroScheduler.java
index ae98874c1..162baed00 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/executive/HierarchicalMicroScheduler.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/executive/HierarchicalMicroScheduler.java
@@ -85,12 +85,7 @@ public class HierarchicalMicroScheduler extends MicroScheduler implements Hierar
      */
     protected HierarchicalMicroScheduler(GenomeAnalysisEngine engine, Walker walker, SAMDataSource reads, IndexedFastaSequenceFile reference, Collection<ReferenceOrderedDataSource> rods, int nThreadsToUse ) {
         super(engine, walker, reads, reference, rods);
-
         this.threadPool = Executors.newFixedThreadPool(nThreadsToUse);
-
-        if (engine.getArguments().processingTrackerFile != null) {
-            throw new UserException.BadArgumentValue("-C", "Distributed GATK calculations currently not supported in multi-threaded mode.  Complain to Mark depristo@broadinstitute.org to implement and test this code path");
-        }
     }
 
     public Object execute( Walker walker, ShardStrategy shardStrategy ) {
diff --git a/public/java/src/org/broadinstitute/sting/gatk/executive/LinearMicroScheduler.java b/public/java/src/org/broadinstitute/sting/gatk/executive/LinearMicroScheduler.java
index 09ab4bd44..deafcd0cc 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/executive/LinearMicroScheduler.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/executive/LinearMicroScheduler.java
@@ -13,6 +13,7 @@ import org.broadinstitute.sting.gatk.io.DirectOutputTracker;
 import org.broadinstitute.sting.gatk.io.OutputTracker;
 import org.broadinstitute.sting.gatk.walkers.LocusWalker;
 import org.broadinstitute.sting.gatk.walkers.Walker;
+import org.broadinstitute.sting.utils.SampleUtils;
 
 import java.util.Collection;
 
@@ -56,7 +57,8 @@ public class LinearMicroScheduler extends MicroScheduler {
             traversalEngine.startTimersIfNecessary();
             if(shard.getShardType() == Shard.ShardType.LOCUS) {
                 LocusWalker lWalker = (LocusWalker)walker;
-                WindowMaker windowMaker = new WindowMaker(shard, engine.getGenomeLocParser(), getReadIterator(shard), shard.getGenomeLocs(), engine.getSampleMetadata());
+                WindowMaker windowMaker = new WindowMaker(shard, engine.getGenomeLocParser(),
+                        getReadIterator(shard), shard.getGenomeLocs(), SampleUtils.getSAMFileSamples(engine));
                 for(WindowMaker.WindowMakerIterator iterator: windowMaker) {
                     ShardDataProvider dataProvider = new LocusShardDataProvider(shard,iterator.getSourceInfo(),engine.getGenomeLocParser(),iterator.getLocus(),iterator,reference,rods);
                     Object result = traversalEngine.traverse(walker, dataProvider, accumulator.getReduceInit());
diff --git a/public/java/src/org/broadinstitute/sting/gatk/executive/ShardTraverser.java b/public/java/src/org/broadinstitute/sting/gatk/executive/ShardTraverser.java
index 2b6488ada..badd39860 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/executive/ShardTraverser.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/executive/ShardTraverser.java
@@ -62,16 +62,17 @@ public class ShardTraverser implements Callable {
 
             Object accumulator = walker.reduceInit();
             LocusWalker lWalker = (LocusWalker)walker;
-            WindowMaker windowMaker = new WindowMaker(shard,microScheduler.getEngine().getGenomeLocParser(),microScheduler.getReadIterator(shard),shard.getGenomeLocs(), microScheduler.engine.getSampleMetadata()); // todo: microScheduler.engine is protected - is it okay to user it here?
-            ShardDataProvider dataProvider = null;
+            WindowMaker windowMaker = new WindowMaker(shard,microScheduler.getEngine().getGenomeLocParser(),
+                    microScheduler.getReadIterator(shard),
+                    shard.getGenomeLocs(),
+                    microScheduler.engine.getSampleDB().getSampleNames()); // todo: microScheduler.engine is protected - is it okay to user it here?
 
             for(WindowMaker.WindowMakerIterator iterator: windowMaker) {
-                dataProvider = new LocusShardDataProvider(shard,iterator.getSourceInfo(),microScheduler.getEngine().getGenomeLocParser(),iterator.getLocus(),iterator,microScheduler.reference,microScheduler.rods);
+                final ShardDataProvider dataProvider = new LocusShardDataProvider(shard,iterator.getSourceInfo(),microScheduler.getEngine().getGenomeLocParser(),iterator.getLocus(),iterator,microScheduler.reference,microScheduler.rods);
                 accumulator = traversalEngine.traverse( walker, dataProvider, accumulator );
                 dataProvider.close();
             }
 
-            if (dataProvider != null) dataProvider.close();
             windowMaker.close();
             outputMergeTask = outputTracker.closeStorage();
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/executive/WindowMaker.java b/public/java/src/org/broadinstitute/sting/gatk/executive/WindowMaker.java
index 43ea46002..d1f5d80da 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/executive/WindowMaker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/executive/WindowMaker.java
@@ -4,7 +4,6 @@ import net.sf.picard.util.PeekableIterator;
 import org.broadinstitute.sting.gatk.ReadProperties;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.datasources.reads.Shard;
-import org.broadinstitute.sting.gatk.datasources.sample.SampleDataSource;
 import org.broadinstitute.sting.gatk.iterators.LocusIterator;
 import org.broadinstitute.sting.gatk.iterators.LocusIteratorByState;
 import org.broadinstitute.sting.gatk.iterators.StingSAMIterator;
@@ -12,6 +11,7 @@ import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.GenomeLocParser;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 
+import java.util.Collection;
 import java.util.Iterator;
 import java.util.List;
 import java.util.NoSuchElementException;
@@ -63,17 +63,20 @@ public class WindowMaker implements Iterable<WindowMaker.WindowMakerIterator>, I
      * the given intervals.
      * @param iterator The data source for this window.
      * @param intervals The set of intervals over which to traverse.
-     * @param sampleData SampleDataSource that we can reference reads with
+     * @param sampleNames The complete set of sample names in the reads in shard
      */
 
-    public WindowMaker(Shard shard, GenomeLocParser genomeLocParser, StingSAMIterator iterator, List<GenomeLoc> intervals, SampleDataSource sampleData ) {
+    public WindowMaker(Shard shard, GenomeLocParser genomeLocParser, StingSAMIterator iterator, List<GenomeLoc> intervals, Collection<String> sampleNames) {
         this.sourceInfo = shard.getReadProperties();
         this.readIterator = iterator;
-
-        this.sourceIterator = new PeekableIterator<AlignmentContext>(new LocusIteratorByState(iterator,sourceInfo,genomeLocParser,sampleData));
+        this.sourceIterator = new PeekableIterator<AlignmentContext>(new LocusIteratorByState(iterator,sourceInfo,genomeLocParser, sampleNames));
         this.intervalIterator = intervals.size()>0 ? new PeekableIterator<GenomeLoc>(intervals.iterator()) : null;
     }
 
+    public WindowMaker(Shard shard, GenomeLocParser genomeLocParser, StingSAMIterator iterator, List<GenomeLoc> intervals ) {
+        this(shard, genomeLocParser, iterator, intervals, LocusIteratorByState.sampleListForSAMWithoutReadGroups());
+    }
+
     public Iterator<WindowMakerIterator> iterator() {
         return this;
     }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/filters/MalformedReadFilter.java b/public/java/src/org/broadinstitute/sting/gatk/filters/MalformedReadFilter.java
index 74deace9a..11bbf9e4c 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/filters/MalformedReadFilter.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/filters/MalformedReadFilter.java
@@ -27,7 +27,9 @@ package org.broadinstitute.sting.gatk.filters;
 import net.sf.samtools.SAMFileHeader;
 import net.sf.samtools.SAMRecord;
 import net.sf.samtools.SAMSequenceRecord;
+import org.broadinstitute.sting.commandline.Argument;
 import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
+import org.broadinstitute.sting.utils.exceptions.UserException;
 
 /**
  * Filter out malformed reads.
@@ -37,14 +39,25 @@ import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
  */
 public class MalformedReadFilter extends ReadFilter {
     private SAMFileHeader header;
-    
+
+    @Argument(fullName = "filter_mismatching_base_and_quals", shortName = "filterMBQ", doc = "if a read has mismatching number of bases and base qualities, filter out the read instead of blowing up.", required = false)
+    boolean filterMismatchingBaseAndQuals = false;
+
     @Override
     public void initialize(GenomeAnalysisEngine engine) {
         this.header = engine.getSAMFileHeader();
     }
 
     public boolean filterOut(SAMRecord read) {
-        return !checkInvalidAlignmentStart(read) ||
+        // slowly changing the behavior to blow up first and filtering out if a parameter is explicitly provided
+        if (!checkMismatchingBasesAndQuals(read)) {
+            if (!filterMismatchingBaseAndQuals)
+                throw new UserException.MalformedBAM(read, "BAM file has a read with mismatching number of bases and base qualities. Offender: " + read.getReadName() +"  [" + read.getReadLength() + " bases] [" +read.getBaseQualities().length +"] quals");
+            else
+                return true;
+        }
+
+        return  !checkInvalidAlignmentStart(read) ||
                 !checkInvalidAlignmentEnd(read) ||
                 !checkAlignmentDisagreesWithHeader(this.header,read) ||
                 !checkCigarDisagreesWithAlignment(read);
@@ -108,4 +121,13 @@ public class MalformedReadFilter extends ReadFilter {
             return false;
         return true;
     }
+
+    /**
+     * Check if the read has the same number of bases and base qualities
+     * @param read the read to validate
+     * @return true if they have the same number. False otherwise.
+     */
+    private static boolean checkMismatchingBasesAndQuals(SAMRecord read) {
+        return (read.getReadLength() == read.getBaseQualities().length);
+    }
 }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/filters/ReadNameFilter.java b/public/java/src/org/broadinstitute/sting/gatk/filters/ReadNameFilter.java
new file mode 100755
index 000000000..a56af56d1
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/filters/ReadNameFilter.java
@@ -0,0 +1,23 @@
+package org.broadinstitute.sting.gatk.filters;
+
+import net.sf.samtools.Cigar;
+import net.sf.samtools.CigarElement;
+import net.sf.samtools.CigarOperator;
+import net.sf.samtools.SAMRecord;
+import org.broadinstitute.sting.commandline.Argument;
+
+/**
+ * Created by IntelliJ IDEA.
+ * User: chartl
+ * Date: 9/19/11
+ * Time: 4:09 PM
+ * To change this template use File | Settings | File Templates.
+ */
+public class ReadNameFilter extends ReadFilter {
+     @Argument(fullName = "readName", shortName = "rn", doc="Filter out all reads except those with this read name", required=true)
+    private String readName;
+
+    public boolean filterOut(final SAMRecord rec) {
+        return ! rec.getReadName().equals(readName);
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/io/storage/VCFWriterStorage.java b/public/java/src/org/broadinstitute/sting/gatk/io/storage/VCFWriterStorage.java
index ebb4cbe66..4ca7b935f 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/io/storage/VCFWriterStorage.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/io/storage/VCFWriterStorage.java
@@ -46,7 +46,7 @@ public class VCFWriterStorage implements Storage<VCFWriterStorage>, VCFWriter {
         else if ( stub.getOutputStream() != null ) {
             this.file = null;
             this.stream = stub.getOutputStream();
-            writer = new StandardVCFWriter(stream, stub.doNotWriteGenotypes());
+            writer = new StandardVCFWriter(stream, stub.getMasterSequenceDictionary(), stub.doNotWriteGenotypes());
         }
         else
             throw new ReviewedStingException("Unable to create target to which to write; storage was provided with neither a file nor a stream.");
@@ -71,7 +71,7 @@ public class VCFWriterStorage implements Storage<VCFWriterStorage>, VCFWriter {
         }
 
         // The GATK/Tribble can't currently index block-compressed files on the fly.  Disable OTF indexing even if the user explicitly asked for it.
-        return new StandardVCFWriter(file, this.stream, indexOnTheFly && !stub.isCompressed(), stub.doNotWriteGenotypes());
+        return new StandardVCFWriter(file, this.stream, stub.getMasterSequenceDictionary(), indexOnTheFly && !stub.isCompressed(), stub.doNotWriteGenotypes());
     }
 
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/io/stubs/VCFWriterStub.java b/public/java/src/org/broadinstitute/sting/gatk/io/stubs/VCFWriterStub.java
index 936243f9d..82cb43634 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/io/stubs/VCFWriterStub.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/io/stubs/VCFWriterStub.java
@@ -25,6 +25,7 @@
 
 package org.broadinstitute.sting.gatk.io.stubs;
 
+import net.sf.samtools.SAMSequenceDictionary;
 import net.sf.samtools.SAMSequenceRecord;
 import org.broadinstitute.sting.gatk.CommandLineExecutable;
 import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
@@ -150,6 +151,15 @@ public class VCFWriterStub implements Stub<VCFWriter>, VCFWriter {
         return isCompressed;
     }
 
+    /**
+     * Gets the master sequence dictionary from the engine associated with this stub
+     * @link GenomeAnalysisEngine.getMasterSequenceDictionary
+     * @return
+     */
+    public SAMSequenceDictionary getMasterSequenceDictionary() {
+        return engine.getMasterSequenceDictionary();
+    }
+
     /**
      * Should we tell the VCF writer not to write genotypes?
      * @return true if the writer should not write genotypes.
diff --git a/public/java/src/org/broadinstitute/sting/gatk/iterators/LocusIteratorByState.java b/public/java/src/org/broadinstitute/sting/gatk/iterators/LocusIteratorByState.java
index e13c5a764..ee3ea63eb 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/iterators/LocusIteratorByState.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/iterators/LocusIteratorByState.java
@@ -35,26 +35,23 @@ import org.broadinstitute.sting.gatk.DownsampleType;
 import org.broadinstitute.sting.gatk.DownsamplingMethod;
 import org.broadinstitute.sting.gatk.ReadProperties;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
-import org.broadinstitute.sting.gatk.datasources.sample.SampleDataSource;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.GenomeLocParser;
 import org.broadinstitute.sting.utils.MathUtils;
 import org.broadinstitute.sting.utils.ReservoirDownsampler;
+import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
 import org.broadinstitute.sting.utils.pileup.ExtendedEventPileupElement;
 import org.broadinstitute.sting.utils.pileup.PileupElement;
 import org.broadinstitute.sting.utils.pileup.ReadBackedExtendedEventPileupImpl;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileupImpl;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.broadinstitute.sting.utils.sam.ReadUtils;
 
 import java.util.*;
 
 /** Iterator that traverses a SAM File, accumulating information on a per-locus basis */
 public class LocusIteratorByState extends LocusIterator {
-//    private static long discarded_bases = 0L;
-//    private static long observed_bases = 0L;
-
     /** our log, which we want to capture anything from this class */
     private static Logger logger = Logger.getLogger(LocusIteratorByState.class);
 
@@ -69,7 +66,7 @@ public class LocusIteratorByState extends LocusIterator {
      * Used to create new GenomeLocs.
      */
     private final GenomeLocParser genomeLocParser;
-    private final ArrayList<Sample> samples;
+    private final ArrayList<String> samples;
     private final ReadStateManager readStates;
 
     static private class SAMRecordState {
@@ -278,15 +275,27 @@ public class LocusIteratorByState extends LocusIterator {
     //
     // -----------------------------------------------------------------------------------------------------------------
 
-    public LocusIteratorByState(final Iterator<SAMRecord> samIterator, ReadProperties readInformation, GenomeLocParser genomeLocParser, SampleDataSource sampleData ) {
+    public LocusIteratorByState(final Iterator<SAMRecord> samIterator, ReadProperties readInformation, GenomeLocParser genomeLocParser, Collection<String> samples ) {
         this.readInfo = readInformation;
         this.genomeLocParser = genomeLocParser;
+        this.samples = new ArrayList<String>(samples);
+        this.readStates = new ReadStateManager(samIterator,readInformation.getDownsamplingMethod());
 
-        // get the list of samples
-        this.samples = new ArrayList<Sample>(sampleData.getSamples());
-        
-        readStates = new ReadStateManager(samIterator,readInformation.getDownsamplingMethod());
-    
+        // currently the GATK expects this LocusIteratorByState to accept empty sample lists, when
+        // there's no read data.  So we need to throw this error only when samIterator.hasNext() is true
+        if ( this.samples.isEmpty() && samIterator.hasNext() ) {
+            throw new IllegalArgumentException("samples list must not be empty");
+        }
+    }
+
+    /**
+     * For testing only.  Assumes that the incoming SAMRecords have no read groups, so creates a dummy sample list
+     * for the system.
+     */
+    public final static Collection<String> sampleListForSAMWithoutReadGroups() {
+        List<String> samples = new ArrayList<String>();
+        samples.add(null);
+        return samples;
     }
 
     public Iterator<AlignmentContext> iterator() {
@@ -303,19 +312,6 @@ public class LocusIteratorByState extends LocusIterator {
         //if ( DEBUG ) System.out.printf("hasNext() = %b%n", r);
     }
 
-    public void printState() {
-        for(Sample sample: samples) {
-            Iterator<SAMRecordState> iterator = readStates.iterator(sample);
-            while(iterator.hasNext()) {
-                SAMRecordState state = iterator.next();
-                logger.debug(String.format("printState():"));
-                SAMRecord read = state.getRead();
-                int offset = state.getReadOffset();
-                logger.debug(String.format("  read: %s(%d)=%s, cigar=%s", read.getReadName(), offset, (char)read.getReadBases()[offset], read.getCigarString()));
-            }
-        }
-    }
-
     private GenomeLoc getLocation() {
         return readStates.isEmpty() ? null : readStates.getFirst().getLocation(genomeLocParser);
     }
@@ -355,14 +351,14 @@ public class LocusIteratorByState extends LocusIterator {
             // In this case, the subsequent call to next() will emit the normal pileup at the current base
             // and shift the position.
             if (readInfo.generateExtendedEvents() && hasExtendedEvents) {
-                Map<Sample,ReadBackedExtendedEventPileupImpl> fullExtendedEventPileup = new HashMap<Sample,ReadBackedExtendedEventPileupImpl>();
+                Map<String,ReadBackedExtendedEventPileupImpl> fullExtendedEventPileup = new HashMap<String,ReadBackedExtendedEventPileupImpl>();
 
                 // get current location on the reference and decrement it by 1: the indels we just stepped over
                 // are associated with the *previous* reference base
                 GenomeLoc loc = genomeLocParser.incPos(getLocation(),-1);
 
                 boolean hasBeenSampled = false;
-                for(Sample sample: samples) {
+                for(final String sample: samples) {
                     Iterator<SAMRecordState> iterator = readStates.iterator(sample);
                     List<ExtendedEventPileupElement> indelPile = new ArrayList<ExtendedEventPileupElement>(readStates.size(sample));
                     hasBeenSampled |= loc.getStart() <= readStates.getDownsamplingExtent(sample);
@@ -382,10 +378,7 @@ public class LocusIteratorByState extends LocusIterator {
                                 maxDeletionLength = Math.max(maxDeletionLength,state.getEventLength());
                             }
                             else nInsertions++;
-                            indelPile.add ( new ExtendedEventPileupElement(state.getRead(),
-                                                                           state.getReadEventStartOffset(),
-                                                                           state.getEventLength(),
-                                                                           state.getEventBases()) );
+                            indelPile.add ( new ExtendedEventPileupElement((GATKSAMRecord) state.getRead(), state.getReadEventStartOffset(), state.getEventLength(), state.getEventBases()) );
 
                         }   else {
                             // HACK: The readahead mechanism for LocusIteratorByState will effectively read past the current position
@@ -407,9 +400,7 @@ public class LocusIteratorByState extends LocusIterator {
                                     // we count such reads (with a longer deletion spanning over a deletion at the previous base we are
                                     // about to report) only if includeReadsWithDeletionAtLoci is true.
                                     size++;
-                                    indelPile.add ( new ExtendedEventPileupElement(state.getRead(),
-                                                                           state.getReadOffset()-1,
-                                                                           -1) // length=-1 --> noevent
+                                    indelPile.add ( new ExtendedEventPileupElement((GATKSAMRecord) state.getRead(), state.getReadOffset()-1, -1) // length=-1 --> noevent
                                             );
                                 }
                             }
@@ -426,10 +417,10 @@ public class LocusIteratorByState extends LocusIterator {
                 nextAlignmentContext = new AlignmentContext(loc, new ReadBackedExtendedEventPileupImpl(loc, fullExtendedEventPileup), hasBeenSampled);
             }  else {
                 GenomeLoc location = getLocation();
-                Map<Sample,ReadBackedPileupImpl> fullPileup = new HashMap<Sample,ReadBackedPileupImpl>();
+                Map<String,ReadBackedPileupImpl> fullPileup = new HashMap<String,ReadBackedPileupImpl>();
 
                 boolean hasBeenSampled = false;
-                for(Sample sample: samples) {
+                for(final String sample: samples) {
                     Iterator<SAMRecordState> iterator = readStates.iterator(sample);
                     List<PileupElement> pile = new ArrayList<PileupElement>(readStates.size(sample));
                     hasBeenSampled |= location.getStart() <= readStates.getDownsamplingExtent(sample);
@@ -447,12 +438,12 @@ public class LocusIteratorByState extends LocusIterator {
                                 continue;
                             } else {
                                 //observed_bases++;
-                                pile.add(new PileupElement(state.getRead(), state.getReadOffset()));
+                                pile.add(new PileupElement((GATKSAMRecord) state.getRead(), state.getReadOffset()));
                                 size++;
                             }
                         } else if ( readInfo.includeReadsWithDeletionAtLoci() && state.getCurrentCigarOperator() != CigarOperator.N ) {
                             size++;
-                            pile.add(new PileupElement(state.getRead(), -1));
+                            pile.add(new PileupElement((GATKSAMRecord) state.getRead(), -1));
                             nDeletions++;
                         }
 
@@ -495,7 +486,7 @@ public class LocusIteratorByState extends LocusIterator {
     }
 
     private void updateReadStates() {
-        for(Sample sample: samples) {
+        for(final String sample: samples) {
             Iterator<SAMRecordState> it = readStates.iterator(sample);
             while ( it.hasNext() ) {
                 SAMRecordState state = it.next();
@@ -522,7 +513,7 @@ public class LocusIteratorByState extends LocusIterator {
         private final PeekableIterator<SAMRecord> iterator;
         private final DownsamplingMethod downsamplingMethod;
         private final SamplePartitioner samplePartitioner;
-        private final Map<Sample,PerSampleReadStateManager> readStatesBySample = new HashMap<Sample,PerSampleReadStateManager>();
+        private final Map<String,PerSampleReadStateManager> readStatesBySample = new HashMap<String,PerSampleReadStateManager>();
         private final int targetCoverage;
         private int totalReadStates = 0;
 
@@ -540,9 +531,9 @@ public class LocusIteratorByState extends LocusIterator {
             }
 
             Map<String,ReadSelector> readSelectors = new HashMap<String,ReadSelector>();
-            for(Sample sample: samples) {
+            for(final String sample: samples) {
                 readStatesBySample.put(sample,new PerSampleReadStateManager());
-                readSelectors.put(sample.getId(),downsamplingMethod.type == DownsampleType.BY_SAMPLE ? new NRandomReadSelector(null,targetCoverage) : new AllReadsSelector());
+                readSelectors.put(sample,downsamplingMethod.type == DownsampleType.BY_SAMPLE ? new NRandomReadSelector(null,targetCoverage) : new AllReadsSelector());
             }
 
             samplePartitioner = new SamplePartitioner(readSelectors);
@@ -554,7 +545,7 @@ public class LocusIteratorByState extends LocusIterator {
          * @param sample The sample.
          * @return Iterator over the reads associated with that sample.
          */
-        public Iterator<SAMRecordState> iterator(final Sample sample) {
+        public Iterator<SAMRecordState> iterator(final String sample) {
             return new Iterator<SAMRecordState>() {
                 private Iterator<SAMRecordState> wrappedIterator = readStatesBySample.get(sample).iterator();
 
@@ -590,7 +581,7 @@ public class LocusIteratorByState extends LocusIterator {
          * @param sample The sample.
          * @return Total number of reads in the given sample.
          */
-        public int size(final Sample sample) {
+        public int size(final String sample) {
             return readStatesBySample.get(sample).size();
         }
 
@@ -600,12 +591,12 @@ public class LocusIteratorByState extends LocusIterator {
          * @param sample Sample, downsampled independently.
          * @return Integer stop of the furthest undownsampled region.
          */
-        public int getDownsamplingExtent(final Sample sample) {
+        public int getDownsamplingExtent(final String sample) {
             return readStatesBySample.get(sample).getDownsamplingExtent();
         }
 
         public SAMRecordState getFirst() {
-            for(Sample sample: samples) {
+            for(final String sample: samples) {
                 PerSampleReadStateManager reads = readStatesBySample.get(sample);
                 if(!reads.isEmpty())
                     return reads.peek();
@@ -639,8 +630,8 @@ public class LocusIteratorByState extends LocusIterator {
             }
             samplePartitioner.complete();
 
-            for(Sample sample: samples) {
-                ReadSelector aggregator = samplePartitioner.getSelectedReads(sample.getId());
+            for(final String sample: samples) {
+                ReadSelector aggregator = samplePartitioner.getSelectedReads(sample);
 
                 Collection<SAMRecord> newReads = new ArrayList<SAMRecord>(aggregator.getSelectedReads());
 
@@ -1072,6 +1063,3 @@ class SamplePartitioner implements ReadSelector {
     }
 
 }
-
-
-
diff --git a/public/java/src/org/broadinstitute/sting/gatk/iterators/ReadFormattingIterator.java b/public/java/src/org/broadinstitute/sting/gatk/iterators/ReadFormattingIterator.java
index 2f30d12a8..9a89d2086 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/iterators/ReadFormattingIterator.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/iterators/ReadFormattingIterator.java
@@ -2,7 +2,6 @@ package org.broadinstitute.sting.gatk.iterators;
 
 import net.sf.samtools.SAMRecord;
 import org.apache.log4j.Logger;
-import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 /**
  * An iterator which does post-processing of a read, including potentially wrapping
@@ -78,7 +77,30 @@ public class ReadFormattingIterator implements StingSAMIterator {
      *         no next exists.
      */
     public SAMRecord next() {
-        return new GATKSAMRecord(wrappedIterator.next(), useOriginalBaseQualities, defaultBaseQualities);
+        SAMRecord rec = wrappedIterator.next();
+
+        // if we are using default quals, check if we need them, and add if necessary.
+        // 1. we need if reads are lacking or have incomplete quality scores
+        // 2. we add if defaultBaseQualities has a positive value
+        if (defaultBaseQualities >= 0) {
+            byte reads [] = rec.getReadBases();
+            byte quals [] = rec.getBaseQualities();
+            if (quals == null || quals.length < reads.length) {
+                byte new_quals [] = new byte [reads.length];
+                for (int i=0; i<reads.length; i++)
+                    new_quals[i] = defaultBaseQualities;
+                rec.setBaseQualities(new_quals);
+            }
+        }
+
+        // if we are using original quals, set them now if they are present in the record
+        if ( useOriginalBaseQualities ) {
+            byte[] originalQuals = rec.getOriginalBaseQualities();
+            if ( originalQuals != null )
+                rec.setBaseQualities(originalQuals);
+        }
+
+        return rec;
     }
 
     /**
diff --git a/public/java/src/org/broadinstitute/sting/gatk/phonehome/GATKRunReport.java b/public/java/src/org/broadinstitute/sting/gatk/phonehome/GATKRunReport.java
index 4d94130a8..f09865537 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/phonehome/GATKRunReport.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/phonehome/GATKRunReport.java
@@ -28,7 +28,6 @@ import org.apache.log4j.Level;
 import org.apache.log4j.Logger;
 import org.broadinstitute.sting.gatk.CommandLineGATK;
 import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
-import org.broadinstitute.sting.gatk.arguments.GATKArgumentCollection;
 import org.broadinstitute.sting.gatk.walkers.Walker;
 import org.broadinstitute.sting.utils.Utils;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
@@ -101,9 +100,6 @@ public class GATKRunReport {
     @Element(required = false, name = "exception")
     private final ExceptionToXML mException;
 
-    @Element(required = false, name = "argument_collection")
-    private final GATKArgumentCollection mCollection;
-
     @Element(required = true, name = "working_directory")
     private String currentPath;
 
@@ -187,7 +183,6 @@ public class GATKRunReport {
             cmdLine = engine.createApproximateCommandLineArgumentString(engine, walker);
         } catch (Exception ignore) { }
 
-        this.mCollection = engine.getArguments();
         walkerName = engine.getWalkerName(walker.getClass());
         svnVersion = CommandLineGATK.getVersionNumber();
 
@@ -293,15 +288,16 @@ public class GATKRunReport {
      * That is, postReport() is guarenteed not to fail for any reason.
      */
     private File postReportToLocalDisk(File rootDir) {
+        String filename = getID() + ".report.xml.gz";
+        File file = new File(rootDir, filename);
         try {
-            String filename = getID() + ".report.xml.gz";
-            File file = new File(rootDir, filename);
             postReportToFile(file);
             logger.debug("Wrote report to " + file);
             return file;
         } catch ( Exception e ) {
             // we catch everything, and no matter what eat the error
             exceptDuringRunReport("Couldn't read report file", e);
+            file.delete();
             return null;
         }
     }
@@ -312,6 +308,7 @@ public class GATKRunReport {
         File localFile = postReportToLocalDisk(new File("./"));
         logger.debug("Generating GATK report to AWS S3 based on local file " + localFile);
         if ( localFile != null ) { // we succeeded in creating the local file
+            localFile.deleteOnExit();
             try {
                 // stop us from printing the annoying, and meaningless, mime types warning
                 Logger mimeTypeLogger = Logger.getLogger(org.jets3t.service.utils.Mimetypes.class);
@@ -336,14 +333,13 @@ public class GATKRunReport {
                 //logger.info("Uploading " + localFile + " to AWS bucket");
                 S3Object s3Object = s3Service.putObject(REPORT_BUCKET_NAME, fileObject);
                 logger.debug("Uploaded to AWS: " + s3Object);
+                logger.info("Uploaded run statistics report to AWS S3");
             } catch ( S3ServiceException e ) {
                 exceptDuringRunReport("S3 exception occurred", e);
             } catch ( NoSuchAlgorithmException e ) {
                 exceptDuringRunReport("Couldn't calculate MD5", e);
             } catch ( IOException e ) {
                 exceptDuringRunReport("Couldn't read report file", e);
-            } finally {
-                localFile.delete();
             }
         }
     }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/refdata/indexer/RMDIndexer.java b/public/java/src/org/broadinstitute/sting/gatk/refdata/indexer/RMDIndexer.java
deleted file mode 100644
index 029800aea..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/refdata/indexer/RMDIndexer.java
+++ /dev/null
@@ -1,130 +0,0 @@
-package org.broadinstitute.sting.gatk.refdata.indexer;
-
-import net.sf.picard.reference.IndexedFastaSequenceFile;
-import org.apache.log4j.Logger;
-import org.broad.tribble.FeatureCodec;
-import org.broad.tribble.Tribble;
-import org.broad.tribble.index.Index;
-import org.broad.tribble.index.IndexFactory;
-import org.broad.tribble.util.LittleEndianOutputStream;
-import org.broadinstitute.sting.commandline.Argument;
-import org.broadinstitute.sting.commandline.CommandLineProgram;
-import org.broadinstitute.sting.commandline.Input;
-import org.broadinstitute.sting.gatk.arguments.ValidationExclusion;
-import org.broadinstitute.sting.gatk.refdata.ReferenceDependentFeatureCodec;
-import org.broadinstitute.sting.gatk.refdata.tracks.FeatureManager;
-import org.broadinstitute.sting.gatk.refdata.tracks.RMDTrackBuilder;
-import org.broadinstitute.sting.utils.GenomeLocParser;
-import org.broadinstitute.sting.utils.fasta.CachingIndexedFastaSequenceFile;
-
-import java.io.File;
-import java.io.FileOutputStream;
-
-/**
- * a utility class that can create an index, written to a target location.  This is useful when you're unable to write to the directory
- * in which an index is located, or if you'd like to pre-index files to save time.
- */
-public class RMDIndexer extends CommandLineProgram {
-    @Argument(shortName="in", fullName="inputFile", doc="The reference meta data file to index", required = true)
-    File inputFileSource = null;
-
-    @Argument(shortName="t", fullName="type", doc="The reference meta data file format (e.g. vcf, bed)", required = true)
-    String inputFileType = null;
-
-    @Input(fullName = "referenceSequence", shortName = "R", doc = "The reference to use when indexing; this sequence will be set in the index", required = true)
-    public File referenceFile = null;
-
-    @Input(shortName = "i", fullName = "indexFile", doc = "Where to write the index to (as a file), if not supplied we write to <inputFile>.idx", required = false)
-    public File indexFile = null;
-
-    @Argument(shortName = "ba", fullName = "balanceApproach", doc="the index balancing approach to take", required=false)
-    IndexFactory.IndexBalanceApproach approach = IndexFactory.IndexBalanceApproach.FOR_SEEK_TIME;
-
-    private static Logger logger = Logger.getLogger(RMDIndexer.class);
-    private IndexedFastaSequenceFile ref = null;
-    private GenomeLocParser genomeLocParser = null;
-
-    @Override
-    protected int execute() throws Exception {
-
-
-        // check parameters
-        // ---------------------------------------------------------------------------------
-
-        // check the input parameters
-        if (referenceFile != null && !referenceFile.canRead())
-            throw new IllegalArgumentException("We can't read the reference file: "
-                + referenceFile + ", check that it exists, and that you have permissions to read it");
-
-
-        // set the index file to the default name if they didn't specify a file
-        if (indexFile == null && inputFileSource != null)
-            indexFile = new File(inputFileSource.getAbsolutePath() + Tribble.STANDARD_INDEX_EXTENSION);
-
-        // check that we can create the output file
-        if (indexFile == null || indexFile.exists())
-            throw new IllegalArgumentException("We can't write to the index file location: "
-                + indexFile + ", the index exists");
-
-        logger.info(String.format("attempting to index file:   %s", inputFileSource));
-        logger.info(String.format("using reference:            %s", ((referenceFile != null) ? referenceFile.getAbsolutePath() : "(not supplied)")));
-        logger.info(String.format("using type:                 %s", inputFileType));
-        logger.info(String.format("writing to location:        %s", indexFile.getAbsolutePath()));
-
-        // try to index the file
-        // ---------------------------------------------------------------------------------
-
-        // setup the reference
-        ref = new CachingIndexedFastaSequenceFile(referenceFile);
-        genomeLocParser = new GenomeLocParser(ref);
-
-        // get a track builder
-        RMDTrackBuilder builder = new RMDTrackBuilder(ref.getSequenceDictionary(),genomeLocParser, ValidationExclusion.TYPE.ALL);
-
-        // find the types available to the track builders
-        FeatureManager.FeatureDescriptor descriptor = builder.getFeatureManager().getByName(inputFileType);
-
-        // check that the type is valid
-        if (descriptor == null)
-            throw new IllegalArgumentException("The type specified " + inputFileType + " is not a valid type.  Valid type list: " + builder.getFeatureManager().userFriendlyListOfAvailableFeatures());
-
-        // create the codec
-        FeatureCodec codec = builder.getFeatureManager().createCodec(descriptor, "foo", genomeLocParser);
-
-        // check if it's a reference dependent feature codec
-        if (codec instanceof ReferenceDependentFeatureCodec)
-            ((ReferenceDependentFeatureCodec)codec).setGenomeLocParser(genomeLocParser);
-        
-        // get some timing info
-        long currentTime = System.currentTimeMillis();
-
-        Index index = IndexFactory.createIndex(inputFileSource, codec, approach);
-
-        // add writing of the sequence dictionary, if supplied
-        builder.setIndexSequenceDictionary(inputFileSource, index, ref.getSequenceDictionary(), indexFile, false);
-
-        // create the output stream, and write the index
-        LittleEndianOutputStream stream = new LittleEndianOutputStream(new FileOutputStream(indexFile));
-        index.write(stream);
-        stream.close();
-
-        // report and exit
-        logger.info("Successfully wrote the index to location: " + indexFile + " in " + ((System.currentTimeMillis() - currentTime)/1000) + " seconds");
-        return 0;  // return successfully
-    }
-
-
-    /**
-     * the generic call execute main
-     * @param argv the arguments from the command line
-     */
-    public static void main(String[] argv) {
-        try {
-            RMDIndexer instance = new RMDIndexer();
-            start(instance, argv);
-            System.exit(CommandLineProgram.result);
-        } catch (Exception e) {
-            exitSystemWithError(e);
-        }
-    }
-}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/refdata/tracks/IndexDictionaryUtils.java b/public/java/src/org/broadinstitute/sting/gatk/refdata/tracks/IndexDictionaryUtils.java
new file mode 100644
index 000000000..d133439dc
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/refdata/tracks/IndexDictionaryUtils.java
@@ -0,0 +1,106 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.gatk.refdata.tracks;
+
+import net.sf.samtools.SAMSequenceDictionary;
+import net.sf.samtools.SAMSequenceRecord;
+import org.apache.log4j.Logger;
+import org.broad.tribble.index.Index;
+import org.broadinstitute.sting.gatk.arguments.ValidationExclusion;
+import org.broadinstitute.sting.utils.SequenceDictionaryUtils;
+
+import java.util.LinkedHashSet;
+import java.util.Map;
+import java.util.Set;
+import java.util.TreeSet;
+
+/**
+ * Utilities for working with Sequence Dictionaries embedded in tribble indices
+ *
+ * @author Your Name
+ * @since Date created
+ */
+public class IndexDictionaryUtils {
+    private final static Logger logger = Logger.getLogger(IndexDictionaryUtils.class);
+
+    // a constant we use for marking sequence dictionary entries in the Tribble index property list
+    public static final String SequenceDictionaryPropertyPredicate = "DICT:";
+
+    /**
+     * get the sequence dictionary from the track, if available.  If not, make it from the contig list that is always in the index
+     * @param index the index file to use
+     * @return a SAMSequenceDictionary if available, null if unavailable
+     */
+    public static SAMSequenceDictionary getSequenceDictionaryFromProperties(Index index) {
+        SAMSequenceDictionary dict = new SAMSequenceDictionary();
+        for (Map.Entry<String,String> entry : index.getProperties().entrySet()) {
+            if (entry.getKey().startsWith(SequenceDictionaryPropertyPredicate))
+                dict.addSequence(new SAMSequenceRecord(entry.getKey().substring(SequenceDictionaryPropertyPredicate.length() , entry.getKey().length()),
+                        Integer.valueOf(entry.getValue())));
+        }
+        return dict;
+    }
+
+    /**
+     * create the sequence dictionary with the contig list; a backup approach
+     * @param index the index file to use
+     * @param dict the sequence dictionary to add contigs to
+     * @return the filled-in sequence dictionary
+     */
+    static SAMSequenceDictionary createSequenceDictionaryFromContigList(Index index, SAMSequenceDictionary dict) {
+        LinkedHashSet<String> seqNames = index.getSequenceNames();
+        if (seqNames == null) {
+            return dict;
+        }
+        for (String name : seqNames) {
+            SAMSequenceRecord seq = new SAMSequenceRecord(name, 0);
+            dict.addSequence(seq);
+        }
+        return dict;
+    }
+
+    public static void setIndexSequenceDictionary(Index index, SAMSequenceDictionary dict) {
+        for ( SAMSequenceRecord seq : dict.getSequences() ) {
+            final String contig = IndexDictionaryUtils.SequenceDictionaryPropertyPredicate + seq.getSequenceName();
+            final String length = String.valueOf(seq.getSequenceLength());
+            index.addProperty(contig,length);
+        }
+    }
+
+    public static void validateTrackSequenceDictionary(final String trackName,
+                                                       final SAMSequenceDictionary trackDict,
+                                                       final SAMSequenceDictionary referenceDict,
+                                                       final ValidationExclusion.TYPE validationExclusionType ) {
+        // if the sequence dictionary is empty (as well as null which means it doesn't have a dictionary), skip validation
+        if (trackDict == null || trackDict.size() == 0)
+            logger.info("Track " + trackName + " doesn't have a sequence dictionary built in, skipping dictionary validation");
+        else {
+            Set<String> trackSequences = new TreeSet<String>();
+            for (SAMSequenceRecord dictionaryEntry : trackDict.getSequences())
+                trackSequences.add(dictionaryEntry.getSequenceName());
+            SequenceDictionaryUtils.validateDictionaries(logger, validationExclusionType, trackName, trackDict, "reference", referenceDict);
+        }
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/refdata/tracks/RMDTrackBuilder.java b/public/java/src/org/broadinstitute/sting/gatk/refdata/tracks/RMDTrackBuilder.java
index 06d05912a..edb514984 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/refdata/tracks/RMDTrackBuilder.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/refdata/tracks/RMDTrackBuilder.java
@@ -25,7 +25,6 @@
 package org.broadinstitute.sting.gatk.refdata.tracks;
 
 import net.sf.samtools.SAMSequenceDictionary;
-import net.sf.samtools.SAMSequenceRecord;
 import org.apache.log4j.Logger;
 import org.broad.tribble.FeatureCodec;
 import org.broad.tribble.FeatureSource;
@@ -41,7 +40,6 @@ import org.broadinstitute.sting.gatk.arguments.ValidationExclusion;
 import org.broadinstitute.sting.gatk.refdata.utils.RMDTriplet;
 import org.broadinstitute.sting.gatk.refdata.utils.RMDTriplet.RMDStorageType;
 import org.broadinstitute.sting.utils.GenomeLocParser;
-import org.broadinstitute.sting.utils.SequenceDictionaryUtils;
 import org.broadinstitute.sting.utils.collections.Pair;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
@@ -52,16 +50,11 @@ import org.broadinstitute.sting.utils.instrumentation.Sizeof;
 import java.io.File;
 import java.io.FileOutputStream;
 import java.io.IOException;
-import java.util.LinkedHashSet;
-import java.util.Map;
-import java.util.Set;
-import java.util.TreeSet;
-
 
 
 /**
- * 
- * @author aaron 
+ *
+ * @author aaron
  *                                           `
  * Class RMDTrackBuilder
  *
@@ -76,9 +69,6 @@ public class RMDTrackBuilder { // extends PluginManager<FeatureCodec> {
     private final static Logger logger = Logger.getLogger(RMDTrackBuilder.class);
     public final static boolean MEASURE_TRIBBLE_QUERY_PERFORMANCE = false;
 
-    // a constant we use for marking sequence dictionary entries in the Tribble index property list
-    public static final String SequenceDictionaryPropertyPredicate = "DICT:";
-
     // private sequence dictionary we use to set our tracks with
     private SAMSequenceDictionary dict = null;
 
@@ -150,7 +140,7 @@ public class RMDTrackBuilder { // extends PluginManager<FeatureCodec> {
         final FeatureManager.FeatureDescriptor descriptor = getFeatureManager().getByCodec(codecClass);
 
         if (descriptor == null)
-            throw new ReviewedStingException("Unable to find type name for codex class " + codecClass.getName());
+            throw new ReviewedStingException("Unable to find type name for codec class " + codecClass.getName());
 
         return createInstanceOfTrack(new RMDTriplet("anonymous",descriptor.getName(),inputFile.getAbsolutePath(),RMDStorageType.FILE,new Tags()));
     }
@@ -210,13 +200,19 @@ public class RMDTrackBuilder { // extends PluginManager<FeatureCodec> {
                 try { logger.info(String.format("  Index for %s has size in bytes %d", inputFile, Sizeof.getObjectGraphSize(index))); }
                 catch (ReviewedStingException e) { }
 
-                sequenceDictionary = getSequenceDictionaryFromProperties(index);
+                sequenceDictionary = IndexDictionaryUtils.getSequenceDictionaryFromProperties(index);
 
                 // if we don't have a dictionary in the Tribble file, and we've set a dictionary for this builder, set it in the file if they match
                 if (sequenceDictionary.size() == 0 && dict != null) {
                     File indexFile = Tribble.indexFile(inputFile);
-                    setIndexSequenceDictionary(inputFile,index,dict,indexFile,true);
-                    sequenceDictionary = getSequenceDictionaryFromProperties(index);
+                    validateAndUpdateIndexSequenceDictionary(inputFile, index, dict);
+                    try { // re-write the index
+                        writeIndexToDisk(index,indexFile,new FSLockWithShared(indexFile));
+                    } catch (IOException e) {
+                        logger.warn("Unable to update index with the sequence dictionary for file " + indexFile + "; this will not effect your run of the GATK");
+                    }
+
+                    sequenceDictionary = IndexDictionaryUtils.getSequenceDictionaryFromProperties(index);
                 }
 
                 if ( MEASURE_TRIBBLE_QUERY_PERFORMANCE )
@@ -363,88 +359,31 @@ public class RMDTrackBuilder { // extends PluginManager<FeatureCodec> {
         // this can take a while, let them know what we're doing
         logger.info("Creating Tribble index in memory for file " + inputFile);
         Index idx = IndexFactory.createIndex(inputFile, codec, IndexFactory.IndexBalanceApproach.FOR_SEEK_TIME);
-        setIndexSequenceDictionary(inputFile, idx, dict, null, false);
+        validateAndUpdateIndexSequenceDictionary(inputFile, idx, dict);
         return idx;
     }
 
-
-    // ---------------------------------------------------------------------------------------------------------
-    // static functions to work with the sequence dictionaries of indexes
-    // ---------------------------------------------------------------------------------------------------------
-    
-    /**
-     * get the sequence dictionary from the track, if available.  If not, make it from the contig list that is always in the index
-     * @param index the index file to use
-     * @return a SAMSequenceDictionary if available, null if unavailable
-     */
-    public static SAMSequenceDictionary getSequenceDictionaryFromProperties(Index index) {
-        SAMSequenceDictionary dict = new SAMSequenceDictionary();
-        for (Map.Entry<String,String> entry : index.getProperties().entrySet()) {
-            if (entry.getKey().startsWith(SequenceDictionaryPropertyPredicate))
-                dict.addSequence(new SAMSequenceRecord(entry.getKey().substring(SequenceDictionaryPropertyPredicate.length() , entry.getKey().length()),
-                                 Integer.valueOf(entry.getValue())));
-        }
-        return dict;
-    }
-
-    /**
-     * create the sequence dictionary with the contig list; a backup approach
-     * @param index the index file to use
-     * @param dict the sequence dictionary to add contigs to
-     * @return the filled-in sequence dictionary
-     */
-    private static SAMSequenceDictionary createSequenceDictionaryFromContigList(Index index, SAMSequenceDictionary dict) {
-        LinkedHashSet<String> seqNames = index.getSequenceNames();
-        if (seqNames == null) {
-            return dict;
-        }
-        for (String name : seqNames) {
-            SAMSequenceRecord seq = new SAMSequenceRecord(name, 0);
-            dict.addSequence(seq);
-        }
-        return dict;
-    }
-
     /**
      * set the sequence dictionary of the track.  This function checks that the contig listing of the underlying file is compatible.
      * (that each contig in the index is in the sequence dictionary).
      * @param inputFile for proper error message formatting.
      * @param dict the sequence dictionary
      * @param index the index file
-     * @param indexFile the index file
-     * @param rewriteIndex should we rewrite the index when we're done?
-     *
      */
-    public void setIndexSequenceDictionary(File inputFile, Index index, SAMSequenceDictionary dict, File indexFile, boolean rewriteIndex) {
-        if (dict == null) return;
-
-        SAMSequenceDictionary currentDict = createSequenceDictionaryFromContigList(index, new SAMSequenceDictionary());
-        validateTrackSequenceDictionary(inputFile.getAbsolutePath(),currentDict,dict);
+    public void validateAndUpdateIndexSequenceDictionary(final File inputFile, final Index index, final SAMSequenceDictionary dict) {
+        if (dict == null) throw new ReviewedStingException("BUG: dict cannot be null");
 
         // check that every contig in the RMD contig list is at least in the sequence dictionary we're being asked to set
-        for (SAMSequenceRecord seq : currentDict.getSequences()) {
-            if (dict.getSequence(seq.getSequenceName()) == null)
-                continue;
-            index.addProperty(SequenceDictionaryPropertyPredicate + dict.getSequence(seq.getSequenceName()).getSequenceName(), String.valueOf(dict.getSequence(seq.getSequenceName()).getSequenceLength()));
-        }
-        // re-write the index
-        if (rewriteIndex) try {
-            writeIndexToDisk(index,indexFile,new FSLockWithShared(indexFile));
-        } catch (IOException e) {
-            logger.warn("Unable to update index with the sequence dictionary for file " + indexFile + "; this will not effect your run of the GATK");
-        }
+        final SAMSequenceDictionary currentDict = IndexDictionaryUtils.createSequenceDictionaryFromContigList(index, new SAMSequenceDictionary());
+        validateTrackSequenceDictionary(inputFile.getAbsolutePath(), currentDict, dict);
+
+        // actually update the dictionary in the index
+        IndexDictionaryUtils.setIndexSequenceDictionary(index, dict);
     }
 
-
-    public void validateTrackSequenceDictionary(String trackName, SAMSequenceDictionary trackDict, SAMSequenceDictionary referenceDict) {
-        // if the sequence dictionary is empty (as well as null which means it doesn't have a dictionary), skip validation
-        if (trackDict == null || trackDict.size() == 0)
-            logger.info("Track " + trackName + " doesn't have a sequence dictionary built in, skipping dictionary validation");
-        else {
-            Set<String> trackSequences = new TreeSet<String>();
-            for (SAMSequenceRecord dictionaryEntry : trackDict.getSequences())
-                trackSequences.add(dictionaryEntry.getSequenceName());
-            SequenceDictionaryUtils.validateDictionaries(logger, validationExclusionType, trackName, trackDict, "reference", referenceDict);
-        }
+    public void validateTrackSequenceDictionary(final String trackName,
+                                                final SAMSequenceDictionary trackDict,
+                                                final SAMSequenceDictionary referenceDict ) {
+        IndexDictionaryUtils.validateTrackSequenceDictionary(trackName, trackDict, referenceDict, validationExclusionType);
     }
 }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/refdata/utils/RMDIntervalGenerator.java b/public/java/src/org/broadinstitute/sting/gatk/refdata/utils/RMDIntervalGenerator.java
deleted file mode 100644
index a7666981c..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/refdata/utils/RMDIntervalGenerator.java
+++ /dev/null
@@ -1,57 +0,0 @@
-package org.broadinstitute.sting.gatk.refdata.utils;
-
-import org.broadinstitute.sting.gatk.datasources.rmd.ReferenceOrderedDataSource;
-import org.broadinstitute.sting.utils.GenomeLoc;
-
-import java.util.*;
-
-
-/**
- * 
- * @author aaron 
- * 
- * Class RMDIntervalGenerator
- *
- * Creates an interval list, given an RMDTrack
- */
-public class RMDIntervalGenerator {
-    public ReferenceOrderedDataSource dataSource;
-
-    /**
-     * create a interval representation of a ROD track
-     * @param dataSource the track
-     */
-    public RMDIntervalGenerator(ReferenceOrderedDataSource dataSource) {
-        if (dataSource == null) throw new IllegalArgumentException("Data source cannot be null");
-        this.dataSource = dataSource;
-    }
-
-    /**
-     * create a genome location list from the interval track
-     * @return a list of genome locations
-     */
-    public List<GenomeLoc> toGenomeLocList() {
-        Iterator<RODRecordList> iter = dataSource.seek((GenomeLoc)null);
-        List<GenomeLoc> locations = new ArrayList<GenomeLoc>();
-        while (iter.hasNext()) {
-            RODRecordList feature = iter.next();
-            GenomeLoc loc = feature.getLocation();
-            if (loc != null) locations.add(loc);            
-        }
-        return locations;
-    }
-
-    /**
-     * return a map of reference meta data track names to RODS
-     * @param sources the reference ordered data sources to get the names from
-     * @return a map of reference meta data names to RODS
-     */
-    public static Map<String,ReferenceOrderedDataSource> getRMDTrackNames(List<ReferenceOrderedDataSource> sources) {
-        // get a list of the current rod names we're working with
-        Map<String,ReferenceOrderedDataSource> rodNames = new HashMap<String,ReferenceOrderedDataSource>();
-        for (ReferenceOrderedDataSource rod : sources) {
-            rodNames.put(rod.getName(),rod);
-        }
-        return rodNames;
-    }
-}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/report/GATKReportColumns.java b/public/java/src/org/broadinstitute/sting/gatk/report/GATKReportColumns.java
old mode 100644
new mode 100755
index a33631c85..a73123b6c
--- a/public/java/src/org/broadinstitute/sting/gatk/report/GATKReportColumns.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/report/GATKReportColumns.java
@@ -24,12 +24,14 @@
 
 package org.broadinstitute.sting.gatk.report;
 
+import org.broadinstitute.sting.utils.collections.Pair;
+
 import java.util.*;
 
 /**
  * Tracks a linked list of GATKReportColumn in order by name.
  */
-public class GATKReportColumns extends LinkedHashMap<String, GATKReportColumn> {
+public class GATKReportColumns extends LinkedHashMap<String, GATKReportColumn> implements Iterable<GATKReportColumn> {
     private List<String> columnNames = new ArrayList<String>();
 
     /**
@@ -52,4 +54,14 @@ public class GATKReportColumns extends LinkedHashMap<String, GATKReportColumn> {
         columnNames.add(key);
         return super.put(key, value);
     }
+
+    @Override
+    public Iterator<GATKReportColumn> iterator() {
+        return new Iterator<GATKReportColumn>() {
+            int offset = 0;
+            public boolean hasNext() { return offset < columnNames.size() ; }
+            public GATKReportColumn next() { return getByIndex(offset++); }
+            public void remove() { throw new UnsupportedOperationException("Cannot remove from a GATKReportColumn iterator"); }
+        };
+    }
 }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/report/GATKReportTable.java b/public/java/src/org/broadinstitute/sting/gatk/report/GATKReportTable.java
index 3e3aa29a7..2fd5ad7e3 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/report/GATKReportTable.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/report/GATKReportTable.java
@@ -286,6 +286,10 @@ public class GATKReportTable {
         }
     }
 
+    public boolean containsKey(Object primaryKey) {
+        return primaryKeyColumn.contains(primaryKey);
+    }
+
     /**
      * Set the value for a given position in the table
      *
diff --git a/public/java/src/org/broadinstitute/sting/gatk/report/GATKReportVersion.java b/public/java/src/org/broadinstitute/sting/gatk/report/GATKReportVersion.java
old mode 100644
new mode 100755
diff --git a/public/java/src/org/broadinstitute/sting/gatk/samples/Affection.java b/public/java/src/org/broadinstitute/sting/gatk/samples/Affection.java
new file mode 100644
index 000000000..83e31f672
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/samples/Affection.java
@@ -0,0 +1,46 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.gatk.samples;
+
+/**
+ * Categorical sample trait for association and analysis
+ *
+ * Samples can have unknown status, be affected or unaffected by the
+ * categorical trait, or they can be marked as actually having an
+ * other trait value (stored in an associated value in the Sample class)
+ *
+ * @author Mark DePristo
+ * @since Sept. 2011
+ */
+public enum Affection {
+    /** Status is unknown */
+    UNKNOWN,
+    /** Suffers from the disease */
+    AFFECTED,
+    /** Unaffected by the disease */
+    UNAFFECTED,
+    /** An "other" trait: value of the trait is stored elsewhere and is an arbitrary string */
+    OTHER
+}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/samples/Gender.java b/public/java/src/org/broadinstitute/sting/gatk/samples/Gender.java
new file mode 100644
index 000000000..6fb44804a
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/samples/Gender.java
@@ -0,0 +1,34 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.gatk.samples;
+
+/**
+* ENUM of possible human genders: male, female, or unknown
+*/
+public enum Gender {
+    MALE,
+    FEMALE,
+    UNKNOWN
+}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/samples/PedReader.java b/public/java/src/org/broadinstitute/sting/gatk/samples/PedReader.java
new file mode 100644
index 000000000..c442409fb
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/samples/PedReader.java
@@ -0,0 +1,310 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.gatk.samples;
+
+import org.apache.log4j.Logger;
+import org.broadinstitute.sting.utils.MathUtils;
+import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.text.XReadLines;
+
+import java.io.*;
+import java.util.*;
+
+/**
+ * Reads PED file-formatted tabular text files
+ *
+ * See http://www.broadinstitute.org/mpg/tagger/faq.html
+ * See http://pngu.mgh.harvard.edu/~purcell/plink/data.shtml#ped
+ *
+ * The "ped" file format refers to the widely-used format for linkage pedigree data.
+ * Each line describes a single (diploid) individual in the following format:
+ *
+ *      family_ID individual_ID father_ID mother_ID gender phenotype genotype_1 genotype_2 ...
+ *
+ * If your data lacks pedigree information (for example, unrelated case/control individuals),
+ * set the father_ID and mother_ID to 0. sex denotes the individual's gender with 1=male and 2=female.
+ * phenotype refers to the affected status (for association studies) where 0=unknown, 1=unaffected, 2=affected.
+ * Finally, each genotype is written as two (=diploid) integer numbers (separated by whitespace),
+ * where 1=A, 2=C, 3=G, 4=T. No header lines are allowed and all columns must be separated by whitespace.
+ * Check out the information at the PLINK website on the "ped" file format.
+ *
+ * The PED file is a white-space (space or tab) delimited file: the first six columns are mandatory:
+ *  Family ID
+ *  Individual ID
+ *  Paternal ID
+ *  Maternal ID
+ *  Sex (1=male; 2=female; other=unknown)
+ *  Phenotype
+ *
+ *  The IDs are alphanumeric: the combination of family and individual ID should uniquely identify a person.
+ *  A PED file must have 1 and only 1 phenotype in the sixth column. The phenotype can be either a
+ *  quantitative trait or an affection status column: PLINK will automatically detect which type
+ *  (i.e. based on whether a value other than 0, 1, 2 or the missing genotype code is observed).
+ *  Note that the GATK actually supports arbitrary values for quantitative trait -- not just doubles --
+ *  and are actually representing these values as strings instead of doubles
+ *
+ *  NOTE Quantitative traits with decimal points must be coded with a period/full-stop character and
+ *  not a comma, i.e. 2.394 not 2,394
+ *
+ *  If an individual's sex is unknown, then any character other than 1 or 2 can be used.
+ *  When new files are created (PED, FAM, or other which contain sex) then the original coding will be
+ *  preserved. However, these individuals will be dropped from any analyses (i.e. phenotype set to missing also)
+ *  and an error message will arise if an analysis that uses family information is requested and an
+ *  individual of 'unknown' sex is specified as a father or mother.
+ *
+ *
+ *  HINT You can add a comment to a PED or MAP file by starting the line with a # character. The rest of that
+ *  line will be ignored. Do not start any family IDs with this character therefore.
+ *
+ *  Affection status, by default, should be coded:
+ *  -9 missing
+ *   0 missing
+ *   1 unaffected
+ *   2 affected
+ *
+ * If your file is coded 0/1 to represent unaffected/affected, then use the --1 flag:
+ * plink --file mydata --1 which will specify a disease phenotype coded:
+ *
+ *  -9 missing
+ *  0 unaffected
+ *  1 affected
+ *
+ * The missing phenotype value for quantitative traits is, by default, -9 (this can also be used for
+ * disease traits as well as 0). It can be reset by including the --missing-phenotype option:
+ *
+ * Genotypes (column 7 onwards) should also be white-space delimited; they can be any character
+ * (e.g. 1,2,3,4 or A,C,G,T or anything else) except 0 which is, by default, the missing genotype
+ * character. All markers should be biallelic. All SNPs (whether haploid or not) must have two
+ * alleles specified. Either Both alleles should be missing (i.e. 0) or neither.
+ *
+ * No header row should be given. For example, here are two individuals typed for 3 SNPs (one row = one person):
+ *
+ *   FAM001  1  0 0  1  2  A A  G G  A C
+ *   FAM001  2  0 0  1  2  A A  A G  0 0
+ *   ...
+ *
+ * Note that the GATK does not support genotypes in a PED file.
+ *
+ * @author Mark DePristo
+ * @since 2011
+ */
+public class PedReader {
+    private static Logger logger = Logger.getLogger(PedReader.class);
+    final static private Set<String> CATAGORICAL_TRAIT_VALUES = new HashSet<String>(Arrays.asList("-9", "0", "1", "2"));
+    final static private String commentMarker = "#";
+
+    /**
+     * An enum that specifies which, if any, of the standard PED fields are
+     * missing from the input records.  For example, suppose we have the full record:
+     *
+     * "fam1 kid dad mom 1 2"
+     *
+     * indicating a male affected child.  This can be parsed with the -ped x.ped argument
+     * to the GATK.  Suppose we only have:
+     *
+     * "fam1 kid 1"
+     *
+     * we can parse the reduced version of this record with -ped:NO_PARENTS,NO_PHENOTYPE x.ped
+     */
+    public enum MissingPedField {
+        /**
+         * The PED records do not have the first (FAMILY_ID) argument.  The family id
+         * will be set to null / empty.
+         */
+        NO_FAMILY_ID,
+
+        /**
+         * The PED records do not have either the paternal or maternal IDs, so
+         * the corresponding IDs are set to null.
+         */
+        NO_PARENTS,
+
+        /**
+         * The PED records do not have the GENDER field, so the sex of each
+         * sample will be set to UNKNOWN.
+         */
+        NO_SEX,
+
+        /**
+         * The PED records do not have the PHENOTYPE field, so the phenotype
+         * of each sample will be set to UNKNOWN.
+         */
+        NO_PHENOTYPE
+    }
+
+    protected enum Field {
+        FAMILY_ID, INDIVIDUAL_ID, PATERNAL_ID, MATERNAL_ID, GENDER, PHENOTYPE
+    }
+
+    // phenotype
+    private final static String MISSING_VALUE1 = "-9";
+    private final static String MISSING_VALUE2 = "0";
+    private final static String PHENOTYPE_UNAFFECTED = "1";
+    private final static String PHENOTYPE_AFFECTED = "2";
+
+    // Sex
+    private final static String SEX_MALE = "1";
+    private final static String SEX_FEMALE = "2";
+    // other=unknown
+
+    public PedReader() { }
+
+    public final List<Sample> parse(File source, EnumSet<MissingPedField> missingFields, SampleDB sampleDB) throws FileNotFoundException  {
+        logger.info("Reading PED file " + source + " with missing fields: " + missingFields);
+        return parse(new FileReader(source), missingFields, sampleDB);
+    }
+
+    public final List<Sample> parse(final String source, EnumSet<MissingPedField> missingFields, SampleDB sampleDB) {
+        logger.warn("Reading PED string: \"" + source + "\" with missing fields: " + missingFields);
+        return parse(new StringReader(source.replace(";", String.format("%n"))), missingFields, sampleDB);
+    }
+
+    public final List<Sample> parse(Reader reader, EnumSet<MissingPedField> missingFields, SampleDB sampleDB) {
+        final List<String> lines = new XReadLines(reader).readLines();
+
+        // What are the record offsets?
+        final int familyPos = missingFields.contains(MissingPedField.NO_FAMILY_ID) ? -1 : 0;
+        final int samplePos = familyPos + 1;
+        final int paternalPos = missingFields.contains(MissingPedField.NO_PARENTS) ? -1 : samplePos + 1;
+        final int maternalPos = missingFields.contains(MissingPedField.NO_PARENTS) ? -1 : paternalPos + 1;
+        final int sexPos = missingFields.contains(MissingPedField.NO_SEX) ? -1 : Math.max(maternalPos, samplePos) + 1;
+        final int phenotypePos = missingFields.contains(MissingPedField.NO_PHENOTYPE) ? -1 : Math.max(sexPos, Math.max(maternalPos, samplePos)) + 1;
+        final int nExpectedFields = MathUtils.arrayMaxInt(Arrays.asList(samplePos, paternalPos, maternalPos, sexPos, phenotypePos)) + 1;
+
+        // go through once and determine properties
+        int lineNo = 1;
+        boolean isQT = false;
+        final List<String[]> splits = new ArrayList<String[]>(lines.size());
+        for ( final String line : lines ) {
+            if ( line.startsWith(commentMarker)) continue;
+            if ( line.trim().equals("") ) continue;
+
+            final String[] parts = line.split("\\s+");
+
+            if ( parts.length != nExpectedFields )
+                throw new UserException.MalformedFile(reader.toString(), "Bad PED line " + lineNo + ": wrong number of fields");
+
+            if ( phenotypePos != -1 ) {
+                isQT = isQT || ! CATAGORICAL_TRAIT_VALUES.contains(parts[phenotypePos]);
+            }
+
+            splits.add(parts);
+            lineNo++;
+        }
+        logger.info("Phenotype is other? " + isQT);
+
+        // now go through and parse each record
+        lineNo = 1;
+        final List<Sample> samples = new ArrayList<Sample>(splits.size());
+        for ( final String[] parts : splits ) {
+            String familyID = null, individualID, paternalID = null, maternalID = null;
+            Gender sex = Gender.UNKNOWN;
+            String quantitativePhenotype = Sample.UNSET_QT;
+            Affection affection = Affection.UNKNOWN;
+
+            if ( familyPos != -1 ) familyID = maybeMissing(parts[familyPos]);
+            individualID = parts[samplePos];
+            if ( paternalPos != -1 ) paternalID = maybeMissing(parts[paternalPos]);
+            if ( maternalPos != -1 ) maternalID = maybeMissing(parts[maternalPos]);
+
+            if ( sexPos != -1 ) {
+                if ( parts[sexPos].equals(SEX_MALE) ) sex = Gender.MALE;
+                else if ( parts[sexPos].equals(SEX_FEMALE) ) sex = Gender.FEMALE;
+                else sex = Gender.UNKNOWN;
+            }
+
+            if ( phenotypePos != -1 ) {
+                if ( isQT ) {
+                    if ( parts[phenotypePos].equals(MISSING_VALUE1) )
+                        affection = Affection.UNKNOWN;
+                    else {
+                        affection = Affection.OTHER;
+                        quantitativePhenotype = parts[phenotypePos];
+                    }
+                } else {
+                    if ( parts[phenotypePos].equals(MISSING_VALUE1) ) affection = Affection.UNKNOWN;
+                    else if ( parts[phenotypePos].equals(MISSING_VALUE2) ) affection = Affection.UNKNOWN;
+                    else if ( parts[phenotypePos].equals(PHENOTYPE_UNAFFECTED) ) affection = Affection.UNAFFECTED;
+                    else if ( parts[phenotypePos].equals(PHENOTYPE_AFFECTED) ) affection = Affection.AFFECTED;
+                    else throw new ReviewedStingException("Unexpected phenotype type " + parts[phenotypePos] + " at line " + lineNo);
+                }
+            }
+
+            final Sample s = new Sample(individualID, sampleDB, familyID, paternalID, maternalID, sex, affection, quantitativePhenotype);
+            samples.add(s);
+            sampleDB.addSample(s);
+            lineNo++;
+        }
+
+        for ( final Sample sample : new ArrayList<Sample>(samples) ) {
+            Sample dad = maybeAddImplicitSample(sampleDB, sample.getPaternalID(), sample.getFamilyID(), Gender.MALE);
+            if ( dad != null ) samples.add(dad);
+
+            Sample mom = maybeAddImplicitSample(sampleDB, sample.getMaternalID(), sample.getFamilyID(), Gender.FEMALE);
+            if ( mom != null ) samples.add(mom);
+        }
+
+        return samples;
+    }
+
+    private final static String maybeMissing(final String string) {
+        if ( string.equals(MISSING_VALUE1) || string.equals(MISSING_VALUE2) )
+            return null;
+        else
+            return string;
+    }
+
+    private final Sample maybeAddImplicitSample(SampleDB sampleDB, final String id, final String familyID, final Gender gender) {
+        if ( id != null && sampleDB.getSample(id) == null ) {
+            Sample s = new Sample(id, sampleDB, familyID, null, null, gender, Affection.UNKNOWN, Sample.UNSET_QT);
+            sampleDB.addSample(s);
+            return s;
+        } else
+            return null;
+    }
+
+    /**
+     * Parses a list of tags from the command line, assuming it comes from the GATK Engine
+     * tags, and returns the corresponding EnumSet.
+     *
+     * @param arg the actual engine arg, used for the UserException if there's an error
+     * @param tags a list of string tags that should be converted to the MissingPedField value
+     * @return
+     */
+    public static final EnumSet<MissingPedField> parseMissingFieldTags(final Object arg, final List<String> tags) {
+        final EnumSet<MissingPedField> missingFields = EnumSet.noneOf(MissingPedField.class);
+
+        for ( final String tag : tags ) {
+            try {
+                missingFields.add(MissingPedField.valueOf(tag));
+            } catch ( IllegalArgumentException e ) {
+                throw new UserException.BadArgumentValue(arg.toString(), "Unknown tag " + tag + " allowed values are " + MissingPedField.values());
+            }
+        }
+
+        return missingFields;
+    }
+}
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/gatk/samples/PedigreeValidationType.java b/public/java/src/org/broadinstitute/sting/gatk/samples/PedigreeValidationType.java
new file mode 100644
index 000000000..bbf857820
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/samples/PedigreeValidationType.java
@@ -0,0 +1,41 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.gatk.samples;
+
+/**
+*
+*/
+public enum PedigreeValidationType {
+    /**
+     * Require if a pedigree file is provided at all samples in the VCF or BAM files have a corresponding
+     * entry in the pedigree file(s).
+     */
+    STRICT,
+
+    /**
+     * Do not enforce any overlap between the VCF/BAM samples and the pedigree data
+     * */
+    SILENT
+}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/samples/Sample.java b/public/java/src/org/broadinstitute/sting/gatk/samples/Sample.java
new file mode 100644
index 000000000..b39fdd79d
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/samples/Sample.java
@@ -0,0 +1,222 @@
+package org.broadinstitute.sting.gatk.samples;
+
+
+import org.broadinstitute.sting.utils.exceptions.UserException;
+
+import java.util.HashMap;
+import java.util.Map;
+
+/**
+ *
+ */
+public class Sample implements Comparable<Sample> { // implements java.io.Serializable {
+    final private String familyID, paternalID, maternalID;
+    final private Gender gender;
+    final private String otherPhenotype;
+    final private Affection affection;
+    final private String ID;
+    final private SampleDB infoDB;
+    final private Map<String, Object> properties = new HashMap<String, Object>();
+
+    public final static String UNSET_QT = null;
+
+    public Sample(final String ID, final SampleDB infoDB,
+                  final String familyID, final String paternalID, final String maternalID,
+                  final Gender gender, final Affection affection, final String otherPhenotype) {
+        this.familyID = familyID;
+        this.paternalID = paternalID;
+        this.maternalID = maternalID;
+        this.gender = gender;
+        this.otherPhenotype = otherPhenotype;
+        this.affection = affection;
+        this.ID = ID;
+        this.infoDB = infoDB;
+    }
+
+    protected Sample(final String ID,
+                     final String familyID, final String paternalID, final String maternalID,
+                     final Gender gender, final Affection affection, final String otherPhenotype) {
+        this(ID, null, familyID, paternalID, maternalID, gender, affection, otherPhenotype);
+    }
+
+    protected Sample(final String ID,
+                     final String familyID, final String paternalID, final String maternalID,
+                     final Gender gender, final Affection affection) {
+        this(ID, null, familyID, paternalID, maternalID, gender, affection, UNSET_QT);
+    }
+
+
+    public Sample(final String ID, final SampleDB infoDB,
+                  final String familyID, final String paternalID, final String maternalID, final Gender gender) {
+        this(ID, infoDB, familyID, paternalID, maternalID, gender, Affection.UNKNOWN, UNSET_QT);
+    }
+
+    public Sample(final String ID, final SampleDB infoDB, final Affection affection, final String otherPhenotype) {
+        this(ID, infoDB, null, null, null, Gender.UNKNOWN, affection, otherPhenotype);
+    }
+
+    public Sample(String id, SampleDB infoDB) {
+        this(id, infoDB, null, null, null,
+                Gender.UNKNOWN, Affection.UNKNOWN, UNSET_QT);
+    }
+
+    // -------------------------------------------------------------------------------------
+    //
+    // standard property getters
+    //
+    // -------------------------------------------------------------------------------------
+
+    public String getID() {
+        return ID;
+    }
+
+    public String getFamilyID() {
+        return familyID;
+    }
+
+    public String getPaternalID() {
+        return paternalID;
+    }
+
+    public String getMaternalID() {
+        return maternalID;
+    }
+
+    public Affection getAffection() {
+        return affection;
+    }
+
+    public boolean hasOtherPhenotype() {
+        return affection == Affection.OTHER;
+    }
+
+    public String getOtherPhenotype() {
+        return otherPhenotype;
+    }
+
+    /**
+     * Get the sample's mother
+     * @return sample object with relationship mother, if exists, or null
+     */
+    public Sample getMother() {
+        return infoDB.getSample(maternalID);
+    }
+
+    /**
+     * Get the sample's father
+     * @return sample object with relationship father, if exists, or null
+     */
+    public Sample getFather() {
+        return infoDB.getSample(paternalID);
+    }
+
+    /**
+     * Get gender of the sample
+     * @return property of key "gender" - must be of type Gender
+     */
+    public Gender getGender() {
+        return gender;
+    }
+
+    @Override
+    public int compareTo(final Sample sample) {
+        return ID.compareTo(sample.getID());
+    }
+
+    @Override
+    public String toString() {
+        return String.format("Sample %s fam=%s dad=%s mom=%s gender=%s affection=%s qt=%s props=%s",
+                getID(), getFamilyID(), getPaternalID(), getMaternalID(), getGender(), getAffection(),
+                getOtherPhenotype(), properties);
+    }
+
+//    // -------------------------------------------------------------------------------------
+//    //
+//    // code for working with additional -- none standard -- properites
+//    //
+//    // -------------------------------------------------------------------------------------
+//
+//    public Map<String, Object> getExtraProperties() {
+//        return Collections.unmodifiableMap(properties);
+//    }
+//
+//    /**
+//     * Get one property
+//     * @param key key of property
+//     * @return value of property as generic object
+//     */
+//    public Object getExtraPropertyValue(final String key) {
+//        return properties.get(key);
+//    }
+//
+//    /**
+//     *
+//     * @param key property key
+//     * @return true if sample has this property (even if its value is null)
+//     */
+//    public boolean hasExtraProperty(String key) {
+//        return properties.containsKey(key);
+//    }
+
+    @Override
+    public int hashCode() {
+        return ID.hashCode();
+    }
+
+    @Override
+    public boolean equals(final Object o) {
+        if(o == null)
+            return false;
+        if(o instanceof Sample) {
+            Sample otherSample = (Sample)o;
+            return ID.equals(otherSample.ID) &&
+                    equalOrNull(familyID, otherSample.familyID) &&
+                    equalOrNull(paternalID, otherSample.paternalID) &&
+                    equalOrNull(maternalID, otherSample.maternalID) &&
+                    equalOrNull(gender, otherSample.gender) &&
+                    equalOrNull(otherPhenotype, otherSample.otherPhenotype) &&
+                    equalOrNull(affection, otherSample.affection) &&
+                    equalOrNull(properties, otherSample.properties);
+        }
+        return false;
+    }
+
+    private final static boolean equalOrNull(final Object o1, final Object o2) {
+        if ( o1 == null )
+            return o2 == null;
+        else
+            return o2 == null ? false : o1.equals(o2);
+    }
+
+    private final static <T> T mergeValues(final String name, final String field, final T o1, final T o2, final T emptyValue) {
+        if ( o1 == null || o1.equals(emptyValue) ) {
+            // take o2 if both are null, otherwise keep o2
+            return o2 == null ? null : o2;
+        } else {
+            if ( o2 == null || o2.equals(emptyValue) )
+                return o1; // keep o1, since it's a real value
+            else {
+                // both o1 and o2 have a value
+                if ( o1 == o2 )
+                    return o1;
+                else
+                    throw new UserException("Inconsistent values detected for " + name + " for field " + field + " value1 " + o1 + " value2 " + o2);
+            }
+        }
+    }
+
+    public final static Sample mergeSamples(final Sample prev, final Sample next) {
+        if ( prev.equals(next) )
+            return next;
+        else {
+            return new Sample(prev.getID(), prev.infoDB,
+                    mergeValues(prev.getID(), "Family_ID", prev.getFamilyID(), next.getFamilyID(), null),
+                    mergeValues(prev.getID(), "Paternal_ID", prev.getPaternalID(), next.getPaternalID(), null),
+                    mergeValues(prev.getID(), "Material_ID", prev.getMaternalID(), next.getMaternalID(), null),
+                    mergeValues(prev.getID(), "Gender", prev.getGender(), next.getGender(), Gender.UNKNOWN),
+                    mergeValues(prev.getID(), "Affection", prev.getAffection(), next.getAffection(), Affection.UNKNOWN),
+                    mergeValues(prev.getID(), "OtherPhenotype", prev.getOtherPhenotype(), next.getOtherPhenotype(), UNSET_QT));
+                    //mergeValues(prev.getID(), "ExtraProperties", prev.getExtraProperties(), next.getExtraProperties(), Collections.emptyMap()));
+        }
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/samples/SampleDB.java b/public/java/src/org/broadinstitute/sting/gatk/samples/SampleDB.java
new file mode 100644
index 000000000..ee0873c6e
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/samples/SampleDB.java
@@ -0,0 +1,183 @@
+package org.broadinstitute.sting.gatk.samples;
+
+import net.sf.samtools.SAMReadGroupRecord;
+import net.sf.samtools.SAMRecord;
+import org.broadinstitute.sting.utils.exceptions.StingException;
+import org.broadinstitute.sting.utils.variantcontext.Genotype;
+
+import java.util.*;
+
+/**
+ *
+ */
+public class SampleDB {
+    /**
+     * This is where Sample objects are stored. Samples are usually accessed by their ID, which is unique, so
+     * this is stored as a HashMap.
+     */
+    private final HashMap<String, Sample> samples = new HashMap<String, Sample>();
+
+    /**
+     * Constructor takes both a SAM header and sample files because the two must be integrated.
+     */
+    public SampleDB() {
+
+    }
+
+    /**
+     * Protected function to add a single sample to the database
+     *
+     * @param sample to be added
+     */
+    protected SampleDB addSample(Sample sample) {
+        Sample prev = samples.get(sample.getID());
+        if ( prev != null )
+            sample = Sample.mergeSamples(prev, sample);
+        samples.put(sample.getID(), sample);
+        return this;
+    }
+
+    // --------------------------------------------------------------------------------
+    //
+    // Functions for getting a sample from the DB
+    //
+    // --------------------------------------------------------------------------------
+
+    /**
+     * Get a sample by its ID
+     * If an alias is passed in, return the main sample object 
+     * @param id
+     * @return sample Object with this ID, or null if this does not exist
+     */
+    public Sample getSample(String id) {
+        return samples.get(id);
+    }
+
+    /**
+     *
+     * @param read
+     * @return sample Object with this ID, or null if this does not exist
+     */
+    public Sample getSample(final SAMRecord read) {
+        return getSample(read.getReadGroup());
+    }
+
+    /**
+     *
+     * @param rg
+     * @return sample Object with this ID, or null if this does not exist
+     */
+    public Sample getSample(final SAMReadGroupRecord rg) {
+        return getSample(rg.getSample());
+    }
+
+    /**
+     * @param g Genotype
+     * @return sample Object with this ID, or null if this does not exist
+     */
+    public Sample getSample(final Genotype g) {
+        return getSample(g.getSampleName());
+    }
+
+    // --------------------------------------------------------------------------------
+    //
+    // Functions for accessing samples in the DB
+    //
+    // --------------------------------------------------------------------------------
+
+    /**
+     * Get number of sample objects
+     * @return size of samples map
+     */
+    public int sampleCount() {
+        return samples.size();
+    }
+
+    public Set<Sample> getSamples() {
+        return new HashSet<Sample>(samples.values());
+    }
+
+    public Collection<String> getSampleNames() {
+        return Collections.unmodifiableCollection(samples.keySet());
+    }
+
+
+    /**
+     * Takes a collection of sample names and returns their corresponding sample objects
+     * Note that, since a set is returned, if you pass in a list with duplicates names there will not be any duplicates in the returned set
+     * @param sampleNameList Set of sample names
+     * @return Corresponding set of samples
+     */
+    public Set<Sample> getSamples(Collection<String> sampleNameList) {
+        HashSet<Sample> samples = new HashSet<Sample>();
+        for (String name : sampleNameList) {
+            try {
+                samples.add(getSample(name));
+            }
+            catch (Exception e) {
+                throw new StingException("Could not get sample with the following ID: " + name, e);
+            }
+        }
+        return samples;
+    }
+
+    // --------------------------------------------------------------------------------
+    //
+    // Higher level pedigree functions
+    //
+    // --------------------------------------------------------------------------------
+
+    /**
+     * Returns a sorted set of the family IDs in all samples (excluding null ids)
+     * @return
+     */
+    public final Set<String> getFamilyIDs() {
+        return getFamilies().keySet();
+    }
+
+    /**
+     * Returns a map from family ID -> set of family members for all samples with
+     * non-null family ids
+     *
+     * @return
+     */
+    public final Map<String, Set<Sample>> getFamilies() {
+        final Map<String, Set<Sample>> families = new TreeMap<String, Set<Sample>>();
+
+        for ( final Sample sample : samples.values() ) {
+            final String famID = sample.getFamilyID();
+            if ( famID != null ) {
+                if ( ! families.containsKey(famID) )
+                    families.put(famID, new TreeSet<Sample>());
+                families.get(famID).add(sample);
+            }
+        }
+
+        return families;
+    }
+
+    /**
+     * Return all samples with a given family ID
+     * @param familyId
+     * @return
+     */
+    public Set<Sample> getFamily(String familyId) {
+        return getFamilies().get(familyId);
+    }
+
+    /**
+     * Returns all children of a given sample
+     * See note on the efficiency of getFamily() - since this depends on getFamily() it's also not efficient
+     * @param sample
+     * @return
+     */
+    public Set<Sample> getChildren(Sample sample) {
+        final HashSet<Sample> children = new HashSet<Sample>();
+        for ( final Sample familyMember : getFamily(sample.getFamilyID())) {
+            if ( familyMember.getMother() == sample || familyMember.getFather() == sample ) {
+                children.add(familyMember);
+            }
+        }
+        return children;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/samples/SampleDBBuilder.java b/public/java/src/org/broadinstitute/sting/gatk/samples/SampleDBBuilder.java
new file mode 100644
index 000000000..44a8600b0
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/samples/SampleDBBuilder.java
@@ -0,0 +1,153 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.gatk.samples;
+
+import net.sf.samtools.SAMFileHeader;
+import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
+import org.broadinstitute.sting.utils.SampleUtils;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+
+import java.io.File;
+import java.io.FileNotFoundException;
+import java.util.*;
+
+/**
+ *
+ */
+public class SampleDBBuilder {
+    PedigreeValidationType validationStrictness;
+    final SampleDB sampleDB = new SampleDB();
+    final GenomeAnalysisEngine engine;
+
+    Set<Sample> samplesFromDataSources = new HashSet<Sample>();
+    Set<Sample> samplesFromPedigrees = new HashSet<Sample>();
+
+    /** for testing only */
+    protected SampleDBBuilder(PedigreeValidationType validationStrictness) {
+        engine = null;
+        this.validationStrictness = validationStrictness;
+    }
+
+    /**
+     * Constructor takes both a SAM header and sample files because the two must be integrated.
+     */
+    public SampleDBBuilder(GenomeAnalysisEngine engine, PedigreeValidationType validationStrictness) {
+        this.engine = engine;
+        this.validationStrictness = validationStrictness;
+    }
+
+    /**
+     * Hallucinates sample objects for all the samples in the SAM file and stores them
+     */
+    public SampleDBBuilder addSamplesFromSAMHeader(final SAMFileHeader header) {
+        addSamplesFromSampleNames(SampleUtils.getSAMFileSamples(header));
+        return this;
+    }
+
+    public SampleDBBuilder addSamplesFromSampleNames(final Collection<String> sampleNames) {
+        for (final String sampleName : sampleNames) {
+            if (sampleDB.getSample(sampleName) == null) {
+                final Sample newSample = new Sample(sampleName, sampleDB);
+                sampleDB.addSample(newSample);
+                samplesFromDataSources.add(newSample); // keep track of data source samples
+            }
+        }
+        return this;
+    }
+
+    public SampleDBBuilder addSamplesFromPedigreeFiles(final List<File> pedigreeFiles) {
+        for (final File pedFile : pedigreeFiles) {
+            Collection<Sample> samples = addSamplesFromPedigreeArgument(pedFile);
+            samplesFromPedigrees.addAll(samples);
+        }
+
+        return this;
+    }
+
+    public SampleDBBuilder addSamplesFromPedigreeStrings(final List<String> pedigreeStrings) {
+        for (final String pedString : pedigreeStrings) {
+            Collection<Sample> samples = addSamplesFromPedigreeArgument(pedString);
+            samplesFromPedigrees.addAll(samples);
+        }
+
+        return this;
+    }
+
+    /**
+     * Parse one sample file and integrate it with samples that are already there
+     * Fail quickly if we find any errors in the file
+     */
+    private Collection<Sample> addSamplesFromPedigreeArgument(File sampleFile) {
+        final PedReader reader = new PedReader();
+
+        try {
+            return reader.parse(sampleFile, getMissingFields(sampleFile), sampleDB);
+        } catch ( FileNotFoundException e ) {
+            throw new UserException.CouldNotReadInputFile(sampleFile, e);
+        }
+    }
+
+    private Collection<Sample> addSamplesFromPedigreeArgument(final String string) {
+        final PedReader reader = new PedReader();
+        return reader.parse(string, getMissingFields(string), sampleDB);
+    }
+
+    public SampleDB getFinalSampleDB() {
+        validate();
+        return sampleDB;
+    }
+
+    public EnumSet<PedReader.MissingPedField> getMissingFields(final Object engineArg) {
+        if ( engine == null )
+            return EnumSet.noneOf(PedReader.MissingPedField.class);
+        else {
+            final List<String> posTags = engine.getTags(engineArg).getPositionalTags();
+            return PedReader.parseMissingFieldTags(engineArg, posTags);
+        }
+    }
+
+    // --------------------------------------------------------------------------------
+    //
+    // Validation
+    //
+    // --------------------------------------------------------------------------------
+
+    protected final void validate() {
+        if ( validationStrictness == PedigreeValidationType.SILENT )
+            return;
+        else {
+            // check that samples in data sources are all annotated, if anything is annotated
+            if ( ! samplesFromPedigrees.isEmpty() && ! samplesFromDataSources.isEmpty() ) {
+                final Set<String> sampleNamesFromPedigrees = new HashSet<String>();
+                for ( final Sample pSample : samplesFromPedigrees )
+                    sampleNamesFromPedigrees.add(pSample.getID());
+
+                for ( final Sample dsSample : samplesFromDataSources )
+                    if ( ! sampleNamesFromPedigrees.contains(dsSample.getID()) )
+                        throw new UserException("Sample " + dsSample.getID() + " found in data sources but not in pedigree files with STRICT pedigree validation");
+            }
+        }
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/traversals/TraversalEngine.java b/public/java/src/org/broadinstitute/sting/gatk/traversals/TraversalEngine.java
index c6321e2ad..fd691735f 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/traversals/TraversalEngine.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/traversals/TraversalEngine.java
@@ -364,8 +364,8 @@ public abstract class TraversalEngine<M,T,WalkerType extends Walker<M,T>,Provide
 
         // count up the number of skipped reads by summing over all filters
         long nSkippedReads = 0L;
-        for ( Map.Entry<Class, Long> countsByFilter: cumulativeMetrics.getCountsByFilter().entrySet())
-            nSkippedReads += countsByFilter.getValue();
+        for ( final long countsByFilter : cumulativeMetrics.getCountsByFilter().values())
+            nSkippedReads += countsByFilter;
 
         logger.info(String.format("Total runtime %.2f secs, %.2f min, %.2f hours", elapsed, elapsed / 60, elapsed / 3600));
         if ( cumulativeMetrics.getNumReadsSeen() > 0 )
@@ -373,10 +373,10 @@ public abstract class TraversalEngine<M,T,WalkerType extends Walker<M,T>,Provide
                     nSkippedReads,
                     cumulativeMetrics.getNumReadsSeen(),
                     100.0 * MathUtils.ratio(nSkippedReads,cumulativeMetrics.getNumReadsSeen())));
-        for ( Map.Entry<Class, Long> filterCounts : cumulativeMetrics.getCountsByFilter().entrySet() ) {
+        for ( Map.Entry<String, Long> filterCounts : cumulativeMetrics.getCountsByFilter().entrySet() ) {
             long count = filterCounts.getValue();
             logger.info(String.format("  -> %d reads (%.2f%% of total) failing %s",
-                    count, 100.0 * MathUtils.ratio(count,cumulativeMetrics.getNumReadsSeen()), Utils.getClassName(filterCounts.getKey())));
+                    count, 100.0 * MathUtils.ratio(count,cumulativeMetrics.getNumReadsSeen()), filterCounts.getKey()));
         }
 
         if ( performanceLog != null ) performanceLog.close();
diff --git a/public/java/src/org/broadinstitute/sting/gatk/traversals/TraverseDuplicates.java b/public/java/src/org/broadinstitute/sting/gatk/traversals/TraverseDuplicates.java
index 046003154..3f349d86d 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/traversals/TraverseDuplicates.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/traversals/TraverseDuplicates.java
@@ -34,6 +34,7 @@ import org.broadinstitute.sting.gatk.iterators.PushbackIterator;
 import org.broadinstitute.sting.gatk.walkers.DuplicateWalker;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileupImpl;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.*;
 
@@ -57,9 +58,9 @@ public class TraverseDuplicates<M,T> extends TraversalEngine<M,T,DuplicateWalker
         return "dups";
     }
 
-    private List<SAMRecord> readsAtLoc(final SAMRecord read, PushbackIterator<SAMRecord> iter) {
+    private List<GATKSAMRecord> readsAtLoc(final GATKSAMRecord read, PushbackIterator<SAMRecord> iter) {
         GenomeLoc site = engine.getGenomeLocParser().createGenomeLoc(read);
-        ArrayList<SAMRecord> l = new ArrayList<SAMRecord>();
+        ArrayList<GATKSAMRecord> l = new ArrayList<GATKSAMRecord>();
 
         l.add(read);
         for (SAMRecord read2 : iter) {
@@ -70,7 +71,7 @@ public class TraverseDuplicates<M,T> extends TraversalEngine<M,T,DuplicateWalker
                 iter.pushback(read2);
                 break;
             } else {
-                l.add(read2);
+                l.add((GATKSAMRecord) read2);
             }
         }
 
@@ -84,15 +85,15 @@ public class TraverseDuplicates<M,T> extends TraversalEngine<M,T,DuplicateWalker
      * @param reads the list of reads to split into unique molecular samples
      * @return
      */
-    protected Set<List<SAMRecord>> uniqueReadSets(List<SAMRecord> reads) {
-        Set<List<SAMRecord>> readSets = new LinkedHashSet<List<SAMRecord>>();
+    protected Set<List<GATKSAMRecord>> uniqueReadSets(List<GATKSAMRecord> reads) {
+        Set<List<GATKSAMRecord>> readSets = new LinkedHashSet<List<GATKSAMRecord>>();
 
         // for each read, find duplicates, and either add the read to its duplicate list or start a new one
-        for ( SAMRecord read : reads ) {
-            List<SAMRecord> readSet = findDuplicateReads(read, readSets);
+        for ( GATKSAMRecord read : reads ) {
+            List<GATKSAMRecord> readSet = findDuplicateReads(read, readSets);
 
             if ( readSet == null ) {
-                readSets.add(new ArrayList<SAMRecord>(Arrays.asList(read)));    // copy so I can add to the list
+                readSets.add(new ArrayList<GATKSAMRecord>(Arrays.asList(read)));    // copy so I can add to the list
             } else {
                 readSet.add(read);
             }
@@ -110,13 +111,13 @@ public class TraverseDuplicates<M,T> extends TraversalEngine<M,T,DuplicateWalker
      * @param readSets
      * @return The list of duplicate reads that read is a member of, or null if it's the only one of its kind
      */
-    protected List<SAMRecord> findDuplicateReads(SAMRecord read, Set<List<SAMRecord>> readSets ) {
+    protected List<GATKSAMRecord> findDuplicateReads(GATKSAMRecord read, Set<List<GATKSAMRecord>> readSets ) {
         if ( read.getReadPairedFlag() ) {
             // paired
             final GenomeLoc readMateLoc = engine.getGenomeLocParser().createGenomeLoc(read.getMateReferenceName(), read.getMateAlignmentStart(), read.getMateAlignmentStart());
 
-            for (List<SAMRecord> reads : readSets) {
-                SAMRecord key = reads.get(0);
+            for (List<GATKSAMRecord> reads : readSets) {
+                GATKSAMRecord key = reads.get(0);
 
                 // read and key start at the same place, and either the this read and the key
                 // share a mate location or the read is flagged as a duplicate
@@ -131,8 +132,8 @@ public class TraverseDuplicates<M,T> extends TraversalEngine<M,T,DuplicateWalker
                 }
             }
         } else {
-            for (List<SAMRecord> reads : readSets) {
-                SAMRecord key = reads.get(0);
+            for (List<GATKSAMRecord> reads : readSets) {
+                GATKSAMRecord key = reads.get(0);
                 boolean v = (! key.getReadPairedFlag()) && read.getAlignmentStart() == key.getAlignmentStart() && ( key.getDuplicateReadFlag() || read.getDuplicateReadFlag() ) && read.getReadLength() == key.getReadLength();
                 //System.out.printf("%s %s %b %b %d %d %d %d => %b%n",
                 //        read.getReadPairedFlag(), key.getReadPairedFlag(), read.getDuplicateReadFlag(), key.getDuplicateReadFlag(),
@@ -179,7 +180,7 @@ public class TraverseDuplicates<M,T> extends TraversalEngine<M,T,DuplicateWalker
             // get the genome loc from the read
             GenomeLoc site = engine.getGenomeLocParser().createGenomeLoc(read);
 
-            Set<List<SAMRecord>> readSets = uniqueReadSets(readsAtLoc(read, iter));
+            Set<List<GATKSAMRecord>> readSets = uniqueReadSets(readsAtLoc((GATKSAMRecord) read, iter));
             if ( DEBUG ) logger.debug(String.format("*** TraverseDuplicates.traverse at %s with %d read sets", site, readSets.size()));
 
             // Jump forward in the reference to this locus location
diff --git a/public/java/src/org/broadinstitute/sting/gatk/traversals/TraverseReads.java b/public/java/src/org/broadinstitute/sting/gatk/traversals/TraverseReads.java
index 27bbd50d5..24b8ac986 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/traversals/TraverseReads.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/traversals/TraverseReads.java
@@ -13,6 +13,7 @@ import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
 import org.broadinstitute.sting.gatk.walkers.DataSource;
 import org.broadinstitute.sting.gatk.walkers.ReadWalker;
 import org.broadinstitute.sting.utils.GenomeLoc;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 /*
  * Copyright (c) 2009 The Broad Institute
@@ -100,9 +101,9 @@ public class TraverseReads<M,T> extends TraversalEngine<M,T,ReadWalker<M,T>,Read
             // if the read is mapped, create a metadata tracker
             ReadMetaDataTracker tracker = (read.getReferenceIndex() >= 0) ? rodView.getReferenceOrderedDataForRead(read) : null;
 
-            final boolean keepMeP = walker.filter(refContext, read);
+            final boolean keepMeP = walker.filter(refContext, (GATKSAMRecord) read);
             if (keepMeP) {
-                M x = walker.map(refContext, read, tracker); // the tracker can be null
+                M x = walker.map(refContext, (GATKSAMRecord) read, tracker); // the tracker can be null
                 sum = walker.reduce(x, sum);
             }
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/ClipReadsWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/ClipReadsWalker.java
index 6989f45b2..d1148cbd5 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/ClipReadsWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/ClipReadsWalker.java
@@ -28,7 +28,6 @@ package org.broadinstitute.sting.gatk.walkers;
 import net.sf.picard.reference.ReferenceSequence;
 import net.sf.picard.reference.ReferenceSequenceFile;
 import net.sf.picard.reference.ReferenceSequenceFileFactory;
-import net.sf.samtools.SAMRecord;
 import net.sf.samtools.util.StringUtil;
 import org.broadinstitute.sting.commandline.Advanced;
 import org.broadinstitute.sting.commandline.Argument;
@@ -43,6 +42,7 @@ import org.broadinstitute.sting.utils.clipreads.ClippingOp;
 import org.broadinstitute.sting.utils.clipreads.ClippingRepresentation;
 import org.broadinstitute.sting.utils.clipreads.ReadClipper;
 import org.broadinstitute.sting.utils.collections.Pair;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.broadinstitute.sting.utils.sam.ReadUtils;
 
 import java.io.File;
@@ -292,11 +292,12 @@ public class ClipReadsWalker extends ReadWalker<ClipReadsWalker.ReadClipperWithD
     /**
      * The reads map function.
      *
+     *
      * @param ref  the reference bases that correspond to our read, if a reference was provided
-     * @param read the read itself, as a SAMRecord
+     * @param read the read itself, as a GATKSAMRecord
      * @return the ReadClipper object describing what should be done to clip this read
      */
-    public ReadClipperWithData map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
+    public ReadClipperWithData map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker) {
         if ( onlyDoRead == null || read.getReadName().equals(onlyDoRead) ) {
             if ( clippingRepresentation == ClippingRepresentation.HARDCLIP_BASES ) {
                 read = ReadUtils.replaceSoftClipsWithMatches(read);
@@ -323,7 +324,7 @@ public class ClipReadsWalker extends ReadWalker<ClipReadsWalker.ReadClipperWithD
      */
     private void clipSequences(ReadClipperWithData clipper) {
         if (sequencesToClip != null) {                // don't bother if we don't have any sequences to clip
-            SAMRecord read = clipper.getRead();
+            GATKSAMRecord read = clipper.getRead();
             ClippingData data = clipper.getData();
 
             for (SeqToClip stc : sequencesToClip) {
@@ -360,7 +361,7 @@ public class ClipReadsWalker extends ReadWalker<ClipReadsWalker.ReadClipperWithD
      * @param stop
      * @return
      */
-    private Pair<Integer, Integer> strandAwarePositions(SAMRecord read, int start, int stop) {
+    private Pair<Integer, Integer> strandAwarePositions(GATKSAMRecord read, int start, int stop) {
         if (read.getReadNegativeStrandFlag())
             return new Pair<Integer, Integer>(read.getReadLength() - stop - 1, read.getReadLength() - start - 1);
         else
@@ -374,7 +375,7 @@ public class ClipReadsWalker extends ReadWalker<ClipReadsWalker.ReadClipperWithD
      */
     private void clipCycles(ReadClipperWithData clipper) {
         if (cyclesToClip != null) {
-            SAMRecord read = clipper.getRead();
+            GATKSAMRecord read = clipper.getRead();
             ClippingData data = clipper.getData();
 
             for (Pair<Integer, Integer> p : cyclesToClip) {   // iterate over each cycle range
@@ -416,7 +417,7 @@ public class ClipReadsWalker extends ReadWalker<ClipReadsWalker.ReadClipperWithD
      * @param clipper
      */
     private void clipBadQualityScores(ReadClipperWithData clipper) {
-        SAMRecord read = clipper.getRead();
+        GATKSAMRecord read = clipper.getRead();
         ClippingData data = clipper.getData();
         int readLen = read.getReadBases().length;
         byte[] quals = read.getBaseQualities();
@@ -458,7 +459,7 @@ public class ClipReadsWalker extends ReadWalker<ClipReadsWalker.ReadClipperWithD
         if ( clipper == null )
             return data;
 
-        SAMRecord clippedRead = clipper.clipRead(clippingRepresentation);
+        GATKSAMRecord clippedRead = clipper.clipRead(clippingRepresentation);
         if (outputBam != null) {
             outputBam.addAlignment(clippedRead);
         } else {
@@ -575,7 +576,7 @@ public class ClipReadsWalker extends ReadWalker<ClipReadsWalker.ReadClipperWithD
     public class ReadClipperWithData extends ReadClipper {
         private ClippingData data;
 
-        public ReadClipperWithData(SAMRecord read, List<SeqToClip> clipSeqs) {
+        public ReadClipperWithData(GATKSAMRecord read, List<SeqToClip> clipSeqs) {
             super(read);
             data = new ClippingData(clipSeqs);
         }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/DuplicateWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/DuplicateWalker.java
index e2db1dc52..905ecf273 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/DuplicateWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/DuplicateWalker.java
@@ -1,10 +1,10 @@
 package org.broadinstitute.sting.gatk.walkers;
 
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.filters.NotPrimaryAlignmentFilter;
 import org.broadinstitute.sting.gatk.filters.UnmappedReadFilter;
 import org.broadinstitute.sting.utils.GenomeLoc;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.List;
 import java.util.Set;
@@ -20,11 +20,11 @@ import java.util.Set;
 @ReadFilters({UnmappedReadFilter.class,NotPrimaryAlignmentFilter.class})
 public abstract class DuplicateWalker<MapType, ReduceType> extends Walker<MapType, ReduceType> {
     // Do we actually want to operate on the context?
-    public boolean filter(GenomeLoc loc, AlignmentContext context, Set<List<SAMRecord>> readSets ) {
+    public boolean filter(GenomeLoc loc, AlignmentContext context, Set<List<GATKSAMRecord>> readSets ) {
         return true;    // We are keeping all the reads
     }
 
-    public abstract MapType map(GenomeLoc loc, AlignmentContext context, Set<List<SAMRecord>> readSets );
+    public abstract MapType map(GenomeLoc loc, AlignmentContext context, Set<List<GATKSAMRecord>> readSets );
 
     // Given result of map function
     public abstract ReduceType reduceInit();
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/FindReadsWithNamesWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/FindReadsWithNamesWalker.java
index 56287df31..7f9269725 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/FindReadsWithNamesWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/FindReadsWithNamesWalker.java
@@ -33,6 +33,7 @@ import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
 import org.broadinstitute.sting.utils.baq.BAQ;
 import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.broadinstitute.sting.utils.text.XReadLines;
 
 import java.io.File;
@@ -71,21 +72,23 @@ public class FindReadsWithNamesWalker extends ReadWalker<SAMRecord, SAMFileWrite
 
     /**
      * The reads filter function.
+     *
      * @param ref the reference bases that correspond to our read, if a reference was provided
      * @param read the read itself, as a SAMRecord
      * @return true if the read passes the filter, false if it doesn't
      */
-    public boolean filter(ReferenceContext ref, SAMRecord read) {
+    public boolean filter(ReferenceContext ref, GATKSAMRecord read) {
         return namesToKeep.contains(read.getReadName());
 	}
 
     /**
      * The reads map function.
+     *
      * @param ref the reference bases that correspond to our read, if a reference was provided
      * @param read the read itself, as a SAMRecord
      * @return the read itself
      */
-    public SAMRecord map( ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker ) {
+    public SAMRecord map( ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker ) {
         return read;
     }
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/FlagStatWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/FlagStatWalker.java
index fcfcb81b5..ab1e452d7 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/FlagStatWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/FlagStatWalker.java
@@ -1,9 +1,9 @@
 package org.broadinstitute.sting.gatk.walkers;
 
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.commandline.Output;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.io.PrintStream;
 import java.text.DecimalFormat;
@@ -119,7 +119,7 @@ public class FlagStatWalker extends ReadWalker<Integer, Integer> {
 
     private FlagStat myStat = new FlagStat();
 
-    public Integer map( ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker ) {
+    public Integer map( ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker ) {
         myStat.readCount++;
         if (read.getReadFailsVendorQualityCheckFlag()) {
             myStat.QC_failure++;
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/LocusWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/LocusWalker.java
index 8152f74c2..e94d01d5a 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/LocusWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/LocusWalker.java
@@ -17,7 +17,7 @@ import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
  */
 @By(DataSource.READS)
 @Requires({DataSource.READS,DataSource.REFERENCE, DataSource.REFERENCE_BASES})
-@PartitionBy(PartitionType.INTERVAL)
+@PartitionBy(PartitionType.LOCUS)
 @ReadFilters({UnmappedReadFilter.class,NotPrimaryAlignmentFilter.class,DuplicateReadFilter.class,FailsVendorQualityCheckFilter.class})
 public abstract class LocusWalker<MapType, ReduceType> extends Walker<MapType, ReduceType> {
     // Do we actually want to operate on the context?
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/PartitionType.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/PartitionType.java
index 361e222c2..f0d92ef8a 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/PartitionType.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/PartitionType.java
@@ -34,6 +34,12 @@ public enum PartitionType {
      */
     NONE,
 
+    /**
+     * The walker inputs can be chunked down to individual
+     * reads.
+     */
+    READ,
+
     /**
      * The walker inputs can be chunked down to the
      * per-locus level.
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/PrintReadsWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/PrintReadsWalker.java
index 4f072e88c..ac69738d3 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/PrintReadsWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/PrintReadsWalker.java
@@ -40,6 +40,7 @@ import java.util.TreeSet;
 
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 /**
  * Renders, in SAM/BAM format, all reads from the input data set in the order in which they appear in the input file.
@@ -136,11 +137,12 @@ public class PrintReadsWalker extends ReadWalker<SAMRecord, SAMFileWriter> {
 
     /**
      * The reads filter function.
+     *
      * @param ref the reference bases that correspond to our read, if a reference was provided
      * @param read the read itself, as a SAMRecord
      * @return true if the read passes the filter, false if it doesn't
      */
-    public boolean filter(ReferenceContext ref, SAMRecord read) {
+    public boolean filter(ReferenceContext ref, GATKSAMRecord read) {
         // check the read group
         if  ( readGroup != null ) {
             SAMReadGroupRecord myReadGroup = read.getReadGroup();
@@ -180,11 +182,12 @@ public class PrintReadsWalker extends ReadWalker<SAMRecord, SAMFileWriter> {
 
     /**
      * The reads map function.
+     *
      * @param ref the reference bases that correspond to our read, if a reference was provided
      * @param read the read itself, as a SAMRecord
      * @return the read itself
      */
-    public SAMRecord map( ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker ) {
+    public SAMRecord map( ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker ) {
         return read;
     }
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/ReadWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/ReadWalker.java
index db2038aa3..8933bd73e 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/ReadWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/ReadWalker.java
@@ -3,6 +3,7 @@ package org.broadinstitute.sting.gatk.walkers;
 import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 /**
  * Created by IntelliJ IDEA.
@@ -12,7 +13,7 @@ import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
  * To change this template use File | Settings | File Templates.
  */
 @Requires({DataSource.READS, DataSource.REFERENCE_BASES})
-@PartitionBy(PartitionType.CONTIG)
+@PartitionBy(PartitionType.READ)
 public abstract class ReadWalker<MapType, ReduceType> extends Walker<MapType, ReduceType> {
     public boolean requiresOrderedReads() { return false; }
     
@@ -20,11 +21,11 @@ public abstract class ReadWalker<MapType, ReduceType> extends Walker<MapType, Re
     /** Must return true for reads that need to be processed. Reads, for which this method return false will
      * be skipped by the engine and never passed to the walker.
      */
-    public boolean filter(ReferenceContext ref, SAMRecord read) {
+    public boolean filter(ReferenceContext ref, GATKSAMRecord read) {
         // We are keeping all the reads
         return true;
     }
 
     // Map over the org.broadinstitute.sting.gatk.contexts.AlignmentContext
-    public abstract MapType map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker);
+    public abstract MapType map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker);
 }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/SplitSamFileWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/SplitSamFileWalker.java
index 486d233b7..31ea63725 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/SplitSamFileWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/SplitSamFileWalker.java
@@ -33,6 +33,7 @@ import org.apache.log4j.Logger;
 import org.broadinstitute.sting.commandline.Argument;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.broadinstitute.sting.utils.sam.ReadUtils;
 
 import java.util.ArrayList;
@@ -60,7 +61,7 @@ public class SplitSamFileWalker extends ReadWalker<SAMRecord, Map<String, SAMFil
         logger.info("SplitSamFile version: " + VERSION);
     }
 
-    public SAMRecord map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
+    public SAMRecord map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker) {
         return read;
     }
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/Walker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/Walker.java
index c88c7c3c4..792fef9c3 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/Walker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/Walker.java
@@ -25,15 +25,17 @@
 
 package org.broadinstitute.sting.gatk.walkers;
 
+import net.sf.samtools.SAMSequenceDictionary;
 import org.apache.log4j.Logger;
 import org.broadinstitute.sting.gatk.CommandLineGATK;
 import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
 import org.broadinstitute.sting.gatk.filters.MalformedReadFilter;
+import org.broadinstitute.sting.gatk.samples.Sample;
+import org.broadinstitute.sting.gatk.samples.SampleDB;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.baq.BAQ;
 import org.broadinstitute.sting.utils.collections.Pair;
 import org.broadinstitute.sting.utils.help.DocumentedGATKFeature;
-import org.broadinstitute.sting.utils.help.GenericDocumentationHandler;
 
 import java.util.List;
 
@@ -77,6 +79,23 @@ public abstract class Walker<MapType, ReduceType> {
         return toolkit;
     }
 
+    /**
+     * Gets the master sequence dictionary for this walker
+     * @link GenomeAnalysisEngine.getMasterSequenceDictionary
+     * @return
+     */
+    protected SAMSequenceDictionary getMasterSequenceDictionary() {
+        return getToolkit().getMasterSequenceDictionary();
+    }
+
+    protected SampleDB getSampleDB() {
+        return getToolkit().getSampleDB();
+    }
+
+    protected Sample getSample(final String id) {
+        return getToolkit().getSampleDB().getSample(id);
+    }
+
     /**
      * (conceptual static) method that states whether you want to see reads piling up at a locus
      * that contain a deletion at the locus.
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/AlleleBalance.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/AlleleBalance.java
index e501258c5..e5f75f06d 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/AlleleBalance.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/AlleleBalance.java
@@ -92,7 +92,7 @@ public class AlleleBalance extends InfoFieldAnnotation {
                     continue;
                 }
                 // todo -- actually care about indel length from the pileup (agnostic at the moment)
-                int refCount = indelPileup.size();
+                int refCount = indelPileup.getNumberOfElements();
                 int altCount = vc.isSimpleInsertion() ? indelPileup.getNumberOfInsertions() : indelPileup.getNumberOfDeletions();
 
                 if ( refCount + altCount == 0 ) {
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/AlleleBalanceBySample.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/AlleleBalanceBySample.java
index 75c4037d5..820fd248a 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/AlleleBalanceBySample.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/AlleleBalanceBySample.java
@@ -47,7 +47,7 @@ public class AlleleBalanceBySample extends GenotypeAnnotation implements Experim
         if (!g.isHet())
             return null;
 
-        Set<Allele> altAlleles = vc.getAlternateAlleles();
+        Collection<Allele> altAlleles = vc.getAlternateAlleles();
         if ( altAlleles.size() == 0 )
             return null;
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/AnnotationByDepth.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/AnnotationByDepth.java
deleted file mode 100755
index 353fd1c2c..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/AnnotationByDepth.java
+++ /dev/null
@@ -1,32 +0,0 @@
-package org.broadinstitute.sting.gatk.walkers.annotator;
-
-import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
-import org.broadinstitute.sting.gatk.walkers.annotator.interfaces.InfoFieldAnnotation;
-import org.broadinstitute.sting.utils.variantcontext.Genotype;
-
-import java.util.Map;
-
-/**
- * Abstract base class for all annotations that are normalized by depth
- */
-public abstract class AnnotationByDepth extends InfoFieldAnnotation {
-
-
-    protected int annotationByVariantDepth(final Map<String, Genotype> genotypes, Map<String, AlignmentContext> stratifiedContexts) {
-        int depth = 0;
-        for ( Map.Entry<String, Genotype> genotype : genotypes.entrySet() ) {
-
-            // we care only about variant calls
-            if ( genotype.getValue().isHomRef() )
-                continue;
-
-            AlignmentContext context = stratifiedContexts.get(genotype.getKey());
-            if ( context != null )
-                depth += context.size();
-        }
-
-        return depth;
-    }
-
-
-}
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/DepthOfCoverage.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/DepthOfCoverage.java
index 864be55b7..8098de5b1 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/DepthOfCoverage.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/DepthOfCoverage.java
@@ -41,7 +41,7 @@ public class DepthOfCoverage extends InfoFieldAnnotation implements StandardAnno
 
         int depth = 0;
         for ( Map.Entry<String, AlignmentContext> sample : stratifiedContexts.entrySet() )
-            depth += sample.getValue().size();
+            depth += sample.getValue().hasBasePileup() ? sample.getValue().getBasePileup().depthOfCoverage() : sample.getValue().getExtendedEventPileup().depthOfCoverage();
         Map<String, Object> map = new HashMap<String, Object>();
         map.put(getKeyNames().get(0), String.format("%d", depth));
         return map;
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/FisherStrand.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/FisherStrand.java
index 393eb549c..2d1d1978c 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/FisherStrand.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/FisherStrand.java
@@ -205,7 +205,7 @@ public class FisherStrand extends InfoFieldAnnotation implements StandardAnnotat
 
         for ( Map.Entry<String, AlignmentContext> sample : stratifiedContexts.entrySet() ) {
             for (PileupElement p : sample.getValue().getBasePileup()) {
-                if ( p.isDeletion() ) // ignore deletions
+                if ( p.isDeletion() || p.isReducedRead() ) // ignore deletions and reduced reads
                     continue;
 
                 if ( p.getRead().getMappingQuality() < 20 || p.getQual() < 20 )
@@ -258,6 +258,8 @@ public class FisherStrand extends InfoFieldAnnotation implements StandardAnnotat
                  continue;
 
             for (final PileupElement p: pileup) {
+                if ( p.isReducedRead() ) // ignore reduced reads
+                    continue;
                 if ( p.getRead().getMappingQuality() < 20)
                     continue;
                 if (indelLikelihoodMap.containsKey(p)) {
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/HaplotypeScore.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/HaplotypeScore.java
index df6da3b85..c142109fa 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/HaplotypeScore.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/HaplotypeScore.java
@@ -34,12 +34,12 @@ import org.broadinstitute.sting.gatk.walkers.annotator.interfaces.InfoFieldAnnot
 import org.broadinstitute.sting.gatk.walkers.annotator.interfaces.StandardAnnotation;
 import org.broadinstitute.sting.gatk.walkers.genotyper.IndelGenotypeLikelihoodsCalculationModel;
 import org.broadinstitute.sting.utils.BaseUtils;
+import org.broadinstitute.sting.utils.Haplotype;
 import org.broadinstitute.sting.utils.MathUtils;
 import org.broadinstitute.sting.utils.QualityUtils;
 import org.broadinstitute.sting.utils.codecs.vcf.VCFHeaderLineType;
 import org.broadinstitute.sting.utils.codecs.vcf.VCFInfoHeaderLine;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
-import org.broadinstitute.sting.utils.genotype.Haplotype;
 import org.broadinstitute.sting.utils.pileup.PileupElement;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
 import org.broadinstitute.sting.utils.sam.AlignmentUtils;
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/MVLikelihoodRatio.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/MVLikelihoodRatio.java
new file mode 100755
index 000000000..bd0d4e3fb
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/MVLikelihoodRatio.java
@@ -0,0 +1,58 @@
+package org.broadinstitute.sting.gatk.walkers.annotator;
+
+import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
+import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
+import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
+import org.broadinstitute.sting.gatk.walkers.annotator.interfaces.AnnotatorCompatibleWalker;
+import org.broadinstitute.sting.gatk.walkers.annotator.interfaces.ExperimentalAnnotation;
+import org.broadinstitute.sting.gatk.walkers.annotator.interfaces.InfoFieldAnnotation;
+import org.broadinstitute.sting.utils.BaseUtils;
+import org.broadinstitute.sting.utils.MendelianViolation;
+import org.broadinstitute.sting.utils.codecs.vcf.VCFFilterHeaderLine;
+import org.broadinstitute.sting.utils.codecs.vcf.VCFHeaderLineType;
+import org.broadinstitute.sting.utils.codecs.vcf.VCFInfoHeaderLine;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.pileup.PileupElement;
+import org.broadinstitute.sting.utils.variantcontext.VariantContext;
+
+import java.util.Arrays;
+import java.util.HashMap;
+import java.util.List;
+import java.util.Map;
+
+/**
+ * Created by IntelliJ IDEA.
+ * User: chartl
+ * Date: 9/14/11
+ * Time: 12:24 PM
+ * To change this template use File | Settings | File Templates.
+ */
+public class MVLikelihoodRatio extends InfoFieldAnnotation implements ExperimentalAnnotation {
+
+    private MendelianViolation mendelianViolation = null;
+
+    public Map<String, Object> annotate(RefMetaDataTracker tracker, AnnotatorCompatibleWalker walker, ReferenceContext ref, Map<String, AlignmentContext> stratifiedContexts, VariantContext vc) {
+        if ( mendelianViolation == null ) {
+            if ( walker instanceof VariantAnnotator && ((VariantAnnotator) walker).familyStr != null) {
+                mendelianViolation = new MendelianViolation(((VariantAnnotator)walker).familyStr, ((VariantAnnotator)walker).minGenotypeQualityP );
+            }
+            else {
+                throw new UserException("Mendelian violation annotation can only be used from the Variant Annotator, and must be provided a valid Family String file (-family) on the command line.");
+            }
+        }
+
+        Map<String,Object> toRet = new HashMap<String,Object>(1);
+        boolean hasAppropriateGenotypes = vc.hasGenotype(mendelianViolation.getSampleChild()) && vc.getGenotype(mendelianViolation.getSampleChild()).hasLikelihoods() &&
+                vc.hasGenotype(mendelianViolation.getSampleDad()) && vc.getGenotype(mendelianViolation.getSampleDad()).hasLikelihoods() &&
+                vc.hasGenotype(mendelianViolation.getSampleMom()) && vc.getGenotype(mendelianViolation.getSampleMom()).hasLikelihoods();
+        if ( hasAppropriateGenotypes )
+            toRet.put("MVLR",mendelianViolation.violationLikelihoodRatio(vc));
+
+        return toRet;
+    }
+
+    // return the descriptions used for the VCF INFO meta field
+    public List<String> getKeyNames() { return Arrays.asList("MVLR"); }
+
+    public List<VCFInfoHeaderLine> getDescriptions() { return Arrays.asList(new VCFInfoHeaderLine("MVLR", 1, VCFHeaderLineType.Float, "Mendelian violation likelihood ratio: L[MV] - L[No MV]")); }
+}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/QualByDepth.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/QualByDepth.java
index 552289309..ffc852903 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/QualByDepth.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/QualByDepth.java
@@ -1,10 +1,10 @@
 package org.broadinstitute.sting.gatk.walkers.annotator;
 
-import org.broadinstitute.sting.commandline.Hidden;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
 import org.broadinstitute.sting.gatk.walkers.annotator.interfaces.AnnotatorCompatibleWalker;
+import org.broadinstitute.sting.gatk.walkers.annotator.interfaces.InfoFieldAnnotation;
 import org.broadinstitute.sting.gatk.walkers.annotator.interfaces.StandardAnnotation;
 import org.broadinstitute.sting.utils.codecs.vcf.VCFHeaderLineType;
 import org.broadinstitute.sting.utils.codecs.vcf.VCFInfoHeaderLine;
@@ -21,7 +21,7 @@ import java.util.Map;
  *
  * Low scores are indicative of false positive calls and artifacts.
  */
-public class QualByDepth extends AnnotationByDepth implements StandardAnnotation {
+public class QualByDepth extends InfoFieldAnnotation implements StandardAnnotation {
 
     public Map<String, Object> annotate(RefMetaDataTracker tracker, AnnotatorCompatibleWalker walker, ReferenceContext ref, Map<String, AlignmentContext> stratifiedContexts, VariantContext vc) {
         if ( stratifiedContexts.size() == 0 )
@@ -43,14 +43,13 @@ public class QualByDepth extends AnnotationByDepth implements StandardAnnotation
             if ( context == null )
                 continue;
 
-            depth += context.size();
+            depth += context.hasBasePileup() ? context.getBasePileup().depthOfCoverage() : context.getExtendedEventPileup().depthOfCoverage();
         }
 
         if ( depth == 0 )
             return null;
 
-        int qDepth = annotationByVariantDepth(genotypes, stratifiedContexts);
-        double QD = 10.0 * vc.getNegLog10PError() / (double)qDepth;
+        double QD = 10.0 * vc.getNegLog10PError() / (double)depth;
 
         Map<String, Object> map = new HashMap<String, Object>();
         map.put(getKeyNames().get(0), String.format("%.2f", QD));
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/ReadDepthAndAllelicFractionBySample.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/ReadDepthAndAllelicFractionBySample.java
index 772541eb6..168fbdc49 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/ReadDepthAndAllelicFractionBySample.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/ReadDepthAndAllelicFractionBySample.java
@@ -79,7 +79,7 @@ public class ReadDepthAndAllelicFractionBySample extends GenotypeAnnotation {
                 alleleCounts.put(allele.getBases()[0], 0);
 
             ReadBackedPileup pileup = stratifiedContext.getBasePileup();
-            int totalDepth = pileup.size();
+            int totalDepth = pileup.getNumberOfElements();
 
             Map<String, Object> map = new HashMap<String, Object>();
             map.put(getKeyNames().get(0), totalDepth); // put total depth in right away
@@ -119,7 +119,7 @@ public class ReadDepthAndAllelicFractionBySample extends GenotypeAnnotation {
             ReadBackedExtendedEventPileup pileup = stratifiedContext.getExtendedEventPileup();
             if ( pileup == null )
                 return null;
-            int totalDepth = pileup.size();
+            int totalDepth = pileup.getNumberOfElements();
 
             Map<String, Object> map = new HashMap<String, Object>();
             map.put(getKeyNames().get(0), totalDepth); // put total depth in right away
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/SBByDepth.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/SBByDepth.java
deleted file mode 100755
index efe96f226..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/SBByDepth.java
+++ /dev/null
@@ -1,59 +0,0 @@
-package org.broadinstitute.sting.gatk.walkers.annotator;
-
-import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
-import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
-import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
-import org.broadinstitute.sting.gatk.walkers.annotator.interfaces.AnnotatorCompatibleWalker;
-import org.broadinstitute.sting.utils.codecs.vcf.VCFConstants;
-import org.broadinstitute.sting.utils.codecs.vcf.VCFHeaderLineType;
-import org.broadinstitute.sting.utils.codecs.vcf.VCFInfoHeaderLine;
-import org.broadinstitute.sting.utils.variantcontext.Genotype;
-import org.broadinstitute.sting.utils.variantcontext.VariantContext;
-
-import java.util.Arrays;
-import java.util.HashMap;
-import java.util.List;
-import java.util.Map;
-
-/**
- * SB annotation value by depth of alt containing samples
- */
-public class SBByDepth extends AnnotationByDepth {
-
-    public Map<String, Object> annotate(RefMetaDataTracker tracker, AnnotatorCompatibleWalker walker, ReferenceContext ref, Map<String, AlignmentContext> stratifiedContexts, VariantContext vc) {
-        if ( stratifiedContexts.size() == 0 )
-            return null;
-
-        if (!vc.hasAttribute(VCFConstants.STRAND_BIAS_KEY))
-            return null;
-
-        double sBias = Double.valueOf(vc.getAttributeAsString(VCFConstants.STRAND_BIAS_KEY));
-
-        final Map<String, Genotype> genotypes = vc.getGenotypes();
-        if ( genotypes == null || genotypes.size() == 0 )
-            return null;
-
-        int sDepth = annotationByVariantDepth(genotypes, stratifiedContexts);
-        if ( sDepth == 0 )
-            return null;
-
-
-
-        double SbyD = (-sBias / (double)sDepth);
-        if (SbyD > 0)
-            SbyD = Math.log10(SbyD);
-        else
-            SbyD = -1000;
-        
-        Map<String, Object> map = new HashMap<String, Object>();
-        map.put(getKeyNames().get(0), String.format("%.2f", SbyD));
-        return map;
-    }
-
-    public List<String> getKeyNames() { return Arrays.asList("SBD"); }
-
-    public List<VCFInfoHeaderLine> getDescriptions() { return Arrays.asList(new VCFInfoHeaderLine(getKeyNames().get(0), 1, VCFHeaderLineType.Float, "Strand Bias by Depth")); }
-
-
-
-}
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/SampleList.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/SampleList.java
index ff409484d..ee08cfa3b 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/SampleList.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/SampleList.java
@@ -42,7 +42,7 @@ import java.util.List;
 import java.util.Map;
 
 /**
- * List all of the samples in the info field
+ * List all of the polymorphic samples.
  */
 public class SampleList extends InfoFieldAnnotation {
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/SpanningDeletions.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/SpanningDeletions.java
index f747fbc2e..66d2ad318 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/SpanningDeletions.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/SpanningDeletions.java
@@ -43,7 +43,7 @@ public class SpanningDeletions extends InfoFieldAnnotation implements StandardAn
 
             if (pileup != null) {
                 deletions += pileup.getNumberOfDeletions();
-                depth += pileup.size();
+                depth += pileup.getNumberOfElements();
             }
         }
         Map<String, Object> map = new HashMap<String, Object>();
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotator.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotator.java
index f6a1c4f31..c9937f3d6 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotator.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotator.java
@@ -132,6 +132,13 @@ public class VariantAnnotator extends RodWalker<Integer, Integer> implements Ann
     @Argument(fullName="annotation", shortName="A", doc="One or more specific annotations to apply to variant calls", required=false)
     protected List<String> annotationsToUse = new ArrayList<String>();
 
+    /**
+     * Note that this argument has higher priority than the -A or -G arguments,
+     * so annotations will be excluded even if they are explicitly included with the other options.
+     */
+    @Argument(fullName="excludeAnnotation", shortName="XA", doc="One or more specific annotations to exclude", required=false)
+    protected List<String> annotationsToExclude = new ArrayList<String>();
+
     /**
      * See the -list argument to view available groups.
      */
@@ -148,6 +155,9 @@ public class VariantAnnotator extends RodWalker<Integer, Integer> implements Ann
     @Argument(fullName="expression", shortName="E", doc="One or more specific expressions to apply to variant calls; see documentation for more details", required=false)
     protected List<String> expressionsToUse = new ArrayList<String>();
 
+    /**
+     * Note that the -XL argument can be used along with this one to exclude annotations.
+     */
     @Argument(fullName="useAllAnnotations", shortName="all", doc="Use all possible annotations (not for the faint of heart)", required=false)
     protected Boolean USE_ALL_ANNOTATIONS = false;
 
@@ -162,6 +172,12 @@ public class VariantAnnotator extends RodWalker<Integer, Integer> implements Ann
     @Argument(fullName="vcfContainsOnlyIndels", shortName="dels",doc="Use if you are annotating an indel vcf, currently VERY experimental", required = false)
     protected boolean indelsOnly = false;
 
+    @Argument(fullName="family_string",shortName="family",required=false,doc="A family string of the form mom+dad=child for use with the mendelian violation ratio annotation")
+    public String familyStr = null;
+
+    @Argument(fullName="MendelViolationGenotypeQualityThreshold",shortName="mvq",required=false,doc="The genotype quality treshold in order to annotate mendelian violation ratio")
+    public double minGenotypeQualityP = 0.0;
+
     private VariantAnnotatorEngine engine;
 
     private Collection<VariantContext> indelBufferContext;
@@ -203,9 +219,9 @@ public class VariantAnnotator extends RodWalker<Integer, Integer> implements Ann
         }
 
         if ( USE_ALL_ANNOTATIONS )
-            engine = new VariantAnnotatorEngine(this, getToolkit());
+            engine = new VariantAnnotatorEngine(annotationsToExclude, this, getToolkit());
         else
-            engine = new VariantAnnotatorEngine(annotationGroupsToUse, annotationsToUse, this, getToolkit());
+            engine = new VariantAnnotatorEngine(annotationGroupsToUse, annotationsToUse, annotationsToExclude, this, getToolkit());
         engine.initializeExpressions(expressionsToUse);
 
         // setup the header fields
@@ -216,6 +232,8 @@ public class VariantAnnotator extends RodWalker<Integer, Integer> implements Ann
             if ( isUniqueHeaderLine(line, hInfo) )
                 hInfo.add(line);
         }
+        for ( String expression : expressionsToUse )
+            hInfo.add(new VCFInfoHeaderLine(expression, VCFHeaderLineCount.UNBOUNDED, VCFHeaderLineType.String, "Value transferred from another external VCF resource"));
 
         engine.invokeAnnotationInitializationMethods(hInfo);
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotatorEngine.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotatorEngine.java
index e5effe6d8..e4bc0d5d5 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotatorEngine.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotatorEngine.java
@@ -73,19 +73,20 @@ public class VariantAnnotatorEngine {
     }
 
     // use this constructor if you want all possible annotations
-    public VariantAnnotatorEngine(AnnotatorCompatibleWalker walker, GenomeAnalysisEngine toolkit) {
+    public VariantAnnotatorEngine(List<String> annotationsToExclude, AnnotatorCompatibleWalker walker, GenomeAnalysisEngine toolkit) {
         this.walker = walker;
         this.toolkit = toolkit;
         requestedInfoAnnotations = AnnotationInterfaceManager.createAllInfoFieldAnnotations();
         requestedGenotypeAnnotations = AnnotationInterfaceManager.createAllGenotypeAnnotations();
+        excludeAnnotations(annotationsToExclude);
         initializeDBs();
     }
 
     // use this constructor if you want to select specific annotations (and/or interfaces)
-    public VariantAnnotatorEngine(List<String> annotationGroupsToUse, List<String> annotationsToUse, AnnotatorCompatibleWalker walker, GenomeAnalysisEngine toolkit) {
+    public VariantAnnotatorEngine(List<String> annotationGroupsToUse, List<String> annotationsToUse, List<String> annotationsToExclude, AnnotatorCompatibleWalker walker, GenomeAnalysisEngine toolkit) {
         this.walker = walker;
         this.toolkit = toolkit;
-        initializeAnnotations(annotationGroupsToUse, annotationsToUse);
+        initializeAnnotations(annotationGroupsToUse, annotationsToUse, annotationsToExclude);
         initializeDBs();
     }
 
@@ -96,10 +97,30 @@ public class VariantAnnotatorEngine {
             requestedExpressions.add(new VAExpression(expression, walker.getResourceRodBindings()));
     }
 
-    private void initializeAnnotations(List<String> annotationGroupsToUse, List<String> annotationsToUse) {
+    private void initializeAnnotations(List<String> annotationGroupsToUse, List<String> annotationsToUse, List<String> annotationsToExclude) {
         AnnotationInterfaceManager.validateAnnotations(annotationGroupsToUse, annotationsToUse);
         requestedInfoAnnotations = AnnotationInterfaceManager.createInfoFieldAnnotations(annotationGroupsToUse, annotationsToUse);
         requestedGenotypeAnnotations = AnnotationInterfaceManager.createGenotypeAnnotations(annotationGroupsToUse, annotationsToUse);
+        excludeAnnotations(annotationsToExclude);
+    }
+
+    private void excludeAnnotations(List<String> annotationsToExclude) {
+        if ( annotationsToExclude.size() == 0 )
+            return;
+
+        List<InfoFieldAnnotation> tempRequestedInfoAnnotations = new ArrayList<InfoFieldAnnotation>(requestedInfoAnnotations.size());
+        for ( InfoFieldAnnotation annotation : requestedInfoAnnotations ) {
+            if ( !annotationsToExclude.contains(annotation.getClass().getSimpleName()) )
+                tempRequestedInfoAnnotations.add(annotation);
+        }
+        requestedInfoAnnotations = tempRequestedInfoAnnotations;
+
+        List<GenotypeAnnotation> tempRequestedGenotypeAnnotations = new ArrayList<GenotypeAnnotation>(requestedGenotypeAnnotations.size());
+        for ( GenotypeAnnotation annotation : requestedGenotypeAnnotations ) {
+            if ( !annotationsToExclude.contains(annotation.getClass().getSimpleName()) )
+                tempRequestedGenotypeAnnotations.add(annotation);
+        }
+        requestedGenotypeAnnotations = tempRequestedGenotypeAnnotations;
     }
 
     private void initializeDBs() {
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/beagle/ProduceBeagleInputWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/beagle/ProduceBeagleInputWalker.java
index 87695077d..b722220f9 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/beagle/ProduceBeagleInputWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/beagle/ProduceBeagleInputWalker.java
@@ -31,6 +31,7 @@ import org.broadinstitute.sting.gatk.arguments.StandardVariantContextInputArgume
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
+import org.broadinstitute.sting.gatk.samples.Gender;
 import org.broadinstitute.sting.gatk.walkers.RodWalker;
 import org.broadinstitute.sting.gatk.walkers.variantrecalibration.VQSRCalibrationCurve;
 import org.broadinstitute.sting.utils.GenomeLoc;
@@ -247,7 +248,7 @@ public class ProduceBeagleInputWalker extends RodWalker<Integer, Integer> {
         Map<String,Genotype> preferredGenotypes = preferredVC.getGenotypes();
         Map<String,Genotype> otherGenotypes = goodSite(otherVC) ? otherVC.getGenotypes() : null;
         for ( String sample : samples ) {
-            boolean isMaleOnChrX = CHECK_IS_MALE_ON_CHR_X && getToolkit().getSampleById(sample).isMale();
+            boolean isMaleOnChrX = CHECK_IS_MALE_ON_CHR_X && getSample(sample).getGender() == Gender.MALE;
 
             Genotype genotype;
             boolean isValidation;
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/CallableLociWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/CallableLociWalker.java
index 32875a098..1dfc6fea0 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/CallableLociWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/CallableLociWalker.java
@@ -227,9 +227,8 @@ public class CallableLociWalker extends LocusWalker<CallableLociWalker.CallableB
 
     @Override
     public void initialize() {
-        if ( getToolkit().getSamples().size() != 2 ) {
-            // unbelievably there are actually two samples even when there's just one in the header.  God I hate this Samples system
-            throw new UserException.BadArgumentValue("-I", "CallableLoci only works for a single sample, but multiple samples were found in the provided BAM files: " + getToolkit().getSamples());
+        if ( getSampleDB().getSamples().size() != 1 ) {
+            throw new UserException.BadArgumentValue("-I", "CallableLoci only works for a single sample, but multiple samples were found in the provided BAM files: " + getSampleDB().getSamples());
         }
 
         try {
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/CoarseCoverageWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/CoarseCoverageWalker.java
deleted file mode 100644
index 405a44c29..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/CoarseCoverageWalker.java
+++ /dev/null
@@ -1,118 +0,0 @@
-/*
- * Copyright (c) 2010 The Broad Institute
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use,
- * copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following
- * conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR
- * THE USE OR OTHER DEALINGS IN THE SOFTWARE.
- */
-
-package org.broadinstitute.sting.gatk.walkers.coverage;
-
-import net.sf.samtools.SAMRecord;
-import org.broadinstitute.sting.commandline.Argument;
-import org.broadinstitute.sting.commandline.Output;
-import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
-import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
-import org.broadinstitute.sting.gatk.walkers.ReadWalker;
-
-import java.io.PrintStream;
-
-/**
- * Computes the coverage per every <granularity> bases on the reference, or on the subset of the reference
- * specified by the intervals provided. Moving to the next contig on the reference will always restart the
- * count anew, even if the count of bases in the last chunk on the previous contig did not reach specified <granularity>.
- */
-public class CoarseCoverageWalker extends ReadWalker<Integer,Integer> {
-    @Output
-    public PrintStream out;
-	
-    @Argument(fullName="granularity", shortName="G", doc="Granularity", required=true)
-    public Integer N;
-
-    @Argument(fullName="dontZeroMissingContigs", shortName="Z", doc="If provided, we won't emit 0 counts for all sites on contigs skipped", required=true)
-    public boolean dontZeroMissingContigs;
-
-    private int chunkStart = 1; // start of the current chunk we are counting reads for
-    private int contig = 0; // current contig we are on
-    private int count = 0; // number of reads overlapping with the current chunk
-    private static String zeroString = "0";
-    
-    @Override 
-    public void initialize() {
-    	chunkStart = 1;
-    	contig = 0;
-    	count = 0;
-    }
-    
-	@Override
-	public Integer map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
-		
-		if ( read.getReadUnmappedFlag() ||
-			 read.getDuplicateReadFlag() ||
-			 read.getNotPrimaryAlignmentFlag() ||
-			 read.getMappingQuality() == 0 ) return 0;
-		
-		if ( read.getReferenceIndex() != contig ) {
-			// we jumped onto another contig
-			out.printf("%d%n", count); // print old count
-			count = 0;
-			
-			// if we skipped one or more contigs completely, make sure we print 0 counts over all of them:
-            for ( contig++ ; contig < read.getReferenceIndex() ; contig++) {
-                if ( ! dontZeroMissingContigs ) {
-                    int contigSize = read.getHeader().getSequence(contig).getSequenceLength();
-                    for ( int k = 1 ; k < contigSize ;  k+=N ) out.println(zeroString);
-                }
-            }
-            // by now we scrolled to the right contig
-			
-			chunkStart = 1; // reset chunk start
-		}
-		
-		// if our read is past the boundary of the current chunk, print old count(s)
-		// (for the current chunk and all chunks we may have skipped altogether) and reinitialize:
-		while ( chunkStart+N < read.getAlignmentStart() ) {
-			out.printf("%d%n", count); // print old count
-			count = 0;
-			chunkStart += N;
-		}
-		count++;
-		return 1;
-	}
-
-	@Override
-	public Integer reduce(Integer value, Integer sum) {
-		return value+sum;
-	}
-
-	@Override
-	public Integer reduceInit() {
-		return 0;
-	}
-	
-	@Override 
-	public void onTraversalDone(Integer result) {
-		out.printf("%d%n", count); // print count from the last chunk
-		super.onTraversalDone(result);
-		
-	}
-	
-
-}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/DepthOfCoverageWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/DepthOfCoverageWalker.java
index 664c319ab..cbbb3d43f 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/DepthOfCoverageWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/DepthOfCoverageWalker.java
@@ -32,6 +32,7 @@ import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
 import org.broadinstitute.sting.gatk.refdata.SeekableRODIterator;
+import org.broadinstitute.sting.utils.SampleUtils;
 import org.broadinstitute.sting.utils.codecs.refseq.RefSeqCodec;
 import org.broadinstitute.sting.utils.codecs.refseq.RefSeqFeature;
 import org.broadinstitute.sting.gatk.refdata.tracks.RMDTrack;
@@ -112,6 +113,7 @@ import java.util.*;
 // todo -- allow for user to set linear binning (default is logarithmic)
 // todo -- formatting --> do something special for end bins in getQuantile(int[] foo), this gets mushed into the end+-1 bins for now
 @By(DataSource.REFERENCE)
+@PartitionBy(PartitionType.INTERVAL)
 public class DepthOfCoverageWalker extends LocusWalker<Map<DoCOutputType.Partition,Map<String,int[]>>, CoveragePartitioner> implements TreeReducible<CoveragePartitioner> {
     @Output
     @Multiplex(value=DoCOutputMultiplexer.class,arguments={"partitionTypes","refSeqGeneList","omitDepthOutput","omitIntervals","omitSampleSummary","omitLocusTable"})
@@ -281,20 +283,14 @@ public class DepthOfCoverageWalker extends LocusWalker<Map<DoCOutputType.Partiti
     private HashSet<String> getSamplesFromToolKit(DoCOutputType.Partition type) {
         HashSet<String> partition = new HashSet<String>();
         if ( type == DoCOutputType.Partition.sample ) {
-            for ( Set<String> sampleSet : getToolkit().getSamplesByReaders() ) {
-                for ( String s : sampleSet ) {
-                    partition.add(s);
-                }
-            }
+            partition.addAll(SampleUtils.getSAMFileSamples(getToolkit()));
         } else if ( type == DoCOutputType.Partition.readgroup ) {
             for ( SAMReadGroupRecord rg : getToolkit().getSAMFileHeader().getReadGroups() ) {
                 partition.add(rg.getSample()+"_rg_"+rg.getReadGroupId());
             }
         } else if ( type == DoCOutputType.Partition.library ) {
-            for ( Set<String> libraries : getToolkit().getLibrariesByReaders() ) {
-                for ( String l : libraries ) {
-                    partition.add(l);
-                }
+            for ( SAMReadGroupRecord rg : getToolkit().getSAMFileHeader().getReadGroups() ) {
+                partition.add(rg.getLibrary());
             }
         } else if ( type == DoCOutputType.Partition.center ) {
             for ( SAMReadGroupRecord rg : getToolkit().getSAMFileHeader().getReadGroups() ) {
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/GCContentByIntervalWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/GCContentByIntervalWalker.java
index 5c2a967b9..17b17764b 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/GCContentByIntervalWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/coverage/GCContentByIntervalWalker.java
@@ -42,12 +42,12 @@ import java.util.List;
  *
  * <h2>Input</h2>
  * <p>
- * One or more BAM files.
+ *  A reference file
  * </p>
  *
  * <h2>Output</h2>
  * <p>
- * GC content calculations per interval.
+ *  GC content calculations per interval.
  * </p>
  *
  * <h2>Examples</h2>
@@ -56,7 +56,6 @@ import java.util.List;
  *   -R ref.fasta \
  *   -T GCContentByInterval \
  *   -o output.txt \
- *   -I input.bam \
  *   -L input.intervals
  * </pre>
  *
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/diagnostics/ReadLengthDistribution.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/diagnostics/ReadLengthDistribution.java
index 0f1cea2e1..2d88baf3f 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/diagnostics/ReadLengthDistribution.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/diagnostics/ReadLengthDistribution.java
@@ -1,13 +1,13 @@
 package org.broadinstitute.sting.gatk.walkers.diagnostics;
 
 import net.sf.samtools.SAMReadGroupRecord;
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.commandline.Output;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
 import org.broadinstitute.sting.gatk.report.GATKReport;
 import org.broadinstitute.sting.gatk.report.GATKReportTable;
 import org.broadinstitute.sting.gatk.walkers.ReadWalker;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.io.PrintStream;
 import java.util.List;
@@ -69,12 +69,12 @@ public class ReadLengthDistribution extends ReadWalker<Integer, Integer> {
 
     }
 
-    public boolean filter(ReferenceContext ref, SAMRecord read) {
+    public boolean filter(ReferenceContext ref, GATKSAMRecord read) {
         return ( !read.getReadPairedFlag() || read.getReadPairedFlag() && read.getFirstOfPairFlag());
     }
 
     @Override
-    public Integer map(ReferenceContext referenceContext, SAMRecord samRecord, ReadMetaDataTracker readMetaDataTracker) {
+    public Integer map(ReferenceContext referenceContext, GATKSAMRecord samRecord, ReadMetaDataTracker readMetaDataTracker) {
         GATKReportTable table = report.getTable("ReadLengthDistribution");
 
         int length = Math.abs(samRecord.getReadLength());
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/diffengine/DiffObjectsWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/diffengine/DiffObjectsWalker.java
index 5889d19e5..04437fdd1 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/diffengine/DiffObjectsWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/diffengine/DiffObjectsWalker.java
@@ -219,10 +219,10 @@ public class DiffObjectsWalker extends RodWalker<Integer, Integer> {
 
     @Override
     public void onTraversalDone(Integer sum) {
-        out.printf("Reading master file %s%n", masterFile);
+        //out.printf("Reading master file %s%n", masterFile);
         DiffElement master = diffEngine.createDiffableFromFile(masterFile, MAX_OBJECTS_TO_READ);
         out.printf("  Read %d objects%n", master.size());
-        out.printf("Reading test file %s%n", testFile);
+        //out.printf("Reading test file %s%n", testFile);
         DiffElement test = diffEngine.createDiffableFromFile(testFile, MAX_OBJECTS_TO_READ);
         out.printf("  Read %d objects%n", test.size());
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/AlleleFrequencyCalculationModel.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/AlleleFrequencyCalculationModel.java
index 70f3c6a1a..35a9fe31d 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/AlleleFrequencyCalculationModel.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/AlleleFrequencyCalculationModel.java
@@ -33,6 +33,7 @@ import org.broadinstitute.sting.utils.variantcontext.Genotype;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
 
 import java.io.PrintStream;
+import java.util.List;
 import java.util.Map;
 import java.util.Set;
 
@@ -67,16 +68,12 @@ public abstract class AlleleFrequencyCalculationModel implements Cloneable {
 
     /**
      * Must be overridden by concrete subclasses
-     * @param tracker                         rod data
-     * @param ref                             reference context
      * @param GLs                             genotype likelihoods
      * @param Alleles                       Alleles corresponding to GLs
      * @param log10AlleleFrequencyPriors      priors
      * @param log10AlleleFrequencyPosteriors  array (pre-allocated) to store results
      */
-    protected abstract void getLog10PNonRef(RefMetaDataTracker tracker,
-                                            ReferenceContext ref,
-                                            Map<String, Genotype> GLs,  Set<Allele> Alleles,
+    protected abstract void getLog10PNonRef(Map<String, Genotype> GLs,  List<Allele> Alleles,
                                             double[] log10AlleleFrequencyPriors,
                                             double[] log10AlleleFrequencyPosteriors);
 
diff --git a/public/java/src/org/broadinstitute/sting/utils/genotype/DiploidGenotype.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidGenotype.java
similarity index 98%
rename from public/java/src/org/broadinstitute/sting/utils/genotype/DiploidGenotype.java
rename to public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidGenotype.java
index 1c2cfe2e1..b5987963f 100755
--- a/public/java/src/org/broadinstitute/sting/utils/genotype/DiploidGenotype.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidGenotype.java
@@ -23,7 +23,7 @@
  * THE USE OR OTHER DEALINGS IN THE SOFTWARE.
  */
 
-package org.broadinstitute.sting.utils.genotype;
+package org.broadinstitute.sting.gatk.walkers.genotyper;
 
 import org.broadinstitute.sting.utils.BaseUtils;
 
@@ -34,7 +34,7 @@ import org.broadinstitute.sting.utils.BaseUtils;
  * Time: 6:46:09 PM
  * To change this template use File | Settings | File Templates.
  */
-public enum DiploidGenotype {
+enum DiploidGenotype {
     AA ('A', 'A'),
     AC ('A', 'C'),
     AG ('A', 'G'),
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidIndelGenotypePriors.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidIndelGenotypePriors.java
index 696a74de8..d8c911092 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidIndelGenotypePriors.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidIndelGenotypePriors.java
@@ -2,7 +2,6 @@ package org.broadinstitute.sting.gatk.walkers.genotyper;
 
 import org.broadinstitute.sting.gatk.walkers.indels.HaplotypeIndelErrorModel;
 import org.broadinstitute.sting.utils.MathUtils;
-import org.broadinstitute.sting.utils.genotype.DiploidGenotype;
 
 /**
  * Created by IntelliJ IDEA.
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidSNPGenotypeLikelihoods.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidSNPGenotypeLikelihoods.java
index 5f6865d04..666fe88a3 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidSNPGenotypeLikelihoods.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidSNPGenotypeLikelihoods.java
@@ -27,14 +27,16 @@ package org.broadinstitute.sting.gatk.walkers.genotyper;
 
 import net.sf.samtools.SAMUtils;
 import org.broadinstitute.sting.utils.BaseUtils;
+import org.broadinstitute.sting.utils.fragments.FragmentCollection;
+import org.broadinstitute.sting.utils.fragments.FragmentUtils;
 import org.broadinstitute.sting.utils.MathUtils;
 import org.broadinstitute.sting.utils.QualityUtils;
 import org.broadinstitute.sting.utils.exceptions.UserException;
-import org.broadinstitute.sting.utils.genotype.DiploidGenotype;
-import org.broadinstitute.sting.utils.pileup.FragmentPileup;
 import org.broadinstitute.sting.utils.pileup.PileupElement;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
 
+import java.util.List;
+
 import static java.lang.Math.log10;
 import static java.lang.Math.pow;
 
@@ -260,35 +262,42 @@ public class DiploidSNPGenotypeLikelihoods implements Cloneable {
         int n = 0;
 
         // for each fragment, add to the likelihoods
-        FragmentPileup fpile = new FragmentPileup(pileup);
+        FragmentCollection<PileupElement> fpile = pileup.toFragments();
 
-        for ( PileupElement p : fpile.getOneReadPileup() )
+        for ( PileupElement p : fpile.getSingletonReads() )
             n += add(p, ignoreBadBases, capBaseQualsAtMappingQual, minBaseQual);
 
-        for ( FragmentPileup.TwoReadPileupElement twoRead : fpile.getTwoReadPileup() )
-            n += add(twoRead, ignoreBadBases, capBaseQualsAtMappingQual, minBaseQual);
+        for ( List<PileupElement> overlappingPair : fpile.getOverlappingPairs() )
+            n += add(overlappingPair, ignoreBadBases, capBaseQualsAtMappingQual, minBaseQual);
 
         return n;
     }
+
     public int add(PileupElement elt, boolean ignoreBadBases, boolean capBaseQualsAtMappingQual, int minBaseQual) {
         byte obsBase = elt.getBase();
 
         if ( elt.isReducedRead() ) {
             // reduced read representation
-            byte qual = elt.getReducedQual();
-            add(obsBase, qual, (byte)0, (byte)0, elt.getReducedCount()); // fast calculation of n identical likelihoods
-            return elt.getReducedCount(); // we added nObs bases here
+            byte qual = elt.getQual();
+            if ( BaseUtils.isRegularBase( elt.getBase() )) {
+                add(obsBase, qual, (byte)0, (byte)0, elt.getRepresentativeCount()); // fast calculation of n identical likelihoods
+                return elt.getRepresentativeCount(); // we added nObs bases here
+            } else // odd bases or deletions => don't use them
+                return 0;
         } else {
             byte qual = qualToUse(elt, ignoreBadBases, capBaseQualsAtMappingQual, minBaseQual);
             return qual > 0 ? add(obsBase, qual, (byte)0, (byte)0, 1) : 0;
         }
     }
 
-    public int add(FragmentPileup.TwoReadPileupElement twoRead, boolean ignoreBadBases, boolean capBaseQualsAtMappingQual, int minBaseQual) {
-        final byte observedBase1 = twoRead.getFirst().getBase();
-        final byte qualityScore1 = qualToUse(twoRead.getFirst(), ignoreBadBases, capBaseQualsAtMappingQual, minBaseQual);
-        final byte observedBase2 = twoRead.getSecond().getBase();
-        final byte qualityScore2 = qualToUse(twoRead.getSecond(), ignoreBadBases, capBaseQualsAtMappingQual, minBaseQual);
+    public int add(List<PileupElement> overlappingPair, boolean ignoreBadBases, boolean capBaseQualsAtMappingQual, int minBaseQual) {
+        final PileupElement p1 = overlappingPair.get(0);
+        final PileupElement p2 = overlappingPair.get(1);
+
+        final byte observedBase1 = p1.getBase();
+        final byte qualityScore1 = qualToUse(p1, ignoreBadBases, capBaseQualsAtMappingQual, minBaseQual);
+        final byte observedBase2 = p2.getBase();
+        final byte qualityScore2 = qualToUse(p2, ignoreBadBases, capBaseQualsAtMappingQual, minBaseQual);
 
         if ( qualityScore1 == 0 ) {
             if ( qualityScore2 == 0 ) // abort early if we didn't see any good bases
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidSNPGenotypePriors.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidSNPGenotypePriors.java
index b9ed17d3e..71854591f 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidSNPGenotypePriors.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidSNPGenotypePriors.java
@@ -26,7 +26,6 @@
 package org.broadinstitute.sting.gatk.walkers.genotyper;
 
 import org.broadinstitute.sting.utils.MathUtils;
-import org.broadinstitute.sting.utils.genotype.DiploidGenotype;
 
 import java.util.Arrays;
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/ExactAFCalculationModel.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/ExactAFCalculationModel.java
index 6ae437b27..1c2d82ab7 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/ExactAFCalculationModel.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/ExactAFCalculationModel.java
@@ -29,90 +29,37 @@ import org.apache.log4j.Logger;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
 import org.broadinstitute.sting.utils.MathUtils;
-import org.broadinstitute.sting.utils.SimpleTimer;
 import org.broadinstitute.sting.utils.Utils;
 import org.broadinstitute.sting.utils.exceptions.UserException;
 import org.broadinstitute.sting.utils.variantcontext.Allele;
 import org.broadinstitute.sting.utils.variantcontext.Genotype;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
-import sun.reflect.generics.reflectiveObjects.NotImplementedException;
 
 import java.io.PrintStream;
-import java.util.ArrayList;
-import java.util.HashMap;
-import java.util.Map;
-import java.util.Set;
+import java.util.*;
 
 public class ExactAFCalculationModel extends AlleleFrequencyCalculationModel {
     //
     // code for testing purposes
     //
     private final static boolean DEBUG = false;
-    private final static boolean PRINT_LIKELIHOODS = false;
-    private final static int N_CYCLES = 1;
-    private SimpleTimer timerExpt = new SimpleTimer("linearExactBanded");
-    private SimpleTimer timerGS = new SimpleTimer("linearExactGS");
-    private final static boolean COMPARE_TO_GS = false;
-
-    public enum ExactCalculation {
-        N2_GOLD_STANDARD,
-        LINEAR_EXPERIMENTAL
-    }
-
     private final static double MAX_LOG10_ERROR_TO_STOP_EARLY = 6; // we want the calculation to be accurate to 1 / 10^6
-
-    private boolean SIMPLE_GREEDY_GENOTYPER = false;
-
+    private final boolean SIMPLE_GREEDY_GENOTYPER = false;
     private final static double SUM_GL_THRESH_NOCALL = -0.001; // if sum(gl) is bigger than this threshold, we treat GL's as non-informative and will force a no-call.
 
-    final private ExactCalculation calcToUse;
     protected ExactAFCalculationModel(UnifiedArgumentCollection UAC, int N, Logger logger, PrintStream verboseWriter) {
         super(UAC, N, logger, verboseWriter);
-        calcToUse = UAC.EXACT_CALCULATION_TYPE;
     }
 
-    public void getLog10PNonRef(RefMetaDataTracker tracker,
-                                ReferenceContext ref,
-                                Map<String, Genotype> GLs, Set<Allele>alleles,
+    public void getLog10PNonRef(Map<String, Genotype> GLs, List<Allele> alleles,
                                 double[] log10AlleleFrequencyPriors,
                                 double[] log10AlleleFrequencyPosteriors) {
-        // todo -- REMOVE ME AFTER TESTING
-        // todo -- REMOVE ME AFTER TESTING
-        // todo -- REMOVE ME AFTER TESTING
-        double[] gsPosteriors;
-        if ( COMPARE_TO_GS ) // due to annoying special values in incoming array, we have to clone up here
-            gsPosteriors = log10AlleleFrequencyPosteriors.clone();
-
-        int idxAA = GenotypeType.AA.ordinal();
-        int idxAB = GenotypeType.AB.ordinal();
-        int idxBB = GenotypeType.BB.ordinal();
-
-        // todo -- remove me after testing
-        if ( N_CYCLES > 1 ) {
-            for ( int i = 0; i < N_CYCLES; i++) {
-                timerGS.restart();
-                linearExact(GLs, log10AlleleFrequencyPriors, log10AlleleFrequencyPosteriors.clone(), idxAA, idxAB, idxBB);
-                timerGS.stop();
-
-                timerExpt.restart();
-                linearExactBanded(GLs, log10AlleleFrequencyPriors, log10AlleleFrequencyPosteriors.clone());
-                timerExpt.stop();
-            }
-
-            System.out.printf("good = %.2f, expt = %.2f, delta = %.2f%n",
-                    timerGS.getElapsedTime(), timerExpt.getElapsedTime(), timerExpt.getElapsedTime()-timerGS.getElapsedTime());
-        }
-
-        int lastK = -1;
-
-        int numAlleles = alleles.size();
+        final int numAlleles = alleles.size();
+        final double[][] posteriorCache = numAlleles > 2 ? new double[numAlleles-1][] : null;
+        final double[] bestAFguess = numAlleles > 2 ? new double[numAlleles-1] : null;
 
         int idxDiag = numAlleles;
         int incr = numAlleles - 1;
-
-        double[][] posteriorCache = new double[numAlleles-1][];
-        double[] bestAFguess = new double[numAlleles-1];
-
         for (int k=1; k < numAlleles; k++) {
             // multi-allelic approximation, part 1: Ideally
             // for each alt allele compute marginal (suboptimal) posteriors -
@@ -121,24 +68,17 @@ public class ExactAFCalculationModel extends AlleleFrequencyCalculationModel {
             // So, for example, with 2 alt alleles, likelihoods have AA,AB,AC,BB,BC,CC.
             // 3 alt alleles: AA,AB,AC,AD BB BC BD CC CD DD
 
-            idxAA = 0;
-            idxAB = k;
+            final int idxAA = 0;
+            final int idxAB = k;
             // yy is always element on the diagonal.
             // 2 alleles: BBelement 2
             // 3 alleles: BB element  3. CC element 5
             // 4 alleles:
-            idxBB = idxDiag;
+            final int idxBB = idxDiag;
             idxDiag += incr--;
 
-            // todo - possible cleanup
-            switch ( calcToUse ) {
-                case N2_GOLD_STANDARD:
-                    lastK = gdaN2GoldStandard(GLs, log10AlleleFrequencyPriors, log10AlleleFrequencyPosteriors, idxAA, idxAB, idxBB);
-                    break;
-                case LINEAR_EXPERIMENTAL:
-                    lastK = linearExact(GLs, log10AlleleFrequencyPriors, log10AlleleFrequencyPosteriors, idxAA, idxAB, idxBB);
-                    break;
-            }
+            final int lastK = linearExact(GLs, log10AlleleFrequencyPriors, log10AlleleFrequencyPosteriors, idxAA, idxAB, idxBB);
+
             if (numAlleles > 2) {
                 posteriorCache[k-1] = log10AlleleFrequencyPosteriors.clone();
                 bestAFguess[k-1] = (double)MathUtils.maxElementIndex(log10AlleleFrequencyPosteriors);
@@ -153,39 +93,14 @@ public class ExactAFCalculationModel extends AlleleFrequencyCalculationModel {
                 log10AlleleFrequencyPosteriors[k] = (posteriorCache[mostLikelyAlleleIdx][k]);
 
         }
-        // todo -- REMOVE ME AFTER TESTING
-        // todo -- REMOVE ME AFTER TESTING
-        // todo -- REMOVE ME AFTER TESTING
-        if ( COMPARE_TO_GS ) {
-            gdaN2GoldStandard(GLs, log10AlleleFrequencyPriors, gsPosteriors, idxAA, idxAB, idxBB);
-
-            double log10thisPVar = Math.log10(MathUtils.normalizeFromLog10(log10AlleleFrequencyPosteriors)[0]);
-            double log10gsPVar = Math.log10(MathUtils.normalizeFromLog10(gsPosteriors)[0]);
-            boolean eq = (log10thisPVar == Double.NEGATIVE_INFINITY && log10gsPVar == Double.NEGATIVE_INFINITY) || MathUtils.compareDoubles(log10thisPVar, log10gsPVar, 1e-4) == 0;
-
-            if ( ! eq || PRINT_LIKELIHOODS ) {
-                System.out.printf("----------------------------------------%n");
-                for (int k=0; k < log10AlleleFrequencyPosteriors.length; k++) {
-                    double x = log10AlleleFrequencyPosteriors[k];
-                    System.out.printf("  %d\t%.2f\t%.2f\t%b%n", k,
-                            x < -1e10 ? Double.NEGATIVE_INFINITY : x, gsPosteriors[k],
-                            log10AlleleFrequencyPosteriors[k] == gsPosteriors[k]);
-                }
-                System.out.printf("MAD_AC\t%d\t%d\t%.2f\t%.2f\t%.6f%n",
-                        ref.getLocus().getStart(), lastK, log10thisPVar, log10gsPVar, log10thisPVar - log10gsPVar);
-            }
-        }
-
     }
 
     private static final ArrayList<double[]> getGLs(Map<String, Genotype> GLs) {
         ArrayList<double[]> genotypeLikelihoods = new ArrayList<double[]>();
 
-        //int j = 0;
         genotypeLikelihoods.add(new double[]{0.0,0.0,0.0}); // dummy
         for ( Genotype sample : GLs.values() ) {
             if ( sample.hasLikelihoods() ) {
-                //double[] genotypeLikelihoods = MathUtils.normalizeFromLog10(GLs.get(sample).getLikelihoods());
                 double[] gls = sample.getLikelihoods().getAsVector();
 
                 if (MathUtils.sum(gls) < SUM_GL_THRESH_NOCALL)
@@ -240,84 +155,6 @@ public class ExactAFCalculationModel extends AlleleFrequencyCalculationModel {
         }
     }
 
-    // now with banding
-    public int linearExactBanded(Map<String, Genotype> GLs,
-                                 double[] log10AlleleFrequencyPriors,
-                                 double[] log10AlleleFrequencyPosteriors) {
-        throw new NotImplementedException();
-//        final int numSamples = GLs.size();
-//        final int numChr = 2*numSamples;
-//        final double[][] genotypeLikelihoods = getGLs(GLs);
-//
-//        final ExactACCache logY = new ExactACCache(numSamples+1);
-//        logY.getkMinus0()[0] = 0.0; // the zero case
-//
-//        double maxLog10L = Double.NEGATIVE_INFINITY;
-//        boolean done = false;
-//        int lastK = -1;
-//        final int BAND_SIZE = 10;
-//
-//        for (int k=0; k <= numChr && ! done; k++ ) {
-//            final double[] kMinus0 = logY.getkMinus0();
-//            int jStart = Math.max(k - BAND_SIZE, 1);
-//            int jStop = Math.min(k + BAND_SIZE, numSamples);
-//
-//            if ( k == 0 ) { // special case for k = 0
-//                for ( int j=1; j <= numSamples; j++ ) {
-//                    kMinus0[j] = kMinus0[j-1] + genotypeLikelihoods[j][GenotypeType.AA.ordinal()];
-//                }
-//            } else { // k > 0
-//                final double[] kMinus1 = logY.getkMinus1();
-//                final double[] kMinus2 = logY.getkMinus2();
-//                Arrays.fill(kMinus0,0);
-//
-//                for ( int j = jStart; j <= jStop; j++ ) {
-//                    final double[] gl = genotypeLikelihoods[j];
-//                    final double logDenominator = log10Cache[2*j] + log10Cache[2*j-1];
-//
-//                    double aa = Double.NEGATIVE_INFINITY;
-//                    double ab = Double.NEGATIVE_INFINITY;
-//                    if (k < 2*j-1)
-//                        aa = log10Cache[2*j-k] + log10Cache[2*j-k-1] + kMinus0[j-1] + gl[GenotypeType.AA.ordinal()];
-//
-//                    if (k < 2*j)
-//                        ab = log10Cache[2*k] + log10Cache[2*j-k]+ kMinus1[j-1] + gl[GenotypeType.AB.ordinal()];
-//
-//                    double log10Max;
-//                    if (k > 1) {
-//                        final double bb = log10Cache[k] + log10Cache[k-1] + kMinus2[j-1] + gl[GenotypeType.BB.ordinal()];
-//                        log10Max = approximateLog10SumLog10(aa, ab, bb);
-//                    } else {
-//                        // we know we aren't considering the BB case, so we can use an optimized log10 function
-//                        log10Max = approximateLog10SumLog10(aa, ab);
-//                    }
-//
-//                    // finally, update the L(j,k) value
-//                    kMinus0[j] = log10Max - logDenominator;
-//
-//                    String offset = Utils.dupString(' ',k);
-//                    System.out.printf("%s%3d %3d %.2f%n", offset, k, j, kMinus0[j]);
-//                }
-//            }
-//
-//            // update the posteriors vector
-//            final double log10LofK = kMinus0[jStop];
-//            log10AlleleFrequencyPosteriors[k] = log10LofK + log10AlleleFrequencyPriors[k];
-//
-//            // can we abort early?
-//            lastK = k;
-//            maxLog10L = Math.max(maxLog10L, log10LofK);
-//            if ( log10LofK < maxLog10L - MAX_LOG10_ERROR_TO_STOP_EARLY ) {
-//                if ( DEBUG ) System.out.printf("  *** breaking early k=%d log10L=%.2f maxLog10L=%.2f%n", k, log10LofK, maxLog10L);
-//                done = true;
-//            }
-//
-//            logY.rotate();
-//        }
-//
-//        return lastK;
-    }
-
     public int linearExact(Map<String, Genotype> GLs,
                            double[] log10AlleleFrequencyPriors,
                            double[] log10AlleleFrequencyPosteriors, int idxAA, int idxAB, int idxBB) {
@@ -605,82 +442,6 @@ public class ExactAFCalculationModel extends AlleleFrequencyCalculationModel {
         return calls;
     }
 
-    // -------------------------------------------------------------------------------------
-    //
-    // Gold standard, but O(N^2), implementation.
-    //
-    // TODO -- remove me for clarity in this code
-    //
-    // -------------------------------------------------------------------------------------
-    public int gdaN2GoldStandard(Map<String, Genotype> GLs,
-                                 double[] log10AlleleFrequencyPriors,
-                                 double[] log10AlleleFrequencyPosteriors, int idxAA, int idxAB, int idxBB) {
-        int numSamples = GLs.size();
-        int numChr = 2*numSamples;
-
-        double[][] logYMatrix = new double[1+numSamples][1+numChr];
-
-        for (int i=0; i <=numSamples; i++)
-            for (int j=0; j <=numChr; j++)
-                logYMatrix[i][j] = Double.NEGATIVE_INFINITY;
-
-        //YMatrix[0][0] = 1.0;
-        logYMatrix[0][0] = 0.0;
-        int j=0;
-
-        for ( Map.Entry<String, Genotype> sample : GLs.entrySet() ) {
-            j++;
-
-            if ( !sample.getValue().hasLikelihoods() )
-                continue;
-
-            //double[] genotypeLikelihoods = MathUtils.normalizeFromLog10(GLs.get(sample).getLikelihoods());
-            double[] genotypeLikelihoods = sample.getValue().getLikelihoods().getAsVector();
-            //double logDenominator = Math.log10(2.0*j*(2.0*j-1));
-            double logDenominator = MathUtils.log10Cache[2*j] + MathUtils.log10Cache[2*j-1];
-
-            // special treatment for k=0: iteration reduces to:
-            //YMatrix[j][0] = YMatrix[j-1][0]*genotypeLikelihoods[GenotypeType.AA.ordinal()];
-            logYMatrix[j][0] = logYMatrix[j-1][0] + genotypeLikelihoods[idxAA];
-
-            for (int k=1; k <= 2*j; k++ ) {
-
-                //double num = (2.0*j-k)*(2.0*j-k-1)*YMatrix[j-1][k] * genotypeLikelihoods[GenotypeType.AA.ordinal()];
-                double logNumerator[];
-                logNumerator = new double[3];
-                if (k < 2*j-1)
-                    logNumerator[0] = MathUtils.log10Cache[2*j-k] + MathUtils.log10Cache[2*j-k-1] + logYMatrix[j-1][k] +
-                            genotypeLikelihoods[idxAA];
-                else
-                    logNumerator[0] = Double.NEGATIVE_INFINITY;
-
-
-                if (k < 2*j)
-                    logNumerator[1] = MathUtils.log10Cache[2*k] + MathUtils.log10Cache[2*j-k]+ logYMatrix[j-1][k-1] +
-                            genotypeLikelihoods[idxAB];
-                else
-                    logNumerator[1] = Double.NEGATIVE_INFINITY;
-
-                if (k > 1)
-                    logNumerator[2] = MathUtils.log10Cache[k] + MathUtils.log10Cache[k-1] + logYMatrix[j-1][k-2] +
-                            genotypeLikelihoods[idxBB];
-                else
-                    logNumerator[2] = Double.NEGATIVE_INFINITY;
-
-                double logNum = MathUtils.softMax(logNumerator);
-
-                //YMatrix[j][k] = num/den;
-                logYMatrix[j][k] = logNum - logDenominator;
-            }
-
-        }
-
-        for (int k=0; k <= numChr; k++)
-            log10AlleleFrequencyPosteriors[k] = logYMatrix[j][k] + log10AlleleFrequencyPriors[k];
-
-        return numChr;
-    }
-
     private final static void printLikelihoods(int numChr, double[][] logYMatrix, double[] log10AlleleFrequencyPriors) {
         int j = logYMatrix.length - 1;
         System.out.printf("-----------------------------------%n");
@@ -689,5 +450,4 @@ public class ExactAFCalculationModel extends AlleleFrequencyCalculationModel {
             System.out.printf("  %4d\t%8.2f\t%8.2f\t%8.2f%n", k, logYMatrix[j][k], log10AlleleFrequencyPriors[k], posterior);
         }
     }
-
 }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/GenotypeLikelihoodsCalculationModel.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/GenotypeLikelihoodsCalculationModel.java
index 60dfe4fe7..489e963e8 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/GenotypeLikelihoodsCalculationModel.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/GenotypeLikelihoodsCalculationModel.java
@@ -53,7 +53,7 @@ public abstract class GenotypeLikelihoodsCalculationModel implements Cloneable {
     }
 
     public enum GENOTYPING_MODE {
-        /** the default; the Unified Genotyper will choose the most likely alternate allele */
+        /** the Unified Genotyper will choose the most likely alternate allele */
         DISCOVERY,
         /** only the alleles passed in from a VCF rod bound to the -alleles argument will be used for genotyping */
         GENOTYPE_GIVEN_ALLELES
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/GridSearchAFEstimation.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/GridSearchAFEstimation.java
index 10b646d63..27842a8bf 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/GridSearchAFEstimation.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/GridSearchAFEstimation.java
@@ -52,9 +52,7 @@ public class GridSearchAFEstimation extends AlleleFrequencyCalculationModel {
         AFMatrix = new AlleleFrequencyMatrix(N);
     }
 
-    protected void getLog10PNonRef(RefMetaDataTracker tracker,
-                                   ReferenceContext ref,
-                                   Map<String, Genotype> GLs, Set<Allele>alleles,
+    protected void getLog10PNonRef(Map<String, Genotype> GLs, List<Allele> alleles,
                                    double[] log10AlleleFrequencyPriors,
                                    double[] log10AlleleFrequencyPosteriors) {
         initializeAFMatrix(GLs);
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/IndelGenotypeLikelihoodsCalculationModel.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/IndelGenotypeLikelihoodsCalculationModel.java
index ec5eefd60..aea63b61d 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/IndelGenotypeLikelihoodsCalculationModel.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/IndelGenotypeLikelihoodsCalculationModel.java
@@ -30,14 +30,11 @@ import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContextUtils;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
-import org.broadinstitute.sting.gatk.walkers.indels.HaplotypeIndelErrorModel;
 import org.broadinstitute.sting.gatk.walkers.indels.PairHMMIndelErrorModel;
 import org.broadinstitute.sting.utils.BaseUtils;
 import org.broadinstitute.sting.utils.GenomeLoc;
-import org.broadinstitute.sting.utils.MathUtils;
-import org.broadinstitute.sting.utils.collections.Pair;
+import org.broadinstitute.sting.utils.Haplotype;
 import org.broadinstitute.sting.utils.exceptions.StingException;
-import org.broadinstitute.sting.utils.genotype.Haplotype;
 import org.broadinstitute.sting.utils.pileup.ExtendedEventPileupElement;
 import org.broadinstitute.sting.utils.pileup.PileupElement;
 import org.broadinstitute.sting.utils.pileup.ReadBackedExtendedEventPileup;
@@ -72,9 +69,6 @@ public class IndelGenotypeLikelihoodsCalculationModel extends GenotypeLikelihood
 
     // gdebug removeme
     // todo -cleanup
-    private HaplotypeIndelErrorModel model;
-    private boolean useOldWrongHorribleHackedUpLikelihoodModel = false;
-//
     private GenomeLoc lastSiteVisited;
     private ArrayList<Allele> alleleList;
 
@@ -85,26 +79,8 @@ public class IndelGenotypeLikelihoodsCalculationModel extends GenotypeLikelihood
 
     protected IndelGenotypeLikelihoodsCalculationModel(UnifiedArgumentCollection UAC, Logger logger) {
         super(UAC, logger);
-        if (UAC.GSA_PRODUCTION_ONLY == false) {
-            pairModel = new PairHMMIndelErrorModel(UAC.INDEL_GAP_OPEN_PENALTY,UAC.INDEL_GAP_CONTINUATION_PENALTY,
-                    UAC.OUTPUT_DEBUG_INDEL_INFO, UAC.DO_CONTEXT_DEPENDENT_PENALTIES, UAC.dovit, UAC.GET_GAP_PENALTIES_FROM_DATA, UAC.INDEL_RECAL_FILE);
-            useOldWrongHorribleHackedUpLikelihoodModel = false;
-        }
-        else {
-            useOldWrongHorribleHackedUpLikelihoodModel = true;
-            double INSERTION_START_PROBABILITY = 1e-3;
-
-            double INSERTION_END_PROBABILITY = 0.5;
-
-            double ALPHA_DELETION_PROBABILITY = 1e-3;
-
-
-            model = new HaplotypeIndelErrorModel(3, INSERTION_START_PROBABILITY,
-                    INSERTION_END_PROBABILITY,ALPHA_DELETION_PROBABILITY,UAC.INDEL_HAPLOTYPE_SIZE, false, UAC.OUTPUT_DEBUG_INDEL_INFO);
-        }
-
         pairModel = new PairHMMIndelErrorModel(UAC.INDEL_GAP_OPEN_PENALTY,UAC.INDEL_GAP_CONTINUATION_PENALTY,
-                    UAC.OUTPUT_DEBUG_INDEL_INFO, UAC.DO_CONTEXT_DEPENDENT_PENALTIES, UAC.dovit, UAC.GET_GAP_PENALTIES_FROM_DATA, UAC.INDEL_RECAL_FILE);
+                UAC.OUTPUT_DEBUG_INDEL_INFO, UAC.BANDED_INDEL_COMPUTATION);
         alleleList = new ArrayList<Allele>();
         getAlleleListFromVCF = UAC.GenotypingMode == GENOTYPING_MODE.GENOTYPE_GIVEN_ALLELES;
         minIndelCountForGenotyping = UAC.MIN_INDEL_COUNT_FOR_GENOTYPING;
@@ -123,10 +99,6 @@ public class IndelGenotypeLikelihoodsCalculationModel extends GenotypeLikelihood
         GenomeLoc loc = ref.getLocus();
         ArrayList<Allele> aList = new ArrayList<Allele>();
 
-        if (DEBUG) {
-            System.out.println("'''''''''''''''''''''");
-            System.out.println("Loc:"+loc.toString());
-        }
         HashMap<String,Integer> consensusIndelStrings = new HashMap<String,Integer>();
 
         int insCount = 0, delCount = 0;
@@ -160,12 +132,12 @@ public class IndelGenotypeLikelihoodsCalculationModel extends GenotypeLikelihood
                     continue;
                 }
 
-                if (DEBUG && p.isIndel()) {
+/*                if (DEBUG && p.isIndel()) {
                     System.out.format("Read: %s, cigar: %s, aln start: %d, aln end: %d, p.len:%d, Type:%s, EventBases:%s\n",
                             read.getReadName(),read.getCigar().toString(),read.getAlignmentStart(),read.getAlignmentEnd(),
                             p.getEventLength(),p.getType().toString(), p.getEventBases());
                 }
-
+   */
 
                 String indelString = p.getEventBases();
                 if (p.isInsertion()) {
@@ -235,7 +207,7 @@ public class IndelGenotypeLikelihoodsCalculationModel extends GenotypeLikelihood
                 }
             }
 
-            if (DEBUG) {
+/*            if (DEBUG) {
                 int icount = indelPileup.getNumberOfInsertions();
                 int dcount = indelPileup.getNumberOfDeletions();
                 if (icount + dcount > 0)
@@ -249,7 +221,7 @@ public class IndelGenotypeLikelihoodsCalculationModel extends GenotypeLikelihood
                     }
                     System.out.println();
                 }
-            }
+            }             */
         }
 
         int maxAlleleCnt = 0;
@@ -260,8 +232,8 @@ public class IndelGenotypeLikelihoodsCalculationModel extends GenotypeLikelihood
                 maxAlleleCnt = curCnt;
                 bestAltAllele = s;
             }
-            if (DEBUG)
-                System.out.format("Key:%s, number: %d\n",s,consensusIndelStrings.get(s)  );
+//            if (DEBUG)
+//                System.out.format("Key:%s, number: %d\n",s,consensusIndelStrings.get(s)  );
         }         //gdebug-
 
         if (maxAlleleCnt <  minIndelCountForGenotyping)
@@ -384,20 +356,13 @@ public class IndelGenotypeLikelihoodsCalculationModel extends GenotypeLikelihood
                 }
             }
         }
-        int eventLength = altAllele.getBaseString().length() - refAllele.getBaseString().length();
-        int hsize = (int)ref.getWindow().size()-Math.abs(eventLength)-1;
-        int numPrefBases= ref.getLocus().getStart()-ref.getWindow().getStart()+1;
 
-        if (useOldWrongHorribleHackedUpLikelihoodModel) {
-            numPrefBases = 20;
-            hsize=80;
-        }
-        if (DEBUG)
-            System.out.format("hsize: %d eventLength: %d refSize: %d, locStart: %d numpr: %d\n",hsize,eventLength,
-                    (int)ref.getWindow().size(), loc.getStart(), numPrefBases);
-        //System.out.println(eventLength);
-        haplotypeMap = Haplotype.makeHaplotypeListFromAlleles( alleleList, loc.getStart(),
-            ref, hsize, numPrefBases);
+        final int eventLength = altAllele.getBaseString().length() - refAllele.getBaseString().length();
+        final int hsize = (int)ref.getWindow().size()-Math.abs(eventLength)-1;
+        final int numPrefBases= ref.getLocus().getStart()-ref.getWindow().getStart()+1;
+
+        haplotypeMap = Haplotype.makeHaplotypeListFromAlleles(alleleList, loc.getStart(),
+                ref, hsize, numPrefBases);
 
         // For each sample, get genotype likelihoods based on pileup
         // compute prior likelihoods on haplotypes, and initialize haplotype likelihood matrix with them.
@@ -414,13 +379,7 @@ public class IndelGenotypeLikelihoodsCalculationModel extends GenotypeLikelihood
                 pileup = context.getBasePileup();
 
             if (pileup != null ) {
-                double[] genotypeLikelihoods;
-
-                if (useOldWrongHorribleHackedUpLikelihoodModel)
-                   genotypeLikelihoods = model.computeReadHaplotypeLikelihoods( pileup, haplotypeMap);
-                else
-                    genotypeLikelihoods = pairModel.computeReadHaplotypeLikelihoods( pileup, haplotypeMap, ref, eventLength, getIndelLikelihoodMap());
-
+                final double[] genotypeLikelihoods = pairModel.computeReadHaplotypeLikelihoods( pileup, haplotypeMap, ref, eventLength, getIndelLikelihoodMap());
 
                 GLs.put(sample.getKey(), new MultiallelicGenotypeLikelihoods(sample.getKey(),
                         alleleList,
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/MultiallelicGenotypeLikelihoods.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/MultiallelicGenotypeLikelihoods.java
index 3652763de..4f378b24a 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/MultiallelicGenotypeLikelihoods.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/MultiallelicGenotypeLikelihoods.java
@@ -4,6 +4,7 @@ import org.broadinstitute.sting.utils.exceptions.StingException;
 import org.broadinstitute.sting.utils.variantcontext.Allele;
 
 import java.util.ArrayList;
+import java.util.List;
 
 /**
  * Created by IntelliJ IDEA.
@@ -15,11 +16,11 @@ import java.util.ArrayList;
 public class MultiallelicGenotypeLikelihoods {
     private String sample;
     private double[] GLs;
-    private ArrayList<Allele> alleleList;
+    private List<Allele> alleleList;
     private int depth;
 
     public MultiallelicGenotypeLikelihoods(String sample,
-                                         ArrayList<Allele> A,
+                                         List<Allele> A,
                                          double[] log10Likelihoods, int depth) {
         /* Check for consistency between likelihood vector and number of alleles */
         int numAlleles = A.size();
@@ -40,7 +41,7 @@ public class MultiallelicGenotypeLikelihoods {
          return GLs;
      }
 
-     public ArrayList<Allele> getAlleles() {
+     public List<Allele> getAlleles() {
          return alleleList;
      }
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/SNPGenotypeLikelihoodsCalculationModel.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/SNPGenotypeLikelihoodsCalculationModel.java
index 6905ce4a4..9bdc754e9 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/SNPGenotypeLikelihoodsCalculationModel.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/SNPGenotypeLikelihoodsCalculationModel.java
@@ -31,9 +31,9 @@ import org.broadinstitute.sting.gatk.contexts.AlignmentContextUtils;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
 import org.broadinstitute.sting.utils.BaseUtils;
+import org.broadinstitute.sting.utils.MathUtils;
 import org.broadinstitute.sting.utils.baq.BAQ;
 import org.broadinstitute.sting.utils.exceptions.StingException;
-import org.broadinstitute.sting.utils.genotype.DiploidGenotype;
 import org.broadinstitute.sting.utils.pileup.PileupElement;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileupImpl;
@@ -122,8 +122,10 @@ public class SNPGenotypeLikelihoodsCalculationModel extends GenotypeLikelihoodsC
             aList.add(refAllele);
             aList.add(altAllele);
             double[] dlike = new double[]{likelihoods[refGenotype.ordinal()],likelihoods[hetGenotype.ordinal()],likelihoods[homGenotype.ordinal()]} ;
+
+            // normalize in log space so that max element is zero.
             GLs.put(sample.getKey(), new MultiallelicGenotypeLikelihoods(sample.getKey(),
-                    aList,  dlike, getFilteredDepth(pileup)));
+                    aList,  MathUtils.normalizeFromLog10(dlike, false, true), getFilteredDepth(pileup)));
         }
 
         return refAllele;
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UGCallVariants.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UGCallVariants.java
index 500b11360..d88e55687 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UGCallVariants.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UGCallVariants.java
@@ -30,7 +30,6 @@ import org.broadinstitute.sting.commandline.Output;
 import org.broadinstitute.sting.commandline.RodBinding;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
-import org.broadinstitute.sting.gatk.datasources.rmd.ReferenceOrderedDataSource;
 import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
 import org.broadinstitute.sting.gatk.walkers.RodWalker;
 import org.broadinstitute.sting.utils.SampleUtils;
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedArgumentCollection.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedArgumentCollection.java
index 7b8045581..07d9892a1 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedArgumentCollection.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedArgumentCollection.java
@@ -31,8 +31,6 @@ import org.broadinstitute.sting.commandline.Input;
 import org.broadinstitute.sting.commandline.RodBinding;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
 
-import java.io.File;
-
 
 public class UnifiedArgumentCollection {
 
@@ -103,18 +101,13 @@ public class UnifiedArgumentCollection {
     @Argument(fullName = "assume_single_sample_reads", shortName = "single_sample", doc = "The single sample that we should assume is represented in the input bam (and therefore associate with all reads regardless of whether they have read groups)", required = false)
     public String ASSUME_SINGLE_SAMPLE = null;
 
-    // TODO -- delete me
-    @Hidden
-    @Argument(fullName = "abort_at_too_much_coverage", doc = "Don't call a site if the downsampled coverage is greater than this value", required = false)
-    public int COVERAGE_AT_WHICH_TO_ABORT = -1;
-
-    // control the various parameters to be used
+    /**
+     * The minimum confidence needed in a given base for it to be used in variant calling.  Note that the base quality of a base
+     * is capped by the mapping quality so that bases on reads with low mapping quality may get filtered out depending on this value.
+     */
     @Argument(fullName = "min_base_quality_score", shortName = "mbq", doc = "Minimum base quality required to consider a base for calling", required = false)
     public int MIN_BASE_QUALTY_SCORE = 17;
 
-    @Argument(fullName = "min_mapping_quality_score", shortName = "mmq", doc = "Minimum read mapping quality required to consider a read for calling", required = false)
-    public int MIN_MAPPING_QUALTY_SCORE = 20;
-
     @Argument(fullName = "max_deletion_fraction", shortName = "deletions", doc = "Maximum fraction of reads with deletions spanning this locus for it to be callable [to disable, set to < 0 or > 1; default:0.05]", required = false)
     public Double MAX_DELETION_FRACTION = 0.05;
 
@@ -143,47 +136,28 @@ public class UnifiedArgumentCollection {
     @Hidden
     @Argument(fullName = "indelHaplotypeSize", shortName = "indelHSize", doc = "Indel haplotype size", required = false)
     public int INDEL_HAPLOTYPE_SIZE = 80;
-    @Hidden
-    @Argument(fullName = "doContextDependentGapPenalties", shortName = "doCDP", doc = "Vary gap penalties by context", required = false)
-     public boolean DO_CONTEXT_DEPENDENT_PENALTIES = true;
+
     //gdebug+
     // experimental arguments, NOT TO BE USED BY ANYONE WHOSE INITIALS AREN'T GDA!!!
+//    @Hidden
+//    @Argument(fullName = "getGapPenaltiesFromData", shortName = "dataGP", doc = "Vary gap penalties by context - EXPERIMENTAL, DO NO USE", required = false)
+//    public boolean GET_GAP_PENALTIES_FROM_DATA = false;
+//
+//    @Hidden
+//    @Argument(fullName="indel_recal_file", shortName="recalFile", required=false, doc="Filename for the input covariates table recalibration .csv file - EXPERIMENTAL, DO NO USE")
+//    public File INDEL_RECAL_FILE = new File("indel.recal_data.csv");
     @Hidden
-    @Argument(fullName = "getGapPenaltiesFromData", shortName = "dataGP", doc = "Vary gap penalties by context - EXPERIMENTAL, DO NO USE", required = false)
-    public boolean GET_GAP_PENALTIES_FROM_DATA = false;
-
-    @Hidden
-    @Argument(fullName="indel_recal_file", shortName="recalFile", required=false, doc="Filename for the input covariates table recalibration .csv file - EXPERIMENTAL, DO NO USE")
-    public File INDEL_RECAL_FILE = new File("indel.recal_data.csv");
+    @Argument(fullName = "bandedIndel", shortName = "bandedIndel", doc = "Banded Indel likelihood computation", required = false)
+    public boolean BANDED_INDEL_COMPUTATION = false;
 
     @Hidden
     @Argument(fullName = "indelDebug", shortName = "indelDebug", doc = "Output indel debug info", required = false)
     public boolean OUTPUT_DEBUG_INDEL_INFO = false;
 
-    @Hidden
-    @Argument(fullName = "dovit", shortName = "dovit", doc = "Perform full Viterbi calculation when evaluating the HMM", required = false)
-    public boolean dovit = false;
-
-    @Hidden
-    @Argument(fullName = "GSA_PRODUCTION_ONLY", shortName = "GSA_PRODUCTION_ONLY", doc = "don't ever use me", required = false)
-    public boolean GSA_PRODUCTION_ONLY = false;
-
-    @Hidden
-    @Argument(fullName = "exactCalculation", shortName = "exactCalculation", doc = "expt", required = false)
-    public ExactAFCalculationModel.ExactCalculation EXACT_CALCULATION_TYPE = ExactAFCalculationModel.ExactCalculation.LINEAR_EXPERIMENTAL;
-
     @Hidden
     @Argument(fullName = "ignoreSNPAlleles", shortName = "ignoreSNPAlleles", doc = "expt", required = false)
     public boolean IGNORE_SNP_ALLELES = false;
 
-    @Deprecated
-    @Argument(fullName="output_all_callable_bases", shortName="all_bases", doc="Please use --output_mode EMIT_ALL_SITES instead" ,required=false)
-    private Boolean ALL_BASES_DEPRECATED = false;   
-
-    @Deprecated
-    @Argument(fullName="genotype", shortName="genotype", doc="Please use --output_mode EMIT_ALL_CONFIDENT_SITES instead" ,required=false)
-    private Boolean GENOTYPE_DEPRECATED = false;
-
 
     // Developers must remember to add any newly added arguments to the list here as well otherwise they won't get changed from their default value!
     public UnifiedArgumentCollection clone() {
@@ -191,7 +165,6 @@ public class UnifiedArgumentCollection {
 
         uac.GLmodel = GLmodel;
         uac.AFmodel = AFmodel;
-        uac.EXACT_CALCULATION_TYPE = EXACT_CALCULATION_TYPE;
         uac.heterozygosity = heterozygosity;
         uac.PCR_error = PCR_error;
         uac.GenotypingMode = GenotypingMode;
@@ -201,7 +174,6 @@ public class UnifiedArgumentCollection {
         uac.STANDARD_CONFIDENCE_FOR_CALLING = STANDARD_CONFIDENCE_FOR_CALLING;
         uac.STANDARD_CONFIDENCE_FOR_EMITTING = STANDARD_CONFIDENCE_FOR_EMITTING;
         uac.MIN_BASE_QUALTY_SCORE = MIN_BASE_QUALTY_SCORE;
-        uac.MIN_MAPPING_QUALTY_SCORE = MIN_MAPPING_QUALTY_SCORE;
         uac.MAX_DELETION_FRACTION = MAX_DELETION_FRACTION;
         uac.MIN_INDEL_COUNT_FOR_GENOTYPING = MIN_INDEL_COUNT_FOR_GENOTYPING;
         uac.INDEL_HETEROZYGOSITY = INDEL_HETEROZYGOSITY;
@@ -209,17 +181,11 @@ public class UnifiedArgumentCollection {
         uac.INDEL_GAP_CONTINUATION_PENALTY = INDEL_GAP_CONTINUATION_PENALTY;
         uac.OUTPUT_DEBUG_INDEL_INFO = OUTPUT_DEBUG_INDEL_INFO;
         uac.INDEL_HAPLOTYPE_SIZE = INDEL_HAPLOTYPE_SIZE;
-        uac.DO_CONTEXT_DEPENDENT_PENALTIES = DO_CONTEXT_DEPENDENT_PENALTIES;
         uac.alleles = alleles;
 
-        uac.GET_GAP_PENALTIES_FROM_DATA = GET_GAP_PENALTIES_FROM_DATA;
-        uac.INDEL_RECAL_FILE = INDEL_RECAL_FILE;
         // todo- arguments to remove
-        uac.COVERAGE_AT_WHICH_TO_ABORT = COVERAGE_AT_WHICH_TO_ABORT;
-        uac.dovit = dovit;
-        uac.GSA_PRODUCTION_ONLY = GSA_PRODUCTION_ONLY;
         uac.IGNORE_SNP_ALLELES = IGNORE_SNP_ALLELES;
-        
+        uac.BANDED_INDEL_COMPUTATION = BANDED_INDEL_COMPUTATION;
         return uac;
     }
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyper.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyper.java
index 9fdf65015..72dc217e1 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyper.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyper.java
@@ -149,6 +149,13 @@ public class UnifiedGenotyper extends LocusWalker<VariantCallContext, UnifiedGen
     @Argument(fullName="annotation", shortName="A", doc="One or more specific annotations to apply to variant calls", required=false)
     protected List<String> annotationsToUse = new ArrayList<String>();
 
+    /**
+     * Which annotations to exclude from output in the VCF file.  Note that this argument has higher priority than the -A or -G arguments,
+     * so annotations will be excluded even if they are explicitly included with the other options.
+     */
+    @Argument(fullName="excludeAnnotation", shortName="XA", doc="One or more specific annotations to exclude", required=false)
+    protected List<String> annotationsToExclude = new ArrayList<String>();
+
     /**
      * Which groups of annotations to add to the output VCF file. See the VariantAnnotator -list argument to view available groups.
      */
@@ -210,7 +217,7 @@ public class UnifiedGenotyper extends LocusWalker<VariantCallContext, UnifiedGen
         if ( verboseWriter != null )
             verboseWriter.println("AFINFO\tLOC\tREF\tALT\tMAF\tF\tAFprior\tAFposterior\tNormalizedPosterior");
 
-        annotationEngine = new VariantAnnotatorEngine(Arrays.asList(annotationClassesToUse), annotationsToUse, this, getToolkit());
+        annotationEngine = new VariantAnnotatorEngine(Arrays.asList(annotationClassesToUse), annotationsToUse, annotationsToExclude, this, getToolkit());
         UG_engine = new UnifiedGenotyperEngine(getToolkit(), UAC, logger, verboseWriter, annotationEngine, samples);
 
         // initialize the header
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyperEngine.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyperEngine.java
index 87dd37bf6..993a434ac 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyperEngine.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyperEngine.java
@@ -120,7 +120,6 @@ public class UnifiedGenotyperEngine {
         this.samples = new TreeSet<String>(samples);
         // note that, because we cap the base quality by the mapping quality, minMQ cannot be less than minBQ
         this.UAC = UAC.clone();
-        this.UAC.MIN_MAPPING_QUALTY_SCORE = Math.max(UAC.MIN_MAPPING_QUALTY_SCORE, UAC.MIN_BASE_QUALTY_SCORE);
 
         this.logger = logger;
         this.verboseWriter = verboseWriter;
@@ -146,9 +145,6 @@ public class UnifiedGenotyperEngine {
      * @return the VariantCallContext object
      */
     public VariantCallContext calculateLikelihoodsAndGenotypes(RefMetaDataTracker tracker, ReferenceContext refContext, AlignmentContext rawContext) {
-        if ( UAC.COVERAGE_AT_WHICH_TO_ABORT > 0 && rawContext.size() > UAC.COVERAGE_AT_WHICH_TO_ABORT )
-            return null;
-
         final GenotypeLikelihoodsCalculationModel.Model model = getCurrentGLModel(tracker, refContext, rawContext );
         if( model == null ) {
             return (UAC.OutputMode == OUTPUT_MODE.EMIT_ALL_SITES && UAC.GenotypingMode == GenotypeLikelihoodsCalculationModel.GENOTYPING_MODE.GENOTYPE_GIVEN_ALLELES ? generateEmptyContext(tracker, refContext, null, rawContext) : null);
@@ -325,7 +321,7 @@ public class UnifiedGenotyperEngine {
 
         // 'zero' out the AFs (so that we don't have to worry if not all samples have reads at this position)
         clearAFarray(log10AlleleFrequencyPosteriors.get());
-        afcm.get().getLog10PNonRef(tracker, refContext, vc.getGenotypes(), vc.getAlleles(), getAlleleFrequencyPriors(model), log10AlleleFrequencyPosteriors.get());
+        afcm.get().getLog10PNonRef(vc.getGenotypes(), vc.getAlleles(), getAlleleFrequencyPriors(model), log10AlleleFrequencyPosteriors.get());
 
         // find the most likely frequency
         int bestAFguess = MathUtils.maxElementIndex(log10AlleleFrequencyPosteriors.get());
@@ -383,7 +379,7 @@ public class UnifiedGenotyperEngine {
             // the overall lod
             VariantContext vcOverall = calculateLikelihoods(tracker, refContext, stratifiedContexts, AlignmentContextUtils.ReadOrientation.COMPLETE, vc.getAlternateAllele(0), false, model);
             clearAFarray(log10AlleleFrequencyPosteriors.get());
-            afcm.get().getLog10PNonRef(tracker, refContext, vcOverall.getGenotypes(), vc.getAlleles(), getAlleleFrequencyPriors(model), log10AlleleFrequencyPosteriors.get());
+            afcm.get().getLog10PNonRef(vcOverall.getGenotypes(), vc.getAlleles(), getAlleleFrequencyPriors(model), log10AlleleFrequencyPosteriors.get());
             //double overallLog10PofNull = log10AlleleFrequencyPosteriors.get()[0];
             double overallLog10PofF = MathUtils.log10sumLog10(log10AlleleFrequencyPosteriors.get(), 1);
             //if ( DEBUG_SLOD ) System.out.println("overallLog10PofF=" + overallLog10PofF);
@@ -391,7 +387,7 @@ public class UnifiedGenotyperEngine {
             // the forward lod
             VariantContext vcForward = calculateLikelihoods(tracker, refContext, stratifiedContexts, AlignmentContextUtils.ReadOrientation.FORWARD, vc.getAlternateAllele(0), false, model);
             clearAFarray(log10AlleleFrequencyPosteriors.get());
-            afcm.get().getLog10PNonRef(tracker, refContext, vcForward.getGenotypes(), vc.getAlleles(), getAlleleFrequencyPriors(model), log10AlleleFrequencyPosteriors.get());
+            afcm.get().getLog10PNonRef(vcForward.getGenotypes(), vc.getAlleles(), getAlleleFrequencyPriors(model), log10AlleleFrequencyPosteriors.get());
             //double[] normalizedLog10Posteriors = MathUtils.normalizeFromLog10(log10AlleleFrequencyPosteriors.get(), true);
             double forwardLog10PofNull = log10AlleleFrequencyPosteriors.get()[0];
             double forwardLog10PofF = MathUtils.log10sumLog10(log10AlleleFrequencyPosteriors.get(), 1);
@@ -400,7 +396,7 @@ public class UnifiedGenotyperEngine {
             // the reverse lod
             VariantContext vcReverse = calculateLikelihoods(tracker, refContext, stratifiedContexts, AlignmentContextUtils.ReadOrientation.REVERSE, vc.getAlternateAllele(0), false, model);
             clearAFarray(log10AlleleFrequencyPosteriors.get());
-            afcm.get().getLog10PNonRef(tracker, refContext, vcReverse.getGenotypes(), vc.getAlleles(), getAlleleFrequencyPriors(model), log10AlleleFrequencyPosteriors.get());
+            afcm.get().getLog10PNonRef(vcReverse.getGenotypes(), vc.getAlleles(), getAlleleFrequencyPriors(model), log10AlleleFrequencyPosteriors.get());
             //normalizedLog10Posteriors = MathUtils.normalizeFromLog10(log10AlleleFrequencyPosteriors.get(), true);
             double reverseLog10PofNull = log10AlleleFrequencyPosteriors.get()[0];
             double reverseLog10PofF = MathUtils.log10sumLog10(log10AlleleFrequencyPosteriors.get(), 1);
@@ -423,7 +419,7 @@ public class UnifiedGenotyperEngine {
 
         int endLoc = calculateEndPos(vc.getAlleles(), vc.getReference(), loc);
 
-        Set<Allele> myAlleles = vc.getAlleles();
+        Set<Allele> myAlleles = new HashSet<Allele>(vc.getAlleles());
         // strip out the alternate allele if it's a ref call
         if ( bestAFguess == 0 && UAC.GenotypingMode == GenotypeLikelihoodsCalculationModel.GENOTYPING_MODE.DISCOVERY ) {
             myAlleles = new HashSet<Allele>(1);
@@ -447,7 +443,79 @@ public class UnifiedGenotyperEngine {
         return new VariantCallContext(vcCall, confidentlyCalled(phredScaledConfidence, PofF));
     }
 
-    private int calculateEndPos(Set<Allele> alleles, Allele refAllele, GenomeLoc loc) {
+    // A barebones entry point to the exact model when there is no tracker or stratified contexts available -- only GLs
+    public VariantCallContext calculateGenotypes(final VariantContext vc, final GenomeLoc loc, final GenotypeLikelihoodsCalculationModel.Model model) {
+
+        // initialize the data for this thread if that hasn't been done yet
+        if ( afcm.get() == null ) {
+            log10AlleleFrequencyPosteriors.set(new double[N+1]);
+            afcm.set(getAlleleFrequencyCalculationObject(N, logger, verboseWriter, UAC));
+        }
+
+        // estimate our confidence in a reference call and return
+        if ( vc.getNSamples() == 0 )
+            return null;
+
+        // 'zero' out the AFs (so that we don't have to worry if not all samples have reads at this position)
+        clearAFarray(log10AlleleFrequencyPosteriors.get());
+        afcm.get().getLog10PNonRef(vc.getGenotypes(), vc.getAlleles(), getAlleleFrequencyPriors(model), log10AlleleFrequencyPosteriors.get());
+
+        // find the most likely frequency
+        int bestAFguess = MathUtils.maxElementIndex(log10AlleleFrequencyPosteriors.get());
+
+        // calculate p(f>0)
+        double[] normalizedPosteriors = MathUtils.normalizeFromLog10(log10AlleleFrequencyPosteriors.get());
+        double sum = 0.0;
+        for (int i = 1; i <= N; i++)
+            sum += normalizedPosteriors[i];
+        double PofF = Math.min(sum, 1.0); // deal with precision errors
+
+        double phredScaledConfidence;
+        if ( bestAFguess != 0 || UAC.GenotypingMode == GenotypeLikelihoodsCalculationModel.GENOTYPING_MODE.GENOTYPE_GIVEN_ALLELES ) {
+            phredScaledConfidence = QualityUtils.phredScaleErrorRate(normalizedPosteriors[0]);
+            if ( Double.isInfinite(phredScaledConfidence) )
+                phredScaledConfidence = -10.0 * log10AlleleFrequencyPosteriors.get()[0];
+        } else {
+            phredScaledConfidence = QualityUtils.phredScaleErrorRate(PofF);
+            if ( Double.isInfinite(phredScaledConfidence) ) {
+                sum = 0.0;
+                for (int i = 1; i <= N; i++) {
+                    if ( log10AlleleFrequencyPosteriors.get()[i] == AlleleFrequencyCalculationModel.VALUE_NOT_CALCULATED )
+                        break;
+                    sum += log10AlleleFrequencyPosteriors.get()[i];
+                }
+                phredScaledConfidence = (MathUtils.compareDoubles(sum, 0.0) == 0 ? 0 : -10.0 * sum);
+            }
+        }
+
+        // return a null call if we don't pass the confidence cutoff or the most likely allele frequency is zero
+        if ( UAC.OutputMode != OUTPUT_MODE.EMIT_ALL_SITES && !passesEmitThreshold(phredScaledConfidence, bestAFguess) ) {
+            // technically, at this point our confidence in a reference call isn't accurately estimated
+            //  because it didn't take into account samples with no data, so let's get a better estimate
+            return null;
+        }
+
+        // create the genotypes
+        Map<String, Genotype> genotypes = afcm.get().assignGenotypes(vc, log10AlleleFrequencyPosteriors.get(), bestAFguess);
+
+        // *** note that calculating strand bias involves overwriting data structures, so we do that last
+        HashMap<String, Object> attributes = new HashMap<String, Object>();
+
+        int endLoc = calculateEndPos(vc.getAlleles(), vc.getReference(), loc);
+
+        Set<Allele> myAlleles = new HashSet<Allele>(vc.getAlleles());
+        // strip out the alternate allele if it's a ref call
+        if ( bestAFguess == 0 && UAC.GenotypingMode == GenotypeLikelihoodsCalculationModel.GENOTYPING_MODE.DISCOVERY ) {
+            myAlleles = new HashSet<Allele>(1);
+            myAlleles.add(vc.getReference());
+        }
+        VariantContext vcCall = new VariantContext("UG_call", loc.getContig(), loc.getStart(), endLoc,
+                myAlleles, genotypes, phredScaledConfidence/10.0, passesCallThreshold(phredScaledConfidence) ? null : filter, attributes, vc.getReferenceBaseForIndel());
+
+        return new VariantCallContext(vcCall, confidentlyCalled(phredScaledConfidence, PofF));
+    }
+
+    private int calculateEndPos(Collection<Allele> alleles, Allele refAllele, GenomeLoc loc) {
         // TODO - temp fix until we can deal with extended events properly
         // for indels, stop location is one more than ref allele length
         boolean isSNP = true, hasNullAltAllele = false;
@@ -494,10 +562,10 @@ public class UnifiedGenotyperEngine {
 
             if (UAC.GenotypingMode == GenotypeLikelihoodsCalculationModel.GENOTYPING_MODE.GENOTYPE_GIVEN_ALLELES) {
                 // regular pileup in this case
-                ReadBackedPileup pileup = rawContext.getBasePileup() .getMappingFilteredPileup(UAC.MIN_MAPPING_QUALTY_SCORE);
+                ReadBackedPileup pileup = rawContext.getBasePileup() .getMappingFilteredPileup(UAC.MIN_BASE_QUALTY_SCORE);
 
                 // don't call when there is no coverage
-                if ( pileup.size() == 0 && UAC.OutputMode != OUTPUT_MODE.EMIT_ALL_SITES  )
+                if ( pileup.getNumberOfElements() == 0 && UAC.OutputMode != OUTPUT_MODE.EMIT_ALL_SITES  )
                     return null;
 
                 // stratify the AlignmentContext and cut by sample
@@ -511,10 +579,10 @@ public class UnifiedGenotyperEngine {
                 ReadBackedExtendedEventPileup rawPileup = rawContext.getExtendedEventPileup();
 
                 // filter the context based on min mapping quality
-                ReadBackedExtendedEventPileup pileup = rawPileup.getMappingFilteredPileup(UAC.MIN_MAPPING_QUALTY_SCORE);
+                ReadBackedExtendedEventPileup pileup = rawPileup.getMappingFilteredPileup(UAC.MIN_BASE_QUALTY_SCORE);
 
                 // don't call when there is no coverage
-                if ( pileup.size() == 0 && UAC.OutputMode != OUTPUT_MODE.EMIT_ALL_SITES  )
+                if ( pileup.getNumberOfElements() == 0 && UAC.OutputMode != OUTPUT_MODE.EMIT_ALL_SITES  )
                     return null;
 
                 // stratify the AlignmentContext and cut by sample
@@ -530,7 +598,7 @@ public class UnifiedGenotyperEngine {
                 for( final PileupElement p : rawContext.getBasePileup() ) {
                     if( p.isDeletion() ) { numDeletions++; }
                 }
-                if( ((double) numDeletions) / ((double) rawContext.getBasePileup().size()) > UAC.MAX_DELETION_FRACTION ) {
+                if( ((double) numDeletions) / ((double) rawContext.getBasePileup().getNumberOfElements()) > UAC.MAX_DELETION_FRACTION ) {
                     return null;
                 }
             }
@@ -544,6 +612,21 @@ public class UnifiedGenotyperEngine {
             AFs[i] = AlleleFrequencyCalculationModel.VALUE_NOT_CALCULATED;
     }
 
+    private final static double[] binomialProbabilityDepthCache = new double[10000];
+    static {
+        for ( int i = 1; i < binomialProbabilityDepthCache.length; i++ ) {
+            binomialProbabilityDepthCache[i] = MathUtils.binomialProbability(0, i, 0.5);
+        }
+    }
+
+    private final double getRefBinomialProb(final int depth) {
+        if ( depth < binomialProbabilityDepthCache.length )
+            return binomialProbabilityDepthCache[depth];
+        else
+            return MathUtils.binomialProbability(0, depth, 0.5);
+    }
+
+
     private VariantCallContext estimateReferenceConfidence(VariantContext vc, Map<String, AlignmentContext> contexts, double theta, boolean ignoreCoveredSamples, double initialPofRef) {
         if ( contexts == null )
             return null;
@@ -562,12 +645,12 @@ public class UnifiedGenotyperEngine {
             if (isCovered) {
                 AlignmentContext context =  contexts.get(sample);
                 if (context.hasBasePileup())
-                    depth = context.getBasePileup().size();
+                    depth = context.getBasePileup().depthOfCoverage();
                 else if (context.hasExtendedEventPileup())
-                    depth = context.getExtendedEventPileup().size();
+                    depth = context.getExtendedEventPileup().depthOfCoverage();
             }
 
-            P_of_ref *= 1.0 - (theta / 2.0) * MathUtils.binomialProbability(0, depth, 0.5);
+            P_of_ref *= 1.0 - (theta / 2.0) * getRefBinomialProb(depth);
         }
 
         return new VariantCallContext(vc, QualityUtils.phredScaleErrorRate(1.0 - P_of_ref) >= UAC.STANDARD_CONFIDENCE_FOR_CALLING, false);
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/ConstrainedMateFixingManager.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/ConstrainedMateFixingManager.java
index adb7c4c38..3dd51fa7d 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/ConstrainedMateFixingManager.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/ConstrainedMateFixingManager.java
@@ -9,6 +9,7 @@ import org.apache.log4j.Logger;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.GenomeLocParser;
 import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.*;
 
@@ -180,8 +181,8 @@ public class ConstrainedMateFixingManager {
         addRead(newRead, readWasModified, true);
     }
 
-    public void addReads(List<SAMRecord> newReads, Set<SAMRecord> modifiedReads) {
-        for ( SAMRecord newRead : newReads )
+    public void addReads(List<GATKSAMRecord> newReads, Set<GATKSAMRecord> modifiedReads) {
+        for ( GATKSAMRecord newRead : newReads )
             addRead(newRead, modifiedReads.contains(newRead), false);
     }
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/HaplotypeIndelErrorModel.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/HaplotypeIndelErrorModel.java
index e68aa31e0..3b3f54b05 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/HaplotypeIndelErrorModel.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/HaplotypeIndelErrorModel.java
@@ -26,9 +26,9 @@
 package org.broadinstitute.sting.gatk.walkers.indels;
 
 import net.sf.samtools.SAMRecord;
+import org.broadinstitute.sting.utils.Haplotype;
 import org.broadinstitute.sting.utils.MathUtils;
 import org.broadinstitute.sting.utils.QualityUtils;
-import org.broadinstitute.sting.utils.genotype.Haplotype;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
 import org.broadinstitute.sting.utils.sam.ReadUtils;
 import org.broadinstitute.sting.utils.variantcontext.Allele;
@@ -73,7 +73,7 @@ public class HaplotypeIndelErrorModel {
         baseMatchArray = new double[MAX_CACHED_QUAL+1];
         baseMismatchArray = new double[MAX_CACHED_QUAL+1];
         for (int k=1; k <= MAX_CACHED_QUAL; k++) {
-            double baseProb = QualityUtils.qualToProb(k);
+            double baseProb = QualityUtils.qualToProb((byte)k);
 
 
             baseMatchArray[k] =  probToQual(baseProb);
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/IndelRealigner.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/IndelRealigner.java
index 36e4db1c5..ba031c497 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/IndelRealigner.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/IndelRealigner.java
@@ -30,9 +30,9 @@ import net.sf.samtools.*;
 import net.sf.samtools.util.RuntimeIOException;
 import net.sf.samtools.util.SequenceUtil;
 import net.sf.samtools.util.StringUtil;
+import org.broad.tribble.Feature;
 import org.broadinstitute.sting.commandline.*;
 import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
-import org.broadinstitute.sting.gatk.arguments.ValidationExclusion;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.io.StingSAMFileWriter;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
@@ -46,11 +46,8 @@ import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.exceptions.StingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
 import org.broadinstitute.sting.utils.fasta.CachingIndexedFastaSequenceFile;
-import org.broadinstitute.sting.utils.interval.IntervalFileMergingIterator;
-import org.broadinstitute.sting.utils.interval.IntervalMergingRule;
-import org.broadinstitute.sting.utils.interval.IntervalUtils;
-import org.broadinstitute.sting.utils.interval.NwayIntervalMergingIterator;
 import org.broadinstitute.sting.utils.sam.AlignmentUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.broadinstitute.sting.utils.sam.NWaySAMFileWriter;
 import org.broadinstitute.sting.utils.sam.ReadUtils;
 import org.broadinstitute.sting.utils.text.TextFormattingUtils;
@@ -138,14 +135,14 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
      * Any number of VCF files representing known indels to be used for constructing alternate consenses.
      * Could be e.g. dbSNP and/or official 1000 Genomes indel calls.  Non-indel variants in these files will be ignored.
      */
-    @Input(fullName="known", shortName = "known", doc="Input VCF file(s) with known indels", required=false)
+    @Input(fullName="knownAlleles", shortName = "known", doc="Input VCF file(s) with known indels", required=false)
     public List<RodBinding<VariantContext>> known = Collections.emptyList();
 
     /**
      * The interval list output from the RealignerTargetCreator tool using the same bam(s), reference, and known indel file(s).
      */
     @Input(fullName="targetIntervals", shortName="targetIntervals", doc="intervals file output from RealignerTargetCreator", required=true)
-    protected String intervalsFile = null;
+    protected IntervalBinding<Feature> intervalsFile = null;
 
     /**
      * This term is equivalent to "significance" - i.e. is the improvement significant enough to merit realignment? Note that this number
@@ -230,14 +227,6 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
     @Argument(fullName="noOriginalAlignmentTags", shortName="noTags", required=false, doc="Don't output the original cigar or alignment start tags for each realigned read in the output bam")
     protected boolean NO_ORIGINAL_ALIGNMENT_TAGS = false;
 
-    /**
-     * For expert users only!  This tool assumes that the target interval list is sorted; if the list turns out to be unsorted, it will throw an exception.
-     * Use this argument when your interval list is not sorted to instruct the Realigner to first sort it in memory.
-     */
-    @Advanced
-    @Argument(fullName="targetIntervalsAreNotSorted", shortName="targetNotSorted", required=false, doc="The target intervals are not sorted")
-    protected boolean TARGET_NOT_SORTED = false;
-
     /**
      * Reads from all input files will be realigned together, but then each read will be saved in the output file corresponding to the input file that
      * the read came from. There are two ways to generate output bam file names: 1) if the value of this argument is a general string (e.g. '.cleaned.bam'),
@@ -263,6 +252,12 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
             doc="Don't output the usual PG tag in the realigned bam file header. FOR DEBUGGING PURPOSES ONLY.  This option is required in order to pass integration tests.")
     protected boolean NO_PG_TAG = false;
 
+    @Hidden
+    @Argument(fullName="keepPGTags", shortName="keepPG", required=false,
+            doc="Keep older PG tags left in the bam header by previous runs of this tool (by default, all these "+
+                    "historical tags will be replaced by the latest tag generated in the current run).")
+    protected boolean KEEP_ALL_PG_RECORDS = false;
+
     @Hidden
     @Output(fullName="indelsFileForDebugging", shortName="indels", required=false, doc="Output file (text) for the indels found; FOR DEBUGGING PURPOSES ONLY")
     protected String OUT_INDELS = null;
@@ -287,10 +282,10 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
 
     // the reads and known indels that fall into the current interval
     private final ReadBin readsToClean = new ReadBin();
-    private final ArrayList<SAMRecord> readsNotToClean = new ArrayList<SAMRecord>();
+    private final ArrayList<GATKSAMRecord> readsNotToClean = new ArrayList<GATKSAMRecord>();
     private final ArrayList<VariantContext> knownIndelsToTry = new ArrayList<VariantContext>();
     private final HashSet<Object> indelRodsSeen = new HashSet<Object>();
-    private final HashSet<SAMRecord> readsActuallyCleaned = new HashSet<SAMRecord>();
+    private final HashSet<GATKSAMRecord> readsActuallyCleaned = new HashSet<GATKSAMRecord>();
 
     private static final int MAX_QUAL = 99;
 
@@ -367,48 +362,23 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
         catch(FileNotFoundException ex) {
             throw new UserException.CouldNotReadInputFile(getToolkit().getArguments().referenceFile,ex);
         }
-        
-        if ( !TARGET_NOT_SORTED ) {
 
-            NwayIntervalMergingIterator merger = new NwayIntervalMergingIterator(IntervalMergingRule.OVERLAPPING_ONLY);
-            List<GenomeLoc> rawIntervals = new ArrayList<GenomeLoc>();
-            // separate argument on semicolon first
-            for (String fileOrInterval : intervalsFile.split(";")) {
-                // if it's a file, add items to raw interval list
-                if (IntervalUtils.isIntervalFile(fileOrInterval)) {
-                    merger.add(new IntervalFileMergingIterator( getToolkit().getGenomeLocParser(), new java.io.File(fileOrInterval), IntervalMergingRule.OVERLAPPING_ONLY ) );
-                } else {
-                    rawIntervals.add(getToolkit().getGenomeLocParser().parseGenomeLoc(fileOrInterval));
-                }
-            }
-            if ( ! rawIntervals.isEmpty() ) merger.add(rawIntervals.iterator());
-            // prepare to read intervals one-by-one, as needed (assuming they are sorted).
-            intervals = merger; 
-        } else {
-            // read in the whole list of intervals for cleaning
-            boolean allowEmptyIntervalList = (getToolkit().getArguments().unsafe == ValidationExclusion.TYPE.ALLOW_EMPTY_INTERVAL_LIST ||
-                                              getToolkit().getArguments().unsafe == ValidationExclusion.TYPE.ALL);
-            GenomeLocSortedSet locs = IntervalUtils.sortAndMergeIntervals(getToolkit().getGenomeLocParser(),
-                    IntervalUtils.parseIntervalArguments(getToolkit().getGenomeLocParser(),Arrays.asList(intervalsFile),allowEmptyIntervalList),
-                    IntervalMergingRule.OVERLAPPING_ONLY);
-            intervals = locs.iterator();
-        }
+        intervals = intervalsFile.getIntervals(getToolkit()).iterator();
+
         currentInterval = intervals.hasNext() ? intervals.next() : null;
 
         writerToUse = writer;
 
         if ( N_WAY_OUT != null ) {
- //           Map<String,String> args = getToolkit().getArguments().walkerArgs;
             boolean createIndex =  true;
 
- //           if ( args.containsKey("disable_bam_indexing") )  { System.out.println("NO INDEXING!!"); System.exit(1); createIndex = false; }
-
             if ( N_WAY_OUT.toUpperCase().endsWith(".MAP") ) {
-                writerToUse = new NWaySAMFileWriter(getToolkit(),loadFileNameMap(N_WAY_OUT),SAMFileHeader.SortOrder.coordinate,true, createIndex, generateMD5s);
+                writerToUse = new NWaySAMFileWriter(getToolkit(),loadFileNameMap(N_WAY_OUT),
+                            SAMFileHeader.SortOrder.coordinate,true, createIndex, generateMD5s,createProgramRecord(),KEEP_ALL_PG_RECORDS);
             } else {
-                writerToUse = new NWaySAMFileWriter(getToolkit(),N_WAY_OUT,SAMFileHeader.SortOrder.coordinate,true, createIndex, generateMD5s);
+                writerToUse = new NWaySAMFileWriter(getToolkit(),N_WAY_OUT,SAMFileHeader.SortOrder.coordinate,true,
+                        createIndex, generateMD5s,createProgramRecord(),KEEP_ALL_PG_RECORDS);
             }
-
         }   else {
 
             // set up the output writer
@@ -448,18 +418,12 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
     private void setupWriter(SAMFileHeader header) {
         
         if ( !NO_PG_TAG ) {
-            final SAMProgramRecord programRecord = new SAMProgramRecord(PROGRAM_RECORD_NAME);
-            final ResourceBundle headerInfo = TextFormattingUtils.loadResourceBundle("StingText");
-            try {
-                final String version = headerInfo.getString("org.broadinstitute.sting.gatk.version");
-                programRecord.setProgramVersion(version);
-            } catch (MissingResourceException e) {}
-            programRecord.setCommandLine(getToolkit().createApproximateCommandLineArgumentString(getToolkit(), this));
+            final SAMProgramRecord programRecord = createProgramRecord();
 
             List<SAMProgramRecord> oldRecords = header.getProgramRecords();
             List<SAMProgramRecord> newRecords = new ArrayList<SAMProgramRecord>(oldRecords.size()+1);
             for ( SAMProgramRecord record : oldRecords ) {
-                if ( !record.getId().startsWith(PROGRAM_RECORD_NAME) )
+                if ( !record.getId().startsWith(PROGRAM_RECORD_NAME) || KEEP_ALL_PG_RECORDS )
                     newRecords.add(record);
             }
             newRecords.add(programRecord);
@@ -470,6 +434,20 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
         writer.setPresorted(true);
     }
 
+
+    private SAMProgramRecord createProgramRecord() {
+        if ( NO_PG_TAG ) return null;
+
+        final SAMProgramRecord programRecord = new SAMProgramRecord(PROGRAM_RECORD_NAME);
+        final ResourceBundle headerInfo = TextFormattingUtils.loadResourceBundle("StingText");
+        try {
+            final String version = headerInfo.getString("org.broadinstitute.sting.gatk.version");
+            programRecord.setProgramVersion(version);
+        } catch (MissingResourceException e) {}
+        programRecord.setCommandLine(getToolkit().createApproximateCommandLineArgumentString(getToolkit(), this));
+        return programRecord;
+    }
+
     private void emit(final SAMRecord read) {
 
         // check to see whether the read was modified by looking at the temporary tag
@@ -492,7 +470,7 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
         readsActuallyCleaned.clear();
     }
 
-    public Integer map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
+    public Integer map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker) {
         if ( currentInterval == null ) {
             emit(read);
             return 0;
@@ -558,7 +536,7 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
         // TODO -- it would be nice if we could use indels from 454 reads as alternate consenses
     }
 
-    private void cleanAndCallMap(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker, GenomeLoc readLoc) {
+    private void cleanAndCallMap(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker, GenomeLoc readLoc) {
         if ( readsToClean.size() > 0 ) {
             GenomeLoc earliestPossibleMove = getToolkit().getGenomeLocParser().createGenomeLoc(readsToClean.getReads().get(0));
             if ( manager.canMoveReads(earliestPossibleMove) )
@@ -574,7 +552,7 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
 
             } while ( currentInterval != null && (readLoc == null || currentInterval.isBefore(readLoc)) );
         } catch (ReviewedStingException e) {
-            throw new UserException.MissortedFile(new File(intervalsFile), " *** Are you sure that your interval file is sorted? If not, you must use the --targetIntervalsAreNotSorted argument. ***", e);
+            throw new UserException.MissortedFile(new File(intervalsFile.getSource()), " *** Are you sure that your interval file is sorted? If not, you must use the --targetIntervalsAreNotSorted argument. ***", e);
         }
         sawReadInCurrentInterval = false;
 
@@ -679,14 +657,14 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
 
     private void clean(ReadBin readsToClean) {
 
-        final List<SAMRecord> reads = readsToClean.getReads();
+        final List<GATKSAMRecord> reads = readsToClean.getReads();
         if ( reads.size() == 0 )
             return;
 
         byte[] reference = readsToClean.getReference(referenceReader);
         int leftmostIndex = readsToClean.getLocation().getStart();
 
-        final ArrayList<SAMRecord> refReads = new ArrayList<SAMRecord>();                 // reads that perfectly match ref
+        final ArrayList<GATKSAMRecord> refReads = new ArrayList<GATKSAMRecord>();                 // reads that perfectly match ref
         final ArrayList<AlignedRead> altReads = new ArrayList<AlignedRead>();               // reads that don't perfectly match
         final LinkedList<AlignedRead> altAlignmentsToTest = new LinkedList<AlignedRead>();  // should we try to make an alt consensus from the read?
         final Set<Consensus> altConsenses = new LinkedHashSet<Consensus>();               // list of alt consenses
@@ -838,8 +816,9 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
                         // however we don't have enough info to use the proper MAQ scoring system.
                         // For now, we will just arbitrarily add 10 to the mapping quality. [EB, 6/7/2010].
                         // TODO -- we need a better solution here
-                        SAMRecord read = aRead.getRead();
-                        read.setMappingQuality(Math.min(aRead.getRead().getMappingQuality() + 10, 254));
+                        GATKSAMRecord read = aRead.getRead();
+                        if ( read.getMappingQuality() != 255 ) // 255 == Unknown, so don't modify it
+                            read.setMappingQuality(Math.min(aRead.getRead().getMappingQuality() + 10, 254));
 
                         // before we fix the attribute tags we first need to make sure we have enough of the reference sequence
                         int neededBasesToLeft = leftmostIndex - read.getAlignmentStart();
@@ -897,8 +876,8 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
         }
     }
 
-    private long determineReadsThatNeedCleaning(final List<SAMRecord> reads,
-                                                final ArrayList<SAMRecord> refReadsToPopulate,
+    private long determineReadsThatNeedCleaning(final List<GATKSAMRecord> reads,
+                                                final ArrayList<GATKSAMRecord> refReadsToPopulate,
                                                 final ArrayList<AlignedRead> altReadsToPopulate,
                                                 final LinkedList<AlignedRead> altAlignmentsToTest,
                                                 final Set<Consensus> altConsenses,
@@ -907,7 +886,7 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
 
         long totalRawMismatchSum = 0L;
 
-        for ( final SAMRecord read : reads ) {
+        for ( final GATKSAMRecord read : reads ) {
 
             // we can not deal with screwy records
             if ( read.getCigar().numCigarElements() == 0 ) {
@@ -1395,7 +1374,7 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
     }
 
     private class AlignedRead {
-        private final SAMRecord read;
+        private final GATKSAMRecord read;
         private byte[] readBases = null;
         private byte[] baseQuals = null;
         private Cigar newCigar = null;
@@ -1403,12 +1382,12 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
         private int mismatchScoreToReference = 0;
         private long alignerMismatchScore = 0;
 
-        public AlignedRead(SAMRecord read) {
+        public AlignedRead(GATKSAMRecord read) {
             this.read = read;
             mismatchScoreToReference = 0;
         }
 
-        public SAMRecord getRead() {
+        public GATKSAMRecord getRead() {
                return read;
         }
 
@@ -1592,7 +1571,7 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
 
     private class ReadBin implements HasGenomeLocation {
 
-        private final ArrayList<SAMRecord> reads = new ArrayList<SAMRecord>();
+        private final ArrayList<GATKSAMRecord> reads = new ArrayList<GATKSAMRecord>();
         private byte[] reference = null;
         private GenomeLoc loc = null;
 
@@ -1600,7 +1579,7 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
 
         // Return false if we can't process this read bin because the reads are not correctly overlapping.
         // This can happen if e.g. there's a large known indel with no overlapping reads.
-        public void add(SAMRecord read) {
+        public void add(GATKSAMRecord read) {
 
             GenomeLoc locForRead = getToolkit().getGenomeLocParser().createGenomeLoc(read);
             if ( loc == null )
@@ -1611,7 +1590,7 @@ public class IndelRealigner extends ReadWalker<Integer, Integer> {
             reads.add(read);
         }
 
-        public List<SAMRecord> getReads() { return reads; }
+        public List<GATKSAMRecord> getReads() { return reads; }
 
         public byte[] getReference(IndexedFastaSequenceFile referenceReader) {
             // set up the reference if we haven't done so yet
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/LeftAlignIndels.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/LeftAlignIndels.java
index 17d5a8e9b..7490262f2 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/LeftAlignIndels.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/LeftAlignIndels.java
@@ -34,6 +34,7 @@ import org.broadinstitute.sting.gatk.io.StingSAMFileWriter;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
 import org.broadinstitute.sting.gatk.walkers.ReadWalker;
 import org.broadinstitute.sting.utils.sam.AlignmentUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 
 /**
@@ -88,7 +89,7 @@ public class LeftAlignIndels extends ReadWalker<Integer, Integer> {
             writer.addAlignment(read);
     }
 
-    public Integer map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
+    public Integer map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker) {
         // we can not deal with screwy records
         if ( read.getCigar().numCigarElements() == 0 ) {
             emit(read);
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/PairHMMIndelErrorModel.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/PairHMMIndelErrorModel.java
index 2d7969230..319f41d53 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/PairHMMIndelErrorModel.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/PairHMMIndelErrorModel.java
@@ -28,62 +28,25 @@ package org.broadinstitute.sting.gatk.walkers.indels;
 import net.sf.samtools.Cigar;
 import net.sf.samtools.CigarElement;
 import net.sf.samtools.CigarOperator;
+import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
+import org.broadinstitute.sting.utils.Haplotype;
 import org.broadinstitute.sting.utils.MathUtils;
-import org.broadinstitute.sting.utils.genotype.Haplotype;
 import org.broadinstitute.sting.utils.pileup.PileupElement;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
-import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.broadinstitute.sting.utils.sam.ReadUtils;
 import org.broadinstitute.sting.utils.variantcontext.Allele;
 
-import java.io.File;
 import java.util.Arrays;
 import java.util.HashMap;
 import java.util.LinkedHashMap;
 
-/*import org.broadinstitute.sting.oneoffprojects.walkers.IndelCountCovariates.Covariate;
-import org.broadinstitute.sting.oneoffprojects.walkers.IndelCountCovariates.RecalDataManager;
-import org.broadinstitute.sting.oneoffprojects.walkers.IndelCountCovariates.RecalDatum;
-import org.broadinstitute.sting.oneoffprojects.walkers.IndelCountCovariates.RecalibrationArgumentCollection;
-*/
-
 
 public class PairHMMIndelErrorModel {
-
-
     public static final int BASE_QUAL_THRESHOLD = 20;
 
-
-    private static final int MATCH_OFFSET = 0;
-    private static final int X_OFFSET = 1;
-    private static final int Y_OFFSET = 2;
-
-    private static final int DIAG = 0;
-    private static final int UP = 1;
-    private static final int LEFT = 2;
-
-    private static final int DIAG_GOTO_M = 0;
-    private static final int DIAG_GOTO_X = 1;
-    private static final int DIAG_GOTO_Y = 2;
-
-    private static final int UP_GOTO_M = 4;
-    private static final int UP_GOTO_X = 5;
-    private static final int UP_GOTO_Y = 6;
-
-    private static final int LEFT_GOTO_M = 8;
-    private static final int LEFT_GOTO_X = 9;
-    private static final int LEFT_GOTO_Y = 10;
-
-    private static final int[] ACTIONS_M = {DIAG_GOTO_M, DIAG_GOTO_X, DIAG_GOTO_Y};
-    private static final int[] ACTIONS_X = {UP_GOTO_M, UP_GOTO_X, UP_GOTO_Y};
-    private static final int[] ACTIONS_Y = {LEFT_GOTO_M, LEFT_GOTO_X, LEFT_GOTO_Y};
-
-
-    private final double logGapOpenProbability;
-    private final double logGapContinuationProbability;
-
     private boolean DEBUG = false;
+    private boolean bandedLikelihoods = false;
 
     private static final int MAX_CACHED_QUAL = 127;
 
@@ -100,36 +63,13 @@ public class PairHMMIndelErrorModel {
     private static final double MIN_GAP_CONT_PENALTY = 10.0;
     private static final double GAP_PENALTY_HRUN_STEP = 1.0; // each increase in hrun decreases gap penalty by this.
 
-
-    private boolean doViterbi = false;
-
-    private final boolean useAffineGapModel = true;
-    private boolean doContextDependentPenalties = false;
-
     private final double[] GAP_OPEN_PROB_TABLE;
     private final double[] GAP_CONT_PROB_TABLE;
 
-    private boolean getGapPenaltiesFromFile = false;
-
-    private int SMOOTHING = 1;
-    private int MAX_QUALITY_SCORE = 50;
-    private int PRESERVE_QSCORES_LESS_THAN = 5;
-
     /////////////////////////////
     // Private Member Variables
     /////////////////////////////
-//copy+
-/*    private RecalDataManager dataManager; // Holds the data HashMap, mostly used by TableRecalibrationWalker to create collapsed data hashmaps
-    private final ArrayList<Covariate> requestedCovariates = new ArrayList<Covariate>(); // List of covariates to be used in this calculation
-    private static final Pattern COMMENT_PATTERN = Pattern.compile("^#.*");
-    private static final Pattern OLD_RECALIBRATOR_HEADER = Pattern.compile("^rg,.*");
-    private static final Pattern COVARIATE_PATTERN = Pattern.compile("^ReadGroup,QualityScore,.*");
-    protected static final String EOF_MARKER = "EOF";
-    private long numReadsWithMalformedColorSpace = 0;
-    private RecalibrationArgumentCollection RAC = new RecalibrationArgumentCollection();
-    private NestedHashMap qualityScoreByFullCovariateKey = new NestedHashMap(); // Caches the result of performSequentialQualityCalculation(..) for all sets of covariate values.
-  */
-//copy-
+
     static {
         LOG_ONE_HALF= -Math.log10(2.0);
         END_GAP_COST = LOG_ONE_HALF;
@@ -145,155 +85,22 @@ public class PairHMMIndelErrorModel {
         }
     }
 
-    public  PairHMMIndelErrorModel(double indelGOP, double indelGCP, boolean deb, boolean doCDP, boolean dovit,boolean gpf, File RECAL_FILE) {
-
-        this(indelGOP, indelGCP, deb, doCDP, dovit);
-        this.getGapPenaltiesFromFile = gpf;
-
-        // read data from recal file
-        // gdebug - start copy from TableRecalibrationWalker
-/*        if (gpf) {
-            boolean sawEOF = false;
-            boolean REQUIRE_EOF = false;
-
-            int lineNumber = 0;
-            boolean foundAllCovariates = false;
-            // Get a list of all available covariates
-            final List<Class<? extends Covariate>> classes = new PluginManager<Covariate>(Covariate.class).getPlugins();
-
-            try {
-                for ( String line : new XReadLines(RECAL_FILE) ) {
-                    lineNumber++;
-                    if ( EOF_MARKER.equals(line) ) {
-                        sawEOF = true;
-                    } else if( COMMENT_PATTERN.matcher(line).matches() || OLD_RECALIBRATOR_HEADER.matcher(line).matches() )  {
-                        ; // Skip over the comment lines, (which start with '#')
-                    }
-                    // Read in the covariates that were used from the input file
-                    else if( COVARIATE_PATTERN.matcher(line).matches() ) { // The line string is either specifying a covariate or is giving csv data
-                        if( foundAllCovariates ) {
-                            throw new UserException.MalformedFile( RECAL_FILE, "Malformed input recalibration file. Found covariate names intermingled with data in file: " + RECAL_FILE );
-                        } else { // Found the covariate list in input file, loop through all of them and instantiate them
-                            String[] vals = line.split(",");
-                            for( int iii = 0; iii < vals.length - 3; iii++ ) { // There are n-3 covariates. The last three items are nObservations, nMismatch, and Qempirical
-                                boolean foundClass = false;
-                                for( Class<?> covClass : classes ) {
-                                    if( (vals[iii] + "Covariate").equalsIgnoreCase( covClass.getSimpleName() ) ) {
-                                        foundClass = true;
-                                        try {
-                                            Covariate covariate = (Covariate)covClass.newInstance();
-                                            requestedCovariates.add( covariate );
-                                        } catch (Exception e) {
-                                            throw new DynamicClassResolutionException(covClass, e);
-                                        }
-
-                                    }
-                                }
-
-                                if( !foundClass ) {
-                                    throw new UserException.MalformedFile(RECAL_FILE, "Malformed input recalibration file. The requested covariate type (" + (vals[iii] + "Covariate") + ") isn't a valid covariate option." );
-                                }
-                            }
-                        }
-
-                    } else { // Found a line of data
-                        if( !foundAllCovariates ) {
-                            foundAllCovariates = true;
-
-                            // At this point all the covariates should have been found and initialized
-                            if( requestedCovariates.size() < 2 ) {
-                                throw new UserException.MalformedFile(RECAL_FILE, "Malformed input recalibration csv file. Covariate names can't be found in file: " + RECAL_FILE );
-                            }
-
-                            final boolean createCollapsedTables = true;
-
-                            // Initialize any covariate member variables using the shared argument collection
-                            for( Covariate cov : requestedCovariates ) {
-                                cov.initialize( RAC );
-                            }
-                            // Initialize the data hashMaps
-                            dataManager = new RecalDataManager( createCollapsedTables, requestedCovariates.size() );
-
-                        }
-                        addCSVData(RECAL_FILE, line); // Parse the line and add the data to the HashMap
-                    }
-                }
-
-            } catch ( FileNotFoundException e ) {
-                throw new UserException.CouldNotReadInputFile(RECAL_FILE, "Can not find input file", e);
-            } catch ( NumberFormatException e ) {
-                throw new UserException.MalformedFile(RECAL_FILE, "Error parsing recalibration data at line " + lineNumber + ". Perhaps your table was generated by an older version of CovariateCounterWalker.");
-            }
-
-            if ( !sawEOF ) {
-                final String errorMessage = "No EOF marker was present in the recal covariates table; this could mean that the file is corrupted or was generated with an old version of the CountCovariates tool.";
-                if ( REQUIRE_EOF )
-                    throw new UserException.MalformedFile(RECAL_FILE, errorMessage);
-            }
-
-            if( dataManager == null ) {
-                throw new UserException.MalformedFile(RECAL_FILE, "Can't initialize the data manager. Perhaps the recal csv file contains no data?");
-            }
-
-            // Create the tables of empirical quality scores that will be used in the sequential calculation
-            dataManager.generateEmpiricalQualities( SMOOTHING, MAX_QUALITY_SCORE );
-        }
-        // debug end copy
-  */
-    }
-    /**
-     * For each covariate read in a value and parse it. Associate those values with the data itself (num observation and num mismatches)
-     */
- /*
-    private void addCSVData(final File file, final String line) {
-        final String[] vals = line.split(",");
-
-        // Check if the data line is malformed, for example if the read group string contains a comma then it won't be parsed correctly
-        if( vals.length != requestedCovariates.size() + 3 ) { // +3 because of nObservations, nMismatch, and Qempirical
-            throw new UserException.MalformedFile(file, "Malformed input recalibration file. Found data line with too many fields: " + line +
-                    " --Perhaps the read group string contains a comma and isn't being parsed correctly.");
-        }
-
-        final Object[] key = new Object[requestedCovariates.size()];
-        Covariate cov;
-        int iii;
-        for( iii = 0; iii < requestedCovariates.size(); iii++ ) {
-            cov = requestedCovariates.get( iii );
-            key[iii] = cov.getValue( vals[iii] );
-        }
-
-        // Create a new datum using the number of observations, number of mismatches, and reported quality score
-        final RecalDatum datum = new RecalDatum( Long.parseLong( vals[iii] ), Long.parseLong( vals[iii + 1] ), Double.parseDouble( vals[1] ), 0.0 );
-        // Add that datum to all the collapsed tables which will be used in the sequential calculation
-        dataManager.addToAllTables( key, datum, PRESERVE_QSCORES_LESS_THAN );
-    }
-
-*/
-    public  PairHMMIndelErrorModel(double indelGOP, double indelGCP, boolean deb, boolean doCDP, boolean dovit) {
-        this(indelGOP, indelGCP, deb, doCDP);
-        this.doViterbi = dovit;
-    }
-
-    public PairHMMIndelErrorModel(double indelGOP, double indelGCP, boolean deb, boolean doCDP) {
-
-
-        this.logGapOpenProbability = -indelGOP/10.0; // QUAL to log prob
-        this.logGapContinuationProbability = -indelGCP/10.0; // QUAL to log prob
-        this.doContextDependentPenalties = doCDP;
+    public PairHMMIndelErrorModel(double indelGOP, double indelGCP, boolean deb, boolean bandedLikelihoods) {
         this.DEBUG = deb;
-
+        this.bandedLikelihoods = bandedLikelihoods;
 
         // fill gap penalty table, affine naive model:
         this.GAP_CONT_PROB_TABLE = new double[MAX_HRUN_GAP_IDX];
         this.GAP_OPEN_PROB_TABLE = new double[MAX_HRUN_GAP_IDX];
 
+        double gop = -indelGOP/10.0;
+        double gcp = -indelGCP/10.0;
+
         for (int i = 0; i < START_HRUN_GAP_IDX; i++) {
-            GAP_OPEN_PROB_TABLE[i] = logGapOpenProbability;
-            GAP_CONT_PROB_TABLE[i] = logGapContinuationProbability;
+            GAP_OPEN_PROB_TABLE[i] = gop;
+            GAP_CONT_PROB_TABLE[i] = gcp;
         }
 
-        double gop = logGapOpenProbability;
-        double gcp = logGapContinuationProbability;
         double step = GAP_PENALTY_HRUN_STEP/10.0;
 
         double maxGOP = -MIN_GAP_OPEN_PENALTY/10.0;  // phred to log prob
@@ -313,132 +120,6 @@ public class PairHMMIndelErrorModel {
 
     }
 
-    private double computeReadLikelihoodGivenHaplotype(byte[] haplotypeBases, byte[] readBases, byte[] readQuals) {
-        final int X_METRIC_LENGTH = readBases.length+1;
-        final int Y_METRIC_LENGTH = haplotypeBases.length+1;
-
-        // initialize path metric and traceback memories for likelihood computation
-        double[][] pathMetricArray = new double[X_METRIC_LENGTH][Y_METRIC_LENGTH];
-        int[][] bestMetricArray = new int[X_METRIC_LENGTH][Y_METRIC_LENGTH];
-
-        pathMetricArray[0][0]= 0;//Double.NEGATIVE_INFINITY;
-
-        for (int i=1; i < X_METRIC_LENGTH; i++) {
-            pathMetricArray[i][0] = 0;
-            bestMetricArray[i][0] = UP;
-        }
-
-        for (int j=1; j < Y_METRIC_LENGTH; j++) {
-            pathMetricArray[0][j] = 0;//logGapOpenProbability + (j-1) * logGapContinuationProbability;
-            bestMetricArray[0][j] = LEFT;
-        }
-
-        for (int indI=1; indI < X_METRIC_LENGTH; indI++) {
-            for (int indJ=1; indJ < Y_METRIC_LENGTH; indJ++) {
-
-                byte x = readBases[indI-1];
-                byte y = haplotypeBases[indJ-1];
-                byte qual = readQuals[indI-1];
-
-                double bestMetric = 0.0;
-                int bestMetricIdx = 0;
-
-                // compute metric for match/mismatch
-                // workaround for reads whose bases quality = 0,
-                if (qual < 1)
-                    qual = 1;
-
-                if (qual > MAX_CACHED_QUAL)
-                    qual = MAX_CACHED_QUAL;
-
-                double pBaseRead =  (x == y)? baseMatchArray[(int)qual]:baseMismatchArray[(int)qual];
-                double[] metrics = new double[3];
-
-                metrics[DIAG] = pathMetricArray[indI-1][indJ-1] + pBaseRead;
-                metrics[UP] = pathMetricArray[indI-1][indJ] + logGapOpenProbability;//(end?0.0:logGapOpenProbability);
-                metrics[LEFT] = pathMetricArray[indI][indJ-1] + logGapOpenProbability;//(end?0.0:logGapOpenProbability);
-
-                if (doViterbi) {
-                    bestMetricIdx = MathUtils.maxElementIndex(metrics);
-                    bestMetric = metrics[bestMetricIdx];
-                }
-                else
-                    bestMetric = MathUtils.softMax(metrics);
-
-                pathMetricArray[indI][indJ] = bestMetric;
-                bestMetricArray[indI][indJ] = bestMetricIdx;
-
-            }
-        }
-
-
-        double bestMetric=0.0;
-        int bestMetricIdx=0,bestI=X_METRIC_LENGTH - 1, bestJ=Y_METRIC_LENGTH - 1;
-
-        for (int i=0; i < X_METRIC_LENGTH; i ++ ) {
-            int j= Y_METRIC_LENGTH-1;
-
-            if (pathMetricArray[i][j] > bestMetric) {
-                bestMetric = pathMetricArray[i][j];
-                bestI = i;
-                bestJ = j;
-            }
-        }
-        for (int j=0; j < Y_METRIC_LENGTH; j++ ) {
-            int i= X_METRIC_LENGTH-1;
-            if (pathMetricArray[i][j] >= bestMetric) {
-                bestMetric = pathMetricArray[i][j];
-                bestI = i;
-                bestJ = j;
-            }
-        }
-
-        if (DEBUG && doViterbi) {
-
-            String haplotypeString = new String (haplotypeBases);
-            String readString = new String(readBases);
-
-
-            int i = bestI;
-            int j = bestJ;
-
-
-            System.out.println("Simple NW");
-
-            while (i >0 || j >0) {
-                bestMetricIdx = bestMetricArray[i][j];
-                System.out.print(bestMetricIdx);
-                if (bestMetricIdx == UP) {
-                    // insert gap in Y
-                    haplotypeString = haplotypeString.substring(0,j)+"-"+haplotypeString.substring(j);
-                    i--;
-                } else if (bestMetricIdx == LEFT) {
-                    readString = readString.substring(0,i)+"-"+readString.substring(i);
-                    j--;
-                }
-                else {
-                    i--; j--;
-                }
-            }
-
-
-
-
-            System.out.println("\nAlignment: ");
-            System.out.println("R:"+readString);
-            System.out.println("H:"+haplotypeString);
-            System.out.println();
-
-
-        }
-        if (DEBUG)
-            System.out.format("Likelihood: %5.4f\n", bestMetric);
-
-        return bestMetric;
-
-
-    }
-
     static private void getContextHomopolymerLength(final byte[] refBytes, int[] hrunArray) {
         // compute forward hrun length, example:
         // AGGTGACCCCCCTGAGAG
@@ -472,221 +153,199 @@ public class PairHMMIndelErrorModel {
     }
 
 
+    private void updateCell(final int indI, final int indJ, final int X_METRIC_LENGTH, final int Y_METRIC_LENGTH, byte[] readBases, byte[] readQuals, byte[] haplotypeBases,
+                            double[] currentGOP, double[] currentGCP,  double[][] matchMetricArray,  double[][] XMetricArray,  double[][] YMetricArray) {
+        if (indI > 0 && indJ > 0) {
+            final int im1 = indI -1;
+            final int jm1 = indJ - 1;
+            // update current point
+            final byte x = readBases[im1];
+            final byte y = haplotypeBases[jm1];
+            final byte qual = readQuals[im1] < 1 ? 1 : (readQuals[im1] > MAX_CACHED_QUAL ? MAX_CACHED_QUAL : readQuals[im1]);
+
+            final double pBaseRead =  (x == y)? baseMatchArray[(int)qual]:baseMismatchArray[(int)qual];
+
+            matchMetricArray[indI][indJ] = MathUtils.softMax(matchMetricArray[im1][jm1] + pBaseRead, XMetricArray[im1][jm1] + pBaseRead,
+                    YMetricArray[im1][jm1] + pBaseRead);
+
+            final double c1 = indJ == Y_METRIC_LENGTH-1 ? END_GAP_COST : currentGOP[jm1];
+            final double d1 = indJ == Y_METRIC_LENGTH-1 ? END_GAP_COST : currentGCP[jm1];
+
+            XMetricArray[indI][indJ] = MathUtils.softMax(matchMetricArray[im1][indJ] + c1, XMetricArray[im1][indJ] + d1);
+
+            // update Y array
+            final double c2 = indI == X_METRIC_LENGTH-1 ? END_GAP_COST : currentGOP[jm1];
+            final double d2 = indI == X_METRIC_LENGTH-1 ? END_GAP_COST : currentGCP[jm1];
+            YMetricArray[indI][indJ] = MathUtils.softMax(matchMetricArray[indI][jm1] + c2, YMetricArray[indI][jm1] + d2);
+        }
+    }
+
     private double computeReadLikelihoodGivenHaplotypeAffineGaps(byte[] haplotypeBases, byte[] readBases, byte[] readQuals,
-                                                                 double[] currentGOP, double[] currentGCP) {
+                                                                 double[] currentGOP, double[] currentGCP, int indToStart,
+                                                                 double[][] matchMetricArray, double[][] XMetricArray, double[][] YMetricArray) {
 
         final int X_METRIC_LENGTH = readBases.length+1;
         final int Y_METRIC_LENGTH = haplotypeBases.length+1;
 
-        // initialize path metric and traceback memories for likelihood computation
-        double[][] matchMetricArray = new double[X_METRIC_LENGTH][Y_METRIC_LENGTH];
-        double[][] XMetricArray = new double[X_METRIC_LENGTH][Y_METRIC_LENGTH];
-        double[][] YMetricArray = new double[X_METRIC_LENGTH][Y_METRIC_LENGTH];
-        int[][] bestActionArrayM = new int[X_METRIC_LENGTH][Y_METRIC_LENGTH];
-        int[][] bestActionArrayX = new int[X_METRIC_LENGTH][Y_METRIC_LENGTH];
-        int[][] bestActionArrayY = new int[X_METRIC_LENGTH][Y_METRIC_LENGTH];
+        if (indToStart == 0) {
+            // default initialization for all arrays
 
-        double c,d;
-        matchMetricArray[0][0]= END_GAP_COST;//Double.NEGATIVE_INFINITY;
+            for (int i=0; i < X_METRIC_LENGTH; i++) {
+                Arrays.fill(matchMetricArray[i],Double.NEGATIVE_INFINITY);
+                Arrays.fill(YMetricArray[i],Double.NEGATIVE_INFINITY);
+                Arrays.fill(XMetricArray[i],Double.NEGATIVE_INFINITY);
+            }
 
-        for (int i=1; i < X_METRIC_LENGTH; i++) {
-            //initialize first column
-            matchMetricArray[i][0]  = Double.NEGATIVE_INFINITY;
-            YMetricArray[i][0]      = Double.NEGATIVE_INFINITY;
-            XMetricArray[i][0]      = END_GAP_COST*(i);//logGapOpenProbability + (i-1)*logGapContinuationProbability;
+            for (int i=1; i < X_METRIC_LENGTH; i++) {
+                //initialize first column
+                XMetricArray[i][0]      = END_GAP_COST*(i);
+            }
 
-            bestActionArrayX[i][0] = bestActionArrayY[i][0] = bestActionArrayM[i][0] = UP_GOTO_X;
+            for (int j=1; j < Y_METRIC_LENGTH; j++) {
+                // initialize first row
+                YMetricArray[0][j]      = END_GAP_COST*(j);
+            }
+            matchMetricArray[0][0]= END_GAP_COST;//Double.NEGATIVE_INFINITY;
+            XMetricArray[0][0]=  YMetricArray[0][0] = 0;
         }
 
-        for (int j=1; j < Y_METRIC_LENGTH; j++) {
-            // initialize first row
-            matchMetricArray[0][j]  = Double.NEGATIVE_INFINITY;
-            XMetricArray[0][j]      = Double.NEGATIVE_INFINITY;
-            YMetricArray[0][j]      = END_GAP_COST*(j);//logGapOpenProbability + (j-1) * logGapContinuationProbability;
 
-            bestActionArrayY[0][j] = bestActionArrayM[0][j] = bestActionArrayX[0][j] = LEFT_GOTO_Y;
+        if (bandedLikelihoods) {
+            final double DIAG_TOL = 20; // means that max - min element in diags have to be > this number for banding to take effect.
+
+            final int numDiags = X_METRIC_LENGTH +  Y_METRIC_LENGTH -1;
+            final int elemsInDiag = Math.min(X_METRIC_LENGTH, Y_METRIC_LENGTH);
+
+            int idxWithMaxElement = 0;
+
+            for (int  diag=indToStart; diag <  numDiags; diag++) {
+                // compute default I and J start positions at edge of diagonals
+                int indI = 0;
+                int indJ = diag;
+                if (diag >= Y_METRIC_LENGTH ) {
+                    indI = diag-(Y_METRIC_LENGTH-1);
+                    indJ = Y_METRIC_LENGTH-1;
+                }
+
+                // first pass: from max element to edge
+                int idxLow =  idxWithMaxElement;
+
+                // reset diag max value before starting
+                double maxElementInDiag = Double.NEGATIVE_INFINITY;
+                // set indI, indJ to correct values
+                indI += idxLow;
+                indJ -= idxLow;
+                if (indI >= X_METRIC_LENGTH || indJ < 0) {
+                    idxLow--;
+                    indI--;
+                    indJ++;
+                }
+
+
+                for (int el = idxLow; el < elemsInDiag; el++) {
+                    updateCell(indI, indJ, X_METRIC_LENGTH, Y_METRIC_LENGTH, readBases, readQuals, haplotypeBases,
+                            currentGOP, currentGCP,  matchMetricArray,  XMetricArray, YMetricArray);
+                    // update max in diagonal
+                    final double bestMetric = MathUtils.max(matchMetricArray[indI][indJ], XMetricArray[indI][indJ], YMetricArray[indI][indJ]);
+
+                    // check if we've fallen off diagonal value by threshold
+                    if (bestMetric > maxElementInDiag) {
+                        maxElementInDiag = bestMetric;
+                        idxWithMaxElement = el;
+                    }
+                    else if (bestMetric < maxElementInDiag - DIAG_TOL && idxWithMaxElement > 0)
+                        break; // done w/current diagonal
+
+                    indI++;
+                    if (indI >=X_METRIC_LENGTH )
+                        break;
+                    indJ--;
+                    if (indJ <= 0)
+                        break;
+                }
+                if (idxLow > 0) {
+                    // now do second part in opposite direction
+                    indI = 0;
+                    indJ = diag;
+                    if (diag >= Y_METRIC_LENGTH ) {
+                        indI = diag-(Y_METRIC_LENGTH-1);
+                        indJ = Y_METRIC_LENGTH-1;
+                    }
+
+                    indI += idxLow-1;
+                    indJ -= idxLow-1;
+                    for (int el = idxLow-1; el >= 0; el--) {
+
+                        updateCell(indI, indJ, X_METRIC_LENGTH, Y_METRIC_LENGTH, readBases, readQuals, haplotypeBases,
+                                currentGOP, currentGCP,  matchMetricArray,  XMetricArray, YMetricArray);
+                        // update max in diagonal
+                        final double bestMetric = MathUtils.max(matchMetricArray[indI][indJ], XMetricArray[indI][indJ], YMetricArray[indI][indJ]);
+
+                        // check if we've fallen off diagonal value by threshold
+                        if (bestMetric > maxElementInDiag) {
+                            maxElementInDiag = bestMetric;
+                            idxWithMaxElement = el;
+                        }
+                        else if (bestMetric < maxElementInDiag - DIAG_TOL)
+                            break; // done w/current diagonal
+
+                        indJ++;
+                        if (indJ >= Y_METRIC_LENGTH )
+                            break;
+                        indI--;
+                        if (indI <= 0)
+                            break;
+                    }
+                }
+                // if (DEBUG)
+                //     System.out.format("Max:%4.1f el:%d\n",maxElementInDiag,  idxWithMaxElement);
+            }
         }
+        else {
+            // simplified rectangular version of update loop
+            for (int indI=1; indI < X_METRIC_LENGTH; indI++) {
+                for (int indJ=indToStart+1; indJ < Y_METRIC_LENGTH; indJ++) {
+                    updateCell(indI, indJ, X_METRIC_LENGTH, Y_METRIC_LENGTH, readBases, readQuals, haplotypeBases,
+                            currentGOP, currentGCP,  matchMetricArray,  XMetricArray, YMetricArray);
 
-        for (int indI=1; indI < X_METRIC_LENGTH; indI++) {
-            int im1 = indI-1;
-            for (int indJ=1; indJ < Y_METRIC_LENGTH; indJ++) {
-                int jm1 = indJ-1;
-                byte x = readBases[im1];
-                byte y = haplotypeBases[jm1];
-                byte qual = readQuals[im1];
-
-                double bestMetric = 0.0;
-                int bestMetricIdx = 0;
-
-                // compute metric for match/mismatch
-                // workaround for reads whose bases quality = 0,
-                if (qual < 1)
-                    qual = 1;
-
-                if (qual > MAX_CACHED_QUAL)
-                    qual = MAX_CACHED_QUAL;
-
-                double pBaseRead =  (x == y)? baseMatchArray[(int)qual]:baseMismatchArray[(int)qual];
-
-
-                double[] metrics = new double[3];
-
-
-                if (doViterbi) {
-                    // update match array
-                    metrics[MATCH_OFFSET] = matchMetricArray[im1][jm1] + pBaseRead;
-                    metrics[X_OFFSET] = XMetricArray[im1][jm1] + pBaseRead;
-                    metrics[Y_OFFSET] = YMetricArray[im1][jm1] + pBaseRead;
-
-                    bestMetricIdx = MathUtils.maxElementIndex(metrics);
-                    bestMetric = metrics[bestMetricIdx];
                 }
-                else
-                    bestMetric = MathUtils.softMax(matchMetricArray[im1][jm1] + pBaseRead, XMetricArray[im1][jm1] + pBaseRead,
-                            YMetricArray[im1][jm1] + pBaseRead);
-
-                matchMetricArray[indI][indJ] = bestMetric;
-                bestActionArrayM[indI][indJ] = ACTIONS_M[bestMetricIdx];
-
-                // update X array
-                // State X(i,j): X(1:i) aligned to a gap in Y(1:j).
-                // When in last column of X, ie X(1:i) aligned to full Y, we don't want to penalize gaps
-
-                //c = (indJ==Y_METRIC_LENGTH-1? END_GAP_COST: currentGOP[jm1]);
-                //d = (indJ==Y_METRIC_LENGTH-1? END_GAP_COST: currentGCP[jm1]);
-                if (getGapPenaltiesFromFile) {
-                    c = currentGOP[im1];
-                    d = logGapContinuationProbability;
-
-                } else {
-                    c = currentGOP[jm1];
-                    d = currentGCP[jm1];
-                }
-                if (indJ == Y_METRIC_LENGTH-1)
-                    c = d = END_GAP_COST;
-
-                if (doViterbi) {
-                    metrics[MATCH_OFFSET] = matchMetricArray[im1][indJ] + c;
-                    metrics[X_OFFSET] = XMetricArray[im1][indJ] + d;
-                    metrics[Y_OFFSET] = Double.NEGATIVE_INFINITY; //YMetricArray[indI-1][indJ] + logGapOpenProbability;
-
-                    bestMetricIdx = MathUtils.maxElementIndex(metrics);
-                    bestMetric = metrics[bestMetricIdx];
-                }
-                else
-                    bestMetric = MathUtils.softMax(matchMetricArray[im1][indJ] + c, XMetricArray[im1][indJ] + d);
-
-                XMetricArray[indI][indJ] = bestMetric;
-                bestActionArrayX[indI][indJ] = ACTIONS_X[bestMetricIdx];
-
-                // update Y array
-                //c = (indI==X_METRIC_LENGTH-1? END_GAP_COST: currentGOP[jm1]);
-                //d = (indI==X_METRIC_LENGTH-1? END_GAP_COST: currentGCP[jm1]);
-                if (getGapPenaltiesFromFile) {
-                    c = currentGOP[im1];
-                    d = logGapContinuationProbability;
-                }
-                else {
-                    c = currentGOP[jm1];
-                    d = currentGCP[jm1];                        
-                }
-                if (indI == X_METRIC_LENGTH-1)
-                    c = d = END_GAP_COST;
-
-
-
-                if (doViterbi) {
-                    metrics[MATCH_OFFSET] = matchMetricArray[indI][jm1] + c;
-                    metrics[X_OFFSET] = Double.NEGATIVE_INFINITY; //XMetricArray[indI][indJ-1] + logGapOpenProbability;
-                    metrics[Y_OFFSET] = YMetricArray[indI][jm1] + d;
-
-                    bestMetricIdx = MathUtils.maxElementIndex(metrics);
-                    bestMetric = metrics[bestMetricIdx];
-                }
-                else
-                    bestMetric = MathUtils.softMax(matchMetricArray[indI][jm1] + c, YMetricArray[indI][jm1] + d);
-
-                YMetricArray[indI][indJ] = bestMetric;
-                bestActionArrayY[indI][indJ] = ACTIONS_Y[bestMetricIdx];
-
-
-
             }
         }
 
-        double bestMetric;
-        double metrics[] = new double[3];
-        int bestTable=0, bestI=X_METRIC_LENGTH - 1, bestJ=Y_METRIC_LENGTH - 1;
-        metrics[MATCH_OFFSET] = matchMetricArray[bestI][bestJ];
-        metrics[X_OFFSET] = XMetricArray[bestI][bestJ];
-        metrics[Y_OFFSET] = YMetricArray[bestI][bestJ];
-        if (doViterbi) {
-            bestTable = MathUtils.maxElementIndex(metrics);
-            bestMetric = metrics[bestTable];
+
+
+        final int bestI = X_METRIC_LENGTH - 1, bestJ = Y_METRIC_LENGTH - 1;
+        final double bestMetric = MathUtils.softMax(matchMetricArray[bestI][bestJ],
+                XMetricArray[bestI][bestJ],
+                YMetricArray[bestI][bestJ]);
+
+        /*
+        if (DEBUG) {
+            PrintStream outx, outy, outm, outs;
+            double[][] sumMetrics = new double[X_METRIC_LENGTH][Y_METRIC_LENGTH];
+            try {
+                outx = new PrintStream("datax.txt");
+                outy = new PrintStream("datay.txt");
+                outm = new PrintStream("datam.txt");
+                outs = new PrintStream("datas.txt");
+                double metrics[] = new double[3];
+                for (int indI=0; indI < X_METRIC_LENGTH; indI++) {
+                    for (int indJ=0; indJ < Y_METRIC_LENGTH; indJ++) {
+                        metrics[0] = matchMetricArray[indI][indJ];
+                        metrics[1] = XMetricArray[indI][indJ];
+                        metrics[2] = YMetricArray[indI][indJ];
+                        //sumMetrics[indI][indJ] = MathUtils.softMax(metrics);
+                        outx.format("%4.1f ", metrics[1]);
+                        outy.format("%4.1f ", metrics[2]);
+                        outm.format("%4.1f ", metrics[0]);
+                        outs.format("%4.1f ", MathUtils.softMax(metrics));
+                    }
+                    outx.println();  outm.println();outy.println(); outs.println();
+                }
+                outm.close(); outx.close(); outy.close();
+            } catch (java.io.IOException e) { throw new UserException("bla");}
         }
-        else
-            bestMetric = MathUtils.softMax(metrics);
-
-        // Do traceback (needed only for debugging!)
-        if (DEBUG && doViterbi) {
-
-            int bestAction;
-            int i = bestI;
-            int j = bestJ;
-
-
-            System.out.println("Affine gap NW");
-
-
-            String haplotypeString = new String (haplotypeBases);
-            String readString = new String(readBases);
-
-
-            while (i >0 || j >0) {
-                if (bestTable == X_OFFSET) {
-                    // insert gap in Y
-                    haplotypeString = haplotypeString.substring(0,j)+"-"+haplotypeString.substring(j);
-                    bestAction = bestActionArrayX[i][j];
-                }
-                else if (bestTable == Y_OFFSET) {
-                    readString = readString.substring(0,i)+"-"+readString.substring(i);
-                    bestAction = bestActionArrayY[i][j];
-
-                }
-                else {
-                    bestAction = bestActionArrayM[i][j];
-                }
-                System.out.print(bestAction);
-
-
-                // bestAction contains action to take at next step
-                // encoding of bestAction: upper 2 bits = direction, lower 2 bits = next table
-
-                // bestTable and nextDirection for next step
-                bestTable = bestAction & 0x3;
-                int nextDirection = bestAction >> 2;
-                if (nextDirection == UP) {
-                    i--;
-                } else if (nextDirection == LEFT) {
-                    j--;
-                } else { //  if (nextDirection == DIAG)
-                    i--; j--;
-                }
-
-            }
-
-
-
-
-            System.out.println("\nAlignment: ");
-            System.out.println("R:"+readString);
-            System.out.println("H:"+haplotypeString);
-            System.out.println();
-
-
-        }
-        if (DEBUG)
-            System.out.format("Likelihood: %5.4f\n", bestMetric);
+        */
 
         return bestMetric;
 
@@ -707,50 +366,38 @@ public class PairHMMIndelErrorModel {
         }
     }
     public synchronized double[] computeReadHaplotypeLikelihoods(ReadBackedPileup pileup, LinkedHashMap<Allele,Haplotype> haplotypeMap,
-                                                                   ReferenceContext ref, int eventLength,
-                                                                   HashMap<PileupElement, LinkedHashMap<Allele,Double>> indelLikelihoodMap){
+                                                                 ReferenceContext ref, int eventLength,
+                                                                 HashMap<PileupElement, LinkedHashMap<Allele,Double>> indelLikelihoodMap){
 
         int numHaplotypes = haplotypeMap.size();
-        double[][] haplotypeLikehoodMatrix = new double[numHaplotypes][numHaplotypes];
-        double readLikelihoods[][] = new double[pileup.getReads().size()][numHaplotypes];
+        final double readLikelihoods[][] = new double[pileup.getNumberOfElements()][numHaplotypes];
+        final int readCounts[] = new int[pileup.getNumberOfElements()];
         int readIdx=0;
 
         LinkedHashMap<Allele,double[]> gapOpenProbabilityMap = new LinkedHashMap<Allele,double[]>();
         LinkedHashMap<Allele,double[]> gapContProbabilityMap = new LinkedHashMap<Allele,double[]>();
 
-        if (DEBUG) {
-            System.out.println("Reference bases:");
-            System.out.println(new String(ref.getBases()));
+        // will context dependent probabilities based on homopolymer run. Probabilities are filled based on total complete haplotypes.
+        // todo -- refactor into separate function
+        for (Allele a: haplotypeMap.keySet()) {
+            Haplotype haplotype = haplotypeMap.get(a);
+            byte[] haplotypeBases = haplotype.getBasesAsBytes();
+            double[] contextLogGapOpenProbabilities = new double[haplotypeBases.length];
+            double[] contextLogGapContinuationProbabilities = new double[haplotypeBases.length];
+
+            // get homopolymer length profile for current haplotype
+            int[] hrunProfile = new int[haplotypeBases.length];
+            getContextHomopolymerLength(haplotypeBases,hrunProfile);
+            fillGapProbabilities(hrunProfile, contextLogGapOpenProbabilities, contextLogGapContinuationProbabilities);
+
+            gapOpenProbabilityMap.put(a,contextLogGapOpenProbabilities);
+            gapContProbabilityMap.put(a,contextLogGapContinuationProbabilities);
+
         }
 
-        if (doContextDependentPenalties && !getGapPenaltiesFromFile)   {
-            // will context dependent probabilities based on homopolymer run. Probabilities are filled based on total complete haplotypes.
-
-
-            for (Allele a: haplotypeMap.keySet()) {
-                Haplotype haplotype = haplotypeMap.get(a);
-                byte[] haplotypeBases = haplotype.getBasesAsBytes();
-                double[] contextLogGapOpenProbabilities = new double[haplotypeBases.length];
-                double[] contextLogGapContinuationProbabilities = new double[haplotypeBases.length];
-
-                // get homopolymer length profile for current haplotype
-                int[] hrunProfile = new int[haplotypeBases.length];
-                getContextHomopolymerLength(haplotypeBases,hrunProfile);
-                if (DEBUG) {
-                    System.out.println("Haplotype bases:");
-                    System.out.println(new String(haplotypeBases));
-                    for (int i=0; i < hrunProfile.length; i++)
-                        System.out.format("%d",hrunProfile[i]);
-                    System.out.println();
-                }
-                fillGapProbabilities(hrunProfile, contextLogGapOpenProbabilities, contextLogGapContinuationProbabilities);
-
-                gapOpenProbabilityMap.put(a,contextLogGapOpenProbabilities);
-                gapContProbabilityMap.put(a,contextLogGapContinuationProbabilities);
-
-            }
-        }
         for (PileupElement p: pileup) {
+            // > 1 when the read is a consensus read representing multiple independent observations
+            readCounts[readIdx] = p.getRepresentativeCount();
 
             // check if we've already computed likelihoods for this pileup element (i.e. for this read at this location)
             if (indelLikelihoodMap.containsKey(p)) {
@@ -762,61 +409,14 @@ public class PairHMMIndelErrorModel {
             }
             else {
                 //System.out.format("%d %s\n",p.getRead().getAlignmentStart(), p.getRead().getClass().getName());
-                GATKSAMRecord read = ReadUtils.hardClipAdaptorSequence(p.getRead());
+                SAMRecord read = ReadUtils.hardClipAdaptorSequence(p.getRead());
                 if (read == null)
                     continue;
 
-                if(ReadUtils.is454Read(read) && !getGapPenaltiesFromFile) {
+                if(ReadUtils.is454Read(read)) {
                     continue;
                 }
 
-                double[] recalQuals = null;
-
- /*
-                if (getGapPenaltiesFromFile) {
-                    RecalDataManager.parseSAMRecord( read, RAC );
-
-
-                    recalQuals = new double[read.getReadLength()];
-
-                    //compute all covariate values for this read
-                    final Comparable[][] covariateValues_offset_x_covar =
-                            RecalDataManager.computeCovariates((GATKSAMRecord) read, requestedCovariates);
-                    // For each base in the read
-                    for( int offset = 0; offset < read.getReadLength(); offset++ ) {
-
-                        final Object[] fullCovariateKey = covariateValues_offset_x_covar[offset];
-
-                        Byte qualityScore = (Byte) qualityScoreByFullCovariateKey.get(fullCovariateKey);
-                        if(qualityScore == null)
-                        {
-                            qualityScore = performSequentialQualityCalculation( fullCovariateKey );
-                            qualityScoreByFullCovariateKey.put(qualityScore, fullCovariateKey);
-                        }
-
-                        recalQuals[offset] = -((double)qualityScore)/10.0;
-                    }
-
-                    // for each read/haplotype combination, compute likelihoods, ie -10*log10(Pr(R | Hi))
-                    // = sum_j(-10*log10(Pr(R_j | Hi) since reads are assumed to be independent
-                    if (DEBUG)  {
-                        System.out.format("\n\nStarting read:%s S:%d US:%d E:%d UE:%d C:%s\n",read.getReadName(),
-                                read.getAlignmentStart(),
-                                read.getUnclippedStart(), read.getAlignmentEnd(), read.getUnclippedEnd(),
-                                read.getCigarString());
-
-                        byte[] bases = read.getReadBases();
-                        for (int k = 0; k < recalQuals.length; k++) {
-                            System.out.format("%c",bases[k]);
-                        }
-                        System.out.println();
-
-                        for (int k = 0; k < recalQuals.length; k++) {
-                            System.out.format("%.0f ",recalQuals[k]);
-                        }
-                        System.out.println();
-                    }
-                }        */
                 // get bases of candidate haplotypes that overlap with reads
                 final int trailingBases = 3;
 
@@ -910,18 +510,16 @@ public class PairHMMIndelErrorModel {
 
                 // ok, we now figured out total number of clipped bases on both ends.
                 // Figure out where we want to place the haplotype to score read against
-                if (DEBUG)
-                    System.out.format("numStartClippedBases: %d numEndClippedBases: %d WinStart:%d WinStop:%d start: %d stop: %d readLength: %d\n",
-                            numStartClippedBases, numEndClippedBases, ref.getWindow().getStart(), ref.getWindow().getStop(), start, stop, read.getReadLength());
-
+                /*
+               if (DEBUG)
+                   System.out.format("numStartClippedBases: %d numEndClippedBases: %d WinStart:%d WinStop:%d start: %d stop: %d readLength: %d\n",
+                           numStartClippedBases, numEndClippedBases, ref.getWindow().getStart(), ref.getWindow().getStop(), start, stop, read.getReadLength());
+                */
 
 
                 LinkedHashMap<Allele,Double> readEl = new LinkedHashMap<Allele,Double>();
 
                 if (numStartClippedBases + numEndClippedBases >= unclippedReadBases.length) {
-                    if (DEBUG)
-                        System.out.println("BAD READ!!");
-
                     int j=0;
                     for (Allele a: haplotypeMap.keySet()) {
                         readEl.put(a,0.0);
@@ -930,25 +528,20 @@ public class PairHMMIndelErrorModel {
 
                 }
                 else {
-                    byte[] readBases = Arrays.copyOfRange(unclippedReadBases,numStartClippedBases,
+                    final byte[] readBases = Arrays.copyOfRange(unclippedReadBases,numStartClippedBases,
                             unclippedReadBases.length-numEndClippedBases);
 
-                    byte[] readQuals = Arrays.copyOfRange(unclippedReadQuals,numStartClippedBases,
+                    final byte[] readQuals = Arrays.copyOfRange(unclippedReadQuals,numStartClippedBases,
                             unclippedReadBases.length-numEndClippedBases);
 
-                    double[] recalCDP = null;
-                    if (getGapPenaltiesFromFile) {
-                        recalCDP = Arrays.copyOfRange(recalQuals,numStartClippedBases,
-                                unclippedReadBases.length-numEndClippedBases);
-
-                    }
-
-                    if (DEBUG) {
-                        System.out.println("Read bases:");
-                        System.out.println(new String(readBases));
-                    }
-
                     int j=0;
+
+                    // initialize path metric and traceback memories for likelihood computation
+                    double[][] matchMetricArray = null, XMetricArray = null, YMetricArray = null;
+                    byte[] previousHaplotypeSeen = null;
+                    double[] previousGOP = null;
+                    double[] previousGCP = null;
+                    int startIdx;
                     for (Allele a: haplotypeMap.keySet()) {
 
 
@@ -963,36 +556,41 @@ public class PairHMMIndelErrorModel {
                         long indStart = start - haplotype.getStartPosition();
                         long indStop =  stop - haplotype.getStartPosition();
 
-                        byte[] haplotypeBases = Arrays.copyOfRange(haplotype.getBasesAsBytes(),
+                        final byte[] haplotypeBases = Arrays.copyOfRange(haplotype.getBasesAsBytes(),
                                 (int)indStart, (int)indStop);
 
+                        double readLikelihood;
+                        if (matchMetricArray == null) {
+                            final int X_METRIC_LENGTH = readBases.length+1;
+                            final int Y_METRIC_LENGTH = haplotypeBases.length+1;
+
+                            matchMetricArray = new double[X_METRIC_LENGTH][Y_METRIC_LENGTH];
+                            XMetricArray = new double[X_METRIC_LENGTH][Y_METRIC_LENGTH];
+                            YMetricArray = new double[X_METRIC_LENGTH][Y_METRIC_LENGTH];
+                        }
+                        final double[] currentContextGOP = Arrays.copyOfRange(gapOpenProbabilityMap.get(a), (int)indStart, (int)indStop);
+                        final double[] currentContextGCP = Arrays.copyOfRange(gapContProbabilityMap.get(a), (int)indStart, (int)indStop);
+                        if (previousHaplotypeSeen == null)
+                            startIdx = 0;
+                        else {
+                            final int s1 = computeFirstDifferingPosition(haplotypeBases, previousHaplotypeSeen);
+                            final int s2 = computeFirstDifferingPosition(currentContextGOP, previousGOP);
+                            final int s3 = computeFirstDifferingPosition(currentContextGCP, previousGCP);
+                            startIdx = Math.min(Math.min(s1, s2), s3);
+                        }
+                        previousHaplotypeSeen = haplotypeBases.clone();
+                        previousGOP = currentContextGOP.clone();
+                        previousGCP = currentContextGCP.clone();
+
+
+                        readLikelihood = computeReadLikelihoodGivenHaplotypeAffineGaps(haplotypeBases, readBases, readQuals,
+                                currentContextGOP, currentContextGCP, startIdx, matchMetricArray, XMetricArray, YMetricArray);
                         if (DEBUG) {
-                            System.out.println("Haplotype to test:");
-                            System.out.println(new String(haplotypeBases));
+                            System.out.println("H:"+new String(haplotypeBases));
+                            System.out.println("R:"+new String(readBases));
+                            System.out.format("L:%4.2f\n",readLikelihood);
+                            System.out.format("StPos:%d\n", startIdx);
                         }
-
-                        Double readLikelihood = 0.0;
-                        if (useAffineGapModel) {
-
-                            double[] currentContextGOP = null;
-                            double[] currentContextGCP = null;
-
-                            if (doContextDependentPenalties) {
-
-                               if (getGapPenaltiesFromFile) {
-                                   readLikelihood = computeReadLikelihoodGivenHaplotypeAffineGaps(haplotypeBases, readBases, readQuals, recalCDP, null);
-
-                               }  else {
-                                   currentContextGOP = Arrays.copyOfRange(gapOpenProbabilityMap.get(a), (int)indStart, (int)indStop);
-                                   currentContextGCP = Arrays.copyOfRange(gapContProbabilityMap.get(a), (int)indStart, (int)indStop);
-                                   readLikelihood = computeReadLikelihoodGivenHaplotypeAffineGaps(haplotypeBases, readBases, readQuals, currentContextGOP, currentContextGCP);
-                               }
-                            }
-
-                        }
-                        else
-                            readLikelihood = computeReadLikelihoodGivenHaplotype(haplotypeBases, readBases, readQuals);
-
                         readEl.put(a,readLikelihood);
                         readLikelihoods[readIdx][j++] = readLikelihood;
                     }
@@ -1004,7 +602,7 @@ public class PairHMMIndelErrorModel {
 
         if (DEBUG) {
             System.out.println("\nLikelihood summary");
-            for (readIdx=0; readIdx < pileup.getReads().size(); readIdx++) {
+            for (readIdx=0; readIdx < pileup.getNumberOfElements(); readIdx++) {
                 System.out.format("Read Index: %d ",readIdx);
                 for (int i=0; i < readLikelihoods[readIdx].length; i++)
                     System.out.format("L%d: %f ",i,readLikelihoods[readIdx][i]);
@@ -1012,123 +610,63 @@ public class PairHMMIndelErrorModel {
             }
 
         }
+
+        return getHaplotypeLikelihoods(numHaplotypes, readCounts, readLikelihoods);
+    }
+
+    private int computeFirstDifferingPosition(byte[] b1, byte[] b2) {
+        if (b1.length != b2.length)
+            return 0; // sanity check
+
+        for (int i=0; i < b1.length; i++ ){
+            if ( b1[i]!= b2[i])
+                return i;
+        }
+        return b1.length;
+    }
+
+    private int computeFirstDifferingPosition(double[] b1, double[] b2) {
+        if (b1.length != b2.length)
+            return 0; // sanity check
+
+        for (int i=0; i < b1.length; i++ ){
+            if ( b1[i]!= b2[i])
+                return i;
+        }
+        return b1.length;
+    }
+
+    private final static double[] getHaplotypeLikelihoods(final int numHaplotypes, final int readCounts[], final double readLikelihoods[][]) {
+        final double[][] haplotypeLikehoodMatrix = new double[numHaplotypes][numHaplotypes];
+
+        // todo: MAD 09/26/11 -- I'm almost certain this calculation can be simplied to just a single loop without the intermediate NxN matrix
         for (int i=0; i < numHaplotypes; i++) {
             for (int j=i; j < numHaplotypes; j++){
                 // combine likelihoods of haplotypeLikelihoods[i], haplotypeLikelihoods[j]
                 // L(Hi, Hj) = sum_reads ( Pr(R|Hi)/2 + Pr(R|Hj)/2)
                 //readLikelihoods[k][j] has log10(Pr(R_k) | H[j] )
-                 for (readIdx=0; readIdx < pileup.getReads().size(); readIdx++) {
-
+                for (int readIdx = 0; readIdx < readLikelihoods.length; readIdx++) {
                     // Compute log10(10^x1/2 + 10^x2/2) = log10(10^x1+10^x2)-log10(2)
                     // First term is approximated by Jacobian log with table lookup.
                     if (Double.isInfinite(readLikelihoods[readIdx][i]) && Double.isInfinite(readLikelihoods[readIdx][j]))
                         continue;
-                    haplotypeLikehoodMatrix[i][j] += ( MathUtils.softMax(readLikelihoods[readIdx][i],
-                            readLikelihoods[readIdx][j]) + LOG_ONE_HALF);
-
+                    final double li = readLikelihoods[readIdx][i];
+                    final double lj = readLikelihoods[readIdx][j];
+                    final int readCount = readCounts[readIdx];
+                    haplotypeLikehoodMatrix[i][j] += readCount * (MathUtils.softMax(li, lj) + LOG_ONE_HALF);
                 }
-
-
             }
         }
 
-        return getHaplotypeLikelihoods(haplotypeLikehoodMatrix);
-
-    }
-
-    public static double[] getHaplotypeLikelihoods(double[][] haplotypeLikehoodMatrix) {
-        int hSize = haplotypeLikehoodMatrix.length;
-        double[] genotypeLikelihoods = new double[hSize*(hSize+1)/2];
-
+        final double[] genotypeLikelihoods = new double[numHaplotypes*(numHaplotypes+1)/2];
         int k=0;
-        double maxElement = Double.NEGATIVE_INFINITY;
-        for (int j=0; j < hSize; j++) {
+        for (int j=0; j < numHaplotypes; j++) {
             for (int i=0; i <= j; i++){
                 genotypeLikelihoods[k++] = haplotypeLikehoodMatrix[i][j];
-                if (haplotypeLikehoodMatrix[i][j] > maxElement)
-                    maxElement = haplotypeLikehoodMatrix[i][j];
             }
         }
 
-        // renormalize
-        for (int i=0; i < genotypeLikelihoods.length; i++)
-            genotypeLikelihoods[i] -= maxElement;
-
-        return genotypeLikelihoods;
+        // renormalize   so that max element is zero.
+        return MathUtils.normalizeFromLog10(genotypeLikelihoods, false, true);
     }
-
-    /**
-     * Implements a serial recalibration of the reads using the combinational table.
-     * First, we perform a positional recalibration, and then a subsequent dinuc correction.
-     *
-     * Given the full recalibration table, we perform the following preprocessing steps:
-     *
-     *   - calculate the global quality score shift across all data [DeltaQ]
-     *   - calculate for each of cycle and dinuc the shift of the quality scores relative to the global shift
-     *      -- i.e., DeltaQ(dinuc) = Sum(pos) Sum(Qual) Qempirical(pos, qual, dinuc) - Qreported(pos, qual, dinuc) / Npos * Nqual
-     *   - The final shift equation is:
-     *
-     *      Qrecal = Qreported + DeltaQ + DeltaQ(pos) + DeltaQ(dinuc) + DeltaQ( ... any other covariate ... )
-     * @param key The list of Comparables that were calculated from the covariates
-     * @return A recalibrated quality score as a byte
-     */
- /*
-    private byte performSequentialQualityCalculation( final Object... key ) {
-
-        final byte qualFromRead = (byte)Integer.parseInt(key[1].toString());
-        final Object[] readGroupCollapsedKey = new Object[1];
-        final Object[] qualityScoreCollapsedKey = new Object[2];
-        final Object[] covariateCollapsedKey = new Object[3];
-
-        // The global quality shift (over the read group only)
-        readGroupCollapsedKey[0] = key[0];
-        final RecalDatum globalRecalDatum = ((RecalDatum)dataManager.getCollapsedTable(0).get( readGroupCollapsedKey ));
-        double globalDeltaQ = 0.0;
-        if( globalRecalDatum != null ) {
-            final double globalDeltaQEmpirical = globalRecalDatum.getEmpiricalQuality();
-            final double aggregrateQReported = globalRecalDatum.getEstimatedQReported();
-            globalDeltaQ = globalDeltaQEmpirical - aggregrateQReported;
-        }
-
-        // The shift in quality between reported and empirical
-        qualityScoreCollapsedKey[0] = key[0];
-        qualityScoreCollapsedKey[1] = key[1];
-        final RecalDatum qReportedRecalDatum = ((RecalDatum)dataManager.getCollapsedTable(1).get( qualityScoreCollapsedKey ));
-        double deltaQReported = 0.0;
-        if( qReportedRecalDatum != null ) {
-            final double deltaQReportedEmpirical = qReportedRecalDatum.getEmpiricalQuality();
-            deltaQReported = deltaQReportedEmpirical - qualFromRead - globalDeltaQ;
-        }
-
-        // The shift in quality due to each covariate by itself in turn
-        double deltaQCovariates = 0.0;
-        double deltaQCovariateEmpirical;
-        covariateCollapsedKey[0] = key[0];
-        covariateCollapsedKey[1] = key[1];
-        for( int iii = 2; iii < key.length; iii++ ) {
-            covariateCollapsedKey[2] =  key[iii]; // The given covariate
-            final RecalDatum covariateRecalDatum = ((RecalDatum)dataManager.getCollapsedTable(iii).get( covariateCollapsedKey ));
-            if( covariateRecalDatum != null ) {
-                deltaQCovariateEmpirical = covariateRecalDatum.getEmpiricalQuality();
-                deltaQCovariates += ( deltaQCovariateEmpirical - qualFromRead - (globalDeltaQ + deltaQReported) );
-            }
-        }
-
-        final double newQuality = qualFromRead + globalDeltaQ + deltaQReported + deltaQCovariates;
-        return QualityUtils.boundQual( (int)Math.round(newQuality), (byte)MAX_QUALITY_SCORE );
-
-        // Verbose printouts used to validate with old recalibrator
-        //if(key.contains(null)) {
-        //    System.out.println( key  + String.format(" => %d + %.2f + %.2f + %.2f + %.2f = %d",
-        //                 qualFromRead, globalDeltaQ, deltaQReported, deltaQPos, deltaQDinuc, newQualityByte));
-        //}
-        //else {
-        //    System.out.println( String.format("%s %s %s %s => %d + %.2f + %.2f + %.2f + %.2f = %d",
-        //                 key.get(0).toString(), key.get(3).toString(), key.get(2).toString(), key.get(1).toString(), qualFromRead, globalDeltaQ, deltaQReported, deltaQPos, deltaQDinuc, newQualityByte) );
-        //}
-
-        //return newQualityByte;
-
-    }
-*/
 }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/RealignedReadCounter.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/RealignedReadCounter.java
deleted file mode 100755
index 2c89b907b..000000000
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/RealignedReadCounter.java
+++ /dev/null
@@ -1,147 +0,0 @@
-/*
- * Copyright (c) 2010.
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use,
- * copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following
- * conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR
- * THE USE OR OTHER DEALINGS IN THE SOFTWARE.
- */
-
-package org.broadinstitute.sting.gatk.walkers.indels;
-
-import net.sf.samtools.CigarElement;
-import net.sf.samtools.CigarOperator;
-import net.sf.samtools.SAMRecord;
-import org.broadinstitute.sting.commandline.Argument;
-import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
-import org.broadinstitute.sting.gatk.filters.BadMateFilter;
-import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
-import org.broadinstitute.sting.gatk.walkers.By;
-import org.broadinstitute.sting.gatk.walkers.DataSource;
-import org.broadinstitute.sting.gatk.walkers.ReadWalker;
-import org.broadinstitute.sting.utils.GenomeLoc;
-import org.broadinstitute.sting.utils.interval.IntervalFileMergingIterator;
-import org.broadinstitute.sting.utils.interval.IntervalMergingRule;
-import org.broadinstitute.sting.utils.sam.ReadUtils;
-
-import java.io.File;
-import java.util.Iterator;
-
-@By(DataSource.READS)
-// walker to count realigned reads
-public class RealignedReadCounter extends ReadWalker<Integer, Integer> {
-
-    public static final String ORIGINAL_CIGAR_TAG = "OC";
-    public static final String ORIGINAL_POSITION_TAG = "OP";
-
-    @Argument(fullName="targetIntervals", shortName="targetIntervals", doc="intervals file output from RealignerTargetCreator", required=true)
-    protected String intervalsFile = null;
-
-    // the intervals input by the user
-    private Iterator<GenomeLoc> intervals = null;
-
-    // the current interval in the list
-    private GenomeLoc currentInterval = null;
-
-    private long updatedIntervals = 0, updatedReads = 0, affectedBases = 0;
-    private boolean intervalWasUpdated = false;
-
-    public void initialize() {
-        // prepare to read intervals one-by-one, as needed (assuming they are sorted).
-        intervals = new IntervalFileMergingIterator( getToolkit().getGenomeLocParser(), new File(intervalsFile), IntervalMergingRule.OVERLAPPING_ONLY );
-        currentInterval = intervals.hasNext() ? intervals.next() : null;
-    }
-
-    public Integer map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
-        if ( currentInterval == null ) {
-            return 0;
-        }
-
-        GenomeLoc readLoc = ref.getGenomeLocParser().createGenomeLoc(read);
-        // hack to get around unmapped reads having screwy locations
-        if ( readLoc.getStop() == 0 )
-            readLoc = ref.getGenomeLocParser().createGenomeLoc(readLoc.getContig(), readLoc.getStart(), readLoc.getStart());
-
-        if ( readLoc.isBefore(currentInterval) || ReadUtils.is454Read(read) )
-            return 0;
-
-        if ( readLoc.overlapsP(currentInterval) ) {
-            if ( doNotTryToClean(read) )
-                return 0;
-
-            if ( read.getAttribute(ORIGINAL_CIGAR_TAG) != null ) {
-                String newCigar = (String)read.getAttribute(ORIGINAL_CIGAR_TAG);
-                // deal with an old bug
-                if ( read.getCigar().toString().equals(newCigar) ) {
-                    //System.out.println(currentInterval + ": " + read.getReadName() + " " + read.getCigarString() + " " + newCigar);
-                    return 0;
-                }
-
-                if ( !intervalWasUpdated ) {
-                    intervalWasUpdated = true;
-                    updatedIntervals++;
-                    affectedBases += 20 + getIndelSize(read);
-                }
-                updatedReads++;
-
-            }
-        } else {
-            do {
-                intervalWasUpdated = false;
-                currentInterval = intervals.hasNext() ? intervals.next() : null;
-            } while ( currentInterval != null && currentInterval.isBefore(readLoc) );
-        }
-
-        return 0;
-    }
-
-    private int getIndelSize(SAMRecord read) {
-        for ( CigarElement ce : read.getCigar().getCigarElements() ) {
-            if ( ce.getOperator() == CigarOperator.I )
-                return 0;
-            if ( ce.getOperator() == CigarOperator.D )
-                return ce.getLength();
-        }
-        logger.warn("We didn't see an indel for this read: " + read.getReadName() + " " + read.getAlignmentStart() + " " + read.getCigar());
-        return 0;
-    }
-
-    private boolean doNotTryToClean(SAMRecord read) {
-        return read.getReadUnmappedFlag() ||
-                read.getNotPrimaryAlignmentFlag() ||
-                read.getReadFailsVendorQualityCheckFlag() ||
-                read.getMappingQuality() == 0 ||
-                read.getAlignmentStart() == SAMRecord.NO_ALIGNMENT_START ||
-                (BadMateFilter.hasBadMate(read));
-    }
-
-    public Integer reduceInit() {
-        return 0;
-    }
-
-    public Integer reduce(Integer value, Integer sum) {
-        return sum + value;
-    }
-
-    public void onTraversalDone(Integer result) {
-        System.out.println(updatedIntervals + " intervals were updated");
-        System.out.println(updatedReads + " reads were updated");
-        System.out.println(affectedBases + " bases were affected");
-    }
-}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/RealignerTargetCreator.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/RealignerTargetCreator.java
index bede50a0b..424e05c20 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/RealignerTargetCreator.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/RealignerTargetCreator.java
@@ -50,6 +50,7 @@ import java.io.PrintStream;
 import java.util.ArrayList;
 import java.util.Collections;
 import java.util.List;
+import java.util.TreeSet;
 
 /**
  * Emits intervals for the Local Indel Realigner to target for realignment.
@@ -103,7 +104,7 @@ import java.util.List;
 @Allows(value={DataSource.READS, DataSource.REFERENCE})
 @By(DataSource.REFERENCE)
 @BAQMode(ApplicationTime = BAQ.ApplicationTime.FORBIDDEN)
-public class RealignerTargetCreator extends RodWalker<RealignerTargetCreator.Event, RealignerTargetCreator.Event> {
+public class RealignerTargetCreator extends RodWalker<RealignerTargetCreator.Event, RealignerTargetCreator.EventPair> implements TreeReducible<RealignerTargetCreator.EventPair> {
 
     /**
      * The target intervals for realignment.
@@ -227,7 +228,7 @@ public class RealignerTargetCreator extends RodWalker<RealignerTargetCreator.Eve
             // make sure we're supposed to look for high entropy
             if ( mismatchThreshold > 0.0 &&
                     mismatchThreshold <= 1.0 &&
-                    pileup.size() >= minReadsAtLocus &&
+                    pileup.getNumberOfElements() >= minReadsAtLocus &&
                     (double)mismatchQualities / (double)totalQualities >= mismatchThreshold )
                 hasPointEvent = true;
         }
@@ -251,43 +252,125 @@ public class RealignerTargetCreator extends RodWalker<RealignerTargetCreator.Eve
         return new Event(eventLoc, furthestStopPos, eventType);
     }
 
-    public void onTraversalDone(Event sum) {
-        if ( sum != null && sum.isReportableEvent() )
-            out.println(sum.toString());
+    public void onTraversalDone(EventPair sum) {
+        if ( sum.left != null && sum.left.isReportableEvent() )
+            sum.intervals.add(sum.left.getLoc());
+        if ( sum.right != null && sum.right.isReportableEvent() )
+            sum.intervals.add(sum.right.getLoc());
+
+        for ( GenomeLoc loc : sum.intervals )
+            out.println(loc);
     }
 
-    public Event reduceInit() {
-        return null;
+    public EventPair reduceInit() {
+        return new EventPair(null, null);
     }
 
-    public Event reduce(Event value, Event sum) {
-        // ignore no new events
-        if ( value == null )
-            return sum;
+    public EventPair treeReduce(EventPair lhs, EventPair rhs) {
+        EventPair result;
 
-        // if it's the first good value, use it
-        if ( sum == null )
-            return value;
+        if ( lhs.left == null ) {
+            result = rhs;
+        } else if ( rhs.left == null ) {
+            result = lhs;
+        } else if ( lhs.right == null ) {
+            if ( rhs.right == null ) {
+                if ( canBeMerged(lhs.left, rhs.left) )
+                    result = new EventPair(mergeEvents(lhs.left, rhs.left), null, lhs.intervals, rhs.intervals);
+                else
+                    result = new EventPair(lhs.left, rhs.left, lhs.intervals, rhs.intervals);
+            } else {
+                if ( canBeMerged(lhs.left, rhs.left) )
+                    result = new EventPair(mergeEvents(lhs.left, rhs.left), rhs.right, lhs.intervals, rhs.intervals);
+                else {
+                    if ( rhs.left.isReportableEvent() )
+                        rhs.intervals.add(rhs.left.getLoc());
+                    result = new EventPair(lhs.left, rhs.right, lhs.intervals, rhs.intervals);
+                }
+            }
+        } else if ( rhs.right == null ) {
+            if ( canBeMerged(lhs.right, rhs.left) )
+                result = new EventPair(lhs.left, mergeEvents(lhs.right, rhs.left), lhs.intervals, rhs.intervals);
+            else {
+                if ( lhs.right.isReportableEvent() )
+                    lhs.intervals.add(lhs.right.getLoc());
+                result = new EventPair(lhs.left, rhs.left, lhs.intervals, rhs.intervals);
+            }
+        } else {
+            if ( canBeMerged(lhs.right, rhs.left) ) {
+                Event merge = mergeEvents(lhs.right, rhs.left);
+                if ( merge.isReportableEvent() )
+                    lhs.intervals.add(merge.getLoc());
+            } else {
+                if ( lhs.right.isReportableEvent() )
+                    lhs.intervals.add(lhs.right.getLoc());
+                if ( rhs.left.isReportableEvent() )
+                    rhs.intervals.add(rhs.left.getLoc());
+            }
 
-        // if we hit a new contig or they have no overlapping reads, then they are separate events - so clear sum
-        if ( sum.loc.getContigIndex() != value.loc.getContigIndex() || sum.furthestStopPos < value.loc.getStart() ) {
-            if ( sum.isReportableEvent() )
-                out.println(sum.toString());
-            return value;
+            result = new EventPair(lhs.left, rhs.right, lhs.intervals, rhs.intervals);
+        }
+
+        return result;
+    }
+
+    public EventPair reduce(Event value, EventPair sum) {
+        if ( value == null ) {
+            ; // do nothing
+        } else if ( sum.left == null ) {
+            sum.left = value;
+        } else if ( sum.right == null ) {
+            if ( canBeMerged(sum.left, value) )
+                sum.left = mergeEvents(sum.left, value);
+            else
+                sum.right = value;
+        } else {
+            if ( canBeMerged(sum.right, value) )
+                sum.right = mergeEvents(sum.right, value);
+            else {
+                if ( sum.right.isReportableEvent() )
+                    sum.intervals.add(sum.right.getLoc());
+                sum.right = value;
+            }
         }
 
-        // otherwise, merge the two events
-        sum.merge(value);
         return sum;
     }
 
+    static private boolean canBeMerged(Event left, Event right) {
+        return left.loc.getContigIndex() == right.loc.getContigIndex() && left.furthestStopPos >= right.loc.getStart();
+    }
+
+    @com.google.java.contract.Requires({"left != null", "right != null"})
+    static private Event mergeEvents(Event left, Event right) {
+        left.merge(right);
+        return left;
+    }
+
     private enum EVENT_TYPE { POINT_EVENT, INDEL_EVENT, BOTH }
 
+    class EventPair {
+        public Event left, right;
+        public TreeSet<GenomeLoc> intervals = new TreeSet<GenomeLoc>();
+
+        public EventPair(Event left, Event right) {
+            this.left = left;
+            this.right = right;
+        }
+
+        public EventPair(Event left, Event right, TreeSet<GenomeLoc> set1, TreeSet<GenomeLoc> set2) {
+            this.left = left;
+            this.right = right;
+            intervals.addAll(set1);
+            intervals.addAll(set2);
+        }
+    }
+
     class Event {
         public int furthestStopPos;
 
-        public GenomeLoc loc;
-        public int eventStartPos;
+        private GenomeLoc loc;
+        private int eventStartPos;
         private int eventStopPos;
         private EVENT_TYPE type;
         private ArrayList<Integer> pointEvents = new ArrayList<Integer>();
@@ -332,6 +415,10 @@ public class RealignerTargetCreator extends RodWalker<RealignerTargetCreator.Eve
                             eventStartPos = lastPosition;
                         else
                             eventStartPos = Math.min(eventStartPos, lastPosition);
+                    } else if ( eventStartPos == -1 && e.eventStartPos != -1 ) {
+                        eventStartPos = e.eventStartPos;
+                        eventStopPos = e.eventStopPos;
+                        furthestStopPos = e.furthestStopPos;
                     }
                 }
                 pointEvents.add(newPosition);
@@ -342,8 +429,8 @@ public class RealignerTargetCreator extends RodWalker<RealignerTargetCreator.Eve
             return getToolkit().getGenomeLocParser().isValidGenomeLoc(loc.getContig(), eventStartPos, eventStopPos, true) && eventStopPos >= 0 && eventStopPos - eventStartPos < maxIntervalSize;
         }
 
-        public String toString() {
-            return String.format("%s:%d-%d", loc.getContig(), eventStartPos, eventStopPos);
+        public GenomeLoc getLoc() {
+            return getToolkit().getGenomeLocParser().createGenomeLoc(loc.getContig(), eventStartPos, eventStopPos);
         }
     }
 }
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/SomaticIndelDetectorWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/SomaticIndelDetectorWalker.java
index 8bba8eac2..414ffa09c 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/SomaticIndelDetectorWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/indels/SomaticIndelDetectorWalker.java
@@ -26,22 +26,16 @@
 package org.broadinstitute.sting.gatk.walkers.indels;
 
 import net.sf.samtools.*;
-import org.broadinstitute.sting.commandline.Argument;
-import org.broadinstitute.sting.commandline.Hidden;
-import org.broadinstitute.sting.commandline.Output;
-import org.broadinstitute.sting.commandline.Tags;
+import org.broad.tribble.Feature;
+import org.broadinstitute.sting.commandline.*;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.datasources.reads.SAMReaderID;
 import org.broadinstitute.sting.gatk.datasources.reference.ReferenceDataSource;
 import org.broadinstitute.sting.gatk.filters.MappingQualityZeroFilter;
 import org.broadinstitute.sting.gatk.filters.Platform454Filter;
 import org.broadinstitute.sting.gatk.filters.PlatformUnitFilter;
-import org.broadinstitute.sting.gatk.filters.PlatformUnitFilterHelper;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
 import org.broadinstitute.sting.gatk.refdata.SeekableRODIterator;
-import org.broadinstitute.sting.utils.codecs.refseq.Transcript;
-import org.broadinstitute.sting.utils.codecs.refseq.RefSeqCodec;
-import org.broadinstitute.sting.utils.codecs.refseq.RefSeqFeature;
 import org.broadinstitute.sting.gatk.refdata.tracks.RMDTrack;
 import org.broadinstitute.sting.gatk.refdata.tracks.RMDTrackBuilder;
 import org.broadinstitute.sting.gatk.refdata.utils.LocationAwareSeekableRODIterator;
@@ -51,16 +45,19 @@ import org.broadinstitute.sting.gatk.walkers.ReadWalker;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.GenomeLocSortedSet;
 import org.broadinstitute.sting.utils.SampleUtils;
+import org.broadinstitute.sting.utils.codecs.refseq.RefSeqCodec;
+import org.broadinstitute.sting.utils.codecs.refseq.RefSeqFeature;
+import org.broadinstitute.sting.utils.codecs.refseq.Transcript;
 import org.broadinstitute.sting.utils.codecs.vcf.*;
 import org.broadinstitute.sting.utils.collections.CircularArray;
 import org.broadinstitute.sting.utils.collections.PrimitivePair;
 import org.broadinstitute.sting.utils.exceptions.StingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
-import org.broadinstitute.sting.utils.interval.IntervalFileMergingIterator;
 import org.broadinstitute.sting.utils.interval.IntervalMergingRule;
 import org.broadinstitute.sting.utils.interval.IntervalUtils;
 import org.broadinstitute.sting.utils.interval.OverlappingIntervalIterator;
 import org.broadinstitute.sting.utils.sam.AlignmentUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.broadinstitute.sting.utils.variantcontext.Allele;
 import org.broadinstitute.sting.utils.variantcontext.Genotype;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
@@ -134,17 +131,9 @@ public class SomaticIndelDetectorWalker extends ReadWalker<Integer,Integer> {
 //    boolean FORMAT_VCF = false;
 
     @Hidden
-    @Argument(fullName = "genotype_intervals", shortName = "genotype",
+    @Input(fullName = "genotype_intervals", shortName = "genotype",
         doc = "Calls will be made at each position within the specified interval(s), whether there is an indel or not", required = false)
-    public String genotypeIntervalsFile = null;
-
-    @Hidden
-    @Argument(fullName="genotypeIntervalsAreNotSorted", shortName="giNotSorted", required=false,
-        doc="This tool assumes that the genotyping interval list (--genotype_intervals) is sorted; "+
-            "if the list turns out to be unsorted, it will throw an exception.  "+
-            "Use this argument when your interval list is not sorted to instruct the IndelGenotyper "+
-            "to sort and keep it in memory (increases memory usage!).")
-    protected boolean GENOTYPE_NOT_SORTED = false;
+    public IntervalBinding<Feature> genotypeIntervalsFile = null;
 
     @Hidden
     @Argument(fullName="unpaired", shortName="unpaired",
@@ -265,7 +254,7 @@ public class SomaticIndelDetectorWalker extends ReadWalker<Integer,Integer> {
         Set<VCFHeaderLine> headerInfo = new HashSet<VCFHeaderLine>();
 
         // first, the basic info
-        headerInfo.add(new VCFHeaderLine("source", "IndelGenotyperV2"));
+        headerInfo.add(new VCFHeaderLine("source", "SomaticIndelDetector"));
         headerInfo.add(new VCFHeaderLine("reference", getToolkit().getArguments().referenceFile.getName()));
 
         // FORMAT and INFO fields
@@ -283,10 +272,10 @@ public class SomaticIndelDetectorWalker extends ReadWalker<Integer,Integer> {
         args.addAll(getToolkit().getFilters());
         Map<String,String> commandLineArgs = getToolkit().getApproximateCommandLineArguments(args);
         for ( Map.Entry<String, String> commandLineArg : commandLineArgs.entrySet() )
-            headerInfo.add(new VCFHeaderLine(String.format("IGv2_%s", commandLineArg.getKey()), commandLineArg.getValue()));
+            headerInfo.add(new VCFHeaderLine(String.format("SID_%s", commandLineArg.getKey()), commandLineArg.getValue()));
         // also, the list of input bams
         for ( String fileName : getToolkit().getArguments().samFiles )
-            headerInfo.add(new VCFHeaderLine("IGv2_bam_file_used", fileName));
+            headerInfo.add(new VCFHeaderLine("SID_bam_file_used", fileName));
 
         return headerInfo;
     }
@@ -366,16 +355,9 @@ public class SomaticIndelDetectorWalker extends ReadWalker<Integer,Integer> {
             }
             if ( genotypeIntervalsFile != null ) {
 
-                if ( ! GENOTYPE_NOT_SORTED && IntervalUtils.isIntervalFile(genotypeIntervalsFile)) {
-                    // prepare to read intervals one-by-one, as needed (assuming they are sorted).
-                    genotypeIntervalIterator = new IntervalFileMergingIterator(getToolkit().getGenomeLocParser(),
-                        new java.io.File(genotypeIntervalsFile), IntervalMergingRule.OVERLAPPING_ONLY );
-                } else {
-                    // read in the whole list of intervals for cleaning
-                    GenomeLocSortedSet locs = IntervalUtils.sortAndMergeIntervals(getToolkit().getGenomeLocParser(),
-                        IntervalUtils.parseIntervalArguments(getToolkit().getGenomeLocParser(),Arrays.asList(genotypeIntervalsFile),true), IntervalMergingRule.OVERLAPPING_ONLY);
-                    genotypeIntervalIterator = locs.iterator();
-                }
+                // read in the whole list of intervals for cleaning
+                GenomeLocSortedSet locs = IntervalUtils.sortAndMergeIntervals(getToolkit().getGenomeLocParser(), genotypeIntervalsFile.getIntervals(getToolkit()), IntervalMergingRule.OVERLAPPING_ONLY);
+                genotypeIntervalIterator = locs.iterator();
 
                 // wrap intervals requested for genotyping inside overlapping iterator, so that we actually
                 // genotype only on the intersections of the requested intervals with the -L intervals
@@ -392,7 +374,7 @@ public class SomaticIndelDetectorWalker extends ReadWalker<Integer,Integer> {
 
 		location = getToolkit().getGenomeLocParser().createGenomeLoc(getToolkit().getSAMFileHeader().getSequence(0).getSequenceName(),1);
 
-        normalSamples = getToolkit().getSamplesByReaders().get(0);
+        normalSamples = SampleUtils.getSAMFileSamples(getToolkit().getSAMFileHeaders().get(0));
 
         try {
             // we already checked that bedOutput and output_file are not set simultaneously
@@ -413,7 +395,7 @@ public class SomaticIndelDetectorWalker extends ReadWalker<Integer,Integer> {
 
 
 	@Override
-	public Integer map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
+	public Integer map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker) {
 
     //        if ( read.getReadName().equals("428EFAAXX090610:2:36:1384:639#0") ) System.out.println("GOT READ");
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/PhasingRead.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/PhasingRead.java
index a56c9e21e..63fb33295 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/PhasingRead.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/PhasingRead.java
@@ -37,7 +37,7 @@ public class PhasingRead extends BaseArray {
     public PhasingRead(int length, int mappingQual) {
         super(length);
 
-        this.mappingProb = new PreciseNonNegativeDouble(QualityUtils.qualToProb(mappingQual));
+        this.mappingProb = new PreciseNonNegativeDouble(QualityUtils.qualToProb((byte)mappingQual));
 
         this.baseProbs = new PreciseNonNegativeDouble[length];
         Arrays.fill(this.baseProbs, null);
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/ReadBackedPhasingWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/ReadBackedPhasingWalker.java
index 17a6e20f1..68fbe8ce2 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/ReadBackedPhasingWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/ReadBackedPhasingWalker.java
@@ -30,7 +30,6 @@ import org.broadinstitute.sting.commandline.Output;
 import org.broadinstitute.sting.gatk.arguments.StandardVariantContextInputArgumentCollection;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
 import org.broadinstitute.sting.gatk.filters.MappingQualityZeroFilter;
 import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
 import org.broadinstitute.sting.gatk.walkers.*;
@@ -76,9 +75,8 @@ import static org.broadinstitute.sting.utils.codecs.vcf.VCFUtils.getVCFHeadersFr
  *      -T ReadBackedPhasing
  *      -R reference.fasta
  *      -I reads.bam
- *      --variant:vcf SNPs.vcf
- *      -BTI variant
- *      -BTIMR INTERSECTION
+ *      --variant SNPs.vcf
+ *      -L SNPs.vcf
  *      -o phased_SNPs.vcf
  *      --phaseQualityThresh 20.0
  * </pre>
@@ -260,10 +258,10 @@ public class ReadBackedPhasingWalker extends RodWalker<PhasingStatsAndOutput, Ph
 
             int numReads = 0;
             if (context.hasBasePileup()) {
-                numReads = context.getBasePileup().size();
+                numReads = context.getBasePileup().getNumberOfElements();
             }
             else if (context.hasExtendedEventPileup()) {
-                numReads = context.getExtendedEventPileup().size();
+                numReads = context.getExtendedEventPileup().getNumberOfElements();
             }
             PhasingStats addInPhaseStats = new PhasingStats(numReads, 1);
             phaseStats.addIn(addInPhaseStats);
@@ -1095,14 +1093,14 @@ public class ReadBackedPhasingWalker extends RodWalker<PhasingStatsAndOutput, Ph
                     // filter the read-base pileup based on min base and mapping qualities:
                     pileup = pileup.getBaseAndMappingFilteredPileup(MIN_BASE_QUALITY_SCORE, MIN_MAPPING_QUALITY_SCORE);
                     if (pileup != null) {
-                        for (Sample sample : pileup.getSamples()) {
+                        for (final String sample : pileup.getSamples()) {
                             ReadBackedPileup samplePileup = pileup.getPileupForSample(sample);
                             ReadBasesAtPosition readBases = new ReadBasesAtPosition();
                             for (PileupElement p : samplePileup) {
                                 if (!p.isDeletion()) // IGNORE deletions for now
                                     readBases.putReadBase(p);
                             }
-                            sampleReadBases.put(sample.getId(), readBases);
+                            sampleReadBases.put(sample, readBases);
                         }
                     }
                 }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/RefSeqDataParser.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/RefSeqDataParser.java
index 55da1c152..f94140814 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/RefSeqDataParser.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/phasing/RefSeqDataParser.java
@@ -44,12 +44,12 @@ public class RefSeqDataParser {
         String nameKeyToUseMultiplePrefix = nameKeyToUse + "_";
 
         Map<String, String> entriesToNames = new HashMap<String, String>();
-        Integer numRecords = vc.getAttributeAsIntegerNoException(NUM_RECORDS_KEY);
-        if (numRecords != null) {
+        int numRecords = vc.getAttributeAsInt(NUM_RECORDS_KEY, -1);
+        if (numRecords != -1) {
             boolean done = false;
 
             if (numRecords == 1) { // Check if perhaps the single record doesn't end with "_1":
-                String name = vc.getAttributeAsStringNoException(nameKeyToUse);
+                String name = vc.getAttributeAsString(nameKeyToUse, null);
                 if (name != null) {
                     entriesToNames.put(nameKeyToUse, name);
                     done = true;
@@ -59,14 +59,14 @@ public class RefSeqDataParser {
             if (!done) {
                 for (int i = 1; i <= numRecords; i++) {
                     String key = nameKeyToUseMultiplePrefix + i;
-                    String name = vc.getAttributeAsStringNoException(key);
+                    String name = vc.getAttributeAsString(key, null);
                     if (name != null)
                         entriesToNames.put(key, name);
                 }
             }
         }
         else { // no entry with the # of records:
-            String name = vc.getAttributeAsStringNoException(nameKeyToUse);
+            String name = vc.getAttributeAsString(nameKeyToUse, null);
             if (name != null) {
                 entriesToNames.put(nameKeyToUse, name);
             }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CountMalesWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CountMalesWalker.java
new file mode 100644
index 000000000..dbbd8e761
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CountMalesWalker.java
@@ -0,0 +1,53 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.gatk.walkers.qc;
+
+import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
+import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
+import org.broadinstitute.sting.gatk.samples.Gender;
+import org.broadinstitute.sting.gatk.samples.Sample;
+import org.broadinstitute.sting.gatk.walkers.DataSource;
+import org.broadinstitute.sting.gatk.walkers.ReadWalker;
+import org.broadinstitute.sting.gatk.walkers.Requires;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
+
+/**
+ * Walks over the input data set, calculating the number of reads seen for diagnostic purposes.
+ * Can also count the number of reads matching a given criterion using read filters (see the
+ * --read-filter command line argument).  Simplest example of a read-backed analysis.
+ */
+@Requires({DataSource.READS, DataSource.REFERENCE})
+public class CountMalesWalker extends ReadWalker<Integer, Integer> {
+    public Integer map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker tracker) {
+        Sample sample = getSampleDB().getSample(read);
+        return sample.getGender() == Gender.MALE ? 1 : 0;
+    }
+
+    public Integer reduceInit() { return 0; }
+
+    public Integer reduce(Integer value, Integer sum) {
+        return value + sum;
+    }
+}                                       
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CountReadsWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CountReadsWalker.java
index 9ce9c4eec..b5a2d183f 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CountReadsWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CountReadsWalker.java
@@ -1,11 +1,11 @@
 package org.broadinstitute.sting.gatk.walkers.qc;
 
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
 import org.broadinstitute.sting.gatk.walkers.DataSource;
 import org.broadinstitute.sting.gatk.walkers.ReadWalker;
 import org.broadinstitute.sting.gatk.walkers.Requires;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 /**
  * Walks over the input data set, calculating the number of reads seen for diagnostic purposes.
@@ -38,7 +38,7 @@ import org.broadinstitute.sting.gatk.walkers.Requires;
  */
 @Requires({DataSource.READS, DataSource.REFERENCE})
 public class CountReadsWalker extends ReadWalker<Integer, Integer> {
-    public Integer map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker tracker) {
+    public Integer map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker tracker) {
 
         return 1;
     }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CycleQualityWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CycleQualityWalker.java
index b5f5442cd..1cb1579d0 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CycleQualityWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CycleQualityWalker.java
@@ -1,434 +1,434 @@
-/*
- * Copyright (c) 2010 The Broad Institute
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use,
- * copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following
- * conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
- * OTHER DEALINGS IN THE SOFTWARE.
- */
-
-package org.broadinstitute.sting.gatk.walkers.qc;
-
-import net.sf.samtools.SAMReadGroupRecord;
-import net.sf.samtools.SAMRecord;
-import org.broadinstitute.sting.commandline.Argument;
-import org.broadinstitute.sting.commandline.Output;
-import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
-import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
-import org.broadinstitute.sting.gatk.walkers.DataSource;
-import org.broadinstitute.sting.gatk.walkers.ReadWalker;
-import org.broadinstitute.sting.gatk.walkers.Requires;
-import org.broadinstitute.sting.utils.collections.PrimitivePair;
-import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
-import org.broadinstitute.sting.utils.exceptions.UserException;
-import org.broadinstitute.sting.utils.sam.AlignmentUtils;
-
-import java.io.*;
-import java.util.*;
-
-/**
- * Created by IntelliJ IDEA.
- * User: asivache
- * Date: Apr 9, 2010
- * Time: 12:16:41 PM
- * To change this template use File | Settings | File Templates.
- */
-
-/**
- * Walks over the input data set, calculating the number of reads seen for diagnostic purposes.
- * Can also count the number of reads matching a given criterion using read filters (see the
- * --read-filter command line argument).  Simplest example of a read-backed analysis.
- */
-@Requires({DataSource.READS})
-public class CycleQualityWalker extends ReadWalker<Integer,Integer> {
-    @Output
-    protected PrintStream out;
-
-    @Argument(fullName="mappedOnly", shortName="mo", doc="when this flag is set (default), statistics will be collected "+
-                "on mapped reads only, while unmapped reads will be discarded", required=false)
-    protected boolean MAPPED_ONLY = true;
-    @Argument(fullName="maxReadLength", shortName="rl", doc="maximum read length", required=false)
-    protected int MAX_READ_LENGTH = 500;
-    @Argument(fullName="out_prefix",shortName="p",doc="prefix for output report and statistics files",required=true)
-    protected String PREFIX = null;
-//    @Argument(fullName="html",shortName="html",doc="produce html-formatted output (starting with h3-level tags) rather than plain text",required=false)
-    protected boolean HTML = false;
-    @Argument(fullName="qualThreshold", shortName="Q",doc="flag as problematic all cycles with av. qualities below the threshold (applies only to the generated report)",required=false)
-    protected double QTHRESHOLD = 10.0;
-    @Argument(fullName="useBothQualities",shortName="bothQ",required=false,doc="Generate statistics both for currently set and for "+
-        "original base qualities (OQ tag, must be present in the bam); two separate data files will be generated.")
-    protected boolean ASSESS_BOTH_QUALS = false;
-
-    private Map<String,CycleStats[]> cyclesByLaneMap = null;
-    private Map<String,CycleStats[]> cyclesByLibraryMap = null;
-    private Map<String,CycleStats[]> cyclesByLaneMapOrig = null;
-    private Map<String,CycleStats[]> cyclesByLibraryMapOrig = null;
-
-    public void initialize() {
-        if ( PREFIX == null ) throw new ReviewedStingException("Prefix for output file(s) must be specified");
-        cyclesByLaneMap = new HashMap<String,CycleStats[]>();
-        cyclesByLibraryMap = new HashMap<String,CycleStats[]>();
-        cyclesByLaneMapOrig = new HashMap<String,CycleStats[]>();
-        cyclesByLibraryMapOrig = new HashMap<String,CycleStats[]>();
-    }
-
-
-    public Integer map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
-
-        if ( AlignmentUtils.isReadUnmapped(read) ) return 0;
-
-        SAMReadGroupRecord rg = read.getReadGroup();
-
-        if ( rg == null ) throw new UserException.ReadMissingReadGroup(read);
-
-        String lane = read.getReadGroup().getPlatformUnit();
-        String library = read.getReadGroup().getLibrary();
-
-        if ( lane == null ) throw new UserException.MalformedBAM(read, "Read "+read.getReadName()+" has no platform unit information");
-        if ( library == null ) throw new UserException.MalformedBAM(read, "Read "+read.getReadName()+" has no library information");
-
-        int end = 0;
-
-        if ( read.getReadPairedFlag() ) {
-
-            if ( read.getFirstOfPairFlag() ) {
-                if ( read.getSecondOfPairFlag() )
-                    throw new UserException.MalformedBAM(read, "Read "+read.getReadName()+" has conflicting first/second in pair attributes");
-                end = 1;
-            } else {
-                if ( ! read.getSecondOfPairFlag() )
-                    throw new UserException.MalformedBAM(read, "Read "+read.getReadName()+" has conflicting first/second in pair attributes");
-                end = 2;
-            }
-        }
-
-        CycleStats[] byLane = cyclesByLaneMap.get(lane);
-        CycleStats[] byLib = cyclesByLibraryMap.get(library);
-
-        //byte [] quals = USE_ORIGINAL_QUALS ? AlignmentUtils.getOriginalQualsInCycleOrder(read) : AlignmentUtils.getQualsInCycleOrder(read);
-
-        byte [] quals = AlignmentUtils.getQualsInCycleOrder(read);
-
-        // if end == 0 (single end lane), we allocate array of length 1, otherwise we need two
-        // elements in the array in order to be able to collect statistics for each end in the pair independently
-        if ( byLane == null ) cyclesByLaneMap.put(lane,byLane = new CycleStats[(end==0?1:2)]);
-        if ( byLib == null ) cyclesByLibraryMap.put(library, byLib =new CycleStats[2]);
-
-        if ( end != 0 ) end--; // we will now use 'end' as index into the array of stats
-
-        if ( byLane[end] == null ) byLane[end] = new CycleStats(MAX_READ_LENGTH);
-        if ( byLib[end] == null ) byLib[end] =new CycleStats(MAX_READ_LENGTH);
-        byLane[end].add(quals);
-        byLib[end].add(quals);
-
-        return 1;  //To change body of implemented methods use File | Settings | File Templates.
-    }
-
-    /**
-     * Provide an initial value for reduce computations.
-     *
-     * @return Initial value of reduce.
-     */
-    public Integer reduceInit() {
-        return 0;  //To change body of implemented methods use File | Settings | File Templates.
-    }
-
-    /**
-     * Reduces a single map with the accumulator provided as the ReduceType.
-     *
-     * @param value result of the map.
-     * @param sum   accumulator for the reduce.
-     * @return accumulator with result of the map taken into account.
-     */
-    public Integer reduce(Integer value, Integer sum) {
-        return sum.intValue()+value.intValue();  //To change body of implemented methods use File | Settings | File Templates.
-    }
-
-    public void onTraversalDone(Integer result) {
-        if ( HTML ) {
-            out.println("<h3>Cycle Quality QC</h3>\n");
-            out.println("File(s) analyzed: <br>");
-            for ( String fileName : getToolkit().getArguments().samFiles) out.println(fileName+"<br>");
-            out.println("<br>");
-        }
-        if ( HTML ) out.println("<br><br>");
-        out.println("\n"+result+" reads analyzed\n");
-        if ( HTML ) out.println("<br><br>");
-        out.println("by platform unit:");
-        if ( HTML ) out.println("<br>");
-        report2(cyclesByLaneMap, new File(PREFIX+".byLane.txt"),true);
-        out.println();
-        if ( HTML ) out.println("<br><br>");
-        out.println("\nby library:");
-        if ( HTML ) out.println("<br>");
-        report2(cyclesByLibraryMap, new File(PREFIX+".byLibrary.txt"),true);
-        out.println();
-        if ( HTML ) out.println("<br><br>");
-    }
-
- 
-
-    private void report2(Map<String,CycleStats[]> m, File f,boolean summaryReport) {
-        long totalReads_1 =0;
-        long totalReads_2 =0;
-        long totalReads_unpaired = 0;
-        SortedSet<String> columns = new TreeSet<String>();
-        int maxLength = 0; // maximum read length across all lanes/read ends analyzed
-
-        for( Map.Entry<String,CycleStats[]> e : m.entrySet() ) {
-            if ( e.getValue()[0].getMaxReadLength() > maxLength ) maxLength = e.getValue()[0].getMaxReadLength();
-
-            if ( e.getValue().length == 1 || e.getValue().length == 2 && e.getValue()[1] == null ) {
-                totalReads_unpaired += e.getValue()[0].getReadCount(); // single end lane
-            } else {
-                totalReads_1 += e.getValue()[0].getReadCount();
-                totalReads_2 += e.getValue()[1].getReadCount();
-                if ( e.getValue()[1].getMaxReadLength() > maxLength ) maxLength = e.getValue()[1].getMaxReadLength();
-            }
-
-            columns.add(e.getKey());
-        }
-
-        if ( summaryReport ) {
-            if ( totalReads_1 == 0 && totalReads_2 != 0) {
-                out.println("   End 1: No reads");
-                if ( HTML ) out.println("<br>");
-            }
-            if ( totalReads_2 == 0 && totalReads_1 != 0 ) {
-                out.println("   End 2: No reads");
-                if ( HTML ) out.println("<br>");
-            }
-            if ( totalReads_1 == 0 && totalReads_2 == 0 && totalReads_unpaired == 0 ) {
-                out.println("   No reads found.");
-                if ( HTML ) out.println("<br>");
-            }
-        }
-
-        if ( totalReads_1 == 0 && totalReads_2 == 0 && totalReads_unpaired == 0 ) return;
-
-        try {
-            BufferedWriter w = new BufferedWriter(new FileWriter(f));
-
-            w.write("cycle");
-
-            for( String col : columns ) {
-                CycleStats[] data = m.get(col);
-                if ( summaryReport ) {
-                    out.print("   ");
-                    out.print(col);
-                }
-
-                CycleStats end1 = data[0];
-                int minL = ( end1 == null ? 0 : end1.getMinReadLength() );
-                int maxL = ( end1 == null ? 0 : end1.getMaxReadLength() );
-
-                if ( data.length == 2 && data[1] != null ) {
-                    if ( summaryReport ) {
-                        out.println(": paired");
-                        if ( HTML ) out.println("<br>");
-                        out.println("    Reads analyzed:");
-                        if ( HTML ) out.println("<br>");
-                    }
-                    CycleStats end2 = data[1];
-
-                    out.print( "      End 1: "+ ( end1 == null ? 0 : end1.getReadCount()) );
-                    if ( minL == maxL ) out.println("; read length = "+minL);
-                    else out.println("; WARNING: variable read length = "+minL+"-"+maxL);
-                    if ( HTML ) out.println("<br>");
-
-                    out.print( "      End 2: "+ ( end2 == null ? 0 : end2.getReadCount()) );
-                    minL = ( end2 == null ? 0 : end2.getMinReadLength() );
-                    maxL = ( end2 == null ? 0 : end2.getMaxReadLength() );
-                    if ( minL == maxL ) out.println("; read length = "+minL);
-                    else out.println("; WARNING: variable read length = "+minL+"-"+maxL);
-                    if ( HTML ) out.println("<br>");
-                }
-                else {
-                    out.println(": unpaired");
-                    if ( HTML ) out.println("<br>");
-                    out.print( "      Reads analyzed: "+ ( end1 == null ? 0 : end1.getReadCount()) );
-                    if ( minL == maxL ) out.println("; read length = "+minL);
-                    else out.println("; WARNING: variable read length = "+minL+"-"+maxL);
-                    if ( HTML ) out.println("<br>");
-                }
-
-                w.write('\t') ;
-                w.write(col);
-                if ( data.length == 1 || data.length == 2 && data[1] == null ) {
-                    w.write(".unpaired");
-                    w.write('\t');
-                    w.write(col);
-                    w.write(".unpaired.stddev");
-                }  else {
-                    w.write(".end1");
-                    w.write('\t');
-                    w.write(col);
-                    w.write(".end1.stddev");
-                    w.write('\t') ;
-                    w.write(col);
-                    w.write(".end2");
-                    w.write('\t');
-                    w.write(col);
-                    w.write(".end2.stddev");
-                }
-            }
-
-            w.write('\n');
-
-            int cycle = 0;
-
-            Map<String,List<PrimitivePair.Int>> problems = new HashMap<String,List<PrimitivePair.Int>>();
-
-            while ( cycle < maxLength ) {
-                w.write(Integer.toString(cycle+1));
-                for ( String col : columns ) {
-
-                    CycleStats[] data = m.get(col);
-                    CycleStats end1 = data[0];
-                    w.write('\t');
-                    if ( end1 == null || cycle >= end1.getMaxReadLength() ) w.write(".\t.");
-                    else {
-                        double aq = end1.getCycleQualAverage(cycle);
-                        w.write(String.format("%.4f\t%.4f",aq,end1.getCycleQualStdDev(cycle)));
-                        recordProblem(aq,cycle, problems,col+".End1");
-                    }
-                    if ( data.length > 1 && data[1] != null ) {
-                        w.write('\t');
-                        CycleStats end2 = data[1];
-                        if ( end2 == null || cycle >= end2.getMaxReadLength() ) w.write(".\t.");
-                        else {
-                            double aq = end2.getCycleQualAverage(cycle);
-                            w.write(String.format("%.4f\t%.4f",aq,end2.getCycleQualStdDev(cycle)));
-                            recordProblem(aq,cycle, problems,col+".End2");
-                        }
-                    }
-                }
-                w.write('\n');
-                cycle++;
-            }
-            w.close();
-
-            if ( HTML ) out.println("<hr>");
-
-            if ( HTML ) out.println("<br>");
-            out.println("\nOUTCOME (threshold at Q="+QTHRESHOLD+"):");
-            if ( HTML ) out.println("<br>");
-            for ( String col : columns ) {
-                List<PrimitivePair.Int> lp = problems.get(col+".End1");
-                out.print("  "+col+" End1:");
-                if ( lp == null ) {
-                    out.print(" GOOD");
-                } else {
-                    for ( PrimitivePair.Int p : lp ) {
-                        out.print(" "+(p.first+1)+"-");
-                        if ( p.second >= 0 ) out.print((p.second+1));
-                        else out.print("END");
-                    }
-                }
-                out.println();
-                if ( HTML ) out.println("<br>");
-
-                lp = problems.get(col+".End2");
-                out.print("  "+col+" End2:");
-                if ( lp == null ) {
-                    out.print(" GOOD");
-                } else {
-                    for ( PrimitivePair.Int p : lp ) {
-                        out.print(" "+(p.first+1)+"-");
-                        if ( p.second >= 0 ) out.print(p.second);
-                        else out.print("END");
-                    }
-                }
-                out.println();
-                if ( HTML ) out.println("<br>");
-            }
-
-        } catch (IOException ioe) {
-            throw new UserException.CouldNotCreateOutputFile(f, "Failed to write report", ioe);
-        }
-    }
-
-
-    private void recordProblem(double q, int cycle, Map<String,List<PrimitivePair.Int>> problems, String name) {
-
-        PrimitivePair.Int p = null;
-        List<PrimitivePair.Int> lp = null;
-        if ( q < QTHRESHOLD ) { // there is a problem
-               if ( ! problems.containsKey(name) ) {
-                   lp = new ArrayList<PrimitivePair.Int>();
-                   p = new PrimitivePair.Int(cycle,-1);
-                   lp.add(p);
-                   problems.put(name,lp);
-               } else {
-                   lp = problems.get(name);
-                   p = lp.get(lp.size()-1);
-               }
-               if ( p.second != -1 ) { // if we are not already inside a run of bad qual bases
-                   lp.add(new PrimitivePair.Int(cycle,-1)); // start new run
-               }
-        } else { // good base
-              if ( problems.containsKey(name) ) { // only if we had problem intervals at all, we need to check if the last one needs to be closed
-                  lp = problems.get(name);
-                  p = lp.get(lp.size()-1);
-                  if ( p.second == -1 ) p.second = cycle - 1;
-              }
-        }
-    }
-
-
-    static class CycleStats {
-        private long readCount = 0;
-        private double[] cycleQualsAv = null;
-        private double[] cycleQualsSd = null;
-        private int minL = 1000000000; // read min. length
-        private int maxL = 0; // read max. length
-
-        public CycleStats(int N) {
-            readCount = 0;
-            cycleQualsAv = new double[N];
-            cycleQualsSd = new double[N];
-        }
-
-        public void add(byte[] quals) {
-            if ( quals.length > cycleQualsAv.length )
-                throw new UserException("A read of length "+quals.length+" encountered, which exceeds specified maximum read length");
-            if ( quals.length > maxL ) maxL = quals.length;
-            if ( quals.length < minL ) minL = quals.length;
-            readCount++;
-            for ( int i = 0 ; i < quals.length ; i++ ) {
-                // NOTE: in the update equaltions below, there is no need to check if readCount == 1 (i.e.
-                // we are initializing with the very first record) or not. Indeed, the arrays are initialized with
-                // 0; when the very first value arrives, readCount is 1 and cycleQuals[i] gets set to quals[i] (correct!);
-                // this will also make the second term in the update equation for Sd (quals[i]-cycleQualsAv[i]) equal
-                // to 0, so Sd will be initially set to 0.
-                double oldAvg = cycleQualsAv[i]; // save old mean, will need it for calculation of the variance
-                cycleQualsAv[i] += ( quals[i] - cycleQualsAv[i] ) / readCount; // update mean
-                cycleQualsSd[i] += ( quals[i] - oldAvg ) * ( quals[i] - cycleQualsAv[i] );
-            }
-        }
-
-        public long getReadCount() { return readCount; }
-        public int getMaxReadLength() { return maxL; }
-        public int getMinReadLength() { return minL; }
-//        long [] getCycleQualSums() { return cycleQuals; }
-//        long getCycleQualSum(int i) { return cycleQuals[i]; }
-        double getCycleQualAverage(int i) { return cycleQualsAv[i]; }
-        double getCycleQualStdDev(int i) { return Math.sqrt( cycleQualsSd[i]/(readCount-1) ); }
-    }
-}
+/*
+ * Copyright (c) 2010 The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.gatk.walkers.qc;
+
+import net.sf.samtools.SAMReadGroupRecord;
+import org.broadinstitute.sting.commandline.Argument;
+import org.broadinstitute.sting.commandline.Output;
+import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
+import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
+import org.broadinstitute.sting.gatk.walkers.DataSource;
+import org.broadinstitute.sting.gatk.walkers.ReadWalker;
+import org.broadinstitute.sting.gatk.walkers.Requires;
+import org.broadinstitute.sting.utils.collections.PrimitivePair;
+import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.sam.AlignmentUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
+
+import java.io.*;
+import java.util.*;
+
+/**
+ * Created by IntelliJ IDEA.
+ * User: asivache
+ * Date: Apr 9, 2010
+ * Time: 12:16:41 PM
+ * To change this template use File | Settings | File Templates.
+ */
+
+/**
+ * Walks over the input data set, calculating the number of reads seen for diagnostic purposes.
+ * Can also count the number of reads matching a given criterion using read filters (see the
+ * --read-filter command line argument).  Simplest example of a read-backed analysis.
+ */
+@Requires({DataSource.READS})
+public class CycleQualityWalker extends ReadWalker<Integer,Integer> {
+    @Output
+    protected PrintStream out;
+
+    @Argument(fullName="mappedOnly", shortName="mo", doc="when this flag is set (default), statistics will be collected "+
+                "on mapped reads only, while unmapped reads will be discarded", required=false)
+    protected boolean MAPPED_ONLY = true;
+    @Argument(fullName="maxReadLength", shortName="rl", doc="maximum read length", required=false)
+    protected int MAX_READ_LENGTH = 500;
+    @Argument(fullName="out_prefix",shortName="p",doc="prefix for output report and statistics files",required=true)
+    protected String PREFIX = null;
+//    @Argument(fullName="html",shortName="html",doc="produce html-formatted output (starting with h3-level tags) rather than plain text",required=false)
+    protected boolean HTML = false;
+    @Argument(fullName="qualThreshold", shortName="Q",doc="flag as problematic all cycles with av. qualities below the threshold (applies only to the generated report)",required=false)
+    protected double QTHRESHOLD = 10.0;
+    @Argument(fullName="useBothQualities",shortName="bothQ",required=false,doc="Generate statistics both for currently set and for "+
+        "original base qualities (OQ tag, must be present in the bam); two separate data files will be generated.")
+    protected boolean ASSESS_BOTH_QUALS = false;
+
+    private Map<String,CycleStats[]> cyclesByLaneMap = null;
+    private Map<String,CycleStats[]> cyclesByLibraryMap = null;
+    private Map<String,CycleStats[]> cyclesByLaneMapOrig = null;
+    private Map<String,CycleStats[]> cyclesByLibraryMapOrig = null;
+
+    public void initialize() {
+        if ( PREFIX == null ) throw new ReviewedStingException("Prefix for output file(s) must be specified");
+        cyclesByLaneMap = new HashMap<String,CycleStats[]>();
+        cyclesByLibraryMap = new HashMap<String,CycleStats[]>();
+        cyclesByLaneMapOrig = new HashMap<String,CycleStats[]>();
+        cyclesByLibraryMapOrig = new HashMap<String,CycleStats[]>();
+    }
+
+
+    public Integer map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker) {
+
+        if ( AlignmentUtils.isReadUnmapped(read) ) return 0;
+
+        SAMReadGroupRecord rg = read.getReadGroup();
+
+        if ( rg == null ) throw new UserException.ReadMissingReadGroup(read);
+
+        String lane = read.getReadGroup().getPlatformUnit();
+        String library = read.getReadGroup().getLibrary();
+
+        if ( lane == null ) throw new UserException.MalformedBAM(read, "Read "+read.getReadName()+" has no platform unit information");
+        if ( library == null ) throw new UserException.MalformedBAM(read, "Read "+read.getReadName()+" has no library information");
+
+        int end = 0;
+
+        if ( read.getReadPairedFlag() ) {
+
+            if ( read.getFirstOfPairFlag() ) {
+                if ( read.getSecondOfPairFlag() )
+                    throw new UserException.MalformedBAM(read, "Read "+read.getReadName()+" has conflicting first/second in pair attributes");
+                end = 1;
+            } else {
+                if ( ! read.getSecondOfPairFlag() )
+                    throw new UserException.MalformedBAM(read, "Read "+read.getReadName()+" has conflicting first/second in pair attributes");
+                end = 2;
+            }
+        }
+
+        CycleStats[] byLane = cyclesByLaneMap.get(lane);
+        CycleStats[] byLib = cyclesByLibraryMap.get(library);
+
+        //byte [] quals = USE_ORIGINAL_QUALS ? AlignmentUtils.getOriginalQualsInCycleOrder(read) : AlignmentUtils.getQualsInCycleOrder(read);
+
+        byte [] quals = AlignmentUtils.getQualsInCycleOrder(read);
+
+        // if end == 0 (single end lane), we allocate array of length 1, otherwise we need two
+        // elements in the array in order to be able to collect statistics for each end in the pair independently
+        if ( byLane == null ) cyclesByLaneMap.put(lane,byLane = new CycleStats[(end==0?1:2)]);
+        if ( byLib == null ) cyclesByLibraryMap.put(library, byLib =new CycleStats[2]);
+
+        if ( end != 0 ) end--; // we will now use 'end' as index into the array of stats
+
+        if ( byLane[end] == null ) byLane[end] = new CycleStats(MAX_READ_LENGTH);
+        if ( byLib[end] == null ) byLib[end] =new CycleStats(MAX_READ_LENGTH);
+        byLane[end].add(quals);
+        byLib[end].add(quals);
+
+        return 1;  //To change body of implemented methods use File | Settings | File Templates.
+    }
+
+    /**
+     * Provide an initial value for reduce computations.
+     *
+     * @return Initial value of reduce.
+     */
+    public Integer reduceInit() {
+        return 0;  //To change body of implemented methods use File | Settings | File Templates.
+    }
+
+    /**
+     * Reduces a single map with the accumulator provided as the ReduceType.
+     *
+     * @param value result of the map.
+     * @param sum   accumulator for the reduce.
+     * @return accumulator with result of the map taken into account.
+     */
+    public Integer reduce(Integer value, Integer sum) {
+        return sum.intValue()+value.intValue();  //To change body of implemented methods use File | Settings | File Templates.
+    }
+
+    public void onTraversalDone(Integer result) {
+        if ( HTML ) {
+            out.println("<h3>Cycle Quality QC</h3>\n");
+            out.println("File(s) analyzed: <br>");
+            for ( String fileName : getToolkit().getArguments().samFiles) out.println(fileName+"<br>");
+            out.println("<br>");
+        }
+        if ( HTML ) out.println("<br><br>");
+        out.println("\n"+result+" reads analyzed\n");
+        if ( HTML ) out.println("<br><br>");
+        out.println("by platform unit:");
+        if ( HTML ) out.println("<br>");
+        report2(cyclesByLaneMap, new File(PREFIX+".byLane.txt"),true);
+        out.println();
+        if ( HTML ) out.println("<br><br>");
+        out.println("\nby library:");
+        if ( HTML ) out.println("<br>");
+        report2(cyclesByLibraryMap, new File(PREFIX+".byLibrary.txt"),true);
+        out.println();
+        if ( HTML ) out.println("<br><br>");
+    }
+
+ 
+
+    private void report2(Map<String,CycleStats[]> m, File f,boolean summaryReport) {
+        long totalReads_1 =0;
+        long totalReads_2 =0;
+        long totalReads_unpaired = 0;
+        SortedSet<String> columns = new TreeSet<String>();
+        int maxLength = 0; // maximum read length across all lanes/read ends analyzed
+
+        for( Map.Entry<String,CycleStats[]> e : m.entrySet() ) {
+            if ( e.getValue()[0].getMaxReadLength() > maxLength ) maxLength = e.getValue()[0].getMaxReadLength();
+
+            if ( e.getValue().length == 1 || e.getValue().length == 2 && e.getValue()[1] == null ) {
+                totalReads_unpaired += e.getValue()[0].getReadCount(); // single end lane
+            } else {
+                totalReads_1 += e.getValue()[0].getReadCount();
+                totalReads_2 += e.getValue()[1].getReadCount();
+                if ( e.getValue()[1].getMaxReadLength() > maxLength ) maxLength = e.getValue()[1].getMaxReadLength();
+            }
+
+            columns.add(e.getKey());
+        }
+
+        if ( summaryReport ) {
+            if ( totalReads_1 == 0 && totalReads_2 != 0) {
+                out.println("   End 1: No reads");
+                if ( HTML ) out.println("<br>");
+            }
+            if ( totalReads_2 == 0 && totalReads_1 != 0 ) {
+                out.println("   End 2: No reads");
+                if ( HTML ) out.println("<br>");
+            }
+            if ( totalReads_1 == 0 && totalReads_2 == 0 && totalReads_unpaired == 0 ) {
+                out.println("   No reads found.");
+                if ( HTML ) out.println("<br>");
+            }
+        }
+
+        if ( totalReads_1 == 0 && totalReads_2 == 0 && totalReads_unpaired == 0 ) return;
+
+        try {
+            BufferedWriter w = new BufferedWriter(new FileWriter(f));
+
+            w.write("cycle");
+
+            for( String col : columns ) {
+                CycleStats[] data = m.get(col);
+                if ( summaryReport ) {
+                    out.print("   ");
+                    out.print(col);
+                }
+
+                CycleStats end1 = data[0];
+                int minL = ( end1 == null ? 0 : end1.getMinReadLength() );
+                int maxL = ( end1 == null ? 0 : end1.getMaxReadLength() );
+
+                if ( data.length == 2 && data[1] != null ) {
+                    if ( summaryReport ) {
+                        out.println(": paired");
+                        if ( HTML ) out.println("<br>");
+                        out.println("    Reads analyzed:");
+                        if ( HTML ) out.println("<br>");
+                    }
+                    CycleStats end2 = data[1];
+
+                    out.print( "      End 1: "+ ( end1 == null ? 0 : end1.getReadCount()) );
+                    if ( minL == maxL ) out.println("; read length = "+minL);
+                    else out.println("; WARNING: variable read length = "+minL+"-"+maxL);
+                    if ( HTML ) out.println("<br>");
+
+                    out.print( "      End 2: "+ ( end2 == null ? 0 : end2.getReadCount()) );
+                    minL = ( end2 == null ? 0 : end2.getMinReadLength() );
+                    maxL = ( end2 == null ? 0 : end2.getMaxReadLength() );
+                    if ( minL == maxL ) out.println("; read length = "+minL);
+                    else out.println("; WARNING: variable read length = "+minL+"-"+maxL);
+                    if ( HTML ) out.println("<br>");
+                }
+                else {
+                    out.println(": unpaired");
+                    if ( HTML ) out.println("<br>");
+                    out.print( "      Reads analyzed: "+ ( end1 == null ? 0 : end1.getReadCount()) );
+                    if ( minL == maxL ) out.println("; read length = "+minL);
+                    else out.println("; WARNING: variable read length = "+minL+"-"+maxL);
+                    if ( HTML ) out.println("<br>");
+                }
+
+                w.write('\t') ;
+                w.write(col);
+                if ( data.length == 1 || data.length == 2 && data[1] == null ) {
+                    w.write(".unpaired");
+                    w.write('\t');
+                    w.write(col);
+                    w.write(".unpaired.stddev");
+                }  else {
+                    w.write(".end1");
+                    w.write('\t');
+                    w.write(col);
+                    w.write(".end1.stddev");
+                    w.write('\t') ;
+                    w.write(col);
+                    w.write(".end2");
+                    w.write('\t');
+                    w.write(col);
+                    w.write(".end2.stddev");
+                }
+            }
+
+            w.write('\n');
+
+            int cycle = 0;
+
+            Map<String,List<PrimitivePair.Int>> problems = new HashMap<String,List<PrimitivePair.Int>>();
+
+            while ( cycle < maxLength ) {
+                w.write(Integer.toString(cycle+1));
+                for ( String col : columns ) {
+
+                    CycleStats[] data = m.get(col);
+                    CycleStats end1 = data[0];
+                    w.write('\t');
+                    if ( end1 == null || cycle >= end1.getMaxReadLength() ) w.write(".\t.");
+                    else {
+                        double aq = end1.getCycleQualAverage(cycle);
+                        w.write(String.format("%.4f\t%.4f",aq,end1.getCycleQualStdDev(cycle)));
+                        recordProblem(aq,cycle, problems,col+".End1");
+                    }
+                    if ( data.length > 1 && data[1] != null ) {
+                        w.write('\t');
+                        CycleStats end2 = data[1];
+                        if ( end2 == null || cycle >= end2.getMaxReadLength() ) w.write(".\t.");
+                        else {
+                            double aq = end2.getCycleQualAverage(cycle);
+                            w.write(String.format("%.4f\t%.4f",aq,end2.getCycleQualStdDev(cycle)));
+                            recordProblem(aq,cycle, problems,col+".End2");
+                        }
+                    }
+                }
+                w.write('\n');
+                cycle++;
+            }
+            w.close();
+
+            if ( HTML ) out.println("<hr>");
+
+            if ( HTML ) out.println("<br>");
+            out.println("\nOUTCOME (threshold at Q="+QTHRESHOLD+"):");
+            if ( HTML ) out.println("<br>");
+            for ( String col : columns ) {
+                List<PrimitivePair.Int> lp = problems.get(col+".End1");
+                out.print("  "+col+" End1:");
+                if ( lp == null ) {
+                    out.print(" GOOD");
+                } else {
+                    for ( PrimitivePair.Int p : lp ) {
+                        out.print(" "+(p.first+1)+"-");
+                        if ( p.second >= 0 ) out.print((p.second+1));
+                        else out.print("END");
+                    }
+                }
+                out.println();
+                if ( HTML ) out.println("<br>");
+
+                lp = problems.get(col+".End2");
+                out.print("  "+col+" End2:");
+                if ( lp == null ) {
+                    out.print(" GOOD");
+                } else {
+                    for ( PrimitivePair.Int p : lp ) {
+                        out.print(" "+(p.first+1)+"-");
+                        if ( p.second >= 0 ) out.print(p.second);
+                        else out.print("END");
+                    }
+                }
+                out.println();
+                if ( HTML ) out.println("<br>");
+            }
+
+        } catch (IOException ioe) {
+            throw new UserException.CouldNotCreateOutputFile(f, "Failed to write report", ioe);
+        }
+    }
+
+
+    private void recordProblem(double q, int cycle, Map<String,List<PrimitivePair.Int>> problems, String name) {
+
+        PrimitivePair.Int p = null;
+        List<PrimitivePair.Int> lp = null;
+        if ( q < QTHRESHOLD ) { // there is a problem
+               if ( ! problems.containsKey(name) ) {
+                   lp = new ArrayList<PrimitivePair.Int>();
+                   p = new PrimitivePair.Int(cycle,-1);
+                   lp.add(p);
+                   problems.put(name,lp);
+               } else {
+                   lp = problems.get(name);
+                   p = lp.get(lp.size()-1);
+               }
+               if ( p.second != -1 ) { // if we are not already inside a run of bad qual bases
+                   lp.add(new PrimitivePair.Int(cycle,-1)); // start new run
+               }
+        } else { // good base
+              if ( problems.containsKey(name) ) { // only if we had problem intervals at all, we need to check if the last one needs to be closed
+                  lp = problems.get(name);
+                  p = lp.get(lp.size()-1);
+                  if ( p.second == -1 ) p.second = cycle - 1;
+              }
+        }
+    }
+
+
+    static class CycleStats {
+        private long readCount = 0;
+        private double[] cycleQualsAv = null;
+        private double[] cycleQualsSd = null;
+        private int minL = 1000000000; // read min. length
+        private int maxL = 0; // read max. length
+
+        public CycleStats(int N) {
+            readCount = 0;
+            cycleQualsAv = new double[N];
+            cycleQualsSd = new double[N];
+        }
+
+        public void add(byte[] quals) {
+            if ( quals.length > cycleQualsAv.length )
+                throw new UserException("A read of length "+quals.length+" encountered, which exceeds specified maximum read length");
+            if ( quals.length > maxL ) maxL = quals.length;
+            if ( quals.length < minL ) minL = quals.length;
+            readCount++;
+            for ( int i = 0 ; i < quals.length ; i++ ) {
+                // NOTE: in the update equaltions below, there is no need to check if readCount == 1 (i.e.
+                // we are initializing with the very first record) or not. Indeed, the arrays are initialized with
+                // 0; when the very first value arrives, readCount is 1 and cycleQuals[i] gets set to quals[i] (correct!);
+                // this will also make the second term in the update equation for Sd (quals[i]-cycleQualsAv[i]) equal
+                // to 0, so Sd will be initially set to 0.
+                double oldAvg = cycleQualsAv[i]; // save old mean, will need it for calculation of the variance
+                cycleQualsAv[i] += ( quals[i] - cycleQualsAv[i] ) / readCount; // update mean
+                cycleQualsSd[i] += ( quals[i] - oldAvg ) * ( quals[i] - cycleQualsAv[i] );
+            }
+        }
+
+        public long getReadCount() { return readCount; }
+        public int getMaxReadLength() { return maxL; }
+        public int getMinReadLength() { return minL; }
+//        long [] getCycleQualSums() { return cycleQuals; }
+//        long getCycleQualSum(int i) { return cycleQuals[i]; }
+        double getCycleQualAverage(int i) { return cycleQualsAv[i]; }
+        double getCycleQualStdDev(int i) { return Math.sqrt( cycleQualsSd[i]/(readCount-1) ); }
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/PrintLocusContextWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/PrintLocusContextWalker.java
index d3b992cb5..ac0b3e7d5 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/PrintLocusContextWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/PrintLocusContextWalker.java
@@ -1,12 +1,12 @@
 package org.broadinstitute.sting.gatk.walkers.qc;
 
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.commandline.Output;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
 import org.broadinstitute.sting.gatk.walkers.LocusWalker;
 import org.broadinstitute.sting.gatk.walkers.TreeReducible;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.io.PrintStream;
 import java.util.Arrays;
@@ -40,7 +40,7 @@ public class PrintLocusContextWalker extends LocusWalker<AlignmentContext, Integ
         return lhs + rhs;
     }
 
-    private String[] getReadNames( List<SAMRecord> reads ) {
+    private String[] getReadNames( List<GATKSAMRecord> reads ) {
         String[] readNames = new String[ reads.size() ];
         for( int i = 0; i < reads.size(); i++ ) {
             readNames[i] = String.format("%nname = %s, start = %d, end = %d", reads.get(i).getReadName(), reads.get(i).getAlignmentStart(), reads.get(i).getAlignmentEnd());
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ReadClippingStatsWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ReadClippingStatsWalker.java
index 908e389a8..27f9d7b6d 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ReadClippingStatsWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ReadClippingStatsWalker.java
@@ -1,142 +1,142 @@
-/*
- * Copyright (c) 2009 The Broad Institute
- *  Permission is hereby granted, free of charge, to any person
- *  obtaining a copy of this software and associated documentation
- *  files (the "Software"), to deal in the Software without
- *  restriction, including without limitation the rights to use,
- *  copy, modify, merge, publish, distribute, sublicense, and/or sell
- *  copies of the Software, and to permit persons to whom the
- *  Software is furnished to do so, subject to the following
- *  conditions:
- *  The above copyright notice and this permission notice shall be
- *  included in all copies or substantial portions of the Software.
- *  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- *  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- *  OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- *  NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- *  HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- *  WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- *  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
- *  * OTHER DEALINGS IN THE SOFTWARE.
- */
-
-package org.broadinstitute.sting.gatk.walkers.qc;
-
-import net.sf.samtools.CigarElement;
-import net.sf.samtools.CigarOperator;
-import net.sf.samtools.SAMReadGroupRecord;
-import net.sf.samtools.SAMRecord;
-import org.broadinstitute.sting.commandline.Argument;
-import org.broadinstitute.sting.commandline.Output;
-import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
-import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
-import org.broadinstitute.sting.gatk.walkers.DataSource;
-import org.broadinstitute.sting.gatk.walkers.ReadWalker;
-import org.broadinstitute.sting.gatk.walkers.Requires;
-import org.broadinstitute.sting.utils.MathUtils;
-import org.broadinstitute.sting.utils.Utils;
-import org.broadinstitute.sting.utils.exceptions.UserException;
-import org.broadinstitute.sting.utils.sam.AlignmentUtils;
-
-import java.io.PrintStream;
-import java.util.Arrays;
-
-/**
- * User: depristo
- * Date: May 5, 2010
- * Time: 12:16:41 PM
- */
-
-/**
- * Walks over the input reads, printing out statistics about the read length, number of clipping events, and length
- * of the clipping to the output stream.
- */
-@Requires({DataSource.READS})
-public class ReadClippingStatsWalker extends ReadWalker<ReadClippingStatsWalker.ReadClippingInfo,Integer> {
-    @Output
-    protected PrintStream out;
-
-    @Argument(fullName="mappedOnly", shortName="mo", doc="when this flag is set (default), statistics will be collected "+
-                "on mapped reads only, while unmapped reads will be discarded", required=false)
-    protected boolean MAPPED_ONLY = true;
-
-    @Argument(fullName="skip", shortName="skip", doc="When provided, only every skip reads are analyzed", required=false)
-    protected int SKIP = 1;
-
-//    public void initialize() {
-//
-//    }
-
-    public class ReadClippingInfo {
-        SAMReadGroupRecord rg;
-        int readLength, nClippingEvents, nClippedBases;
-    }
-
-    public ReadClippingInfo map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker) {
-        if ( AlignmentUtils.isReadUnmapped(read) && MAPPED_ONLY)
-            return null;
-
-        ReadClippingInfo info = new ReadClippingInfo();
-        info.rg = read.getReadGroup();
-
-        if ( info.rg == null ) throw new UserException.ReadMissingReadGroup(read);
-
-        for ( CigarElement elt : read.getCigar().getCigarElements() ) {
-            if ( elt.getOperator() != CigarOperator.N )
-
-            switch ( elt.getOperator()) {
-                case H : // ignore hard clips
-                case S : // soft clip
-                    info.nClippingEvents++;
-                    info.nClippedBases += elt.getLength();
-                    // note the fall through here
-                case M :
-                case D : // deletion w.r.t. the reference
-                case P : // ignore pads
-                case I : // insertion w.r.t. the reference
-                    info.readLength += elt.getLength(); // Unless we have a reference skip, the read gets longer
-                    break;
-                case N : // reference skip (looks and gets processed just like a "deletion", just different logical meaning)
-                    break;
-                default : throw new IllegalStateException("Case statement didn't deal with cigar op: " + elt.getOperator());
-            }
-        }
-
-        return info;  //To change body of implemented methods use File | Settings | File Templates.
-    }
-
-    /**
-     * Provide an initial value for reduce computations.
-     *
-     * @return Initial value of reduce.
-     */
-    public Integer reduceInit() {
-        out.println(Utils.join(" \t", Arrays.asList("ReadGroup", "ReadLength", "NClippingEvents", "NClippedBases", "PercentClipped")));
-        return 0;
-    }
-
-    /**
-     * Reduces a single map with the accumulator provided as the ReduceType.
-     *
-     * @param info  result of the map.
-     * @param sum   accumulator for the reduce.
-     * @return accumulator with result of the map taken into account.
-     */
-    public Integer reduce(ReadClippingInfo info, Integer sum) {
-        if ( info != null ) {
-            if ( sum % SKIP == 0 ) {
-                String id = info.rg.getReadGroupId();
-                out.printf("%s\t %d\t %d\t %d\t %.2f%n",
-                        id, info.readLength, info.nClippingEvents, info.nClippedBases,
-                        100.0 * MathUtils.ratio(info.nClippedBases, info.readLength));
-            }
-            return sum + 1;  //To change body of implemented methods use File | Settings | File Templates.
-        } else {
-            return sum;
-        }
-    }
-
-    public void onTraversalDone(Integer result) {
-
-    }
+/*
+ * Copyright (c) 2009 The Broad Institute
+ *  Permission is hereby granted, free of charge, to any person
+ *  obtaining a copy of this software and associated documentation
+ *  files (the "Software"), to deal in the Software without
+ *  restriction, including without limitation the rights to use,
+ *  copy, modify, merge, publish, distribute, sublicense, and/or sell
+ *  copies of the Software, and to permit persons to whom the
+ *  Software is furnished to do so, subject to the following
+ *  conditions:
+ *  The above copyright notice and this permission notice shall be
+ *  included in all copies or substantial portions of the Software.
+ *  THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ *  EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ *  OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ *  NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ *  HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ *  WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ *  * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ *  * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.gatk.walkers.qc;
+
+import net.sf.samtools.CigarElement;
+import net.sf.samtools.CigarOperator;
+import net.sf.samtools.SAMReadGroupRecord;
+import org.broadinstitute.sting.commandline.Argument;
+import org.broadinstitute.sting.commandline.Output;
+import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
+import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
+import org.broadinstitute.sting.gatk.walkers.DataSource;
+import org.broadinstitute.sting.gatk.walkers.ReadWalker;
+import org.broadinstitute.sting.gatk.walkers.Requires;
+import org.broadinstitute.sting.utils.MathUtils;
+import org.broadinstitute.sting.utils.Utils;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.sam.AlignmentUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
+
+import java.io.PrintStream;
+import java.util.Arrays;
+
+/**
+ * User: depristo
+ * Date: May 5, 2010
+ * Time: 12:16:41 PM
+ */
+
+/**
+ * Walks over the input reads, printing out statistics about the read length, number of clipping events, and length
+ * of the clipping to the output stream.
+ */
+@Requires({DataSource.READS})
+public class ReadClippingStatsWalker extends ReadWalker<ReadClippingStatsWalker.ReadClippingInfo,Integer> {
+    @Output
+    protected PrintStream out;
+
+    @Argument(fullName="mappedOnly", shortName="mo", doc="when this flag is set (default), statistics will be collected "+
+                "on mapped reads only, while unmapped reads will be discarded", required=false)
+    protected boolean MAPPED_ONLY = true;
+
+    @Argument(fullName="skip", shortName="skip", doc="When provided, only every skip reads are analyzed", required=false)
+    protected int SKIP = 1;
+
+//    public void initialize() {
+//
+//    }
+
+    public class ReadClippingInfo {
+        SAMReadGroupRecord rg;
+        int readLength, nClippingEvents, nClippedBases;
+    }
+
+    public ReadClippingInfo map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker) {
+        if ( AlignmentUtils.isReadUnmapped(read) && MAPPED_ONLY)
+            return null;
+
+        ReadClippingInfo info = new ReadClippingInfo();
+        info.rg = read.getReadGroup();
+
+        if ( info.rg == null ) throw new UserException.ReadMissingReadGroup(read);
+
+        for ( CigarElement elt : read.getCigar().getCigarElements() ) {
+            if ( elt.getOperator() != CigarOperator.N )
+
+            switch ( elt.getOperator()) {
+                case H : // ignore hard clips
+                case S : // soft clip
+                    info.nClippingEvents++;
+                    info.nClippedBases += elt.getLength();
+                    // note the fall through here
+                case M :
+                case D : // deletion w.r.t. the reference
+                case P : // ignore pads
+                case I : // insertion w.r.t. the reference
+                    info.readLength += elt.getLength(); // Unless we have a reference skip, the read gets longer
+                    break;
+                case N : // reference skip (looks and gets processed just like a "deletion", just different logical meaning)
+                    break;
+                default : throw new IllegalStateException("Case statement didn't deal with cigar op: " + elt.getOperator());
+            }
+        }
+
+        return info;  //To change body of implemented methods use File | Settings | File Templates.
+    }
+
+    /**
+     * Provide an initial value for reduce computations.
+     *
+     * @return Initial value of reduce.
+     */
+    public Integer reduceInit() {
+        out.println(Utils.join(" \t", Arrays.asList("ReadGroup", "ReadLength", "NClippingEvents", "NClippedBases", "PercentClipped")));
+        return 0;
+    }
+
+    /**
+     * Reduces a single map with the accumulator provided as the ReduceType.
+     *
+     * @param info  result of the map.
+     * @param sum   accumulator for the reduce.
+     * @return accumulator with result of the map taken into account.
+     */
+    public Integer reduce(ReadClippingInfo info, Integer sum) {
+        if ( info != null ) {
+            if ( sum % SKIP == 0 ) {
+                String id = info.rg.getReadGroupId();
+                out.printf("%s\t %d\t %d\t %d\t %.2f%n",
+                        id, info.readLength, info.nClippingEvents, info.nClippedBases,
+                        100.0 * MathUtils.ratio(info.nClippedBases, info.readLength));
+            }
+            return sum + 1;  //To change body of implemented methods use File | Settings | File Templates.
+        } else {
+            return sum;
+        }
+    }
+
+    public void onTraversalDone(Integer result) {
+
+    }
 }
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ReadValidationWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ReadValidationWalker.java
index fa1bb4d55..4425f92c4 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ReadValidationWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ReadValidationWalker.java
@@ -6,6 +6,7 @@ import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
 import org.broadinstitute.sting.gatk.walkers.ReadWalker;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.security.MessageDigest;
 import java.security.NoSuchAlgorithmException;
@@ -64,21 +65,23 @@ public class ReadValidationWalker extends ReadWalker<SAMRecord, SAMRecord> {
 
     /**
      * The reads filter function.
+     *
      * @param ref the reference bases that correspond to our read, if a reference was provided
      * @param read the read itself, as a SAMRecord
      * @return true if the read passes the filter, false if it doesn't
      */
-    public boolean filter(ReferenceContext ref, SAMRecord read) {
+    public boolean filter(ReferenceContext ref, GATKSAMRecord read) {
         return true;
 	}
 
     /**
      * The reads map function.
+     *
      * @param ref the reference bases that correspond to our read, if a reference was provided
      * @param read the read itself, as a SAMRecord
      * @return the read itself
      */
-    public SAMRecord map( ReferenceContext ref, SAMRecord read, ReadMetaDataTracker metaDataTracker ) {
+    public SAMRecord map( ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker ) {
         return read;
     }
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ValidatingPileupWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ValidatingPileupWalker.java
index ca30d875b..cd17e4592 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ValidatingPileupWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ValidatingPileupWalker.java
@@ -78,7 +78,7 @@ public class ValidatingPileupWalker extends LocusWalker<Integer, ValidationStats
             }
         }
 
-        return pileup.size();
+        return pileup.getNumberOfElements();
     }
 
     private static String maybeSorted( final String x, boolean sortMe )
@@ -94,7 +94,7 @@ public class ValidatingPileupWalker extends LocusWalker<Integer, ValidationStats
 
     public String pileupDiff(final ReadBackedPileup a, final SAMPileupFeature b, boolean orderDependent)
     {
-        if ( a.size() != b.size() )
+        if ( a.getNumberOfElements() != b.size() )
             return "Sizes not equal";
         GenomeLoc featureLocation = getToolkit().getGenomeLocParser().createGenomeLoc(b.getChr(),b.getStart(),b.getEnd());
         if ( a.getLocation().compareTo(featureLocation) != 0 )
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/CycleCovariate.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/CycleCovariate.java
index 945d02837..e10334a77 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/CycleCovariate.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/CycleCovariate.java
@@ -2,9 +2,12 @@ package org.broadinstitute.sting.gatk.walkers.recalibration;
 
 import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.utils.BaseUtils;
+import org.broadinstitute.sting.utils.NGSPlatform;
 import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.Arrays;
+import java.util.EnumSet;
 import java.util.List;
 
 /*
@@ -46,6 +49,9 @@ import java.util.List;
  */
 
 public class CycleCovariate implements StandardCovariate {
+    private final static EnumSet<NGSPlatform> DISCRETE_CYCLE_PLATFORMS = EnumSet.of(NGSPlatform.ILLUMINA, NGSPlatform.SOLID, NGSPlatform.PACBIO, NGSPlatform.COMPLETE_GENOMICS);
+    private final static EnumSet<NGSPlatform> FLOW_CYCLE_PLATFORMS = EnumSet.of(NGSPlatform.LS454,  NGSPlatform.ION_TORRENT);
+
     // Initialize any member variables using the command-line arguments passed to the walkers
     public void initialize( final RecalibrationArgumentCollection RAC ) {
         if( RAC.DEFAULT_PLATFORM != null ) {
@@ -58,129 +64,15 @@ public class CycleCovariate implements StandardCovariate {
         }
     }
 
-    /*
-    // Used to pick out the covariate's value from attributes of the read
-    public final Comparable getValue( final SAMRecord read, final int offset ) {
-
-        int cycle = 1;
-
-        //-----------------------------
-        // ILLUMINA and SOLID
-        //-----------------------------
-
-        if( read.getReadGroup().getPlatform().equalsIgnoreCase( "ILLUMINA" ) || read.getReadGroup().getPlatform().equalsIgnoreCase( "SLX" ) || // Some bams have "illumina" and others have "SLX"
-            read.getReadGroup().getPlatform().equalsIgnoreCase( "SOLID" ) || read.getReadGroup().getPlatform().equalsIgnoreCase( "ABI_SOLID" )) { // Some bams have "solid" and others have "ABI_SOLID"
-            cycle = offset + 1;
-            if( read.getReadNegativeStrandFlag() ) {
-                cycle = read.getReadLength() - offset;
-            }
-        }
-
-        //-----------------------------
-        // 454
-        //-----------------------------
-
-        else if( read.getReadGroup().getPlatform().contains( "454" ) ) { // Some bams have "LS454" and others have just "454"
-            final byte[] bases = read.getReadBases();
-
-            // BUGBUG: Consider looking at degradation of base quality scores in homopolymer runs to detect when the cycle incremented even though the nucleotide didn't change
-            // For example, AAAAAAA was probably read in two flow cycles but here we count it as one
-            if( !read.getReadNegativeStrandFlag() ) { // Forward direction
-                int iii = 0;
-                while( iii <= offset )
-                {
-                    while( iii <= offset && bases[iii] == (byte)'T' ) { iii++; }
-                    while( iii <= offset && bases[iii] == (byte)'A' ) { iii++; }
-                    while( iii <= offset && bases[iii] == (byte)'C' ) { iii++; }
-                    while( iii <= offset && bases[iii] == (byte)'G' ) { iii++; }
-                    if( iii <= offset ) { cycle++; }
-                    if( iii <= offset && !BaseUtils.isRegularBase(bases[iii]) ) { iii++; }
-
-                }
-            } else { // Negative direction
-                int iii = bases.length-1;
-                while( iii >= offset )
-                {
-                    while( iii >= offset && bases[iii] == (byte)'T' ) { iii--; }
-                    while( iii >= offset && bases[iii] == (byte)'A' ) { iii--; }
-                    while( iii >= offset && bases[iii] == (byte)'C' ) { iii--; }
-                    while( iii >= offset && bases[iii] == (byte)'G' ) { iii--; }
-                    if( iii >= offset ) { cycle++; }
-                    if( iii >= offset && !BaseUtils.isRegularBase(bases[iii]) ) { iii--; }
-                }
-            }
-        }
-
-        //-----------------------------
-        // SOLID (unused), only to be used in conjunction with PrimerRoundCovariate
-        //-----------------------------
-
-        //else if( read.getReadGroup().getPlatform().equalsIgnoreCase( "SOLID" ) ) {
-        //    // The ligation cycle according to http://www3.appliedbiosystems.com/cms/groups/mcb_marketing/documents/generaldocuments/cms_057511.pdf
-        //    int pos = offset + 1;
-        //    if( read.getReadNegativeStrandFlag() ) {
-        //        pos = read.getReadLength() - offset;
-        //    }
-        //    cycle = pos / 5; // integer division
-        //}
-
-        //-----------------------------
-        // UNRECOGNIZED PLATFORM
-        //-----------------------------
-
-        else { // Platform is unrecognized so revert to the default platform but warn the user first
-            if( defaultPlatform != null) { // The user set a default platform
-                if( !warnedUserBadPlatform ) {
-                    Utils.warnUser( "Platform string (" + read.getReadGroup().getPlatform() + ") unrecognized in CycleCovariate. " +
-                            "Defaulting to platform = " + defaultPlatform + "." );
-                }
-                warnedUserBadPlatform = true;
-
-                read.getReadGroup().setPlatform( defaultPlatform );
-                return getValue( read, offset ); // A recursive call
-            } else { // The user did not set a default platform
-                throw new StingException( "Platform string (" + read.getReadGroup().getPlatform() + ") unrecognized in CycleCovariate. " +
-                        "No default platform specified. Users must set the default platform using the --default_platform <String> argument." );
-            }
-        }
-
-        // Differentiate between first and second of pair.
-        // The sequencing machine cycle keeps incrementing for the second read in a pair. So it is possible for a read group
-        // to have an error affecting quality at a particular cycle on the first of pair which carries over to the second of pair.
-        // Therefore the cycle covariate must differentiate between first and second of pair reads.
-        // This effect can not be corrected by pulling out the first of pair and second of pair flags into a separate covariate because
-        //   the current sequential model would consider the effects independently instead of jointly.
-        if( read.getReadPairedFlag() && read.getSecondOfPairFlag() ) {
-            cycle *= -1;
-        }
-
-        return cycle;
-    }
-    */
-
-    // todo -- this should be put into a common place in the code base
-    private static List<String> PACBIO_NAMES = Arrays.asList("PACBIO");
-    private static List<String> ILLUMINA_NAMES = Arrays.asList("ILLUMINA", "SLX", "SOLEXA");
-    private static List<String> SOLID_NAMES = Arrays.asList("SOLID");
-    private static List<String> LS454_NAMES = Arrays.asList("454");
-
-    private static boolean isPlatform(SAMRecord read, List<String> names) {
-        String pl = read.getReadGroup().getPlatform().toUpperCase();
-        for ( String name : names )
-            if ( pl.contains( name ) )
-                return true;
-        return false;
-    }
-
     // Used to pick out the covariate's value from attributes of the read
     public void getValues(SAMRecord read, Comparable[] comparable) {
 
         //-----------------------------
-        // ILLUMINA and SOLID
+        // Illumina, Solid, PacBio, and Complete Genomics
         //-----------------------------
 
-
-        if( isPlatform(read, ILLUMINA_NAMES) || isPlatform(read, SOLID_NAMES) || isPlatform(read, PACBIO_NAMES)) {
+        final NGSPlatform ngsPlatform = ((GATKSAMRecord)read).getNGSPlatform();
+        if( DISCRETE_CYCLE_PLATFORMS.contains(ngsPlatform) ) {
             final int init;
             final int increment;
             if( !read.getReadNegativeStrandFlag() ) {
@@ -222,7 +114,11 @@ public class CycleCovariate implements StandardCovariate {
                 cycle += increment;
             }
         }
-        else if ( isPlatform(read, LS454_NAMES) ) { // Some bams have "LS454" and others have just "454"
+
+        //-----------------------------
+        // 454 and Ion Torrent
+        //-----------------------------
+        else if( FLOW_CYCLE_PLATFORMS.contains(ngsPlatform) ) {
 
             final int readLength = read.getReadLength();
             final byte[] bases = read.getReadBases();
@@ -267,8 +163,6 @@ public class CycleCovariate implements StandardCovariate {
         else  {
             throw new IllegalStateException("This method hasn't been implemented yet for " + read.getReadGroup().getPlatform());
         }
-
-
     }
 
     // Used to get the covariate's value from input csv file in TableRecalibrationWalker
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/RecalDataManager.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/RecalDataManager.java
index ac25d4f13..a0c928afa 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/RecalDataManager.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/RecalDataManager.java
@@ -35,6 +35,7 @@ import org.broadinstitute.sting.utils.collections.NestedHashMap;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
 import org.broadinstitute.sting.utils.sam.AlignmentUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMReadGroupRecord;
 import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.ArrayList;
@@ -228,8 +229,7 @@ public class RecalDataManager {
      * @param RAC The list of shared command line arguments
      */
     public static void parseSAMRecord( final SAMRecord read, final RecalibrationArgumentCollection RAC ) {
-
-        SAMReadGroupRecord readGroup = read.getReadGroup();
+        GATKSAMReadGroupRecord readGroup = ((GATKSAMRecord)read).getReadGroup();
 
         // If there are no read groups we have to default to something, and that something could be specified by the user using command line arguments
         if( readGroup == null ) {
@@ -241,18 +241,17 @@ public class RecalDataManager {
                     warnUserNullReadGroup = true;
                 }
                 // There is no readGroup so defaulting to these values
-                readGroup = new SAMReadGroupRecord( RAC.DEFAULT_READ_GROUP );
+                readGroup = new GATKSAMReadGroupRecord( RAC.DEFAULT_READ_GROUP );
                 readGroup.setPlatform( RAC.DEFAULT_PLATFORM );
                 ((GATKSAMRecord)read).setReadGroup( readGroup );
             } else {
-                throw new UserException.MalformedBAM(read, "The input .bam file contains reads with no read group. First observed at read with name = " + read.getReadName() +
-                                         " Users must set both the default read group using the --default_read_group <String> argument and the default platform using the --default_platform <String> argument." );
+                throw new UserException.MalformedBAM(read, "The input .bam file contains reads with no read group. First observed at read with name = " + read.getReadName() );
             }
         }
 
         if( RAC.FORCE_READ_GROUP != null && !readGroup.getReadGroupId().equals(RAC.FORCE_READ_GROUP) ) { // Collapse all the read groups into a single common String provided by the user
             final String oldPlatform = readGroup.getPlatform();
-            readGroup = new SAMReadGroupRecord( RAC.FORCE_READ_GROUP );
+            readGroup = new GATKSAMReadGroupRecord( RAC.FORCE_READ_GROUP );
             readGroup.setPlatform( oldPlatform );
             ((GATKSAMRecord)read).setReadGroup( readGroup );
         }
@@ -271,8 +270,7 @@ public class RecalDataManager {
                 }
                 readGroup.setPlatform( RAC.DEFAULT_PLATFORM );
             } else {
-                throw new UserException.MalformedBAM(read, "The input .bam file contains reads with no platform information. First observed at read with name = " + read.getReadName() +
-                                         " Users must set the default platform using the --default_platform <String> argument." );
+                throw new UserException.MalformedBAM(read, "The input .bam file contains reads with no platform information. First observed at read with name = " + read.getReadName() );
             }
         }
     }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/RecalibrationArgumentCollection.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/RecalibrationArgumentCollection.java
index f31e2fc5b..75de84cb4 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/RecalibrationArgumentCollection.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/RecalibrationArgumentCollection.java
@@ -26,6 +26,7 @@
 package org.broadinstitute.sting.gatk.walkers.recalibration;
 
 import org.broadinstitute.sting.commandline.Argument;
+import org.broadinstitute.sting.commandline.Hidden;
 
 /**
  * Created by IntelliJ IDEA.
@@ -41,22 +42,29 @@ public class RecalibrationArgumentCollection {
     //////////////////////////////////
     // Shared Command Line Arguments
     //////////////////////////////////
+    @Hidden
     @Argument(fullName="default_read_group", shortName="dRG", required=false, doc="If a read has no read group then default to the provided String.")
     public String DEFAULT_READ_GROUP = null;
+    @Hidden
     @Argument(fullName="default_platform", shortName="dP", required=false, doc="If a read has no platform then default to the provided String. Valid options are illumina, 454, and solid.")
     public String DEFAULT_PLATFORM = null;
+    @Hidden
     @Argument(fullName="force_read_group", shortName="fRG", required=false, doc="If provided, the read group ID of EVERY read will be forced to be the provided String. This is useful to collapse all data into a single read group.")
     public String FORCE_READ_GROUP = null;
+    @Hidden
     @Argument(fullName="force_platform", shortName="fP", required=false, doc="If provided, the platform of EVERY read will be forced to be the provided String. Valid options are illumina, 454, and solid.")
     public String FORCE_PLATFORM = null;
+    @Hidden
     @Argument(fullName = "window_size_nqs", shortName="nqs", doc="The window size used by MinimumNQSCovariate for its calculation", required=false)
     public int WINDOW_SIZE = 5;
 
     /**
      * This window size tells the module in how big of a neighborhood around the current base it should look for the minimum base quality score.
      */
+    @Hidden
     @Argument(fullName = "homopolymer_nback", shortName="nback", doc="The number of previous bases to look at in HomopolymerCovariate", required=false)
     public int HOMOPOLYMER_NBACK = 7;
+    @Hidden
     @Argument(fullName = "exception_if_no_tile", shortName="throwTileException", doc="If provided, TileCovariate will throw an exception when no tile can be found. The default behavior is to use tile = -1", required=false)
     public boolean EXCEPTION_IF_NO_TILE = false;
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/TableRecalibrationWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/TableRecalibrationWalker.java
index 174e810c2..1ce02a3cf 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/TableRecalibrationWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/recalibration/TableRecalibrationWalker.java
@@ -170,9 +170,9 @@ public class TableRecalibrationWalker extends ReadWalker<SAMRecord, SAMFileWrite
     /////////////////////////////
     private RecalDataManager dataManager; // Holds the data HashMap, mostly used by TableRecalibrationWalker to create collapsed data hashmaps
     private final ArrayList<Covariate> requestedCovariates = new ArrayList<Covariate>(); // List of covariates to be used in this calculation
-    private static final Pattern COMMENT_PATTERN = Pattern.compile("^#.*");
-    private static final Pattern OLD_RECALIBRATOR_HEADER = Pattern.compile("^rg,.*");
-    private static final Pattern COVARIATE_PATTERN = Pattern.compile("^ReadGroup,QualityScore,.*");
+    public static final Pattern COMMENT_PATTERN = Pattern.compile("^#.*");
+    public static final Pattern OLD_RECALIBRATOR_HEADER = Pattern.compile("^rg,.*");
+    public static final Pattern COVARIATE_PATTERN = Pattern.compile("^ReadGroup,QualityScore,.*");
     public static final String EOF_MARKER = "EOF";
     private long numReadsWithMalformedColorSpace = 0;
 
@@ -364,11 +364,12 @@ public class TableRecalibrationWalker extends ReadWalker<SAMRecord, SAMFileWrite
 
     /**
      * For each base in the read calculate a new recalibrated quality score and replace the quality scores in the read
+     *
      * @param refBases References bases over the length of the read
      * @param read The read to be recalibrated
      * @return The read with quality scores replaced
      */
-    public SAMRecord map( ReferenceContext refBases, SAMRecord read, ReadMetaDataTracker metaDataTracker  ) {
+    public SAMRecord map( ReferenceContext refBases, GATKSAMRecord read, ReadMetaDataTracker metaDataTracker  ) {
 
         if( read.getReadLength() == 0 ) { // Some reads have '*' as the SEQ field and samtools returns length zero. We don't touch these reads.
             return read;
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/validation/GenotypeAndValidateWalker.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/validation/GenotypeAndValidateWalker.java
index f416e94a0..fd55d78a0 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/validation/GenotypeAndValidateWalker.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/validation/GenotypeAndValidateWalker.java
@@ -39,7 +39,6 @@ import org.broadinstitute.sting.utils.codecs.vcf.VCFHeader;
 import org.broadinstitute.sting.utils.codecs.vcf.VCFHeaderLine;
 import org.broadinstitute.sting.utils.codecs.vcf.VCFUtils;
 import org.broadinstitute.sting.utils.codecs.vcf.VCFWriter;
-import org.broadinstitute.sting.utils.exceptions.UserException;
 import org.broadinstitute.sting.utils.variantcontext.MutableVariantContext;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
 import org.broadinstitute.sting.utils.variantcontext.VariantContextUtils;
@@ -142,7 +141,7 @@ import static org.broadinstitute.sting.utils.IndelUtils.isInsideExtendedIndel;
  *  <h3>Additional Details</h3>
  *  <ul>
  *      <li>
- *          You should always use -BTI on your VCF track, so that the GATK only looks at the sites on the VCF file.
+ *          You should always use -L on your VCF track, so that the GATK only looks at the sites on the VCF file.
  *          This speeds up the process a lot.
  *      </li>
  *      <li>
@@ -165,7 +164,7 @@ import static org.broadinstitute.sting.utils.IndelUtils.isInsideExtendedIndel;
  *      -R human_g1k_v37.fasta
  *      -I myNewTechReads.bam
  *      -alleles handAnnotatedVCF.vcf
- *      -BTI alleles
+ *      -L handAnnotatedVCF.vcf
  * </pre>
  *
  *      <li>
@@ -179,7 +178,7 @@ import static org.broadinstitute.sting.utils.IndelUtils.isInsideExtendedIndel;
  *      -R human_g1k_v37.fasta
  *      -I myTruthDataset.bam
  *      -alleles callsToValidate.vcf
- *      -BTI alleles
+ *      -L callsToValidate.vcf
  *      -bt
  *      -o gav.vcf
  * </pre>
@@ -266,8 +265,13 @@ public class GenotypeAndValidateWalker extends RodWalker<GenotypeAndValidateWalk
     public static class CountedData {
         private long nAltCalledAlt = 0L;
         private long nAltCalledRef = 0L;
+        private long nAltNotCalled = 0L;
         private long nRefCalledAlt = 0L;
         private long nRefCalledRef = 0L;
+        private long nRefNotCalled = 0L;
+        private long nNoStatusCalledAlt = 0L;
+        private long nNoStatusCalledRef = 0L;
+        private long nNoStatusNotCalled = 0L;
         private long nNotConfidentCalls = 0L;
         private long nUncovered = 0L;
 
@@ -278,8 +282,13 @@ public class GenotypeAndValidateWalker extends RodWalker<GenotypeAndValidateWalk
         public void add(CountedData other) {
             nAltCalledAlt += other.nAltCalledAlt;
             nAltCalledRef += other.nAltCalledRef;
+            nAltNotCalled += other.nAltNotCalled;
             nRefCalledAlt += other.nRefCalledAlt;
             nRefCalledRef += other.nRefCalledRef;
+            nRefNotCalled += other.nRefNotCalled;
+            nNoStatusCalledAlt += other.nNoStatusCalledAlt;
+            nNoStatusCalledRef += other.nNoStatusCalledRef;
+            nNoStatusNotCalled += other.nNoStatusNotCalled;
             nUncovered += other.nUncovered;
             nNotConfidentCalls += other.nNotConfidentCalls;
         }
@@ -358,6 +367,13 @@ public class GenotypeAndValidateWalker extends RodWalker<GenotypeAndValidateWalk
         // Do not operate on variants that are not covered to the optional minimum depth
         if (!context.hasReads() || (minDepth > 0 && context.getBasePileup().getBases().length < minDepth)) {
             counter.nUncovered = 1L;
+            if (vcComp.getAttribute("GV").equals("T"))
+                counter.nAltNotCalled = 1L;
+            else if (vcComp.getAttribute("GV").equals("F"))
+                counter.nRefNotCalled = 1L;
+            else
+                counter.nNoStatusNotCalled = 1L;
+
             return counter;
         }
 
@@ -382,7 +398,7 @@ public class GenotypeAndValidateWalker extends RodWalker<GenotypeAndValidateWalk
                 // If truth is a confident REF call
                 if (call.isVariant()) {
                     if (vcComp.isVariant())
-                        counter.nAltCalledAlt = 1L;  // todo -- may wanna check if the alts called are the same?
+                        counter.nAltCalledAlt = 1L;
                     else {
                         counter.nAltCalledRef = 1L;
                         if ( printInterestingSites )
@@ -407,30 +423,41 @@ public class GenotypeAndValidateWalker extends RodWalker<GenotypeAndValidateWalk
             }
         }
         else {
-            if (!vcComp.hasAttribute("GV"))
-                throw new UserException.BadInput("Variant has no GV annotation in the INFO field. " + vcComp.getChr() + ":" + vcComp.getStart());
-
-
+//            if (!vcComp.hasAttribute("GV"))
+//                throw new UserException.BadInput("Variant has no GV annotation in the INFO field. " + vcComp.getChr() + ":" + vcComp.getStart());
 
             if (call.isCalledAlt(callConf)) {
                 if (vcComp.getAttribute("GV").equals("T"))
                     counter.nAltCalledAlt = 1L;
-                else {
+                else if (vcComp.getAttribute("GV").equals("F")) {
                     counter.nRefCalledAlt = 1L;
                     if ( printInterestingSites )
                         System.out.println("Truth=REF Call=ALT at " + call.getChr() + ":" + call.getStart());
                 }
+                else
+                    counter.nNoStatusCalledAlt = 1L;
             }
             else if (call.isCalledRef(callConf)) {
                 if (vcComp.getAttribute("GV").equals("T")) {
                     counter.nAltCalledRef = 1L;
                     if ( printInterestingSites )
                         System.out.println("Truth=ALT Call=REF at " + call.getChr() + ":" + call.getStart());
-                } else
+                }
+                else if (vcComp.getAttribute("GV").equals("F"))
                     counter.nRefCalledRef = 1L;
+
+                else
+                    counter.nNoStatusCalledRef = 1L;
             }
             else {
                 counter.nNotConfidentCalls = 1L;
+                if (vcComp.getAttribute("GV").equals("T"))
+                    counter.nAltNotCalled = 1L;
+                else if (vcComp.getAttribute("GV").equals("F"))
+                    counter.nRefNotCalled = 1L;
+                else
+                    counter.nNoStatusNotCalled = 1L;
+
                 if ( printInterestingSites )
                     System.out.println("Truth is not confident at " + call.getChr() + ":" + call.getStart());
                 writeVariant = false;
@@ -475,20 +502,21 @@ public class GenotypeAndValidateWalker extends RodWalker<GenotypeAndValidateWalk
         double sensitivity = 100 * ((double) reduceSum.nAltCalledAlt /( reduceSum.nAltCalledAlt + reduceSum.nAltCalledRef));
         double specificity = (reduceSum.nRefCalledRef + reduceSum.nRefCalledAlt > 0) ? 100 * ((double) reduceSum.nRefCalledRef /( reduceSum.nRefCalledRef + reduceSum.nRefCalledAlt)) : 100;
         logger.info(String.format("Resulting Truth Table Output\n\n" +
-                                  "---------------------------------------------------\n" +
-                                  "\t\t|\tALT\t|\tREF\t\n"  +
-                                  "---------------------------------------------------\n" +
-                                  "called alt\t|\t%d\t|\t%d\n" +
-                                  "called ref\t|\t%d\t|\t%d\n" +
-                                  "---------------------------------------------------\n" +
+                                  "------------------------------------------------------------------\n" +
+                                  "\t\t|\tALT\t|\tREF\t|\tNo Status\n"  +
+                                  "------------------------------------------------------------------\n" +
+                                  "called alt\t|\t%d\t|\t%d\t|\t%d\n" +
+                                  "called ref\t|\t%d\t|\t%d\t|\t%d\n" +
+                                  "not called\t|\t%d\t|\t%d\t|\t%d\n" +
+                                  "------------------------------------------------------------------\n" +
                                   "positive predictive value: %f%%\n" +
                                   "negative predictive value: %f%%\n" +
-                                  "---------------------------------------------------\n" +
+                                  "------------------------------------------------------------------\n" +
                                   "sensitivity: %f%%\n" +
                                   "specificity: %f%%\n" +
-                                  "---------------------------------------------------\n" +
+                                  "------------------------------------------------------------------\n" +
                                   "not confident: %d\n" +
                                   "not covered: %d\n" +
-                                  "---------------------------------------------------\n", reduceSum.nAltCalledAlt, reduceSum.nRefCalledAlt, reduceSum.nAltCalledRef, reduceSum.nRefCalledRef, ppv, npv, sensitivity, specificity, reduceSum.nNotConfidentCalls, reduceSum.nUncovered));
+                                  "------------------------------------------------------------------\n", reduceSum.nAltCalledAlt, reduceSum.nRefCalledAlt, reduceSum.nNoStatusCalledAlt, reduceSum.nAltCalledRef, reduceSum.nRefCalledRef, reduceSum.nNoStatusCalledRef, reduceSum.nAltNotCalled, reduceSum.nRefNotCalled, reduceSum.nNoStatusNotCalled, ppv, npv, sensitivity, specificity, reduceSum.nNotConfidentCalls, reduceSum.nUncovered));
     }
 }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/validation/ValidationAmplicons.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/validation/ValidationAmplicons.java
index 48cba6a1a..035d8d2ca 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/validation/ValidationAmplicons.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/validation/ValidationAmplicons.java
@@ -80,7 +80,7 @@ import java.util.List;
  *      -jar GenomeAnalysisTK.jar
  *      -T ValidationAmplicons
  *      -R /humgen/1kg/reference/human_g1k_v37.fasta
- *      -BTI ProbeIntervals
+ *      -L:table interval_table.table
  *      -ProbeIntervals:table interval_table.table
  *      -ValidateAlleles:vcf sites_to_validate.vcf
  *      -MaskAlleles:vcf mask_sites.vcf
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/CountVariants.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/CountVariants.java
index 2913c97a6..e83434037 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/CountVariants.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/CountVariants.java
@@ -110,12 +110,12 @@ public class CountVariants extends VariantEvaluator implements StandardEval {
                 case SNP:
                     nVariantLoci++;
                     nSNPs++;
-                    if (vc1.getAttributeAsBoolean("ISSINGLETON")) nSingletons++;
+                    if (vc1.getAttributeAsBoolean("ISSINGLETON", false)) nSingletons++;
                     break;
                 case MNP:
                     nVariantLoci++;
                     nMNPs++;
-                    if (vc1.getAttributeAsBoolean("ISSINGLETON")) nSingletons++;
+                    if (vc1.getAttributeAsBoolean("ISSINGLETON", false)) nSingletons++;
                     break;
                 case INDEL:
                     nVariantLoci++;
@@ -130,6 +130,10 @@ public class CountVariants extends VariantEvaluator implements StandardEval {
                     nVariantLoci++;
                     nMixed++;
                     break;
+                case SYMBOLIC:
+                    // ignore symbolic alleles, but don't fail
+                    // todo - consistent way of treating symbolic alleles thgoughout codebase?
+                    break;
                 default:
                     throw new ReviewedStingException("Unexpected VariantContext type " + vc1.getType());
             }
@@ -137,7 +141,7 @@ public class CountVariants extends VariantEvaluator implements StandardEval {
 
         String refStr = vc1.getReference().getBaseString().toUpperCase();
 
-        String aaStr = vc1.hasAttribute("ANCESTRALALLELE") ? vc1.getAttributeAsString("ANCESTRALALLELE").toUpperCase() : null;
+        String aaStr = vc1.hasAttribute("ANCESTRALALLELE") ? vc1.getAttributeAsString("ANCESTRALALLELE", null).toUpperCase() : null;
 //        if (aaStr.equals(".")) {
 //            aaStr = refStr;
 //        }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/GenotypePhasingEvaluator.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/GenotypePhasingEvaluator.java
index a476a2680..e69dbfb28 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/GenotypePhasingEvaluator.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/GenotypePhasingEvaluator.java
@@ -219,7 +219,8 @@ public class GenotypePhasingEvaluator extends VariantEvaluator {
     }
 
     public static Double getPQ(Genotype gt) {
-        return gt.getAttributeAsDoubleNoException(ReadBackedPhasingWalker.PQ_KEY);
+        Double d = gt.getAttributeAsDouble(ReadBackedPhasingWalker.PQ_KEY, -1);
+        return d == -1 ? null : d;
     }
 
     public static boolean topMatchesTop(AllelePair b1, AllelePair b2) {
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/SimpleMetricsByAC.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/SimpleMetricsByAC.java
index 203c15a85..2d0163206 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/SimpleMetricsByAC.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/SimpleMetricsByAC.java
@@ -120,7 +120,7 @@ public class SimpleMetricsByAC extends VariantEvaluator implements StandardEval
             if ( eval.hasGenotypes() )
                 ac = eval.getChromosomeCount(eval.getAlternateAllele(0));
             else if ( eval.hasAttribute("AC") ) {
-                ac = Integer.valueOf(eval.getAttributeAsString("AC"));
+                ac = eval.getAttributeAsInt("AC", -1);
             }
 
             if ( ac != -1 ) {
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/TiTvVariantEvaluator.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/TiTvVariantEvaluator.java
index 1feb37e01..9b6e145e6 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/TiTvVariantEvaluator.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/TiTvVariantEvaluator.java
@@ -49,18 +49,14 @@ public class TiTvVariantEvaluator extends VariantEvaluator implements StandardEv
                 else nTv++;
             }
 
-            String refStr = vc.getReference().getBaseString().toUpperCase();
-            String aaStr = vc.getAttributeAsString("ANCESTRALALLELE").toUpperCase();
-
-            if (aaStr != null && !aaStr.equalsIgnoreCase("null") && !aaStr.equals(".")) {
-                BaseUtils.BaseSubstitutionType aaSubType = BaseUtils.SNPSubstitutionType(aaStr.getBytes()[0], vc.getAlternateAllele(0).getBases()[0]);
-
-                //System.out.println(refStr + " " + vc.getAttributeAsString("ANCESTRALALLELE").toUpperCase() + " " + aaSubType);
-
-                if (aaSubType == BaseUtils.BaseSubstitutionType.TRANSITION) {
-                    nTiDerived++;
-                } else if (aaSubType == BaseUtils.BaseSubstitutionType.TRANSVERSION) {
-                    nTvDerived++;
+            if (vc.hasAttribute("ANCESTRALALLELE")) {
+                final String aaStr = vc.getAttributeAsString("ANCESTRALALLELE", "null").toUpperCase();
+                if ( ! aaStr.equals(".") ) {
+                    switch ( BaseUtils.SNPSubstitutionType(aaStr.getBytes()[0], vc.getAlternateAllele(0).getBases()[0] ) ) {
+                        case TRANSITION: nTiDerived++; break;
+                        case TRANSVERSION: nTvDerived++; break;
+                        default: break;
+                    }
                 }
             }
         }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/ValidationReport.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/ValidationReport.java
index 307b4f684..3b4967cad 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/ValidationReport.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/evaluators/ValidationReport.java
@@ -10,6 +10,7 @@ import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.variantcontext.Allele;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
 
+import java.util.Collection;
 import java.util.Set;
 
 /**
@@ -131,7 +132,7 @@ public class ValidationReport extends VariantEvaluator implements StandardEval {
 ////                System.out.printf("  ac = %d%n", ac);
             }
             else
-                ac = vc.getAttributeAsInt(VCFConstants.ALLELE_COUNT_KEY);
+                ac = vc.getAttributeAsInt(VCFConstants.ALLELE_COUNT_KEY, 0);
             return ac > 0 ? SiteStatus.POLY : SiteStatus.MONO;
         } else {
             return TREAT_ALL_SITES_IN_EVAL_VCF_AS_CALLED ? SiteStatus.POLY : SiteStatus.NO_CALL; // we can't figure out what to do
@@ -142,8 +143,8 @@ public class ValidationReport extends VariantEvaluator implements StandardEval {
 
 
     public boolean haveDifferentAltAlleles(VariantContext eval, VariantContext comp) {
-        Set<Allele> evalAlts = eval.getAlternateAlleles();
-        Set<Allele> compAlts = comp.getAlternateAlleles();
+        Collection<Allele> evalAlts = eval.getAlternateAlleles();
+        Collection<Allele> compAlts = comp.getAlternateAlleles();
         if ( evalAlts.size() != compAlts.size() ) {
             return true;
         } else {
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/AlleleCount.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/AlleleCount.java
index 3cc22cc52..c7bea93b2 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/AlleleCount.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/AlleleCount.java
@@ -44,7 +44,7 @@ public class AlleleCount extends VariantStratifier {
         if (eval != null) {
             int AC = -1;
             if ( eval.hasAttribute("AC") && eval.getAttribute("AC") instanceof Integer ) {
-                AC = eval.getAttributeAsInt("AC");
+                AC = eval.getAttributeAsInt("AC", 0);
             } else if ( eval.isVariant() ) {
                 for (Allele allele : eval.getAlternateAlleles())
                     AC = Math.max(AC, eval.getChromosomeCount(allele));
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/AlleleFrequency.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/AlleleFrequency.java
index 3d2dda651..cd2b8e475 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/AlleleFrequency.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/AlleleFrequency.java
@@ -28,7 +28,7 @@ public class AlleleFrequency extends VariantStratifier {
 
         if (eval != null) {
             try {
-                relevantStates.add(String.format("%.3f", (5.0 * MathUtils.round(eval.getAttributeAsDouble("AF") / 5.0, 3))));
+                relevantStates.add(String.format("%.3f", (5.0 * MathUtils.round(eval.getAttributeAsDouble("AF", 0.0) / 5.0, 3))));
             } catch (Exception e) {
                 return relevantStates;
             }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/Degeneracy.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/Degeneracy.java
index 3223626c0..91c96e490 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/Degeneracy.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/Degeneracy.java
@@ -90,8 +90,8 @@ public class Degeneracy extends VariantStratifier {
             Integer frame = null;
 
             if (eval.hasAttribute("refseq.functionalClass")) {
-                aa = eval.getAttributeAsString("refseq.variantAA");
-                frame = eval.getAttributeAsInt("refseq.frame");
+                aa = eval.getAttributeAsString("refseq.variantAA", null);
+                frame = eval.getAttributeAsInt("refseq.frame", 0);
             } else if (eval.hasAttribute("refseq.functionalClass_1")) {
                 int annotationId = 1;
                 String key;
@@ -99,7 +99,7 @@ public class Degeneracy extends VariantStratifier {
                 do {
                     key = String.format("refseq.functionalClass_%d", annotationId);
 
-                    String newtype = eval.getAttributeAsString(key);
+                    String newtype = eval.getAttributeAsString(key, null);
 
                     if ( newtype != null &&
                             ( type == null ||
@@ -109,13 +109,13 @@ public class Degeneracy extends VariantStratifier {
                         type = newtype;
 
                         String aakey = String.format("refseq.variantAA_%d", annotationId);
-                        aa = eval.getAttributeAsString(aakey);
+                        aa = eval.getAttributeAsString(aakey, null);
 
                         if (aa != null) {
                             String framekey = String.format("refseq.frame_%d", annotationId);
 
                             if (eval.hasAttribute(framekey)) {
-                                frame = eval.getAttributeAsInt(framekey);
+                                frame = eval.getAttributeAsInt(framekey, 0);
                             }
                         }
                     }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/FunctionalClass.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/FunctionalClass.java
index 1dc047b5d..f5dcf527a 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/FunctionalClass.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/FunctionalClass.java
@@ -28,7 +28,7 @@ public class FunctionalClass extends VariantStratifier {
     }
 
 
-    public List<String> getRelevantStates(ReferenceContext ref, RefMetaDataTracker tracker, VariantContext comp, String compName, VariantContext eval, String evalName, String sampleName) {
+public List<String> getRelevantStates(ReferenceContext ref, RefMetaDataTracker tracker, VariantContext comp, String compName, VariantContext eval, String evalName, String sampleName) {
         ArrayList<String> relevantStates = new ArrayList<String>();
 
         relevantStates.add("all");
@@ -38,7 +38,7 @@ public class FunctionalClass extends VariantStratifier {
 
             if (eval.hasAttribute("refseq.functionalClass")) {
                 try {
-                    type = FunctionalType.valueOf(eval.getAttributeAsString("refseq.functionalClass"));
+                    type = FunctionalType.valueOf(eval.getAttributeAsString("refseq.functionalClass", null));
                 } catch ( Exception e ) {} // don't error out if the type isn't supported
             } else if (eval.hasAttribute("refseq.functionalClass_1")) {
                 int annotationId = 1;
@@ -47,7 +47,7 @@ public class FunctionalClass extends VariantStratifier {
                 do {
                     key = String.format("refseq.functionalClass_%d", annotationId);
 
-                    String newtypeStr = eval.getAttributeAsString(key);
+                    String newtypeStr = eval.getAttributeAsString(key, null);
                     if ( newtypeStr != null && !newtypeStr.equalsIgnoreCase("null") ) {
                         try {
                             FunctionalType newType = FunctionalType.valueOf(newtypeStr);
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/IndelSize.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/IndelSize.java
new file mode 100644
index 000000000..1b9513b9a
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/stratifications/IndelSize.java
@@ -0,0 +1,52 @@
+package org.broadinstitute.sting.gatk.walkers.varianteval.stratifications;
+
+import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
+import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
+import org.broadinstitute.sting.utils.MathUtils;
+import org.broadinstitute.sting.utils.variantcontext.VariantContext;
+
+import java.util.ArrayList;
+import java.util.List;
+
+/**
+ * Stratifies the eval RODs by the indel size
+ *
+ * Indel sizes are stratified from sizes -100 to +100. Sizes greater than this are lumped in the +/- 100 bin
+ * This stratification ignores multi-allelic indels (whose size is not defined uniquely)
+ */
+public class IndelSize extends VariantStratifier {
+    static final int MAX_INDEL_SIZE = 100;
+    @Override
+    public void initialize() {
+        states = new ArrayList<String>();
+        for( int a=-MAX_INDEL_SIZE; a <=MAX_INDEL_SIZE; a++ ) {
+            states.add(String.format("%d", a));
+        }
+    }
+
+    public List<String> getRelevantStates(ReferenceContext ref, RefMetaDataTracker tracker, VariantContext comp, String compName, VariantContext eval, String evalName, String sampleName) {
+        ArrayList<String> relevantStates = new ArrayList<String>();
+
+        if (eval != null && eval.isIndel() && eval.isBiallelic()) {
+            try {
+                int eventLength = 0;
+                if ( eval.isSimpleInsertion() ) {
+                    eventLength = eval.getAlternateAllele(0).length();
+                } else if ( eval.isSimpleDeletion() ) {
+                    eventLength = -eval.getReference().length();
+                }
+
+                if (eventLength > MAX_INDEL_SIZE)
+                    eventLength = MAX_INDEL_SIZE;
+                else if (eventLength < -MAX_INDEL_SIZE)
+                    eventLength = -MAX_INDEL_SIZE;
+
+                relevantStates.add(String.format("%d",eventLength));
+            } catch (Exception e) {
+                return relevantStates;
+            }
+        }
+
+        return relevantStates;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/util/VariantEvalUtils.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/util/VariantEvalUtils.java
index 92e7c6554..6a057a456 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/util/VariantEvalUtils.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/varianteval/util/VariantEvalUtils.java
@@ -354,7 +354,7 @@ public class VariantEvalUtils {
 
     private void addMapping(HashMap<String, Set<VariantContext>> mappings, String sample, VariantContext vc) {
         if ( !mappings.containsKey(sample) )
-            mappings.put(sample, new HashSet<VariantContext>());
+            mappings.put(sample, new LinkedHashSet<VariantContext>());
         mappings.get(sample).add(vc);
     }
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/ApplyRecalibration.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/ApplyRecalibration.java
index 16f1abf1b..1d5493daf 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/ApplyRecalibration.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/ApplyRecalibration.java
@@ -32,6 +32,8 @@ import org.broadinstitute.sting.commandline.RodBinding;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
+import org.broadinstitute.sting.gatk.walkers.PartitionBy;
+import org.broadinstitute.sting.gatk.walkers.PartitionType;
 import org.broadinstitute.sting.gatk.walkers.RodWalker;
 import org.broadinstitute.sting.utils.SampleUtils;
 import org.broadinstitute.sting.utils.codecs.vcf.*;
@@ -84,6 +86,7 @@ import java.util.*;
  *
  */
 
+@PartitionBy(PartitionType.NONE)
 public class ApplyRecalibration extends RodWalker<Integer, Integer> {
 
     /////////////////////////////
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/VQSRCalibrationCurve.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/VQSRCalibrationCurve.java
index bc7252ec2..04ba3ff14 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/VQSRCalibrationCurve.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/VQSRCalibrationCurve.java
@@ -115,7 +115,7 @@ public class VQSRCalibrationCurve {
         if ( vc.isFiltered() )
             return 0.0;
         else if ( vc.hasAttribute(VQSRQualKey) ) {
-            double qual = vc.getAttributeAsDouble(VQSRQualKey);
+            double qual = vc.getAttributeAsDouble(VQSRQualKey, 0.0);
             return probTrueVariant(qual);
         } else {
             throw new UserException.VariantContextMissingRequiredField(VQSRQualKey, vc);
@@ -143,7 +143,7 @@ public class VQSRCalibrationCurve {
             for ( int i = 0; i < log10Likelihoods.length; i++) {
                 double p = Math.pow(10, log10Likelihoods[i]);
                 double q = alpha * p + (1-alpha) * noInfoPr;
-                if ( DEBUG ) System.out.printf("  vqslod = %.2f, p = %.2e, alpha = %.2e, q = %.2e%n", vc.getAttributeAsDouble(VQSRQualKey), p, alpha, q);
+                if ( DEBUG ) System.out.printf("  vqslod = %.2f, p = %.2e, alpha = %.2e, q = %.2e%n", vc.getAttributeAsDouble(VQSRQualKey, 0.0), p, alpha, q);
                 updated[i] = Math.log10(q);
             }
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/VariantRecalibrator.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/VariantRecalibrator.java
index 89e702b64..f60a94a22 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/VariantRecalibrator.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantrecalibration/VariantRecalibrator.java
@@ -29,13 +29,17 @@ import org.broadinstitute.sting.commandline.*;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
 import org.broadinstitute.sting.gatk.refdata.RefMetaDataTracker;
+import org.broadinstitute.sting.gatk.walkers.PartitionBy;
+import org.broadinstitute.sting.gatk.walkers.PartitionType;
 import org.broadinstitute.sting.gatk.walkers.RodWalker;
 import org.broadinstitute.sting.gatk.walkers.TreeReducible;
 import org.broadinstitute.sting.utils.MathUtils;
 import org.broadinstitute.sting.utils.QualityUtils;
+import org.broadinstitute.sting.utils.R.RScriptExecutor;
 import org.broadinstitute.sting.utils.Utils;
 import org.broadinstitute.sting.utils.collections.ExpandingArrayList;
 import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.io.Resource;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
 import org.broadinstitute.sting.utils.variantcontext.VariantContextUtils;
 
@@ -62,6 +66,10 @@ import java.util.*;
  * the log odds ratio of being a true variant versus being false under the trained Gaussian mixture model.
  *
  * <p>
+ * NOTE: In order to create the model reporting plots Rscript needs to be in your environment PATH (this is the scripting version of R, not the interactive version).
+ * See <a target="r-project" href="http://www.r-project.org">http://www.r-project.org</a> for more info on how to download and install R.
+ *
+ * <p>
  * See the GATK wiki for a tutorial and example recalibration accuracy plots.
  * http://www.broadinstitute.org/gsa/wiki/index.php/Variant_quality_score_recalibration
  *
@@ -94,10 +102,12 @@ import java.util.*;
  *
  */
 
+@PartitionBy(PartitionType.NONE)
 public class VariantRecalibrator extends RodWalker<ExpandingArrayList<VariantDatum>, ExpandingArrayList<VariantDatum>> implements TreeReducible<ExpandingArrayList<VariantDatum>> {
 
     public static final String VQS_LOD_KEY = "VQSLOD"; // Log odds ratio of being a true variant versus being false under the trained gaussian mixture model
     public static final String CULPRIT_KEY = "culprit"; // The annotation which was the worst performing in the Gaussian mixture model, likely the reason why the variant was filtered out
+    private static final String PLOT_TRANCHES_RSCRIPT = "plot_Tranches.R";
 
     @ArgumentCollection private VariantRecalibratorArgumentCollection VRAC = new VariantRecalibratorArgumentCollection();
 
@@ -155,12 +165,8 @@ public class VariantRecalibrator extends RodWalker<ExpandingArrayList<VariantDat
     private double[] TS_TRANCHES = new double[] {100.0, 99.9, 99.0, 90.0};
     @Argument(fullName="ignore_filter", shortName="ignoreFilter", doc="If specified the variant recalibrator will use variants even if the specified filter name is marked in the input VCF file", required=false)
     private String[] IGNORE_INPUT_FILTERS = null;
-    @Argument(fullName="path_to_Rscript", shortName = "Rscript", doc = "The path to your implementation of Rscript. For Broad users this is maybe /broad/software/free/Linux/redhat_5_x86_64/pkgs/r_2.12.0/bin/Rscript", required=false)
-    private String PATH_TO_RSCRIPT = "Rscript";
-    @Argument(fullName="rscript_file", shortName="rscriptFile", doc="The output rscript file generated by the VQSR to aid in visualization of the input data and learned model", required=false)
-    private String RSCRIPT_FILE = null;
-    @Argument(fullName = "path_to_resources", shortName = "resources", doc = "Path to resources folder holding the Sting R scripts.", required=false)
-    private String PATH_TO_RESOURCES = "public/R/";
+    @Output(fullName="rscript_file", shortName="rscriptFile", doc="The output rscript file generated by the VQSR to aid in visualization of the input data and learned model", required=false)
+    private File RSCRIPT_FILE = null;
     @Argument(fullName="ts_filter_level", shortName="ts_filter_level", doc="The truth sensitivity level at which to start filtering, used here to indicate filtered variants in the model reporting plots", required=false)
     private double TS_FILTER_LEVEL = 99.0;
 
@@ -189,9 +195,13 @@ public class VariantRecalibrator extends RodWalker<ExpandingArrayList<VariantDat
     //---------------------------------------------------------------------------------------------------------------
 
     public void initialize() {
-        if( !PATH_TO_RESOURCES.endsWith("/") ) { PATH_TO_RESOURCES = PATH_TO_RESOURCES + "/"; }
         dataManager = new VariantDataManager( new ArrayList<String>(Arrays.asList(USE_ANNOTATIONS)), VRAC );
 
+        if (RSCRIPT_FILE != null && !RScriptExecutor.RSCRIPT_EXISTS)
+            Utils.warnUser(logger, String.format(
+                    "Rscript not found in environment path. %s will be generated but PDF plots will not.",
+                    RSCRIPT_FILE));
+
         if( IGNORE_INPUT_FILTERS != null ) {
             ignoreInputFilterSet.addAll( Arrays.asList(IGNORE_INPUT_FILTERS) );
         }
@@ -324,20 +334,13 @@ public class VariantRecalibrator extends RodWalker<ExpandingArrayList<VariantDat
             createVisualizationScript( dataManager.getRandomDataForPlotting( 6000 ), goodModel, badModel, lodCutoff );
         }
 
-        // Execute Rscript command to create the tranche plot
-        // Print out the command line to make it clear to the user what is being executed and how one might modify it
-        final String rScriptTranchesCommandLine = PATH_TO_RSCRIPT + " " + PATH_TO_RESOURCES + "plot_Tranches.R" + " " + TRANCHES_FILE.getAbsolutePath() + " " + TARGET_TITV;
-        logger.info( "Executing: " + rScriptTranchesCommandLine );
-
         // Execute the RScript command to plot the table of truth values
-        try {
-            Process p;
-            p = Runtime.getRuntime().exec( rScriptTranchesCommandLine );
-            p.waitFor();
-        } catch ( Exception e ) {
-            Utils.warnUser("Unable to execute the RScript command.  While not critical to the calculations themselves, the script outputs a report that is extremely useful for confirming that the recalibration proceded as expected.  We highly recommend trying to rerun the script manually if possible.");
-        }
-
+        RScriptExecutor executor = new RScriptExecutor();
+        executor.addScript(new Resource(PLOT_TRANCHES_RSCRIPT, VariantRecalibrator.class));
+        executor.addArgs(TRANCHES_FILE.getAbsoluteFile(), TARGET_TITV);
+        // Print out the command line to make it clear to the user what is being executed and how one might modify it
+        logger.info("Executing: " + executor.getApproximateCommandLine());
+        executor.exec();
     }
 
     private void createVisualizationScript( final ExpandingArrayList<VariantDatum> randomData, final GaussianMixtureModel goodModel, final GaussianMixtureModel badModel, final double lodCutoff ) {
@@ -345,15 +348,18 @@ public class VariantRecalibrator extends RodWalker<ExpandingArrayList<VariantDat
         try {
             stream = new PrintStream(RSCRIPT_FILE);
         } catch( FileNotFoundException e ) {
-            throw new UserException.CouldNotCreateOutputFile(RSCRIPT_FILE, "", e);
+            throw new UserException.CouldNotCreateOutputFile(RSCRIPT_FILE, e);
         }
 
         // We make extensive use of the ggplot2 R library: http://had.co.nz/ggplot2/
         stream.println("library(ggplot2)");
+        // For compactPDF in R 2.13+
+        stream.println("library(tools)");
 
         createArrangeFunction( stream );
 
-        stream.println("pdf(\"" + RSCRIPT_FILE + ".pdf\")"); // Unfortunately this is a huge pdf file, BUGBUG: need to work on reducing the file size
+        stream.println("outputPDF <- \"" + RSCRIPT_FILE + ".pdf\"");
+        stream.println("pdf(outputPDF)"); // Unfortunately this is a huge pdf file, BUGBUG: need to work on reducing the file size
 
         for(int iii = 0; iii < USE_ANNOTATIONS.length; iii++) {
             for( int jjj = iii + 1; jjj < USE_ANNOTATIONS.length; jjj++) {
@@ -428,18 +434,17 @@ public class VariantRecalibrator extends RodWalker<ExpandingArrayList<VariantDat
         }
         stream.println("dev.off()");
 
+        stream.println("if (exists(\"compactPDF\")) {");
+        stream.println("compactPDF(ouputPDF)");
+        stream.println("}");
+
         stream.close();
 
         // Execute Rscript command to generate the clustering plots
-        final String rScriptTranchesCommandLine = PATH_TO_RSCRIPT + " " +  RSCRIPT_FILE;
-        logger.info( "Executing: " + rScriptTranchesCommandLine );
-        try {
-            Process p;
-            p = Runtime.getRuntime().exec( rScriptTranchesCommandLine );
-            p.waitFor();
-        } catch ( Exception e ) {
-            Utils.warnUser("Unable to execute the RScript command.  While not critical to the calculations themselves, the script outputs a report that is extremely useful for visualizing the recalibration results.  We highly recommend trying to rerun the script manually if possible.");
-        }
+        RScriptExecutor executor = new RScriptExecutor();
+        executor.addScript(RSCRIPT_FILE);
+        logger.info("Executing: " + executor.getApproximateCommandLine());
+        executor.exec();
      }
 
     // The Arrange function is how we place the 4 model plots on one page
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/CombineVariants.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/CombineVariants.java
index 7062f17e5..ce03dfffe 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/CombineVariants.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/CombineVariants.java
@@ -233,7 +233,7 @@ public class CombineVariants extends RodWalker<Integer, Integer> {
 
         if (minimumN > 1 && (vcs.size() - numFilteredRecords < minimumN))
             return 0;
-        
+
         List<VariantContext> mergedVCs = new ArrayList<VariantContext>();
         Map<VariantContext.Type, List<VariantContext>> VCsByType = VariantContextUtils.separateVariantContextsByType(vcs);
         // iterate over the types so that it's deterministic
@@ -244,7 +244,7 @@ public class CombineVariants extends RodWalker<Integer, Integer> {
                         SET_KEY, filteredAreUncalled, MERGE_INFO_WITH_MAX_AC));
         }
 
-        for ( VariantContext mergedVC : mergedVCs ) {
+         for ( VariantContext mergedVC : mergedVCs ) {
             // only operate at the start of events
             if ( mergedVC == null )
                 continue;
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/LiftoverVariants.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/LiftoverVariants.java
index 1c76a21ea..a932d44ed 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/LiftoverVariants.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/LiftoverVariants.java
@@ -99,7 +99,7 @@ public class LiftoverVariants extends RodWalker<Integer, Integer> {
 
 
         final VCFHeader vcfHeader = new VCFHeader(metaData, samples);
-        writer = new StandardVCFWriter(file, false);
+        writer = new StandardVCFWriter(file, getMasterSequenceDictionary(), false);
         writer.writeHeader(vcfHeader);
     }
 
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/RandomlySplitVariants.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/RandomlySplitVariants.java
index 1fefd20fc..88de12f9a 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/RandomlySplitVariants.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/RandomlySplitVariants.java
@@ -58,15 +58,12 @@ public class RandomlySplitVariants extends RodWalker<Integer, Integer> {
     @Argument(fullName="fractionToOut1", shortName="fraction", doc="Fraction of records to be placed in out1 (must be 0 >= fraction <= 1); all other records are placed in out2", required=false)
     protected double fraction = 0.5;
 
-    protected int iFraction;
-
     /**
      * Set up the VCF writer, the sample expressions and regexs, and the JEXL matcher
      */
     public void initialize() {
         if ( fraction < 0.0 || fraction > 1.0 )
             throw new UserException.BadArgumentValue("fractionToOut1", "this value needs to be a number between 0 and 1");
-        iFraction = (int)(fraction * 1000.0);
 
         // setup the header info
         final List<String> inputNames = Arrays.asList(variantCollection.variants.getName());
@@ -75,7 +72,7 @@ public class RandomlySplitVariants extends RodWalker<Integer, Integer> {
         hInfo.addAll(VCFUtils.getHeaderFields(getToolkit(), inputNames));
 
         vcfWriter1.writeHeader(new VCFHeader(hInfo, samples));
-        vcfWriter2 = new StandardVCFWriter(file2, true);
+        vcfWriter2 = new StandardVCFWriter(file2, getMasterSequenceDictionary(), true);
         vcfWriter2.writeHeader(new VCFHeader(hInfo, samples));
     }
 
@@ -93,8 +90,8 @@ public class RandomlySplitVariants extends RodWalker<Integer, Integer> {
 
         Collection<VariantContext> vcs = tracker.getValues(variantCollection.variants, context.getLocation());
         for ( VariantContext vc : vcs ) {
-            int random = GenomeAnalysisEngine.getRandomGenerator().nextInt(1000);
-            if ( random < iFraction )
+            double random = GenomeAnalysisEngine.getRandomGenerator().nextDouble();
+            if ( random < fraction )
                 vcfWriter1.add(vc);
             else
                 vcfWriter2.add(vc);
@@ -107,5 +104,8 @@ public class RandomlySplitVariants extends RodWalker<Integer, Integer> {
 
     public Integer reduce(Integer value, Integer sum) { return value + sum; }
 
-    public void onTraversalDone(Integer result) { logger.info(result + " records processed."); }
+    public void onTraversalDone(Integer result) {
+        logger.info(result + " records processed.");
+        vcfWriter2.close();
+    }
 }
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/SelectVariants.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/SelectVariants.java
index 459ffb75e..609593acc 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/SelectVariants.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/SelectVariants.java
@@ -255,14 +255,6 @@ public class SelectVariants extends RodWalker<Integer, Integer> {
     @Argument(fullName="keepOriginalAC", shortName="keepOriginalAC", doc="Don't update the AC, AF, or AN values in the INFO field after selecting", required=false)
     private boolean KEEP_ORIGINAL_CHR_COUNTS = false;
 
-    @Hidden
-    @Argument(fullName="keepAFSpectrum", shortName="keepAF", doc="Don't include loci found to be non-variant after the subsetting procedure", required=false)
-    private boolean KEEP_AF_SPECTRUM = false;
-
-    @Hidden
-    @Argument(fullName="afFile", shortName="afFile", doc="The output recal file used by ApplyRecalibration", required=false)
-    private File AF_FILE = new File("");
-
     @Hidden
     @Argument(fullName="family_structure_file", shortName="familyFile", doc="use -family unless you know what you're doing", required=false)
     private File FAMILY_STRUCTURE_FILE = null;
@@ -442,7 +434,7 @@ public class SelectVariants extends RodWalker<Integer, Integer> {
                             mvSet.add(mv);
                     }
                 } catch ( FileNotFoundException e ) {
-                    throw new UserException.CouldNotReadInputFile(AF_FILE, e);
+                    throw new UserException.CouldNotReadInputFile(FAMILY_STRUCTURE_FILE, e);
                 }
                 if (outMVFile != null)
                     try {
@@ -452,7 +444,7 @@ public class SelectVariants extends RodWalker<Integer, Integer> {
                         throw new UserException.CouldNotCreateOutputFile(outMVFile, "Can't open output file", e);   }
             }
             else
-                mvSet.add(new MendelianViolation(getToolkit(), MENDELIAN_VIOLATION_QUAL_THRESHOLD));
+                mvSet.add(new MendelianViolation(FAMILY_STRUCTURE, MENDELIAN_VIOLATION_QUAL_THRESHOLD));
         }
         else if (!FAMILY_STRUCTURE.isEmpty()) {
             mvSet.add(new MendelianViolation(FAMILY_STRUCTURE, MENDELIAN_VIOLATION_QUAL_THRESHOLD));
@@ -469,31 +461,7 @@ public class SelectVariants extends RodWalker<Integer, Integer> {
         if (SELECT_RANDOM_FRACTION) logger.info("Selecting approximately " + 100.0*fractionRandom + "% of the variants at random from the variant track");
 
 
-        if (KEEP_AF_SPECTRUM) {
-            try {
-                afBreakpoints = new ArrayList<Double>();
-                afBoosts = new ArrayList<Double>();
-                logger.info("Reading in AF boost table...");
-                boolean firstLine = false;
-                for ( final String line : new XReadLines( AF_FILE ) ) {
-                    if (!firstLine) {
-                        firstLine = true;
-                        continue;
-                    }
-                    final String[] vals = line.split(" ");
 
-                    double bkp = Double.valueOf(vals[0]);
-                    double afb = Double.valueOf(vals[1]);
-                    afBreakpoints.add(bkp);
-                    afBoosts.add(afb);
-
-                }
-                bkDelta = afBreakpoints.get(0);
-            } catch ( FileNotFoundException e ) {
-                throw new UserException.CouldNotReadInputFile(AF_FILE, e);
-            }
-
-        }
     }
 
     /**
@@ -566,61 +534,11 @@ public class SelectVariants extends RodWalker<Integer, Integer> {
                 if (SELECT_RANDOM_NUMBER) {
                     randomlyAddVariant(++variantNumber, sub, ref.getBase());
                 }
-                else if (!SELECT_RANDOM_FRACTION || (!KEEP_AF_SPECTRUM && GenomeAnalysisEngine.getRandomGenerator().nextDouble() < fractionRandom)) {
+                else if (!SELECT_RANDOM_FRACTION || ( GenomeAnalysisEngine.getRandomGenerator().nextDouble() < fractionRandom)) {
                     vcfWriter.add(sub);
                 }
-                else {
-                    if (SELECT_RANDOM_FRACTION && KEEP_AF_SPECTRUM ) {
-                        // ok we have a comp VC and we need to match the AF spectrum of inputAFRodName.
-                        // We then pick a variant with probablity AF*desiredFraction
-                        if ( sub.hasAttribute(VCFConstants.ALLELE_FREQUENCY_KEY) )  {
-                            String afo = sub.getAttributeAsString(VCFConstants.ALLELE_FREQUENCY_KEY);
-
-                            double af;
-                            double afBoost = 1.0;
-                            if (afo.contains(",")) {
-                                String[] afs = afo.split(",");
-                                afs[0] = afs[0].substring(1,afs[0].length());
-                                afs[afs.length-1] = afs[afs.length-1].substring(0,afs[afs.length-1].length()-1);
-
-                                double[] afd = new double[afs.length];
-
-                                for (int k=0; k < afd.length; k++)
-                                    afd[k] = Double.valueOf(afs[k]);
-
-                                af = MathUtils.arrayMax(afd);
-                                //af = Double.valueOf(afs[0]);
-
-                            }
-                            else
-                                af = Double.valueOf(afo);
-
-                            // now boost af by table read from file if desired
-                            //double bkpt = 0.0;
-                            int bkidx = 0;
-                            if (!afBreakpoints.isEmpty()) {
-                                for ( Double bkpt : afBreakpoints) {
-                                    if (af < bkpt + bkDelta)
-                                        break;
-                                    else bkidx++;
-                                }
-                                if (bkidx >=afBoosts.size())
-                                    bkidx = afBoosts.size()-1;
-                                afBoost = afBoosts.get(bkidx);
-                                //System.out.formatPrin("af:%f bkidx:%d afboost:%f\n",af,bkidx,afBoost);
 
 
-
-                            }
-
-                            //System.out.format("%s .. %4.4f\n",afo.toString(), af);
-                            if (GenomeAnalysisEngine.getRandomGenerator().nextDouble() < fractionRandom * afBoost *   afBoost)
-                                vcfWriter.add(sub);
-                        }
-
-
-                    }
-                }
             }
 
         }
@@ -638,9 +556,9 @@ public class SelectVariants extends RodWalker<Integer, Integer> {
         if (vc == null)
             return false;
 
-        // if we're not looking at specific samples then the absense of a compVC means discordance
-        if (NO_SAMPLES_SPECIFIED && (compVCs == null || compVCs.isEmpty()))
-            return true;
+        // if we're not looking at specific samples then the absence of a compVC means discordance
+        if (NO_SAMPLES_SPECIFIED)
+            return (compVCs == null || compVCs.isEmpty());
 
         // check if we find it in the variant rod
         Map<String, Genotype> genotypes = vc.getGenotypes(samples);
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/VariantValidationAssessor.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/VariantValidationAssessor.java
index 8eaf976d0..4e6cc722d 100644
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/VariantValidationAssessor.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/VariantValidationAssessor.java
@@ -237,7 +237,7 @@ public class VariantValidationAssessor extends RodWalker<VariantContext,Integer>
         infoMap.put("HomVarPct", String.format("%.1f", 100.0*homVarProp));
         infoMap.put("HetPct", String.format("%.1f", 100.0*hetProp));
         infoMap.put("HW", String.format("%.2f", hwScore));
-        Set<Allele> altAlleles = vContext.getAlternateAlleles();
+        Collection<Allele> altAlleles = vContext.getAlternateAlleles();
         int altAlleleCount = altAlleles.size() == 0 ? 0 : vContext.getChromosomeCount(altAlleles.iterator().next());
         if ( !isViolation && altAlleleCount > 0 )
             numTrueVariants++;
diff --git a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/VariantsToTable.java b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/VariantsToTable.java
index 2a877fb09..454909634 100755
--- a/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/VariantsToTable.java
+++ b/public/java/src/org/broadinstitute/sting/gatk/walkers/variantutils/VariantsToTable.java
@@ -27,6 +27,7 @@ package org.broadinstitute.sting.gatk.walkers.variantutils;
 import org.broadinstitute.sting.commandline.*;
 import org.broadinstitute.sting.gatk.arguments.StandardVariantContextInputArgumentCollection;
 import org.broadinstitute.sting.utils.MathUtils;
+import org.broadinstitute.sting.utils.variantcontext.Allele;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
@@ -65,12 +66,14 @@ import java.util.*;
  *
  * <h2>Output</h2>
  * <p>
- * A table deliminated file containing the values of the requested fields in the VCF file
+ * A tab-delimited file containing the values of the requested fields in the VCF file
  * </p>
  *
  * <h2>Examples</h2>
  * <pre>
- *     -T $WalkerName \
+ *     java -jar GenomeAnalysisTK.jar \
+ *     -R reference.fasta
+ *     -T VariantsToTable \
  *     -V file.vcf \
  *     -F CHROM -F POS -F ID -F QUAL -F AC \
  *     -o results.table
@@ -103,7 +106,7 @@ public class VariantsToTable extends RodWalker<Integer, Integer> {
 
     /**
      * By default this tool only emits values for fields where the FILTER field is either PASS or . (unfiltered).
-     * Throwing this flag will cause $WalkerName to emit values regardless of the FILTER field value.
+     * Throwing this flag will cause VariantsToTable to emit values regardless of the FILTER field value.
      */
     @Advanced
     @Argument(fullName="showFiltered", shortName="raw", doc="If provided, field values from filtered records will be included in the output", required=false)
@@ -133,7 +136,7 @@ public class VariantsToTable extends RodWalker<Integer, Integer> {
 
     /**
      * By default, this tool throws a UserException when it encounters a field without a value in some record.  This
-     * is generally useful when you mistype -F CHRMO, so that you get a friendly warning about CHRMO not being
+     * is generally useful when you mistype -F CHROM, so that you get a friendly warning about CHROM not being
      * found before the tool runs through 40M 1000G records.  However, in some cases you genuinely want to allow such
      * fields (e.g., AC not being calculated for filtered records, if included).  When provided, this argument
      * will cause VariantsToTable to write out NA values for missing fields instead of throwing an error.
@@ -192,7 +195,7 @@ public class VariantsToTable extends RodWalker<Integer, Integer> {
             if ( getters.containsKey(field) ) {
                 val = getters.get(field).get(vc);
             } else if ( vc.hasAttribute(field) ) {
-                val = vc.getAttributeAsString(field);
+                val = vc.getAttributeAsString(field, null);
             } else if ( isWildCard(field) ) {
                 Set<String> wildVals = new HashSet<String>();
                 for ( Map.Entry<String,Object> elt : vc.getAttributes().entrySet()) {
@@ -294,6 +297,14 @@ public class VariantsToTable extends RodWalker<Integer, Integer> {
                 return x.toString();
             }
         });
+        getters.put("EVENTLENGTH", new Getter() { public String get(VariantContext vc) {
+            int maxLength = 0;
+            for ( final Allele a : vc.getAlternateAlleles() ) {
+                final int length = a.length() - vc.getReference().length();
+                if( Math.abs(length) > Math.abs(maxLength) ) { maxLength = length; }
+            }
+            return Integer.toString(maxLength);
+        }});
         getters.put("QUAL", new Getter() { public String get(VariantContext vc) { return Double.toString(vc.getPhredScaledQual()); } });
         getters.put("TRANSITION", new Getter() { public String get(VariantContext vc) {
             if ( vc.isSNP() && vc.isBiallelic() )
@@ -304,11 +315,12 @@ public class VariantsToTable extends RodWalker<Integer, Integer> {
         getters.put("FILTER", new Getter() { public String get(VariantContext vc) {
             return vc.isNotFiltered() ? "PASS" : Utils.join(",", vc.getFilters()); }
         });
-
+        getters.put("ID", new Getter() { public String get(VariantContext vc) { return vc.hasID() ? vc.getID() : "."; } });
         getters.put("HET", new Getter() { public String get(VariantContext vc) { return Integer.toString(vc.getHetCount()); } });
         getters.put("HOM-REF", new Getter() { public String get(VariantContext vc) { return Integer.toString(vc.getHomRefCount()); } });
         getters.put("HOM-VAR", new Getter() { public String get(VariantContext vc) { return Integer.toString(vc.getHomVarCount()); } });
         getters.put("NO-CALL", new Getter() { public String get(VariantContext vc) { return Integer.toString(vc.getNoCallCount()); } });
+        getters.put("TYPE", new Getter() { public String get(VariantContext vc) { return vc.getType().toString(); } });
         getters.put("VAR", new Getter() { public String get(VariantContext vc) { return Integer.toString(vc.getHetCount() + vc.getHomVarCount()); } });
         getters.put("NSAMPLES", new Getter() { public String get(VariantContext vc) { return Integer.toString(vc.getNSamples()); } });
         getters.put("NCALLED", new Getter() { public String get(VariantContext vc) { return Integer.toString(vc.getNSamples() - vc.getNoCallCount()); } });
diff --git a/public/java/src/org/broadinstitute/sting/utils/GenomeLoc.java b/public/java/src/org/broadinstitute/sting/utils/GenomeLoc.java
index b96923589..c1479bc69 100644
--- a/public/java/src/org/broadinstitute/sting/utils/GenomeLoc.java
+++ b/public/java/src/org/broadinstitute/sting/utils/GenomeLoc.java
@@ -5,6 +5,10 @@ import com.google.java.contract.Requires;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 
 import java.io.Serializable;
+import java.util.ArrayList;
+import java.util.Arrays;
+import java.util.Collections;
+import java.util.List;
 
 /**
  * Created by IntelliJ IDEA.
@@ -174,6 +178,8 @@ public class GenomeLoc implements Comparable<GenomeLoc>, Serializable, HasGenome
         return new GenomeLoc[] { new GenomeLoc(getContig(),contigIndex,getStart(),splitPoint-1), new GenomeLoc(getContig(),contigIndex,splitPoint,getStop()) };
     }
 
+    public GenomeLoc union( GenomeLoc that ) { return merge(that); }
+
     @Requires("that != null")
     @Ensures("result != null")
     public GenomeLoc intersect( GenomeLoc that ) throws ReviewedStingException {
@@ -192,6 +198,79 @@ public class GenomeLoc implements Comparable<GenomeLoc>, Serializable, HasGenome
                              Math.min( getStop(), that.getStop()) );
     }
 
+    @Requires("that != null")
+    public final List<GenomeLoc> subtract( final GenomeLoc that ) {
+        if(GenomeLoc.isUnmapped(this) || GenomeLoc.isUnmapped(that)) {
+            if(! GenomeLoc.isUnmapped(this) || !GenomeLoc.isUnmapped(that))
+                throw new ReviewedStingException("Tried to intersect a mapped and an unmapped genome loc");
+            return Arrays.asList(UNMAPPED);
+        }
+
+        if (!(this.overlapsP(that))) {
+            throw new ReviewedStingException("GenomeLoc::minus(): The two genome loc's need to overlap");
+        }
+
+        if (equals(that)) {
+            return Collections.emptyList();
+        } else if (containsP(that)) {
+            List<GenomeLoc> l = new ArrayList<GenomeLoc>(2);
+
+            /**
+             * we have to create two new region, one for the before part, one for the after
+             * The old region:
+             * |----------------- old region (g) -------------|
+             *        |----- to delete (e) ------|
+             *
+             * product (two new regions):
+             * |------|  + |--------|
+             *
+             */
+            int afterStop = this.getStop(), afterStart = that.getStop() + 1;
+            int beforeStop = that.getStart() - 1, beforeStart = this.getStart();
+            if (afterStop - afterStart >= 0) {
+                GenomeLoc after = new GenomeLoc(this.getContig(), getContigIndex(), afterStart, afterStop);
+                l.add(after);
+            }
+            if (beforeStop - beforeStart >= 0) {
+                GenomeLoc before = new GenomeLoc(this.getContig(), getContigIndex(), beforeStart, beforeStop);
+                l.add(before);
+            }
+
+            return l;
+        } else if (that.containsP(this)) {
+            /**
+             * e completely contains g, delete g, but keep looking, there may be more regions
+             * i.e.:
+             *   |--------------------- e --------------------|
+             *       |--- g ---|    |---- others ----|
+             */
+            return Collections.emptyList();   // don't need to do anything
+        } else {
+            /**
+             * otherwise e overlaps some part of g
+             *
+             * figure out which region occurs first on the genome.  I.e., is it:
+             * |------------- g ----------|
+             *       |------------- e ----------|
+             *
+             * or:
+             *       |------------- g ----------|
+             * |------------ e -----------|
+             *
+             */
+
+            GenomeLoc n;
+            if (that.getStart() < this.getStart()) {
+                n = new GenomeLoc(this.getContig(), getContigIndex(), that.getStop() + 1, this.getStop());
+            } else {
+                n = new GenomeLoc(this.getContig(), getContigIndex(), this.getStart(), that.getStart() - 1);
+            }
+
+            // replace g with the new region
+            return Arrays.asList(n);
+        }
+    }
+
     @Requires("that != null")
     public final boolean containsP(GenomeLoc that) {
         return onSameContig(that) && getStart() <= that.getStart() && getStop() >= that.getStop();
@@ -203,19 +282,14 @@ public class GenomeLoc implements Comparable<GenomeLoc>, Serializable, HasGenome
     }
 
     @Requires("that != null")
-    public final int minus( final GenomeLoc that ) {
+    @Ensures("result >= 0")
+    public final int distance( final GenomeLoc that ) {
         if ( this.onSameContig(that) )
-            return this.getStart() - that.getStart();
+            return Math.abs(this.getStart() - that.getStart());
         else
             return Integer.MAX_VALUE;
     }
 
-    @Requires("that != null")
-    @Ensures("result >= 0")
-    public final int distance( final GenomeLoc that ) {
-        return Math.abs(minus(that));
-    }    
-
     @Requires({"left != null", "right != null"})
     public final boolean isBetween( final GenomeLoc left, final GenomeLoc right ) {
         return this.compareTo(left) > -1 && this.compareTo(right) < 1;
@@ -306,7 +380,7 @@ public class GenomeLoc implements Comparable<GenomeLoc>, Serializable, HasGenome
     
     @Override
     public int hashCode() {
-        return (int)( start << 16 + stop << 4 + contigIndex );
+        return start << 16 | stop << 4 | contigIndex;
     }
 
 
diff --git a/public/java/src/org/broadinstitute/sting/utils/GenomeLocComparator.java b/public/java/src/org/broadinstitute/sting/utils/GenomeLocComparator.java
new file mode 100644
index 000000000..7aa9fdd65
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/GenomeLocComparator.java
@@ -0,0 +1,56 @@
+package org.broadinstitute.sting.utils;
+
+import com.google.java.contract.Ensures;
+import com.google.java.contract.Requires;
+
+import java.util.Comparator;
+
+/**
+ *
+ * @author Mauricio Carneiro
+ * @since 9/28/11
+ */
+public class GenomeLocComparator implements Comparator<GenomeLoc> {
+    /**
+     * compares genomeLoc's contigs
+     *
+     * @param gl1 the genome loc to compare contigs
+     * @param gl2 the genome loc to compare contigs
+     * @return 0 if equal, -1 if gl2.contig is greater, 1 if gl1.contig is greater
+     */
+    @Requires("gl2 != null")
+    @Ensures("result == 0 || result == 1 || result == -1")
+    public final int compareContigs( GenomeLoc gl1, GenomeLoc gl2 ) {
+        if (gl1.contigIndex == gl2.contigIndex)
+            return 0;
+        else if (gl1.contigIndex > gl2.contigIndex)
+            return 1;
+        return -1;
+    }
+
+    @Requires("gl2 != null")
+    @Ensures("result == 0 || result == 1 || result == -1")
+    public int compare ( GenomeLoc gl1, GenomeLoc gl2 ) {
+        int result = 0;
+
+        if ( gl1 == gl2 ) {
+            result = 0;
+        }
+        else if(GenomeLoc.isUnmapped(gl1))
+            result = 1;
+        else if(GenomeLoc.isUnmapped(gl2))
+            result = -1;
+        else {
+            final int cmpContig = compareContigs(gl1, gl2);
+
+            if ( cmpContig != 0 ) {
+                result = cmpContig;
+            } else {
+                if ( gl1.getStart() < gl2.getStart() ) result = -1;
+                if ( gl1.getStart() > gl2.getStart() ) result = 1;
+            }
+        }
+
+        return result;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/GenomeLocSortedSet.java b/public/java/src/org/broadinstitute/sting/utils/GenomeLocSortedSet.java
index fd7a79f48..26be0e59e 100755
--- a/public/java/src/org/broadinstitute/sting/utils/GenomeLocSortedSet.java
+++ b/public/java/src/org/broadinstitute/sting/utils/GenomeLocSortedSet.java
@@ -215,7 +215,7 @@ public class GenomeLocSortedSet extends AbstractSet<GenomeLoc> {
 
             if ( p.overlapsP(e) ) {
                 toProcess.pop();
-                for ( GenomeLoc newP : subtractRegion(p, e) )
+                for ( GenomeLoc newP : p.subtract(e) )
                     toProcess.push(newP);
             } else if ( p.compareContigs(e) < 0 ) {
                 good.add(toProcess.pop());         // p is now good
@@ -236,69 +236,6 @@ public class GenomeLocSortedSet extends AbstractSet<GenomeLoc> {
         return createSetFromList(genomeLocParser,good);
     }
 
-    private static final List<GenomeLoc> EMPTY_LIST = new ArrayList<GenomeLoc>();
-    private List<GenomeLoc> subtractRegion(GenomeLoc g, GenomeLoc e) {
-        if (g.equals(e)) {
-            return EMPTY_LIST;
-        } else if (g.containsP(e)) {
-            List<GenomeLoc> l = new ArrayList<GenomeLoc>();
-
-            /**
-             * we have to create two new region, one for the before part, one for the after
-             * The old region:
-             * |----------------- old region (g) -------------|
-             *        |----- to delete (e) ------|
-             *
-             * product (two new regions):
-             * |------|  + |--------|
-             *
-             */
-            int afterStop = g.getStop(), afterStart = e.getStop() + 1;
-            int beforeStop = e.getStart() - 1, beforeStart = g.getStart();
-            if (afterStop - afterStart >= 0) {
-                GenomeLoc after = genomeLocParser.createGenomeLoc(g.getContig(), afterStart, afterStop);
-                l.add(after);
-            }
-            if (beforeStop - beforeStart >= 0) {
-                GenomeLoc before = genomeLocParser.createGenomeLoc(g.getContig(), beforeStart, beforeStop);
-                l.add(before);
-            }
-
-            return l;
-        } else if (e.containsP(g)) {
-            /**
-             * e completely contains g, delete g, but keep looking, there may be more regions
-             * i.e.:
-             *   |--------------------- e --------------------|
-             *       |--- g ---|    |---- others ----|
-             */
-            return EMPTY_LIST;   // don't need to do anything
-        } else {
-            /**
-             * otherwise e overlaps some part of g
-             *
-             * figure out which region occurs first on the genome.  I.e., is it:
-             * |------------- g ----------|
-             *       |------------- e ----------|
-             *
-             * or:
-             *       |------------- g ----------|
-             * |------------ e -----------|
-             *
-             */
-
-            GenomeLoc n;
-            if (e.getStart() < g.getStart()) {
-                n = genomeLocParser.createGenomeLoc(g.getContig(), e.getStop() + 1, g.getStop());
-            } else {
-                n = genomeLocParser.createGenomeLoc(g.getContig(), g.getStart(), e.getStart() - 1);
-            }
-
-            // replace g with the new region
-            return Arrays.asList(n);
-        }
-    }
-
 
     /**
      * a simple removal of an interval contained in this list.  The interval must be identical to one in the list (no partial locations or overlapping)
diff --git a/public/java/src/org/broadinstitute/sting/utils/genotype/Haplotype.java b/public/java/src/org/broadinstitute/sting/utils/Haplotype.java
similarity index 98%
rename from public/java/src/org/broadinstitute/sting/utils/genotype/Haplotype.java
rename to public/java/src/org/broadinstitute/sting/utils/Haplotype.java
index a17e81461..ce2ca2c28 100755
--- a/public/java/src/org/broadinstitute/sting/utils/genotype/Haplotype.java
+++ b/public/java/src/org/broadinstitute/sting/utils/Haplotype.java
@@ -22,10 +22,9 @@
  * OTHER DEALINGS IN THE SOFTWARE.
  */
 
-package org.broadinstitute.sting.utils.genotype;
+package org.broadinstitute.sting.utils;
 
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
-import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.variantcontext.Allele;
 
diff --git a/public/java/src/org/broadinstitute/sting/utils/MathUtils.java b/public/java/src/org/broadinstitute/sting/utils/MathUtils.java
index 0d85f9606..17f458f31 100644
--- a/public/java/src/org/broadinstitute/sting/utils/MathUtils.java
+++ b/public/java/src/org/broadinstitute/sting/utils/MathUtils.java
@@ -408,12 +408,12 @@ public class MathUtils {
         return Math.sqrt(rms);
     }
 
-    public static double rms(Collection<Double> l) {
+    public static double rms(Collection<Integer> l) {
         if (l.size() == 0)
             return 0.0;
 
         double rms = 0.0;
-        for (Double i : l)
+        for (int i : l)
             rms += i*i;
         rms /= l.size();
         return Math.sqrt(rms);
@@ -444,11 +444,25 @@ public class MathUtils {
      * @return a newly allocated array corresponding the normalized values in array, maybe log10 transformed
     */
     public static double[] normalizeFromLog10(double[] array, boolean takeLog10OfOutput) {
-        double[] normalized = new double[array.length];
+        return normalizeFromLog10(array, takeLog10OfOutput, false);
+    }
+
+    public static double[] normalizeFromLog10(double[] array, boolean takeLog10OfOutput, boolean keepInLogSpace) {
 
         // for precision purposes, we need to add (or really subtract, since they're
         // all negative) the largest value; also, we need to convert to normal-space.
         double maxValue = Utils.findMaxEntry(array);
+
+        // we may decide to just normalize in log space with converting to linear space
+        if (keepInLogSpace) {
+            for (int i = 0; i < array.length; i++)
+                array[i] -= maxValue;
+            return array;
+        }
+
+        // default case: go to linear space
+        double[] normalized = new double[array.length];
+
         for (int i = 0; i < array.length; i++)
             normalized[i] = Math.pow(10, array[i] - maxValue);
 
diff --git a/public/java/src/org/broadinstitute/sting/utils/MendelianViolation.java b/public/java/src/org/broadinstitute/sting/utils/MendelianViolation.java
index c6a07b5ce..cf45dab79 100755
--- a/public/java/src/org/broadinstitute/sting/utils/MendelianViolation.java
+++ b/public/java/src/org/broadinstitute/sting/utils/MendelianViolation.java
@@ -1,7 +1,6 @@
 package org.broadinstitute.sting.utils;
 
-import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
+import org.broadinstitute.sting.gatk.samples.Sample;
 import org.broadinstitute.sting.utils.exceptions.UserException;
 import org.broadinstitute.sting.utils.variantcontext.Genotype;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
@@ -17,9 +16,6 @@ import java.util.regex.Pattern;
  * Time: 12:38 PM
  */
 public class MendelianViolation {
-
-
-
     String sampleMom;
     String sampleDad;
     String sampleChild;
@@ -30,21 +26,20 @@ public class MendelianViolation {
 
     double minGenotypeQuality;
 
-    private static Pattern FAMILY_PATTERN = Pattern.compile("(.*)\\+(.*)=(.*)");
+    static final int[] mvOffsets = new int[] { 1,2,5,6,8,11,15,18,20,21,24,25 };
+    static final int[] nonMVOffsets = new int[]{ 0,3,4,7,9,10,12,13,14,16,17,19,22,23,26 };
 
+    private static Pattern FAMILY_PATTERN = Pattern.compile("(.*)\\+(.*)=(.*)");
 
     public String getSampleMom() {
         return sampleMom;
     }
-
     public String getSampleDad() {
         return sampleDad;
     }
-
     public String getSampleChild() {
         return sampleChild;
     }
-
     public double getMinGenotypeQuality() {
         return minGenotypeQuality;
     }
@@ -85,37 +80,12 @@ public class MendelianViolation {
      * @param minGenotypeQualityP - the minimum phred scaled genotype quality score necessary to asses mendelian violation
      */
     public MendelianViolation(Sample sample, double minGenotypeQualityP) {
-        sampleMom = sample.getMother().getId();
-        sampleDad = sample.getFather().getId();
-        sampleChild = sample.getId();
+        sampleMom = sample.getMother().getID();
+        sampleDad = sample.getFather().getID();
+        sampleChild = sample.getID();
         minGenotypeQuality = minGenotypeQualityP;
     }
 
-
-    /**
-     * The most common constructor to be used when give a YAML file with the relationships to the engine with the -SM option.
-     * @param engine - The GATK engine, use getToolkit(). That's where the sample information is stored.
-     * @param minGenotypeQualityP - the minimum phred scaled genotype quality score necessary to asses mendelian violation
-     */
-    public MendelianViolation(GenomeAnalysisEngine engine, double minGenotypeQualityP) {
-        boolean gotSampleInformation = false;
-        Collection<Sample> samples = engine.getSamples();
-        // Iterate through all samples in the sample_metadata file but we really can only take one.
-        for (Sample sample : samples) {
-            if (sample.getMother() != null && sample.getFather() != null) {
-                sampleMom = sample.getMother().getId();
-                sampleDad = sample.getFather().getId();
-                sampleChild = sample.getId();
-                minGenotypeQuality = minGenotypeQualityP;
-                gotSampleInformation = true;
-                break; // we can only deal with one trio information
-            }
-        }
-        if (!gotSampleInformation)
-            throw new UserException("YAML file has no sample with relationship information (mother/father)");
-    }
-
-
     /**
      * This method prepares the object to evaluate for violation. Typically you won't call it directly, a call to
      * isViolation(vc) will take care of this. But if you want to know whether your site was a valid comparison site
@@ -153,7 +123,7 @@ public class MendelianViolation {
      * @return False if we can't determine (lack of information), or it's not a violation. True if it is a violation.
      *
      */
-    public boolean isViolation (VariantContext vc)
+    public boolean isViolation(VariantContext vc)
     {
         return setAlleles(vc) && isViolation();
     }
@@ -168,4 +138,42 @@ public class MendelianViolation {
         return true;
     }
 
+    /**
+     * @return the likelihood ratio for a mendelian violation
+     */
+    public double violationLikelihoodRatio(VariantContext vc) {
+        double[] logLikAssignments = new double[27];
+        // the matrix to set up is
+        // MOM   DAD    CHILD
+        //                    |-  AA
+        //   AA     AA    |    AB
+        //                    |-   BB
+        //                    |- AA
+        //  AA     AB     |   AB
+        //                    |- BB
+        // etc. The leaves are counted as 0-11 for MVs and 0-14 for non-MVs
+        double[] momGL = vc.getGenotype(sampleMom).getLikelihoods().getAsVector();
+        double[] dadGL = vc.getGenotype(sampleDad).getLikelihoods().getAsVector();
+        double[] childGL = vc.getGenotype(sampleChild).getLikelihoods().getAsVector();
+        int offset = 0;
+        for ( int oMom = 0; oMom < 3; oMom++ ) {
+            for ( int oDad = 0; oDad < 3; oDad++ ) {
+                for ( int oChild = 0; oChild < 3; oChild ++ ) {
+                    logLikAssignments[offset++] = momGL[oMom] + dadGL[oDad] + childGL[oChild];
+                }
+            }
+        }
+        double[] mvLiks = new double[12];
+        double[] nonMVLiks = new double[15];
+        for ( int i = 0; i < 12; i ++ ) {
+            mvLiks[i] = logLikAssignments[mvOffsets[i]];
+        }
+
+        for ( int i = 0; i < 15; i++) {
+            nonMVLiks[i] = logLikAssignments[nonMVOffsets[i]];
+        }
+
+        return MathUtils.log10sumLog10(mvLiks) - MathUtils.log10sumLog10(nonMVLiks);
+    }
+
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/NGSPlatform.java b/public/java/src/org/broadinstitute/sting/utils/NGSPlatform.java
new file mode 100644
index 000000000..4f01f2b7a
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/NGSPlatform.java
@@ -0,0 +1,108 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils;
+
+import net.sf.samtools.SAMReadGroupRecord;
+import net.sf.samtools.SAMRecord;
+
+/**
+ * A canonical, master list of the standard NGS platforms.  These values
+ * can be obtained (efficiently) from a GATKSAMRecord object with the
+ * getNGSPlatform method.
+ *
+ * @author Mark DePristo
+ * @since 2011
+ */
+public enum NGSPlatform {
+    ILLUMINA("ILLUMINA", "SLX", "SOLEXA"),
+    SOLID("SOLID"),
+    LS454("454"),
+    COMPLETE_GENOMICS("COMPLETE"),
+    PACBIO("PACBIO"),
+    ION_TORRENT("IONTORRENT"),
+    UNKNOWN("UNKNOWN");
+
+    /**
+     * Array of the prefix names in a BAM file for each of the platforms.
+     */
+    private final String[] BAM_PL_NAMES;
+
+    NGSPlatform(final String... BAM_PL_NAMES) {
+        for ( int i = 0; i < BAM_PL_NAMES.length; i++ )
+            BAM_PL_NAMES[i] = BAM_PL_NAMES[i].toUpperCase();
+        this.BAM_PL_NAMES = BAM_PL_NAMES;
+    }
+
+    /**
+     * Returns a representative PL string for this platform
+     * @return
+     */
+    public final String getDefaultPlatform() {
+        return BAM_PL_NAMES[0];
+    }
+
+    /**
+     * Convenience constructor -- calculates the NGSPlatfrom from a SAMRecord.
+     * Note you should not use this function if you have a GATKSAMRecord -- use the
+     * accessor method instead.
+     *
+     * @param read
+     * @return an NGSPlatform object matching the PL field of the header, of UNKNOWN if there was no match
+     */
+    public static final NGSPlatform fromRead(SAMRecord read) {
+        return fromReadGroup(read.getReadGroup());
+    }
+
+    /**
+     * Returns the NGSPlatform corresponding to the PL tag in the read group
+     * @param rg
+     * @return an NGSPlatform object matching the PL field of the header, of UNKNOWN if there was no match
+     */
+    public static final NGSPlatform fromReadGroup(SAMReadGroupRecord rg) {
+        return fromReadGroupPL(rg.getPlatform());
+    }
+
+    /**
+     * Returns the NGSPlatform corresponding to the PL tag in the read group
+     * @param plFromRG -- the PL field (or equivalent) in a ReadGroup object
+     * @return an NGSPlatform object matching the PL field of the header, of UNKNOWN if there was no match
+     */
+    public static final NGSPlatform fromReadGroupPL(final String plFromRG) {
+        if ( plFromRG == null ) return UNKNOWN;
+
+        // todo -- algorithm could be implemented more efficiently, as the list of all
+        // todo -- names is known upfront, so a decision tree could be used to identify
+        // todo -- a prefix common to PL
+        final String pl = plFromRG.toUpperCase();
+        for ( final NGSPlatform ngsPlatform : NGSPlatform.values() ) {
+            for ( final String bamPLName : ngsPlatform.BAM_PL_NAMES ) {
+                if ( pl.contains(bamPLName) )
+                    return ngsPlatform;
+            }
+        }
+
+        return UNKNOWN;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/QualityUtils.java b/public/java/src/org/broadinstitute/sting/utils/QualityUtils.java
index fad2320fc..19e03a19d 100755
--- a/public/java/src/org/broadinstitute/sting/utils/QualityUtils.java
+++ b/public/java/src/org/broadinstitute/sting/utils/QualityUtils.java
@@ -9,14 +9,17 @@ import net.sf.samtools.SAMUtils;
  * @author Kiran Garimella
  */
 public class QualityUtils {
-
     public final static byte MAX_QUAL_SCORE = SAMUtils.MAX_PHRED_SCORE;
     public final static double MIN_REASONABLE_ERROR = 0.0001;
     public final static byte MAX_REASONABLE_Q_SCORE = 40;
     public final static byte MIN_USABLE_Q_SCORE = 6;
-
     public final static int MAPPING_QUALITY_UNAVAILABLE = 255;
 
+    private static double qualToErrorProbCache[] = new double[256];
+    static {
+        for (int i = 0; i < 256; i++) qualToErrorProbCache[i] = qualToErrorProbRaw((byte)i);
+    }
+
     /**
      * Private constructor.  No instantiating this class!
      */
@@ -33,10 +36,6 @@ public class QualityUtils {
         return 1.0 - qualToErrorProb(qual);
     }
 
-    static public double qualToProb(int qual) {
-        return qualToProb( (double)qual );
-    }
-
     static public double qualToProb(double qual) {
         return 1.0 - Math.pow(10.0, qual/(-10.0));
     }
@@ -48,10 +47,14 @@ public class QualityUtils {
      * @param qual a quality score (0-40)
      * @return a probability (0.0-1.0)
      */
-    static public double qualToErrorProb(byte qual) {
+    static public double qualToErrorProbRaw(byte qual) {
         return Math.pow(10.0, ((double) qual)/-10.0);
     }
 
+    static public double qualToErrorProb(byte qual) {
+        return qualToErrorProbCache[qual];
+    }
+
     /**
      * Convert a probability to a quality score.  Note, this is capped at Q40.
      *
@@ -110,88 +113,4 @@ public class QualityUtils {
         //return (byte) Math.min(qual, maxQual);
         return (byte) Math.max(Math.min(qual, maxQual), 1);
     }
-
-    /**
-     * Compress a base and a probability into a single byte so that it can be output in a SAMRecord's SQ field.
-     * Note: the highest probability this function can encode is 64%, so this function should only never be used on the best base hypothesis.
-     * Another note: the probability encoded here gets rounded to the nearest 1%.
-     *
-     * @param baseIndex the base index
-     * @param prob      the base probability
-     * @return a byte containing the index and the probability
-     */
-    static public byte baseAndProbToCompressedQuality(int baseIndex, double prob) {
-        byte compressedQual = 0;
-
-        compressedQual = (byte) baseIndex;
-
-        byte cprob = (byte) (100.0*prob);
-        byte qualmask = (byte) 252;
-        compressedQual += ((cprob << 2) & qualmask);
-        
-        return compressedQual;
-    }
-
-    /**
-     * From a compressed base, extract the base index (0:A, 1:C, 2:G, 3:T)
-     *
-     * @param compressedQual the compressed quality score, as returned by baseAndProbToCompressedQuality
-     * @return base index
-     */
-    static public int compressedQualityToBaseIndex(byte compressedQual) {
-        return (int) (compressedQual & 0x3);
-    }
-
-    /**
-     * From a compressed base, extract the base probability
-     *
-     * @param compressedQual the compressed quality score, as returned by baseAndProbToCompressedQuality
-     * @return the probability
-     */
-    static public double compressedQualityToProb(byte compressedQual) {
-        // Because java natives are signed, extra care must be taken to avoid
-        // shifting a 1 into the sign bit in the implicit promotion of 2 to an int.
-        int x2 = ((int) compressedQual) & 0xff;
-        x2 = (x2 >>> 2);
-
-        return ((double) x2)/100.0;
-    }
-
-    /**
-     * Return the complement of a compressed quality
-     *
-     * @param compressedQual  the compressed quality score (as returned by baseAndProbToCompressedQuality)
-     * @return the complementary compressed quality
-     */
-    static public byte complementCompressedQuality(byte compressedQual) {
-        int baseIndex = compressedQualityToBaseIndex(compressedQual);
-        double prob = compressedQualityToProb(compressedQual);
-
-        return baseAndProbToCompressedQuality(BaseUtils.complementIndex(baseIndex), prob);
-    }
-
-    /**
-     * Return the reverse complement of a byte array of compressed qualities
-     *
-     * @param compressedQuals  a byte array of compressed quality scores
-     * @return the reverse complement of the byte array
-     */
-    static public byte[] reverseComplementCompressedQualityArray(byte[] compressedQuals) {
-        byte[] rcCompressedQuals = new byte[compressedQuals.length];
-
-        for (int pos = 0; pos < compressedQuals.length; pos++) {
-            rcCompressedQuals[compressedQuals.length - pos - 1] = complementCompressedQuality(compressedQuals[pos]);
-        }
-
-        return rcCompressedQuals;
-    }
-
-    /**
-     * Return the reverse of a byte array of qualities (compressed or otherwise)
-     * @param quals   the array of bytes to be reversed
-     * @return the reverse of the quality array
-     */
-    static public byte[] reverseQualityArray( byte[] quals ) {
-        return Utils.reverse(quals); // no sense in duplicating functionality
-    }
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/R/RScriptExecutor.java b/public/java/src/org/broadinstitute/sting/utils/R/RScriptExecutor.java
index 58f7942fe..d8176ff4e 100644
--- a/public/java/src/org/broadinstitute/sting/utils/R/RScriptExecutor.java
+++ b/public/java/src/org/broadinstitute/sting/utils/R/RScriptExecutor.java
@@ -25,104 +25,164 @@
 package org.broadinstitute.sting.utils.R;
 
 import org.apache.commons.io.FileUtils;
+import org.apache.commons.lang.StringUtils;
 import org.apache.log4j.Logger;
-import org.broadinstitute.sting.commandline.Advanced;
-import org.broadinstitute.sting.commandline.Argument;
-import org.broadinstitute.sting.commandline.ArgumentCollection;
-import org.broadinstitute.sting.gatk.walkers.recalibration.Covariate;
-import org.broadinstitute.sting.utils.PathUtils;
 import org.broadinstitute.sting.utils.Utils;
+import org.broadinstitute.sting.utils.exceptions.StingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.io.IOUtils;
+import org.broadinstitute.sting.utils.io.Resource;
+import org.broadinstitute.sting.utils.runtime.ProcessController;
+import org.broadinstitute.sting.utils.runtime.ProcessSettings;
+import org.broadinstitute.sting.utils.runtime.RuntimeUtils;
 
 import java.io.File;
-import java.io.IOException;
-import java.util.Arrays;
+import java.util.ArrayList;
 import java.util.List;
 
 /**
- * Generic service for executing RScripts in the GATK directory
- *
- * @author Your Name
- * @since Date created
+ * Generic service for executing RScripts
  */
 public class RScriptExecutor {
+    private static final String RSCRIPT_BINARY = "Rscript";
+    private static final File RSCRIPT_PATH = RuntimeUtils.which(RSCRIPT_BINARY);
+    public static final boolean RSCRIPT_EXISTS = (RSCRIPT_PATH != null);
+    private static final String RSCRIPT_MISSING_MESSAGE = "Please add the Rscript directory to your environment ${PATH}";
+
     /**
      * our log
      */
-    protected static Logger logger = Logger.getLogger(RScriptExecutor.class);
+    private static Logger logger = Logger.getLogger(RScriptExecutor.class);
 
-    public static class RScriptArgumentCollection {
-        @Advanced
-        @Argument(fullName = "path_to_Rscript", shortName = "Rscript", doc = "The path to your implementation of Rscript. For Broad users this is maybe /broad/software/free/Linux/redhat_5_x86_64/pkgs/r_2.12.0/bin/Rscript", required = false)
-        public String PATH_TO_RSCRIPT = "Rscript";
+    private boolean exceptOnError = false;
+    private final List<RScriptLibrary> libraries = new ArrayList<RScriptLibrary>();
+    private final List<Resource> scriptResources = new ArrayList<Resource>();
+    private final List<File> scriptFiles = new ArrayList<File>();
+    private final List<String> args = new ArrayList<String>();
 
-        @Advanced
-        @Argument(fullName = "path_to_Rresources", shortName = "Rresources", doc = "Path to resources folder holding the Sting R scripts.", required = false)
-        public List<String> PATH_TO_RESOURCES = Arrays.asList("public/R/", "private/R/");
-
-        public RScriptArgumentCollection() {}
-
-        /** For testing and convenience */
-        public RScriptArgumentCollection(final String PATH_TO_RSCRIPT, final List<String> PATH_TO_RESOURCES) {
-            this.PATH_TO_RSCRIPT = PATH_TO_RSCRIPT;
-            this.PATH_TO_RESOURCES = PATH_TO_RESOURCES;
-        }
-    }
-
-    final RScriptArgumentCollection myArgs;
-    final boolean exceptOnError;
-
-    public RScriptExecutor(final RScriptArgumentCollection myArgs, final boolean exceptOnError) {
-        this.myArgs = myArgs;
+    public void setExceptOnError(boolean exceptOnError) {
         this.exceptOnError = exceptOnError;
     }
 
-    public void callRScripts(String scriptName, Object... scriptArgs) {
-        callRScripts(scriptName, Arrays.asList(scriptArgs));
+    public void addLibrary(RScriptLibrary library) {
+        this.libraries.add(library);
     }
 
-    public void callRScripts(String scriptName, List<Object> scriptArgs) {
-        try {
-            final File pathToScript = findScript(scriptName);
-            if ( pathToScript == null ) return; // we failed but shouldn't exception out
-            final String argString = Utils.join(" ", scriptArgs);
-            final String cmdLine = Utils.join(" ", Arrays.asList(myArgs.PATH_TO_RSCRIPT, pathToScript, argString));
-            logger.info("Executing RScript: " + cmdLine);
-            Runtime.getRuntime().exec(cmdLine).waitFor();
-        } catch (InterruptedException e) {
-            generateException(e);
-        } catch (IOException e) {
-            generateException("Fatal Exception: Perhaps RScript jobs are being spawned too quickly?", e);
-        }
+    public void addScript(Resource script) {
+        this.scriptResources.add(script);
     }
 
-    public File findScript(final String scriptName) {
-        for ( String pathToResource : myArgs.PATH_TO_RESOURCES ) {
-            final File f = new File(pathToResource + "/" + scriptName);
-            if ( f.exists() ) {
-                if ( f.canRead() )
-                    return f;
-                else
-                    generateException("Script exists but couldn't be read: " + scriptName);
+    public void addScript(File script) {
+        this.scriptFiles.add(script);
+    }
+
+    /**
+     * Adds args to the end of the Rscript command line.
+     * @param args the args.
+     * @throws NullPointerException if any of the args are null.
+     */
+    public void addArgs(Object... args) {
+        for (Object arg: args)
+            this.args.add(arg.toString());
+    }
+
+    public String getApproximateCommandLine() {
+        StringBuilder command = new StringBuilder("Rscript");
+        for (Resource script: this.scriptResources)
+            command.append(" (resource)").append(script.getFullPath());
+        for (File script: this.scriptFiles)
+            command.append(" ").append(script.getAbsolutePath());
+        for (String arg: this.args)
+            command.append(" ").append(arg);
+        return command.toString();
+    }
+
+    public boolean exec() {
+        if (!RSCRIPT_EXISTS) {
+            if (exceptOnError) {
+                throw new UserException.CannotExecuteRScript(RSCRIPT_MISSING_MESSAGE);
+            } else {
+                logger.warn("Skipping: " + getApproximateCommandLine());
+                return false;
             }
         }
 
-        generateException("Couldn't find script: " + scriptName + " in " + myArgs.PATH_TO_RESOURCES);
-        return null;
-    }
+        List<File> tempFiles = new ArrayList<File>();
+        try {
+            File tempLibDir = IOUtils.tempDir("R.", ".lib");
+            tempFiles.add(tempLibDir);
 
-    private void generateException(String msg) {
-        generateException(msg, null);
-    }
+            StringBuilder expression = new StringBuilder("tempLibDir = '").append(tempLibDir).append("';");
 
-    private void generateException(Throwable e) {
-        generateException("", e);
-    }
+            if (this.libraries.size() > 0) {
+                List<String> tempLibraryPaths = new ArrayList<String>();
+                for (RScriptLibrary library: this.libraries) {
+                    File tempLibrary = library.writeTemp();
+                    tempFiles.add(tempLibrary);
+                    tempLibraryPaths.add(tempLibrary.getAbsolutePath());
+                }
 
-    private void generateException(String msg, Throwable e) {
-        if ( exceptOnError )
-            throw new UserException(msg, e);
-        else
-            logger.warn(msg + (e == null ? "" : ":" + e.getMessage()));
+                expression.append("install.packages(");
+                expression.append("pkgs=c('").append(StringUtils.join(tempLibraryPaths, "', '")).append("'), lib=tempLibDir, repos=NULL, type='source', ");
+                // Install faster by eliminating cruft.
+                expression.append("INSTALL_opts=c('--no-libs', '--no-data', '--no-help', '--no-demo', '--no-exec')");
+                expression.append(");");
+
+                for (RScriptLibrary library: this.libraries) {
+                    expression.append("library('").append(library.getLibraryName()).append("', lib.loc=tempLibDir);");
+                }
+            }
+
+            for (Resource script: this.scriptResources) {
+                File tempScript = IOUtils.writeTempResource(script);
+                tempFiles.add(tempScript);
+                expression.append("source('").append(tempScript.getAbsolutePath()).append("');");
+            }
+
+            for (File script: this.scriptFiles) {
+                expression.append("source('").append(script.getAbsolutePath()).append("');");
+            }
+
+            String[] cmd = new String[this.args.size() + 3];
+            int i = 0;
+            cmd[i++] = RSCRIPT_BINARY;
+            cmd[i++] = "-e";
+            cmd[i++] = expression.toString();
+            for (String arg: this.args)
+                cmd[i++] = arg;
+
+            ProcessSettings processSettings = new ProcessSettings(cmd);
+            if (logger.isDebugEnabled()) {
+                processSettings.getStdoutSettings().printStandard(true);
+                processSettings.getStderrSettings().printStandard(true);
+            }
+
+            ProcessController controller = ProcessController.getThreadLocal();
+
+            if (logger.isDebugEnabled()) {
+                logger.debug("Executing:");
+                for (String arg: cmd)
+                    logger.debug("  " + arg);
+            }
+            int exitValue = controller.exec(processSettings).getExitValue();
+            logger.debug("Result: " + exitValue);
+
+            if (exitValue != 0)
+                throw new RScriptExecutorException(
+                        "RScript exited with " + exitValue +
+                                (logger.isDebugEnabled() ? "" : ". Run with -l DEBUG for more info."));
+
+            return true;
+        } catch (StingException e) {
+            if (exceptOnError) {
+                throw e;
+            } else {
+                logger.warn(e.getMessage());
+                return false;
+            }
+        } finally {
+            for (File temp: tempFiles)
+                FileUtils.deleteQuietly(temp);
+        }
     }
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/R/RScriptExecutorException.java b/public/java/src/org/broadinstitute/sting/utils/R/RScriptExecutorException.java
new file mode 100644
index 000000000..794c3ade4
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/R/RScriptExecutorException.java
@@ -0,0 +1,33 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.R;
+
+import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+
+public class RScriptExecutorException extends ReviewedStingException {
+    public RScriptExecutorException(String msg) {
+        super(msg);
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/R/RScriptLibrary.java b/public/java/src/org/broadinstitute/sting/utils/R/RScriptLibrary.java
new file mode 100644
index 000000000..60cd7504b
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/R/RScriptLibrary.java
@@ -0,0 +1,59 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.R;
+
+import org.broadinstitute.sting.utils.io.IOUtils;
+import org.broadinstitute.sting.utils.io.Resource;
+
+import java.io.File;
+
+/**
+ * Libraries embedded in the StingUtils package.
+ */
+public enum RScriptLibrary {
+    GSALIB("gsalib");
+
+    private final String name;
+
+    private RScriptLibrary(String name) {
+        this.name = name;
+    }
+
+    public String getLibraryName() {
+        return this.name;
+    }
+
+    public String getResourcePath() {
+        return name + ".tar.gz";
+    }
+
+    /**
+     * Writes the library source code to a temporary tar.gz file and returns the path.
+     * @return The path to the library source code. The caller must delete the code when done.
+     */
+    public File writeTemp() {
+        return IOUtils.writeTempResource(new Resource(getResourcePath(), RScriptLibrary.class));
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/SampleUtils.java b/public/java/src/org/broadinstitute/sting/utils/SampleUtils.java
index f9997bfd8..edc1413ba 100755
--- a/public/java/src/org/broadinstitute/sting/utils/SampleUtils.java
+++ b/public/java/src/org/broadinstitute/sting/utils/SampleUtils.java
@@ -69,6 +69,18 @@ public class SampleUtils {
         return samples;
     }
 
+
+    /**
+     * Same as @link getSAMFileSamples but gets all of the samples
+     * in the SAM files loaded by the engine
+     *
+     * @param engine
+     * @return
+     */
+    public final static Set<String> getSAMFileSamples(GenomeAnalysisEngine engine) {
+        return SampleUtils.getSAMFileSamples(engine.getSAMFileHeader());
+    }
+
     /**
      * Gets all of the unique sample names from all VCF rods input by the user
      *
@@ -190,11 +202,21 @@ public class SampleUtils {
 
     }
 
-    public static List<String> getSamplesFromCommandLineInput(Collection<String> sampleArgs) {
+    /**
+     * Returns a new set of samples, containing a final list of samples expanded from sampleArgs
+     *
+     * Each element E of sampleArgs can either be a literal sample name or a file.  For each E,
+     * we try to read a file named E from disk, and if possible all lines from that file are expanded
+     * into unique sample names.
+     *
+     * @param sampleArgs
+     * @return
+     */
+    public static Set<String> getSamplesFromCommandLineInput(Collection<String> sampleArgs) {
         if (sampleArgs != null) {
             // Let's first go through the list and see if we were given any files.  We'll add every entry in the file to our
             // sample list set, and treat the entries as if they had been specified on the command line.
-            List<String> samplesFromFiles = new ArrayList<String>();
+            Set<String> samplesFromFiles = new HashSet<String>();
             for (String SAMPLE_EXPRESSION : sampleArgs) {
                 File sampleFile = new File(SAMPLE_EXPRESSION);
 
@@ -203,7 +225,7 @@ public class SampleUtils {
 
                     List<String> lines = reader.readLines();
                     for (String line : lines) {
-                        samplesFromFiles.add(line);
+                        samplesFromFiles.add(line.trim());
                     }
                 } catch (FileNotFoundException e) {
                     samplesFromFiles.add(SAMPLE_EXPRESSION); // not a file, so must be a sample
@@ -212,7 +234,8 @@ public class SampleUtils {
 
             return samplesFromFiles;
         }
-        return new ArrayList<String>();
+
+        return new HashSet<String>();
     }
 
     public static Set<String> getSamplesFromCommandLineInput(Collection<String> vcfSamples, Collection<String> sampleExpressions) {
diff --git a/public/java/src/org/broadinstitute/sting/utils/SimpleTimer.java b/public/java/src/org/broadinstitute/sting/utils/SimpleTimer.java
index a5ac10250..15d34a348 100644
--- a/public/java/src/org/broadinstitute/sting/utils/SimpleTimer.java
+++ b/public/java/src/org/broadinstitute/sting/utils/SimpleTimer.java
@@ -1,10 +1,5 @@
 package org.broadinstitute.sting.utils;
 
-import com.google.java.contract.Ensures;
-import com.google.java.contract.Invariant;
-import com.google.java.contract.Requires;
-
-import java.io.PrintStream;
 
 /**
  * A useful simple system for timing code.  This code is not thread safe!
@@ -13,11 +8,6 @@ import java.io.PrintStream;
  * Date: Dec 10, 2010
  * Time: 9:07:44 AM
  */
-@Invariant({
-        "elapsed >= 0",
-        "startTime >= 0",
-        "name != null",
-        "! running || startTime > 0"})
 public class SimpleTimer {
     final private String name;
     private long elapsed = 0l;
@@ -27,7 +17,6 @@ public class SimpleTimer {
     /**
      * Creates an anonymous simple timer
      */
-    @Ensures("name != null && name.equals(\"Anonymous\")")
     public SimpleTimer() {
         this("Anonymous");
     }
@@ -36,8 +25,6 @@ public class SimpleTimer {
      * Creates a simple timer named name
      * @param name of the timer, must not be null
      */
-    @Requires("name != null")
-    @Ensures("this.name != null && this.name.equals(name)")
     public SimpleTimer(String name) {
         this.name = name;
     }
@@ -45,7 +32,6 @@ public class SimpleTimer {
     /**
      * @return the name associated with this timer
      */
-    @Ensures("result != null")
     public synchronized String getName() {
         return name;
     }
@@ -56,8 +42,6 @@ public class SimpleTimer {
      *
      * @return this object, for programming convenience
      */
-    @Requires("running == false")
-    @Ensures({"result != null", "elapsed == 0l"})
     public synchronized SimpleTimer start() {
         elapsed = 0l;
         restart();
@@ -71,8 +55,6 @@ public class SimpleTimer {
      *
      * @return this object, for programming convenience
      */
-    @Requires("running == false")
-    @Ensures("result != null")
     public synchronized SimpleTimer restart() {
         running = true;
         startTime = currentTime();
@@ -99,8 +81,6 @@ public class SimpleTimer {
      *
      * @return this object, for programming convenience
      */
-    @Requires("running == true")
-    @Ensures({"result != null", "elapsed >= old(elapsed)", "running == false"})
     public synchronized SimpleTimer stop() {
         running = false;
         elapsed += currentTime() - startTime;
@@ -113,9 +93,6 @@ public class SimpleTimer {
      *
      * @return this time, in seconds
      */
-    @Ensures({
-            "result >= (elapsed/1000.0)",
-            "result >= 0"})
     public synchronized double getElapsedTime() {
         return (running ? (currentTime() - startTime + elapsed) : elapsed) / 1000.0;
     }
diff --git a/public/java/src/org/broadinstitute/sting/utils/Utils.java b/public/java/src/org/broadinstitute/sting/utils/Utils.java
index 6ce492c63..f0eb5d399 100755
--- a/public/java/src/org/broadinstitute/sting/utils/Utils.java
+++ b/public/java/src/org/broadinstitute/sting/utils/Utils.java
@@ -58,33 +58,6 @@ public class Utils {
         return (int)(maxElements / JAVA_DEFAULT_HASH_LOAD_FACTOR) + 2;
     }
 
-    public static String getClassName(Class c) {
-        String FQClassName = c.getName();
-        int firstChar;
-        firstChar = FQClassName.lastIndexOf ('.') + 1;
-        if ( firstChar > 0 ) {
-            FQClassName = FQClassName.substring ( firstChar );
-        }
-        return FQClassName;
-    }
-
-
-    // returns package and class name
-    public static String getFullClassName(Class c) {
-        return  c.getName();
-    }
-
-    // returns the package without the classname, empty string if
-    // there is no package
-    public static String getPackageName(Class c) {
-        String fullyQualifiedName = c.getName();
-        int lastDot = fullyQualifiedName.lastIndexOf ('.');
-        if (lastDot==-1){ return ""; }
-        return fullyQualifiedName.substring (0, lastDot);
-    }
-
-
-
     /**
      * Compares two objects, either of which might be null.
      *
@@ -107,20 +80,24 @@ public class Utils {
     }
 
     public static void warnUser(final String msg) {
+        warnUser(logger, msg);
+    }
+    
+    public static void warnUser(final Logger logger, final String msg) {
         logger.warn(String.format("********************************************************************************"));
         logger.warn(String.format("* WARNING:"));
         logger.warn(String.format("*"));
-        prettyPrintWarningMessage(msg);
+        prettyPrintWarningMessage(logger, msg);
         logger.warn(String.format("********************************************************************************"));
     }
-    
 
     /**
      * pretty print the warning message supplied
      *
+     * @param logger logger for the message
      * @param message the message
      */
-    private static void prettyPrintWarningMessage(String message) {
+    private static void prettyPrintWarningMessage(Logger logger, String message) {
         StringBuilder builder = new StringBuilder(message);
         while (builder.length() > 70) {
             int space = builder.lastIndexOf(" ", 70);
@@ -609,6 +586,12 @@ public class Utils {
         return rcbases;
     }
 
+    static public final <T> List<T> reverse(final List<T> l) {
+        final List<T> newL = new ArrayList<T>(l);
+        Collections.reverse(newL);
+        return newL;
+    }
+
     /**
      * Reverse an int array of bases
      *
diff --git a/public/java/src/org/broadinstitute/sting/utils/bed/BedParser.java b/public/java/src/org/broadinstitute/sting/utils/bed/BedParser.java
deleted file mode 100644
index b95165841..000000000
--- a/public/java/src/org/broadinstitute/sting/utils/bed/BedParser.java
+++ /dev/null
@@ -1,104 +0,0 @@
-package org.broadinstitute.sting.utils.bed;
-
-import org.broadinstitute.sting.utils.GenomeLoc;
-import org.broadinstitute.sting.utils.GenomeLocParser;
-import org.broadinstitute.sting.utils.exceptions.UserException;
-
-import java.io.*;
-import java.util.ArrayList;
-import java.util.List;
-
-/**
- * Created by IntelliJ IDEA.
- * User: aaron
- * Date: Oct 5, 2009
- * Time: 5:46:45 PM
- */
-public class BedParser {
-    // the GATk operates as a one based location, bed files are 0 based
-    static final int TO_ONE_BASED_ADDITION = 1;
-
-    // the buffered reader input
-    private final BufferedReader mIn;
-
-    private GenomeLocParser genomeLocParser;
-
-    // our array of locations
-    private List<GenomeLoc> mLocations;
-
-    /**
-     * parse a bed file, given it's location
-     *
-     * @param fl
-     */
-    public BedParser(GenomeLocParser genomeLocParser,File fl) {
-        this.genomeLocParser = genomeLocParser;
-        try {
-            mIn = new BufferedReader(new FileReader(fl));
-        } catch (FileNotFoundException e) {
-            throw new UserException.CouldNotReadInputFile(fl, e);
-        }
-        mLocations = parseLocations();
-    }
-
-    /**
-     * parse a bed file, given an input reader
-     *
-     * @param fl the bed file
-     */
-    public BedParser(BufferedReader fl) {
-        mIn = fl;
-        mLocations = parseLocations();
-    }
-
-    /**
-     * parse out the locations
-     *
-     * @return a list of GenomeLocs, sorted and merged
-     */
-    private List<GenomeLoc> parseLocations() {
-        String line = null;
-        List<GenomeLoc> locArray = new ArrayList<GenomeLoc>();
-        try {
-            while ((line = mIn.readLine()) != null) {
-                locArray.add(parseLocation(genomeLocParser,line));
-            }
-        } catch (IOException e) {
-            throw new UserException.MalformedFile("Unable to parse line in BED file.");
-        }
-        return locArray;
-    }
-
-    /**
-     * parse a single location
-     *
-     * @param line the line, as a string
-     * @return a parsed genome loc
-     */
-    public static GenomeLoc parseLocation(GenomeLocParser genomeLocParser,String line) {
-        String contig;
-        int start;
-        int stop;
-        try {
-            String parts[] = line.split("\\s+");
-            contig = parts[0];
-            start = Integer.valueOf(parts[1]) + TO_ONE_BASED_ADDITION;
-            stop = Integer.valueOf(parts[2]); // the ending point is an open interval
-        } catch (Exception e) {
-            throw new UserException.MalformedFile("Unable to process bed file line = " + line, e);
-        }
-
-        // we currently drop the rest of the bed record, which can contain names, scores, etc
-        return genomeLocParser.createGenomeLoc(contig, start, stop, true);
-
-    }
-
-    /**
-     * return the sorted, and merged (for overlapping regions)
-     *
-     * @return an arraylist
-     */
-    public List<GenomeLoc> getLocations() {
-        return mLocations;
-    }
-}
diff --git a/public/java/src/org/broadinstitute/sting/utils/clipreads/ClippingOp.java b/public/java/src/org/broadinstitute/sting/utils/clipreads/ClippingOp.java
index bc200372f..4a253b217 100644
--- a/public/java/src/org/broadinstitute/sting/utils/clipreads/ClippingOp.java
+++ b/public/java/src/org/broadinstitute/sting/utils/clipreads/ClippingOp.java
@@ -4,9 +4,9 @@ import com.google.java.contract.Requires;
 import net.sf.samtools.Cigar;
 import net.sf.samtools.CigarElement;
 import net.sf.samtools.CigarOperator;
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.Iterator;
 import java.util.Stack;
@@ -39,14 +39,14 @@ public class ClippingOp {
      * @param algorithm
      * @param read
      */
-    public SAMRecord apply(ClippingRepresentation algorithm, SAMRecord read) {
+    public GATKSAMRecord apply(ClippingRepresentation algorithm, GATKSAMRecord read) {
         byte[] quals = read.getBaseQualities();
         byte[] bases = read.getReadBases();
 
         switch (algorithm) {
             // important note:
             //   it's not safe to call read.getReadBases()[i] = 'N' or read.getBaseQualities()[i] = 0
-            //   because you're not guaranteed to get a pointer to the actual array of bytes in the SAMRecord
+            //   because you're not guaranteed to get a pointer to the actual array of bytes in the GATKSAMRecord
             case WRITE_NS:
                 for (int i = start; i <= stop; i++)
                     bases[i] = 'N';
@@ -248,9 +248,9 @@ public class ClippingOp {
     }
 
     @Requires({"start <= stop", "start == 0 || stop == read.getReadLength() - 1", "!read.getReadUnmappedFlag()"})
-    private SAMRecord hardClip (SAMRecord read, int start, int stop) {
-        if (start == 0 && stop == read.getReadLength() -1)
-            return new SAMRecord(read.getHeader());
+    private GATKSAMRecord hardClip (GATKSAMRecord read, int start, int stop) {
+        if (start == 0 && stop == read.getReadLength() - 1)
+            return new GATKSAMRecord(read.getHeader());
 
         // If the read is unmapped there is no Cigar string and neither should we create a new cigar string
         CigarShift cigarShift = (read.getReadUnmappedFlag()) ? new CigarShift(new Cigar(), 0, 0) : hardClipCigar(read.getCigar(), start, stop);
@@ -265,9 +265,9 @@ public class ClippingOp {
         System.arraycopy(read.getReadBases(), copyStart, newBases, 0, newLength);
         System.arraycopy(read.getBaseQualities(), copyStart, newQuals, 0, newLength);
 
-        SAMRecord hardClippedRead;
+        GATKSAMRecord hardClippedRead;
         try {
-            hardClippedRead = (SAMRecord) read.clone();
+            hardClippedRead = (GATKSAMRecord) read.clone();
         } catch (CloneNotSupportedException e) {
             throw new ReviewedStingException("Where did the clone go?");
         }
@@ -324,6 +324,8 @@ public class ClippingOp {
 
                 if (index <= stop && cigarElementIterator.hasNext())
                     cigarElement = cigarElementIterator.next();
+                else
+                    break;
             }
 
             // add the remaining cigar elements
@@ -363,6 +365,8 @@ public class ClippingOp {
                 index += shift;
                 if (index < start && cigarElementIterator.hasNext())
                     cigarElement = cigarElementIterator.next();
+                else
+                    break;
             }
 
             // check if we are hard clipping indels
@@ -394,7 +398,9 @@ public class ClippingOp {
 
         for (int i = 1; i <= 2; i++) {
             int shift = 0;
+            int totalHardClip = 0;
             boolean readHasStarted = false;
+            boolean addedHardClips = false;
 
             while(!cigarStack.empty()) {
                 CigarElement cigarElement = cigarStack.pop();
@@ -404,14 +410,33 @@ public class ClippingOp {
                         cigarElement.getOperator() != CigarOperator.DELETION &&
                         cigarElement.getOperator() != CigarOperator.HARD_CLIP)
                     readHasStarted = true;
+
+                else if ( !readHasStarted && cigarElement.getOperator() == CigarOperator.HARD_CLIP)
+                    totalHardClip += cigarElement.getLength();
+
                 else if ( !readHasStarted && cigarElement.getOperator() == CigarOperator.INSERTION)
                     shift += cigarElement.getLength();
 
-                if (readHasStarted || cigarElement.getOperator() == CigarOperator.HARD_CLIP) {
-                    if (i==1)
+                else if ( !readHasStarted && cigarElement.getOperator() == CigarOperator.DELETION)
+                    totalHardClip += cigarElement.getLength();
+
+                if (readHasStarted) {
+                    if (i==1) {
+                        if (!addedHardClips) {
+                            if (totalHardClip > 0)
+                                inverseCigarStack.push(new CigarElement(totalHardClip, CigarOperator.HARD_CLIP));
+                            addedHardClips = true;
+                        }
                         inverseCigarStack.push(cigarElement);
-                    else
+                    }
+                    else {
+                        if (!addedHardClips) {
+                            if (totalHardClip > 0)
+                                cleanCigar.add(new CigarElement(totalHardClip, CigarOperator.HARD_CLIP));
+                            addedHardClips = true;
+                        }
                         cleanCigar.add(cigarElement);
+                    }
                 }
             }
             // first pass  (i=1) is from end to start of the cigar elements
@@ -428,39 +453,35 @@ public class ClippingOp {
     }
 
     private int calculateAlignmentStartShift(Cigar oldCigar, Cigar newCigar) {
-        int shift = 0;
+        int newShift = 0;
+        int oldShift = 0;
 
-        // Rewind to previous start (by counting everything that was already clipped in this read)
-        for (CigarElement cigarElement : oldCigar.getCigarElements()) {
-            if (!cigarElement.getOperator().consumesReferenceBases())
-                shift -= cigarElement.getLength();
-            else
-                break;
-        }
-
-        // Advance to new start (by counting everything new that has been clipped )
         for (CigarElement cigarElement : newCigar.getCigarElements()) {
-            if (!cigarElement.getOperator().consumesReferenceBases())
-                shift += cigarElement.getLength();
+            if (cigarElement.getOperator() == CigarOperator.HARD_CLIP || cigarElement.getOperator() == CigarOperator.SOFT_CLIP)
+                newShift += cigarElement.getLength();
             else
                 break;
         }
 
-        return shift;
+        for (CigarElement cigarElement : oldCigar.getCigarElements()) {
+            if (cigarElement.getOperator() == CigarOperator.HARD_CLIP || cigarElement.getOperator() == CigarOperator.SOFT_CLIP )
+                oldShift += Math.min(cigarElement.getLength(), newShift - oldShift);
+            else
+                break;
+        }
+        return newShift - oldShift;
     }
 
     private int calculateHardClippingAlignmentShift(CigarElement cigarElement, int clippedLength) {
-        if (cigarElement.getOperator() == CigarOperator.INSERTION) {
-            int cigarElementLength = cigarElement.getLength();
-            if (clippedLength >= cigarElementLength)
-                return -cigarElement.getLength();
-            else
-                return -clippedLength;
-        }
+        // Insertions should be discounted from the total hard clip count
+        if (cigarElement.getOperator() == CigarOperator.INSERTION)
+            return -clippedLength;
 
-        if (cigarElement.getOperator() == CigarOperator.DELETION)
+        // Deletions should be added to the total hard clip count
+        else if (cigarElement.getOperator() == CigarOperator.DELETION)
             return cigarElement.getLength();
 
+        // There is no shift if we are not clipping an indel
         return 0;
     }
 
diff --git a/public/java/src/org/broadinstitute/sting/utils/clipreads/ReadClipper.java b/public/java/src/org/broadinstitute/sting/utils/clipreads/ReadClipper.java
index 26c25850a..a6df986ba 100644
--- a/public/java/src/org/broadinstitute/sting/utils/clipreads/ReadClipper.java
+++ b/public/java/src/org/broadinstitute/sting/utils/clipreads/ReadClipper.java
@@ -1,8 +1,10 @@
 package org.broadinstitute.sting.utils.clipreads;
 
 import com.google.java.contract.Requires;
-import net.sf.samtools.SAMRecord;
+import net.sf.samtools.CigarElement;
+import net.sf.samtools.CigarOperator;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.broadinstitute.sting.utils.sam.ReadUtils;
 
 import java.util.ArrayList;
@@ -12,7 +14,7 @@ import java.util.List;
  * A simple collection of the clipping operations to apply to a read along with its read
  */
 public class ReadClipper {
-    SAMRecord read;
+    GATKSAMRecord read;
     boolean wasClipped;
     List<ClippingOp> ops = null;
 
@@ -21,7 +23,7 @@ public class ReadClipper {
      *
      * @param read
      */
-    public ReadClipper(final SAMRecord read) {
+    public ReadClipper(final GATKSAMRecord read) {
         this.read = read;
         this.wasClipped = false;
     }
@@ -44,50 +46,64 @@ public class ReadClipper {
         return wasClipped;
     }
 
-    public SAMRecord getRead() {
+    public GATKSAMRecord getRead() {
         return read;
     }
 
-    public SAMRecord hardClipByReferenceCoordinatesLeftTail(int refStop) {
+    public GATKSAMRecord hardClipByReferenceCoordinatesLeftTail(int refStop) {
         return hardClipByReferenceCoordinates(-1, refStop);
     }
 
-    public SAMRecord hardClipByReferenceCoordinatesRightTail(int refStart) {
+    public GATKSAMRecord hardClipByReferenceCoordinatesRightTail(int refStart) {
         return hardClipByReferenceCoordinates(refStart, -1);
     }
 
-    private SAMRecord hardClipByReferenceCoordinates(int refStart, int refStop) {
-        int start = (refStart < 0) ? 0 : ReadUtils.getReadCoordinateForReferenceCoordinate(read, refStart);
-        int stop =  (refStop  < 0) ? read.getReadLength() - 1 : ReadUtils.getReadCoordinateForReferenceCoordinate(read, refStop);
+    private int numDeletions(GATKSAMRecord read) {
+        int result = 0;
+        for (CigarElement e: read.getCigar().getCigarElements()) {
+            if ( e.getOperator() == CigarOperator.DELETION || e.getOperator() == CigarOperator.D )
+                result =+ e.getLength();
+        }
+        return result;
+    }
+
+    protected GATKSAMRecord hardClipByReferenceCoordinates(int refStart, int refStop) {
+        int start = (refStart < 0) ? 0 : ReadUtils.getReadCoordinateForReferenceCoordinate(read, refStart, ReadUtils.ClippingTail.RIGHT_TAIL);
+        int stop =  (refStop  < 0) ? read.getReadLength() - 1 : ReadUtils.getReadCoordinateForReferenceCoordinate(read, refStop, ReadUtils.ClippingTail.LEFT_TAIL);
 
         if (start < 0 || stop > read.getReadLength() - 1)
             throw new ReviewedStingException("Trying to clip before the start or after the end of a read");
 
-        // TODO add requires statement/check in the Hardclip function
         if ( start > stop )
-            stop = ReadUtils.getReadCoordinateForReferenceCoordinate(read, ReadUtils.getRefCoordSoftUnclippedEnd(read));
+            throw new ReviewedStingException("START > STOP -- this should never happen -- call Mauricio!");
 
-        //System.out.println("Clipping start/stop: " + start + "/" + stop);
         this.addOp(new ClippingOp(start, stop));
-        SAMRecord clippedRead = clipRead(ClippingRepresentation.HARDCLIP_BASES);
+        GATKSAMRecord clippedRead = clipRead(ClippingRepresentation.HARDCLIP_BASES);
         this.ops = null;
         return clippedRead;
     }
 
-    public SAMRecord hardClipByReadCoordinates(int start, int stop) {
+    public GATKSAMRecord hardClipByReadCoordinates(int start, int stop) {
         this.addOp(new ClippingOp(start, stop));
         return clipRead(ClippingRepresentation.HARDCLIP_BASES);
     }
 
     @Requires("left <= right")
-    public SAMRecord hardClipBothEndsByReferenceCoordinates(int left, int right) {
+    public GATKSAMRecord hardClipBothEndsByReferenceCoordinates(int left, int right) {
         if (left == right)
-            return new SAMRecord(read.getHeader());
-        this.read = hardClipByReferenceCoordinates(right, -1);
-        return hardClipByReferenceCoordinates(-1, left);
+            return new GATKSAMRecord(read.getHeader());
+        GATKSAMRecord leftTailRead = hardClipByReferenceCoordinates(right, -1);
+
+        // after clipping one tail, it is possible that the consequent hard clipping of adjacent deletions
+        // make the left cut index no longer part of the read. In that case, clip the read entirely.
+        if (left > leftTailRead.getAlignmentEnd())
+            return new GATKSAMRecord(read.getHeader());
+
+        ReadClipper clipper = new ReadClipper(leftTailRead);
+        return clipper.hardClipByReferenceCoordinatesLeftTail(left);
     }
 
-    public SAMRecord hardClipLowQualEnds(byte lowQual) {
+    public GATKSAMRecord hardClipLowQualEnds(byte lowQual) {
         byte [] quals = read.getBaseQualities();
         int leftClipIndex = 0;
         int rightClipIndex = read.getReadLength() - 1;
@@ -98,7 +114,7 @@ public class ReadClipper {
 
         // if the entire read should be clipped, then return an empty read. (--todo: maybe null is better? testing this for now)
         if (leftClipIndex > rightClipIndex)
-            return (new SAMRecord(read.getHeader()));
+            return (new GATKSAMRecord(read.getHeader()));
 
         if (rightClipIndex < read.getReadLength() - 1) {
             this.addOp(new ClippingOp(rightClipIndex + 1, read.getReadLength() - 1));
@@ -109,18 +125,51 @@ public class ReadClipper {
         return this.clipRead(ClippingRepresentation.HARDCLIP_BASES);
     }
 
+    public GATKSAMRecord hardClipSoftClippedBases () {
+        int readIndex = 0;
+        int cutLeft = -1;            // first position to hard clip (inclusive)
+        int cutRight = -1;           // first position to hard clip (inclusive)
+        boolean rightTail = false;   // trigger to stop clipping the left tail and start cutting the right tail
+
+        for (CigarElement cigarElement : read.getCigar().getCigarElements()) {
+            if (cigarElement.getOperator() == CigarOperator.SOFT_CLIP) {
+                if (rightTail) {
+                    cutRight = readIndex;
+                }
+                else {
+                    cutLeft = readIndex + cigarElement.getLength() - 1;
+                }
+            }
+            else if (cigarElement.getOperator() != CigarOperator.HARD_CLIP)
+                rightTail = true;
+
+            if (cigarElement.getOperator().consumesReadBases())
+                readIndex += cigarElement.getLength();
+        }
+
+        // It is extremely important that we cut the end first otherwise the read coordinates change.
+        if (cutRight >= 0)
+            this.addOp(new ClippingOp(cutRight, read.getReadLength() - 1));
+        if (cutLeft >= 0)
+            this.addOp(new ClippingOp(0, cutLeft));
+
+        return clipRead(ClippingRepresentation.HARDCLIP_BASES);
+    }
+
+
+
     /**
      * Return a new read corresponding to this.read that's been clipped according to ops, if any are present.
      *
      * @param algorithm
      * @return
      */
-    public SAMRecord clipRead(ClippingRepresentation algorithm) {
+    public GATKSAMRecord clipRead(ClippingRepresentation algorithm) {
         if (ops == null)
             return getRead();
         else {
             try {
-                SAMRecord clippedRead = (SAMRecord) read.clone();
+                GATKSAMRecord clippedRead = (GATKSAMRecord) read.clone();
                 for (ClippingOp op : getOps()) {
                     clippedRead = op.apply(algorithm, clippedRead);
                 }
@@ -131,4 +180,21 @@ public class ReadClipper {
             }
         }
     }
+
+    public GATKSAMRecord hardClipLeadingInsertions() {
+        for(CigarElement cigarElement : read.getCigar().getCigarElements()) {
+            if (cigarElement.getOperator() != CigarOperator.HARD_CLIP && cigarElement.getOperator() != CigarOperator.SOFT_CLIP &&
+                cigarElement.getOperator() != CigarOperator.INSERTION && cigarElement.getOperator() != CigarOperator.DELETION)
+                break;
+
+            else if (cigarElement.getOperator() == CigarOperator.INSERTION) {
+                this.addOp(new ClippingOp(0, cigarElement.getLength() - 1));
+            }
+
+            else if (cigarElement.getOperator() == CigarOperator.DELETION) {
+                throw new ReviewedStingException("No read should start with a deletion. Aligner bug?");
+            }
+        }
+        return clipRead(ClippingRepresentation.HARDCLIP_BASES);
+    }
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/codecs/table/TableCodec.java b/public/java/src/org/broadinstitute/sting/utils/codecs/table/TableCodec.java
index 1919ccbf0..4082a5597 100755
--- a/public/java/src/org/broadinstitute/sting/utils/codecs/table/TableCodec.java
+++ b/public/java/src/org/broadinstitute/sting/utils/codecs/table/TableCodec.java
@@ -86,7 +86,13 @@ public class TableCodec implements ReferenceDependentFeatureCodec {
     public Object readHeader(LineReader reader) {
         String line = "";
         try {
+            boolean isFirst = true;
             while ((line = reader.readLine()) != null) {
+                System.out.println(line);
+                if ( isFirst && ! line.startsWith(headerDelimiter) && ! line.startsWith(commentDelimiter)) {
+                    throw new UserException.MalformedFile("TableCodec file does not have a header");
+                }
+		isFirst &= line.startsWith(commentDelimiter);
                 if (line.startsWith(headerDelimiter)) {
                     if (header.size() > 0) throw new IllegalStateException("Input table file seems to have two header lines.  The second is = " + line);
                     String spl[] = line.split(delimiterRegex);
diff --git a/public/java/src/org/broadinstitute/sting/utils/codecs/table/TableFeature.java b/public/java/src/org/broadinstitute/sting/utils/codecs/table/TableFeature.java
index a85849f0b..4b5c51bd4 100755
--- a/public/java/src/org/broadinstitute/sting/utils/codecs/table/TableFeature.java
+++ b/public/java/src/org/broadinstitute/sting/utils/codecs/table/TableFeature.java
@@ -1,7 +1,9 @@
 package org.broadinstitute.sting.utils.codecs.table;
 
+
 import org.broad.tribble.Feature;
 import org.broadinstitute.sting.utils.GenomeLoc;
+import org.broadinstitute.sting.utils.Utils;
 
 import java.util.List;
 
@@ -44,6 +46,10 @@ public class TableFeature implements Feature {
         return values.get(columnPosition);
     }
 
+    public String toString() {
+        return String.format("%s\t%s",position.toString(), Utils.join("\t",values));
+    }
+
     public String get(String columnName) {
         int position = keys.indexOf(columnName);
         if (position < 0) throw new IllegalArgumentException("We don't have a column named " + columnName);
diff --git a/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/AbstractVCFCodec.java b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/AbstractVCFCodec.java
index bb212e128..0e0cb14bf 100755
--- a/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/AbstractVCFCodec.java
+++ b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/AbstractVCFCodec.java
@@ -6,6 +6,7 @@ import org.broad.tribble.FeatureCodec;
 import org.broad.tribble.NameAwareCodec;
 import org.broad.tribble.TribbleException;
 import org.broad.tribble.readers.LineReader;
+import org.broad.tribble.util.BlockCompressedInputStream;
 import org.broad.tribble.util.ParsingUtils;
 import org.broadinstitute.sting.gatk.refdata.SelfScopingFeatureCodec;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
@@ -35,6 +36,7 @@ public abstract class AbstractVCFCodec implements FeatureCodec, NameAwareCodec,
     // for ParsingUtils.split
     protected String[] GTValueArray = new String[100];
     protected String[] genotypeKeyArray = new String[100];
+    protected String[] infoFieldArray = new String[1000];
     protected String[] infoValueArray = new String[1000];
 
     // for performance testing purposes
@@ -114,15 +116,21 @@ public abstract class AbstractVCFCodec implements FeatureCodec, NameAwareCodec,
                     }
                     arrayIndex++;
                 }
+
+                boolean sawFormatTag = false;
                 if ( arrayIndex < strings.length ) {
                     if ( !strings[arrayIndex].equals("FORMAT") )
                         throw new TribbleException.InvalidHeader("we were expecting column name 'FORMAT' but we saw '" + strings[arrayIndex] + "'");
+                    sawFormatTag = true;
                     arrayIndex++;
                 }
 
-                while (arrayIndex < strings.length)
+                while ( arrayIndex < strings.length )
                     auxTags.add(strings[arrayIndex++]);
 
+                if ( sawFormatTag && auxTags.size() == 0 )
+                    throw new UserException.MalformedVCFHeader("The FORMAT field was provided but there is no genotype/sample data");
+
             } else {
                 if ( str.startsWith("##INFO=") ) {
                     VCFInfoHeaderLine info = new VCFInfoHeaderLine(str.substring(7),version);
@@ -154,16 +162,27 @@ public abstract class AbstractVCFCodec implements FeatureCodec, NameAwareCodec,
      * @return a feature, (not guaranteed complete) that has the correct start and stop
      */
     public Feature decodeLoc(String line) {
-        String[] locParts = new String[6];
-        ParsingUtils.split(line, locParts, VCFConstants.FIELD_SEPARATOR_CHAR, true);
+        lineNo++;
+
+        // the same line reader is not used for parsing the header and parsing lines, if we see a #, we've seen a header line
+        if (line.startsWith(VCFHeader.HEADER_INDICATOR)) return null;
+
+        // our header cannot be null, we need the genotype sample names and counts
+        if (header == null) throw new ReviewedStingException("VCF Header cannot be null when decoding a record");
+
+        final String[] locParts = new String[6];
+        int nParts = ParsingUtils.split(line, locParts, VCFConstants.FIELD_SEPARATOR_CHAR, true);
+
+        if ( nParts != 6 )
+            throw new UserException.MalformedVCF("there aren't enough columns for line " + line, lineNo);
 
         // get our alleles (because the end position depends on them)
-        String ref = getCachedString(locParts[3].toUpperCase());
-        String alts = getCachedString(locParts[4].toUpperCase());
-        List<Allele> alleles = parseAlleles(ref, alts, lineNo);
+        final String ref = getCachedString(locParts[3].toUpperCase());
+        final String alts = getCachedString(locParts[4].toUpperCase());
+        final List<Allele> alleles = parseAlleles(ref, alts, lineNo);
 
         // find out our location
-        int start = Integer.valueOf(locParts[1]);
+        final int start = Integer.valueOf(locParts[1]);
         int stop = start;
 
         // ref alleles don't need to be single bases for monomorphic sites
@@ -199,35 +218,31 @@ public abstract class AbstractVCFCodec implements FeatureCodec, NameAwareCodec,
      * @return a VariantContext
      */
     public Feature decode(String line) {
-        return reallyDecode(line);
-    }
+        // the same line reader is not used for parsing the header and parsing lines, if we see a #, we've seen a header line
+        if (line.startsWith(VCFHeader.HEADER_INDICATOR)) return null;
 
-    private Feature reallyDecode(String line) {
-            // the same line reader is not used for parsing the header and parsing lines, if we see a #, we've seen a header line
-            if (line.startsWith(VCFHeader.HEADER_INDICATOR)) return null;
+        // our header cannot be null, we need the genotype sample names and counts
+        if (header == null) throw new ReviewedStingException("VCF Header cannot be null when decoding a record");
 
-            // our header cannot be null, we need the genotype sample names and counts
-            if (header == null) throw new ReviewedStingException("VCF Header cannot be null when decoding a record");
+        if (parts == null)
+            parts = new String[Math.min(header.getColumnCount(), NUM_STANDARD_FIELDS+1)];
 
-            if (parts == null)
-                parts = new String[Math.min(header.getColumnCount(), NUM_STANDARD_FIELDS+1)];
+        int nParts = ParsingUtils.split(line, parts, VCFConstants.FIELD_SEPARATOR_CHAR, true);
 
-            int nParts = ParsingUtils.split(line, parts, VCFConstants.FIELD_SEPARATOR_CHAR, true);
+        // if we have don't have a header, or we have a header with no genotyping data check that we have eight columns.  Otherwise check that we have nine (normal colummns + genotyping data)
+        if (( (header == null || !header.hasGenotypingData()) && nParts != NUM_STANDARD_FIELDS) ||
+             (header != null && header.hasGenotypingData() && nParts != (NUM_STANDARD_FIELDS + 1)) )
+            throw new UserException.MalformedVCF("there aren't enough columns for line " + line + " (we expected " + (header == null ? NUM_STANDARD_FIELDS : NUM_STANDARD_FIELDS + 1) +
+                    " tokens, and saw " + nParts + " )", lineNo);
 
-            // if we have don't have a header, or we have a header with no genotyping data check that we have eight columns.  Otherwise check that we have nine (normal colummns + genotyping data)
-            if (( (header == null || (header != null && !header.hasGenotypingData())) && nParts != NUM_STANDARD_FIELDS) ||
-                 (header != null && header.hasGenotypingData() && nParts != (NUM_STANDARD_FIELDS + 1)) )
-                throw new UserException.MalformedVCF("there aren't enough columns for line " + line + " (we expected " + (header == null ? NUM_STANDARD_FIELDS : NUM_STANDARD_FIELDS + 1) +
-                        " tokens, and saw " + nParts + " )", lineNo);
-
-            return parseVCFLine(parts);
+        return parseVCFLine(parts);
     }
 
     protected void generateException(String message) {
         throw new UserException.MalformedVCF(message, lineNo);
     }
 
-    private static void generateException(String message, int lineNo) {
+    protected static void generateException(String message, int lineNo) {
         throw new UserException.MalformedVCF(message, lineNo);
     }
 
@@ -345,23 +360,31 @@ public abstract class AbstractVCFCodec implements FeatureCodec, NameAwareCodec,
             generateException("The VCF specification requires a valid info field");
 
         if ( !infoField.equals(VCFConstants.EMPTY_INFO_FIELD) ) {
-            int infoValueSplitSize = ParsingUtils.split(infoField, infoValueArray, VCFConstants.INFO_FIELD_SEPARATOR_CHAR);
-            for (int i = 0; i < infoValueSplitSize; i++) {
+            if ( infoField.indexOf("\t") != -1 || infoField.indexOf(" ") != -1 )
+                generateException("The VCF specification does not allow for whitespace in the INFO field");
+
+            int infoFieldSplitSize = ParsingUtils.split(infoField, infoFieldArray, VCFConstants.INFO_FIELD_SEPARATOR_CHAR, false);
+            for (int i = 0; i < infoFieldSplitSize; i++) {
                 String key;
                 Object value;
 
-                int eqI = infoValueArray[i].indexOf("=");
+                int eqI = infoFieldArray[i].indexOf("=");
                 if ( eqI != -1 ) {
-                    key = infoValueArray[i].substring(0, eqI);
-                    String str = infoValueArray[i].substring(eqI+1, infoValueArray[i].length());
+                    key = infoFieldArray[i].substring(0, eqI);
+                    String str = infoFieldArray[i].substring(eqI+1);
 
-                    // lets see if the string contains a , separator
-                    if ( str.contains(",") )
-                        value = Arrays.asList(str.split(","));
-                    else
-                        value = str;
+                    // split on the INFO field separator
+                    int infoValueSplitSize = ParsingUtils.split(str, infoValueArray, VCFConstants.INFO_FIELD_ARRAY_SEPARATOR_CHAR, false);
+                    if ( infoValueSplitSize == 1 ) {
+                        value = infoValueArray[0];
+                    } else {
+                        ArrayList<String> valueList = new ArrayList<String>(infoValueSplitSize);
+                        for ( int j = 0; j < infoValueSplitSize; j++ )
+                            valueList.add(infoValueArray[j]);
+                        value = valueList;
+                    }
                 } else {
-                    key = infoValueArray[i];
+                    key = infoFieldArray[i];
                     value = true;
                 }
 
@@ -369,7 +392,8 @@ public abstract class AbstractVCFCodec implements FeatureCodec, NameAwareCodec,
             }
         }
 
-        attributes.put(VariantContext.ID_KEY, id);
+        if ( ! id.equals(VCFConstants.EMPTY_ID_FIELD) )
+            attributes.put(VariantContext.ID_KEY, id);
         return attributes;
     }
 
@@ -587,7 +611,8 @@ public abstract class AbstractVCFCodec implements FeatureCodec, NameAwareCodec,
     public final static boolean canDecodeFile(final File potentialInput, final String MAGIC_HEADER_LINE) {
         try {
             return isVCFStream(new FileInputStream(potentialInput), MAGIC_HEADER_LINE) ||
-                    isVCFStream(new GZIPInputStream(new FileInputStream(potentialInput)), MAGIC_HEADER_LINE);
+                    isVCFStream(new GZIPInputStream(new FileInputStream(potentialInput)), MAGIC_HEADER_LINE) ||
+                    isVCFStream(new BlockCompressedInputStream(new FileInputStream(potentialInput)), MAGIC_HEADER_LINE);
         } catch ( FileNotFoundException e ) {
             return false;
         } catch ( IOException e ) {
@@ -598,12 +623,17 @@ public abstract class AbstractVCFCodec implements FeatureCodec, NameAwareCodec,
     private final static boolean isVCFStream(final InputStream stream, final String MAGIC_HEADER_LINE) {
         try {
             byte[] buff = new byte[MAGIC_HEADER_LINE.length()];
-            stream.read(buff, 0, MAGIC_HEADER_LINE.length());
-            String firstLine = new String(buff);
-            stream.close();
-            return firstLine.startsWith(MAGIC_HEADER_LINE);
+            int nread = stream.read(buff, 0, MAGIC_HEADER_LINE.length());
+            boolean eq = Arrays.equals(buff, MAGIC_HEADER_LINE.getBytes());
+            return eq;
+//            String firstLine = new String(buff);
+//            return firstLine.startsWith(MAGIC_HEADER_LINE);
         } catch ( IOException e ) {
             return false;
+        } catch ( RuntimeException e ) {
+            return false;
+        } finally {
+            try { stream.close(); } catch ( IOException e ) {}
         }
     }
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/IndexingVCFWriter.java b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/IndexingVCFWriter.java
new file mode 100644
index 000000000..71ec4ce1b
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/IndexingVCFWriter.java
@@ -0,0 +1,144 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.codecs.vcf;
+
+import com.google.java.contract.Ensures;
+import com.google.java.contract.Requires;
+import net.sf.samtools.SAMSequenceDictionary;
+import org.broad.tribble.Tribble;
+import org.broad.tribble.TribbleException;
+import org.broad.tribble.index.DynamicIndexCreator;
+import org.broad.tribble.index.Index;
+import org.broad.tribble.index.IndexFactory;
+import org.broad.tribble.util.LittleEndianOutputStream;
+import org.broad.tribble.util.PositionalStream;
+import org.broadinstitute.sting.gatk.refdata.tracks.IndexDictionaryUtils;
+import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.variantcontext.VariantContext;
+
+import java.io.*;
+
+/**
+ * this class writes VCF files
+ */
+public abstract class IndexingVCFWriter implements VCFWriter {
+    final private String name;
+    private final SAMSequenceDictionary refDict;
+
+    private OutputStream outputStream;
+    private PositionalStream positionalStream = null;
+    private DynamicIndexCreator indexer = null;
+    private LittleEndianOutputStream idxStream = null;
+
+    @Requires({"name != null",
+            "! ( location == null && output == null )",
+            "! ( enableOnTheFlyIndexing && location == null )"})
+    protected IndexingVCFWriter(final String name, final File location, final OutputStream output, final SAMSequenceDictionary refDict, final boolean enableOnTheFlyIndexing) {
+        outputStream = output;
+        this.name = name;
+        this.refDict = refDict;
+
+        if ( enableOnTheFlyIndexing ) {
+            try {
+                idxStream = new LittleEndianOutputStream(new FileOutputStream(Tribble.indexFile(location)));
+                //System.out.println("Creating index on the fly for " + location);
+                indexer = new DynamicIndexCreator(IndexFactory.IndexBalanceApproach.FOR_SEEK_TIME);
+                indexer.initialize(location, indexer.defaultBinSize());
+                positionalStream = new PositionalStream(output);
+                outputStream = positionalStream;
+            } catch ( IOException ex ) {
+                // No matter what we keep going, since we don't care if we can't create the index file
+                idxStream = null;
+                indexer = null;
+                positionalStream = null;
+            }
+        }
+    }
+
+    @Ensures("result != null")
+    public OutputStream getOutputStream() {
+        return outputStream;
+    }
+
+    @Ensures("result != null")
+    public String getStreamName() {
+        return name;
+    }
+
+    public abstract void writeHeader(VCFHeader header);
+
+    /**
+     * attempt to close the VCF file
+     */
+    public void close() {
+        // try to close the index stream (keep it separate to help debugging efforts)
+        if ( indexer != null ) {
+            try {
+                Index index = indexer.finalizeIndex(positionalStream.getPosition());
+                IndexDictionaryUtils.setIndexSequenceDictionary(index, refDict);
+                index.write(idxStream);
+                idxStream.close();
+            } catch (IOException e) {
+                throw new ReviewedStingException("Unable to close index for " + getStreamName(), e);
+            }
+        }
+    }
+
+    /**
+     * add a record to the file
+     *
+     * @param vc      the Variant Context object
+     */
+    public void add(VariantContext vc) {
+        // if we are doing on the fly indexing, add the record ***before*** we write any bytes
+        if ( indexer != null )
+            indexer.addFeature(vc, positionalStream.getPosition());
+    }
+
+    /**
+     * Returns a reasonable "name" for this writer, to display to the user if something goes wrong
+     *
+     * @param location
+     * @param stream
+     * @return
+     */
+    protected static final String writerName(final File location, final OutputStream stream) {
+        return location == null ? stream.toString() : location.getAbsolutePath();
+    }
+
+    /**
+     * Returns a output stream writing to location, or throws a UserException if this fails
+     * @param location
+     * @return
+     */
+    protected static OutputStream openOutputStream(final File location) {
+        try {
+            return new FileOutputStream(location);
+        } catch (FileNotFoundException e) {
+            throw new UserException.CouldNotCreateOutputFile(location, "Unable to create VCF writer", e);
+        }
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/StandardVCFWriter.java b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/StandardVCFWriter.java
index d3705813c..0da7a100f 100755
--- a/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/StandardVCFWriter.java
+++ b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/StandardVCFWriter.java
@@ -24,6 +24,7 @@
 
 package org.broadinstitute.sting.utils.codecs.vcf;
 
+import net.sf.samtools.SAMSequenceDictionary;
 import org.broad.tribble.Tribble;
 import org.broad.tribble.TribbleException;
 import org.broad.tribble.index.DynamicIndexCreator;
@@ -44,46 +45,30 @@ import java.util.*;
 /**
  * this class writes VCF files
  */
-public class StandardVCFWriter implements VCFWriter {
+public class StandardVCFWriter extends IndexingVCFWriter {
+    // the print stream we're writing to
+    final protected BufferedWriter mWriter;
+
+    // should we write genotypes or just sites?
+    final protected boolean doNotWriteGenotypes;
 
     // the VCF header we're storing
     protected VCFHeader mHeader = null;
 
-    // the print stream we're writing to
-    protected BufferedWriter mWriter;
-    protected PositionalStream positionalStream = null;
-
     // were filters applied?
     protected boolean filtersWereAppliedToContext = false;
 
-    // should we write genotypes or just sites?
-    protected boolean doNotWriteGenotypes = false;
-
-    protected DynamicIndexCreator indexer = null;
-    protected File indexFile = null;
-    LittleEndianOutputStream idxStream = null;
-    File location = null;
-
     /**         
      * create a VCF writer, given a file to write to
      *
      * @param location the file location to write to
      */
-    public StandardVCFWriter(File location) {
-        this(location, openOutputStream(location), true, false);
+    public StandardVCFWriter(final File location, final SAMSequenceDictionary refDict) {
+        this(location, openOutputStream(location), refDict, true, false);
     }
 
-    public StandardVCFWriter(File location, boolean enableOnTheFlyIndexing) {
-        this(location, openOutputStream(location), enableOnTheFlyIndexing, false);
-    }
-
-    /**
-     * create a VCF writer, given a stream to write to
-     *
-     * @param output   the file location to write to
-     */
-    public StandardVCFWriter(OutputStream output) {
-        this(output, false);
+    public StandardVCFWriter(File location, final SAMSequenceDictionary refDict, boolean enableOnTheFlyIndexing) {
+        this(location, openOutputStream(location), refDict, enableOnTheFlyIndexing, false);
     }
 
     /**
@@ -92,33 +77,23 @@ public class StandardVCFWriter implements VCFWriter {
      * @param output   the file location to write to
      * @param doNotWriteGenotypes   do not write genotypes
      */
-    public StandardVCFWriter(OutputStream output, boolean doNotWriteGenotypes) {
-        mWriter = new BufferedWriter(new OutputStreamWriter(output));
+    public StandardVCFWriter(final OutputStream output, final SAMSequenceDictionary refDict, final boolean doNotWriteGenotypes) {
+        this(null, output, refDict, false, doNotWriteGenotypes);
+    }
+
+    public StandardVCFWriter(final File location, final OutputStream output, final SAMSequenceDictionary refDict, final boolean enableOnTheFlyIndexing, boolean doNotWriteGenotypes) {
+        super(writerName(location, output), location, output, refDict, enableOnTheFlyIndexing);
+        mWriter = new BufferedWriter(new OutputStreamWriter(getOutputStream())); // todo -- fix buffer size
         this.doNotWriteGenotypes = doNotWriteGenotypes;
     }
 
-    public StandardVCFWriter(File location, OutputStream output, boolean enableOnTheFlyIndexing, boolean doNotWriteGenotypes) {
-        this.location = location;
-
-        if ( enableOnTheFlyIndexing ) {
-            indexFile = Tribble.indexFile(location);
-            try {
-                idxStream = new LittleEndianOutputStream(new FileOutputStream(indexFile));
-                //System.out.println("Creating index on the fly for " + location);
-                indexer = new DynamicIndexCreator(IndexFactory.IndexBalanceApproach.FOR_SEEK_TIME);
-                indexer.initialize(location, indexer.defaultBinSize());
-                positionalStream = new PositionalStream(output);
-                output = positionalStream;
-            } catch ( IOException ex ) {
-                // No matter what we keep going, since we don't care if we can't create the index file
-            }
-        }
-
-        //mWriter = new BufferedWriter(new OutputStreamWriter(new PositionalStream(output)));
-        mWriter = new BufferedWriter(new OutputStreamWriter(output));
-        this.doNotWriteGenotypes = doNotWriteGenotypes;
-    }
+    // --------------------------------------------------------------------------------
+    //
+    // VCFWriter interface functions
+    //
+    // --------------------------------------------------------------------------------
 
+    @Override
     public void writeHeader(VCFHeader header) {
         mHeader = doNotWriteGenotypes ? new VCFHeader(header.getMetaData()) : header;
         
@@ -158,44 +133,24 @@ public class StandardVCFWriter implements VCFWriter {
             mWriter.flush();  // necessary so that writing to an output stream will work
         }
         catch (IOException e) {
-            throw new TribbleException("IOException writing the VCF header to " + locationString(), e);
+            throw new ReviewedStingException("IOException writing the VCF header to " + getStreamName(), e);
         }
     }
 
-    private String locationString() {
-        return location == null ? mWriter.toString() : location.getAbsolutePath();
-    }
-
     /**
      * attempt to close the VCF file
      */
+    @Override
     public void close() {
         // try to close the vcf stream
         try {
             mWriter.flush();
             mWriter.close();
         } catch (IOException e) {
-            throw new TribbleException("Unable to close " + locationString() + " because of " + e.getMessage());
+            throw new ReviewedStingException("Unable to close " + getStreamName(), e);
         }
 
-        // try to close the index stream (keep it separate to help debugging efforts)
-        if ( indexer != null ) {
-            try {
-                Index index = indexer.finalizeIndex(positionalStream.getPosition());
-                index.write(idxStream);
-                idxStream.close();
-            } catch (IOException e) {
-                throw new TribbleException("Unable to close index for " + locationString() + " because of " + e.getMessage());
-            }
-        }
-    }
-
-    protected static OutputStream openOutputStream(File location) {
-        try {
-            return new FileOutputStream(location);
-        } catch (FileNotFoundException e) {
-            throw new TribbleException("Unable to create VCF file at location: " + location);
-        }
+        super.close();
     }
 
     /**
@@ -203,28 +158,17 @@ public class StandardVCFWriter implements VCFWriter {
      *
      * @param vc      the Variant Context object
      */
+    @Override
     public void add(VariantContext vc) {
-        add(vc, false);
-    }
-
-    /**
-     * add a record to the file
-     *
-     * @param vc      the Variant Context object
-     * @param refBaseShouldBeAppliedToEndOfAlleles *** THIS SHOULD BE FALSE EXCEPT FOR AN INDEL AT THE EXTREME BEGINNING OF A CONTIG (WHERE THERE IS NO PREVIOUS BASE, SO WE USE THE BASE AFTER THE EVENT INSTEAD)
-     */
-    public void add(VariantContext vc, boolean refBaseShouldBeAppliedToEndOfAlleles) {
         if ( mHeader == null )
-            throw new IllegalStateException("The VCF Header must be written before records can be added: " + locationString());
+            throw new IllegalStateException("The VCF Header must be written before records can be added: " + getStreamName());
 
         if ( doNotWriteGenotypes )
             vc = VariantContext.modifyGenotypes(vc, null);
 
         try {
-            vc = VariantContext.createVariantContextWithPaddedAlleles(vc, refBaseShouldBeAppliedToEndOfAlleles);
-
-            // if we are doing on the fly indexing, add the record ***before*** we write any bytes 
-            if ( indexer != null ) indexer.addFeature(vc, positionalStream.getPosition());
+            vc = VariantContext.createVariantContextWithPaddedAlleles(vc, false);
+            super.add(vc);
 
             Map<Allele, String> alleleMap = new HashMap<Allele, String>(vc.getAlleles().size());
             alleleMap.put(Allele.NO_CALL, VCFConstants.EMPTY_ALLELE); // convenience for lookup
@@ -275,7 +219,7 @@ public class StandardVCFWriter implements VCFWriter {
             mWriter.write(VCFConstants.FIELD_SEPARATOR);
 
             // FILTER
-            String filters = vc.isFiltered() ? ParsingUtils.join(";", ParsingUtils.sortList(vc.getFilters())) : (filtersWereAppliedToContext || vc.filtersWereApplied() ? VCFConstants.PASSES_FILTERS_v4 : VCFConstants.UNFILTERED);
+            String filters = getFilterString(vc, filtersWereAppliedToContext);
             mWriter.write(filters);
             mWriter.write(VCFConstants.FIELD_SEPARATOR);
 
@@ -317,9 +261,22 @@ public class StandardVCFWriter implements VCFWriter {
             mWriter.write("\n");
             mWriter.flush();  // necessary so that writing to an output stream will work
         } catch (IOException e) {
-            throw new RuntimeException("Unable to write the VCF object to " + locationString());
+            throw new RuntimeException("Unable to write the VCF object to " + getStreamName());
         }
+    }
 
+    // --------------------------------------------------------------------------------
+    //
+    // implementation functions
+    //
+    // --------------------------------------------------------------------------------
+
+    public static final String getFilterString(final VariantContext vc) {
+        return getFilterString(vc, false);
+    }
+
+    public static final String getFilterString(final VariantContext vc, boolean forcePASS) {
+        return vc.isFiltered() ? ParsingUtils.join(";", ParsingUtils.sortList(vc.getFilters())) : (forcePASS || vc.filtersWereApplied() ? VCFConstants.PASSES_FILTERS_v4 : VCFConstants.UNFILTERED);
     }
 
     private String getQualValue(double qual) {
@@ -462,7 +419,7 @@ public class StandardVCFWriter implements VCFWriter {
         mWriter.write(encoding);
     }
 
-    private static String formatVCFField(Object val) {
+    public static String formatVCFField(Object val) {
         String result;
         if ( val == null )
             result = VCFConstants.MISSING_VALUE_v4;
@@ -524,12 +481,11 @@ public class StandardVCFWriter implements VCFWriter {
     }
 
 
-    public static int countOccurrences(char c, String s) {
+    private static int countOccurrences(char c, String s) {
            int count = 0;
            for (int i = 0; i < s.length(); i++) {
                count += s.charAt(i) == c ? 1 : 0;
            }
            return count;
     }
-
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFCodec.java b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFCodec.java
index fa030ef5f..42ea05355 100755
--- a/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFCodec.java
+++ b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFCodec.java
@@ -105,34 +105,37 @@ public class VCFCodec extends AbstractVCFCodec {
      * @return a set of the filters applied or null if filters were not applied to the record (e.g. as per the missing value in a VCF)
      */
     protected Set<String> parseFilters(String filterString) {
+        return parseFilters(filterHash, lineNo, filterString);
+    }
 
+    public static Set<String> parseFilters(final Map<String, LinkedHashSet<String>> cache, final int lineNo, final String filterString) {
         // null for unfiltered
         if ( filterString.equals(VCFConstants.UNFILTERED) )
             return null;
 
-        // empty set for passes filters
-        LinkedHashSet<String> fFields = new LinkedHashSet<String>();
-
         if ( filterString.equals(VCFConstants.PASSES_FILTERS_v4) )
-            return fFields;
+            return Collections.emptySet();
         if ( filterString.equals(VCFConstants.PASSES_FILTERS_v3) )
-            generateException(VCFConstants.PASSES_FILTERS_v3 + " is an invalid filter name in vcf4");
+            generateException(VCFConstants.PASSES_FILTERS_v3 + " is an invalid filter name in vcf4", lineNo);
         if ( filterString.length() == 0 )
-            generateException("The VCF specification requires a valid filter status");
+            generateException("The VCF specification requires a valid filter status: filter was " + filterString, lineNo);
 
         // do we have the filter string cached?
-        if ( filterHash.containsKey(filterString) )
-            return filterHash.get(filterString);
+        if ( cache != null && cache.containsKey(filterString) )
+            return Collections.unmodifiableSet(cache.get(filterString));
 
+        // empty set for passes filters
+        LinkedHashSet<String> fFields = new LinkedHashSet<String>();
         // otherwise we have to parse and cache the value
         if ( filterString.indexOf(VCFConstants.FILTER_CODE_SEPARATOR) == -1 )
             fFields.add(filterString);
         else
             fFields.addAll(Arrays.asList(filterString.split(VCFConstants.FILTER_CODE_SEPARATOR)));
 
-        filterHash.put(filterString, fFields);
+        fFields = fFields;
+        if ( cache != null ) cache.put(filterString, fFields);
 
-        return fFields;
+        return Collections.unmodifiableSet(fFields);
     }
 
 
diff --git a/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFConstants.java b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFConstants.java
index 91cf86c70..8e9d989cc 100755
--- a/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFConstants.java
+++ b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFConstants.java
@@ -71,6 +71,7 @@ public final class VCFConstants {
     public static final char   FIELD_SEPARATOR_CHAR = '\t';
     public static final String FILTER_CODE_SEPARATOR = ";";
     public static final String INFO_FIELD_ARRAY_SEPARATOR = ",";
+    public static final char INFO_FIELD_ARRAY_SEPARATOR_CHAR = ',';
     public static final String ID_FIELD_SEPARATOR = ";";
     public static final String INFO_FIELD_SEPARATOR = ";";
     public static final char INFO_FIELD_SEPARATOR_CHAR = ';';
diff --git a/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFHeader.java b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFHeader.java
index fd1c74993..66e11bc1e 100755
--- a/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFHeader.java
+++ b/public/java/src/org/broadinstitute/sting/utils/codecs/vcf/VCFHeader.java
@@ -35,9 +35,6 @@ public class VCFHeader {
     // the header string indicator
     public static final String HEADER_INDICATOR = "#";
 
-    /** do we have genotying data? */
-    private boolean hasGenotypingData = false;
-
     // were the input samples sorted originally (or are we sorting them)?
     private boolean samplesWereAlreadySorted = true;
 
@@ -57,17 +54,15 @@ public class VCFHeader {
      * create a VCF header, given a list of meta data and auxillary tags
      *
      * @param metaData            the meta data associated with this header
-     * @param genotypeSampleNames the genotype format field, and the sample names
+     * @param genotypeSampleNames the sample names
      */
     public VCFHeader(Set<VCFHeaderLine> metaData, Set<String> genotypeSampleNames) {
         mMetaData = new TreeSet<VCFHeaderLine>();
         if ( metaData != null )
             mMetaData.addAll(metaData);
-        for (String col : genotypeSampleNames) {
-            if (!col.equals("FORMAT"))
-                mGenotypeSampleNames.add(col);
-        }
-        if (genotypeSampleNames.size() > 0) hasGenotypingData = true;
+
+        mGenotypeSampleNames.addAll(genotypeSampleNames);
+
         loadVCFVersion();
         loadMetaDataMaps();
 
@@ -157,7 +152,7 @@ public class VCFHeader {
      * @return true if we have genotyping columns, false otherwise
      */
     public boolean hasGenotypingData() {
-        return hasGenotypingData;
+        return mGenotypeSampleNames.size() > 0;
     }
 
     /**
@@ -171,7 +166,7 @@ public class VCFHeader {
 
     /** @return the column count */
     public int getColumnCount() {
-        return HEADER_FIELDS.values().length + ((hasGenotypingData) ? mGenotypeSampleNames.size() + 1 : 0);
+        return HEADER_FIELDS.values().length + (hasGenotypingData() ? mGenotypeSampleNames.size() + 1 : 0);
     }
 
     /**
diff --git a/public/java/src/org/broadinstitute/sting/utils/duplicates/DupUtils.java b/public/java/src/org/broadinstitute/sting/utils/duplicates/DupUtils.java
index bba47c76c..7ae575534 100644
--- a/public/java/src/org/broadinstitute/sting/utils/duplicates/DupUtils.java
+++ b/public/java/src/org/broadinstitute/sting/utils/duplicates/DupUtils.java
@@ -25,7 +25,6 @@
 
 package org.broadinstitute.sting.utils.duplicates;
 
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.utils.BaseUtils;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.GenomeLocParser;
@@ -35,27 +34,28 @@ import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.pileup.PileupElement;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileupImpl;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.Arrays;
 import java.util.List;
 
 public class DupUtils {
-    private static SAMRecord tmpCopyRead(SAMRecord read) {
+    private static GATKSAMRecord tmpCopyRead(GATKSAMRecord read) {
         try {
-            return (SAMRecord)read.clone();
+            return (GATKSAMRecord)read.clone();
         } catch ( CloneNotSupportedException e ) {
             throw new ReviewedStingException("Unexpected Clone failure!");
         }
     }
 
-    public static SAMRecord combineDuplicates(GenomeLocParser genomeLocParser,List<SAMRecord> duplicates, int maxQScore) {
+    public static GATKSAMRecord combineDuplicates(GenomeLocParser genomeLocParser,List<GATKSAMRecord> duplicates, int maxQScore) {
         if ( duplicates.size() == 0 )
             return null;
 
         // make the combined read by copying the first read and setting the
         // bases and quals to new arrays
-        SAMRecord comb = tmpCopyRead(duplicates.get(0));
-        //SAMRecord comb = tmpCopyRead(duplicates.get(0));
+        GATKSAMRecord comb = tmpCopyRead(duplicates.get(0));
+        //GATKSAMRecord comb = tmpCopyRead(duplicates.get(0));
         comb.setDuplicateReadFlag(false);
         int readLen = comb.getReadBases().length;
         byte[] bases = new byte[readLen];
@@ -63,7 +63,7 @@ public class DupUtils {
 
         for ( int i = 0; i < readLen; i++ ) {
             //System.out.printf("I is %d%n", i);
-            //for ( SAMRecord read : duplicates ) {
+            //for ( GATKSAMRecord read : duplicates ) {
             //    System.out.printf("dup base %c %d%n", (char)read.getReadBases()[i], read.getBaseQualities()[i]);
             //}
             Pair<Byte, Byte> baseAndQual = combineBaseProbs(genomeLocParser,duplicates, i, maxQScore);
@@ -117,7 +117,7 @@ public class DupUtils {
         System.out.printf("%n");
     }
 
-    private static Pair<Byte, Byte> combineBaseProbs(GenomeLocParser genomeLocParser,List<SAMRecord> duplicates, int readOffset, int maxQScore) {
+    private static Pair<Byte, Byte> combineBaseProbs(GenomeLocParser genomeLocParser,List<GATKSAMRecord> duplicates, int readOffset, int maxQScore) {
         GenomeLoc loc = genomeLocParser.createGenomeLoc(duplicates.get(0));
         ReadBackedPileup pileup = new ReadBackedPileupImpl(loc, duplicates, readOffset);
 
diff --git a/public/java/src/org/broadinstitute/sting/utils/exceptions/UserException.java b/public/java/src/org/broadinstitute/sting/utils/exceptions/UserException.java
index 9d131ae0c..a208d2dc0 100755
--- a/public/java/src/org/broadinstitute/sting/utils/exceptions/UserException.java
+++ b/public/java/src/org/broadinstitute/sting/utils/exceptions/UserException.java
@@ -164,7 +164,15 @@ public class UserException extends ReviewedStingException {
 
     public static class MalformedBAM extends UserException {
         public MalformedBAM(SAMRecord read, String message) {
-            super(String.format("SAM/BAM file %s is malformed: %s", read.getFileSource() != null ? read.getFileSource().getReader() : "(none)", message));
+            this(read.getFileSource() != null ? read.getFileSource().getReader().toString() : "(none)", message);
+        }
+
+        public MalformedBAM(File file, String message) {
+            this(file.toString(), message);
+        }
+
+        public MalformedBAM(String source, String message) {
+            super(String.format("SAM/BAM file %s is malformed: %s", source, message));
         }
     }
 
@@ -178,6 +186,12 @@ public class UserException extends ReviewedStingException {
         }
     }
 
+    public static class MalformedVCFHeader extends UserException {
+        public MalformedVCFHeader(String message) {
+            super(String.format("The provided VCF file has a malformed header: %s", message));
+        }
+    }
+
     public static class ReadMissingReadGroup extends MalformedBAM {
         public ReadMissingReadGroup(SAMRecord read) {
             super(read, String.format("Read %s is either missing the read group or its read group is not defined in the BAM header, both of which are required by the GATK.  Please use http://www.broadinstitute.org/gsa/wiki/index.php/ReplaceReadGroups to fix this problem", read.getReadName()));
@@ -213,12 +227,19 @@ public class UserException extends ReviewedStingException {
             super(String.format("File %s is malformed: %s caused by %s", f.getAbsolutePath(), message, e.getMessage()));
         }
 
+        public MalformedFile(String name, String message) {
+            super(String.format("File associated with name %s is malformed: %s", name, message));
+        }
+
         public MalformedFile(String name, String message, Exception e) {
             super(String.format("File associated with name %s is malformed: %s caused by %s", name, message, e.getMessage()));
         }
      }
 
     public static class CannotExecuteRScript extends UserException {
+        public CannotExecuteRScript(String message) {
+            super(String.format("Unable to execute RScript command: " + message));
+        }
         public CannotExecuteRScript(String message, Exception e) {
             super(String.format("Unable to execute RScript command: " + message), e);
         }
diff --git a/public/java/src/org/broadinstitute/sting/utils/fragments/FragmentCollection.java b/public/java/src/org/broadinstitute/sting/utils/fragments/FragmentCollection.java
new file mode 100644
index 000000000..3261e8d2e
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/fragments/FragmentCollection.java
@@ -0,0 +1,66 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.fragments;
+
+import java.util.Collection;
+import java.util.Collections;
+import java.util.List;
+
+/**
+ * Useful helper class to represent the results of the reads -> fragment calculation.
+ *
+ * Contains singleton -- objects whose underlying reads do not overlap their mate pair
+ * Contains overlappingPairs -- objects whose underlying reads do overlap their mate pair
+ *
+ * User: ebanks, depristo
+ * Date: Jan 10, 2011
+ */
+public class FragmentCollection<T> {
+    Collection<T> singletons;
+    Collection<List<T>> overlappingPairs;
+
+    public FragmentCollection(final Collection<T> singletons, final Collection<List<T>> overlappingPairs) {
+        this.singletons = singletons == null ? Collections.<T>emptyList() : singletons;
+        this.overlappingPairs = overlappingPairs == null ? Collections.<List<T>>emptyList() : overlappingPairs;
+    }
+
+    /**
+     * Gets the T elements not containing overlapping elements, in no particular order
+     *
+     * @return
+     */
+    public Collection<T> getSingletonReads() {
+        return singletons;
+    }
+
+    /**
+     * Gets the T elements containing overlapping elements, in no particular order
+     *
+     * @return
+     */
+    public Collection<List<T>> getOverlappingPairs() {
+        return overlappingPairs;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/fragments/FragmentUtils.java b/public/java/src/org/broadinstitute/sting/utils/fragments/FragmentUtils.java
new file mode 100644
index 000000000..e5500ca21
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/fragments/FragmentUtils.java
@@ -0,0 +1,124 @@
+package org.broadinstitute.sting.utils.fragments;
+
+import net.sf.samtools.SAMRecord;
+import org.broadinstitute.sting.utils.pileup.PileupElement;
+import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
+
+import java.util.*;
+
+/**
+ * An easy to access fragment-based pileup, which contains two separate pileups.  The first
+ * is a regular collection of PileupElements containing all of the reads in the original RBP
+ * that uniquely info about a fragment.  The second are TwoReadPileupElements that, as the
+ * name suggests, contain two reads that are sequenced from the same underlying fragment.
+ *
+ * Based on the original code by E. Banks
+ *
+ * Oct 21: note that the order of the oneReadPileup and twoReadPileups are not
+ * defined.  The algorithms that produce these lists are in fact producing
+ * lists of Pileup elements *NOT* sorted by alignment start position of the underlying
+ * reads.
+ *
+ * User: depristo
+ * Date: 3/26/11
+ * Time: 10:09 PM
+ */
+public class FragmentUtils {
+    private FragmentUtils() {} // private constructor
+
+    /**
+     * A getter function that takes an Object of type T and returns its associated SAMRecord.
+     *
+     * Allows us to write a generic T -> Fragment algorithm that works with any object containing
+     * a read.
+     *
+     * @param <T>
+     */
+    public interface ReadGetter<T> {
+        public GATKSAMRecord get(T object);
+    }
+
+    /** Identify getter for SAMRecords themselves */
+    private final static ReadGetter<GATKSAMRecord> SamRecordGetter = new ReadGetter<GATKSAMRecord>() {
+        @Override public GATKSAMRecord get(final GATKSAMRecord object) { return object; }
+    };
+
+    /** Gets the SAMRecord in a PileupElement */
+    private final static ReadGetter<PileupElement> PileupElementGetter = new ReadGetter<PileupElement>() {
+        @Override public GATKSAMRecord get(final PileupElement object) { return object.getRead(); }
+    };
+
+
+    /**
+     * Generic algorithm that takes an iterable over T objects, a getter routine to extract the reads in T,
+     * and returns a FragmentCollection that contains the T objects whose underlying reads either overlap (or
+     * not) with their mate pairs.
+     *
+     * @param readContainingObjects
+     * @param nElements
+     * @param getter
+     * @param <T>
+     * @return
+     */
+    private final static <T> FragmentCollection<T> create(Iterable<T> readContainingObjects, int nElements, ReadGetter<T> getter) {
+        Collection<T> singletons = null;
+        Collection<List<T>> overlapping = null;
+        Map<String, T> nameMap = null;
+
+        int lastStart = -1;
+
+        // build an initial map, grabbing all of the multi-read fragments
+        for ( final T p : readContainingObjects ) {
+            final SAMRecord read = getter.get(p);
+
+            if ( read.getAlignmentStart() < lastStart ) {
+                throw new IllegalArgumentException(String.format(
+                        "FragmentUtils.create assumes that the incoming objects are ordered by " +
+                                "SAMRecord alignment start, but saw a read %s with alignment start " +
+                                "%d before the previous start %d", read.getSAMString(), read.getAlignmentStart(), lastStart));
+            }
+            lastStart = read.getAlignmentStart();
+
+            final int mateStart = read.getMateAlignmentStart();
+            if ( mateStart == 0 || mateStart > read.getAlignmentEnd() ) {
+                // if we know that this read won't overlap its mate, or doesn't have one, jump out early
+                if ( singletons == null ) singletons = new ArrayList<T>(nElements); // lazy init
+                singletons.add(p);
+            } else {
+                // the read might overlap it's mate, or is the rightmost read of a pair
+                final String readName = read.getReadName();
+                final T pe1 = nameMap == null ? null : nameMap.get(readName);
+                if ( pe1 != null ) {
+                    // assumes we have at most 2 reads per fragment
+                    if ( overlapping == null ) overlapping = new ArrayList<List<T>>(); // lazy init
+                    overlapping.add(Arrays.asList(pe1, p));
+                    nameMap.remove(readName);
+                } else {
+                    if ( nameMap == null ) nameMap = new HashMap<String, T>(nElements); // lazy init
+                    nameMap.put(readName, p);
+                }
+            }
+        }
+
+        // add all of the reads that are potentially overlapping but whose mate never showed
+        // up to the oneReadPile
+        if ( nameMap != null && ! nameMap.isEmpty() ) {
+            if ( singletons == null )
+                singletons = nameMap.values();
+            else
+                singletons.addAll(nameMap.values());
+        }
+
+        return new FragmentCollection<T>(singletons, overlapping);
+    }
+
+    public final static FragmentCollection<PileupElement> create(ReadBackedPileup rbp) {
+        return create(rbp, rbp.getNumberOfElements(), PileupElementGetter);
+    }
+
+    public final static FragmentCollection<GATKSAMRecord> create(List<GATKSAMRecord> reads) {
+        return create(reads, reads.size(), SamRecordGetter);
+    }
+
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/gcf/GCF.java b/public/java/src/org/broadinstitute/sting/utils/gcf/GCF.java
new file mode 100644
index 000000000..ef0d9ca42
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/gcf/GCF.java
@@ -0,0 +1,256 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.gcf;
+
+import org.broadinstitute.sting.utils.codecs.vcf.StandardVCFWriter;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.variantcontext.Allele;
+import org.broadinstitute.sting.utils.variantcontext.Genotype;
+import org.broadinstitute.sting.utils.variantcontext.VariantContext;
+
+import java.io.*;
+import java.util.*;
+
+/**
+ * GATK binary VCF record
+ *
+ * @author Your Name
+ * @since Date created
+ */
+public class GCF {
+    private final static int RECORD_TERMINATOR = 123456789;
+    private int chromOffset;
+    private int start, stop;
+    private String id;
+    private List<Allele> alleleMap;
+    private int alleleOffsets[];
+    private float qual;
+    private byte refPad;
+    private String info;
+    private int filterOffset;
+
+    private List<GCFGenotype> genotypes = Collections.emptyList();
+
+    public GCF(final GCFHeaderBuilder GCFHeaderBuilder, final VariantContext vc, boolean skipGenotypes) {
+        chromOffset = GCFHeaderBuilder.encodeString(vc.getChr());
+        start = vc.getStart();
+        stop = vc.getEnd();
+        refPad = vc.hasReferenceBaseForIndel() ? vc.getReferenceBaseForIndel() : 0;
+        id = vc.getID();
+
+        // encode alleles
+        alleleMap = new ArrayList<Allele>(vc.getNAlleles());
+        alleleOffsets = new int[vc.getNAlleles()];
+        alleleMap.add(vc.getReference());
+        alleleOffsets[0] = GCFHeaderBuilder.encodeAllele(vc.getReference());
+        for ( int i = 0; i < vc.getAlternateAlleles().size(); i++ ) {
+            alleleMap.add(vc.getAlternateAllele(i));
+            alleleOffsets[i+1] = GCFHeaderBuilder.encodeAllele(vc.getAlternateAllele(i));
+        }
+
+        qual = (float)vc.getNegLog10PError(); //qualToByte(vc.getPhredScaledQual());
+        info = infoFieldString(vc, GCFHeaderBuilder);
+        filterOffset = GCFHeaderBuilder.encodeString(StandardVCFWriter.getFilterString(vc));
+
+        if ( ! skipGenotypes ) {
+            genotypes = encodeGenotypes(GCFHeaderBuilder, vc);
+        }
+    }
+
+    public GCF(DataInputStream inputStream, boolean skipGenotypes) throws IOException, EOFException {
+        chromOffset = inputStream.readInt();
+
+        // have we reached the footer?
+        if ( chromOffset == GCFHeader.FOOTER_START_MARKER )
+            throw new EOFException();
+
+        start = inputStream.readInt();
+        stop = inputStream.readInt();
+        id = inputStream.readUTF();
+        refPad = inputStream.readByte();
+        alleleOffsets = readIntArray(inputStream);
+        qual = inputStream.readFloat();
+        info = inputStream.readUTF();
+        filterOffset = inputStream.readInt();
+
+        int nGenotypes = inputStream.readInt();
+        int sizeOfGenotypes = inputStream.readInt();
+        if ( skipGenotypes ) {
+            genotypes = Collections.emptyList();
+            inputStream.skipBytes(sizeOfGenotypes);
+        } else {
+            genotypes = new ArrayList<GCFGenotype>(nGenotypes);
+            for ( int i = 0; i < nGenotypes; i++ )
+                genotypes.add(new GCFGenotype(this, inputStream));
+        }
+
+        int recordDone = inputStream.readInt();
+        if ( recordDone != RECORD_TERMINATOR )
+            throw new UserException.MalformedFile("Record not terminated by RECORD_TERMINATOR key");
+    }
+
+    public int write(DataOutputStream outputStream) throws IOException {
+        int startSize = outputStream.size();
+        outputStream.writeInt(chromOffset);
+        outputStream.writeInt(start);
+        outputStream.writeInt(stop);
+        outputStream.writeUTF(id);
+        outputStream.writeByte(refPad);
+        writeIntArray(alleleOffsets, outputStream, true);
+        outputStream.writeFloat(qual);
+        outputStream.writeUTF(info);
+        outputStream.writeInt(filterOffset);
+
+        int nGenotypes = genotypes.size();
+        int expectedSizeOfGenotypes = nGenotypes == 0 ? 0 : genotypes.get(0).sizeInBytes() * nGenotypes;
+        outputStream.writeInt(nGenotypes);
+        outputStream.writeInt(expectedSizeOfGenotypes);
+        int obsSizeOfGenotypes = 0;
+        for ( GCFGenotype g : genotypes )
+            obsSizeOfGenotypes += g.write(outputStream);
+        if ( obsSizeOfGenotypes != expectedSizeOfGenotypes )
+            throw new RuntimeException("Expect and observed genotype sizes disagree! expect = " + expectedSizeOfGenotypes + " obs =" + obsSizeOfGenotypes);
+
+        outputStream.writeInt(RECORD_TERMINATOR);
+        return outputStream.size() - startSize;
+    }
+
+    public VariantContext decode(final String source, final GCFHeader header) {
+        final String contig = header.getString(chromOffset);
+        alleleMap = header.getAlleles(alleleOffsets);
+        double negLog10PError = qual; // QualityUtils.qualToErrorProb(qual);
+        Set<String> filters = header.getFilters(filterOffset);
+        Map<String, Object> attributes = new HashMap<String, Object>();
+        attributes.put("INFO", info);
+        Byte refPadByte = refPad == 0 ? null : refPad;
+        Map<String, Genotype> genotypes = decodeGenotypes(header);
+
+        return new VariantContext(source, contig, start, stop, alleleMap, genotypes, negLog10PError, filters, attributes, refPadByte);
+    }
+
+    private Map<String, Genotype> decodeGenotypes(final GCFHeader header) {
+        if ( genotypes.isEmpty() )
+            return VariantContext.NO_GENOTYPES;
+        else {
+            Map<String, Genotype> map = new TreeMap<String, Genotype>();
+
+            for ( int i = 0; i < genotypes.size(); i++ ) {
+                final String sampleName = header.getSample(i);
+                final Genotype g = genotypes.get(i).decode(sampleName, header, this, alleleMap);
+                map.put(sampleName, g);
+            }
+
+            return map;
+        }
+    }
+
+    private List<GCFGenotype> encodeGenotypes(final GCFHeaderBuilder GCFHeaderBuilder, final VariantContext vc) {
+        int nGenotypes = vc.getNSamples();
+        if ( nGenotypes > 0 ) {
+            List<GCFGenotype> genotypes = new ArrayList<GCFGenotype>(nGenotypes);
+            for ( int i = 0; i < nGenotypes; i++ ) genotypes.add(null);
+
+            for ( Genotype g : vc.getGenotypes().values() ) {
+                int i = GCFHeaderBuilder.encodeSample(g.getSampleName());
+                genotypes.set(i, new GCFGenotype(GCFHeaderBuilder, alleleMap, g));
+            }
+
+            return genotypes;
+        } else {
+            return Collections.emptyList();
+        }
+    }
+
+    public int getNAlleles() { return alleleOffsets.length; }
+
+
+    private final String infoFieldString(VariantContext vc, final GCFHeaderBuilder GCFHeaderBuilder) {
+        StringBuilder s = new StringBuilder();
+
+        boolean first = true;
+        for ( Map.Entry<String, Object> field : vc.getAttributes().entrySet() ) {
+            String key = field.getKey();
+            if ( key.equals(VariantContext.ID_KEY) || key.equals(VariantContext.UNPARSED_GENOTYPE_MAP_KEY) || key.equals(VariantContext.UNPARSED_GENOTYPE_PARSER_KEY) )
+                continue;
+            int stringIndex = GCFHeaderBuilder.encodeString(key);
+            String outputValue = StandardVCFWriter.formatVCFField(field.getValue());
+            if ( outputValue != null ) {
+                if ( ! first ) s.append(";");
+                s.append(stringIndex).append("=").append(outputValue);
+                first = false;
+            }
+        }
+
+        return s.toString();
+    }
+
+    protected final static int BUFFER_SIZE = 1048576; // 2**20
+
+    public static DataInputStream createDataInputStream(final InputStream stream) {
+        return new DataInputStream(new BufferedInputStream(stream, BUFFER_SIZE));
+    }
+
+    public static FileInputStream createFileInputStream(final File file) throws FileNotFoundException {
+        return new FileInputStream(file);
+    }
+
+    protected final static int[] readIntArray(final DataInputStream inputStream) throws IOException {
+        return readIntArray(inputStream, inputStream.readInt());
+    }
+
+    protected final static int[] readIntArray(final DataInputStream inputStream, int size) throws IOException {
+        int[] array = new int[size];
+        for ( int i = 0; i < array.length; i++ )
+            array[i] = inputStream.readInt();
+        return array;
+    }
+
+    protected final static void writeIntArray(int[] array, final DataOutputStream outputStream, boolean writeSize) throws IOException {
+        if ( writeSize ) outputStream.writeInt(array.length);
+        for ( int i : array )
+            outputStream.writeInt(i);
+    }
+
+    protected final static byte[] readByteArray(final DataInputStream inputStream) throws IOException {
+        return readByteArray(inputStream, inputStream.readInt());
+    }
+
+    protected final static byte[] readByteArray(final DataInputStream inputStream, int size) throws IOException {
+        byte[] array = new byte[size];
+        for ( int i = 0; i < array.length; i++ )
+            array[i] = inputStream.readByte();
+        return array;
+    }
+
+    protected final static void writeByteArray(byte[] array, final DataOutputStream outputStream, boolean writeSize) throws IOException {
+        if ( writeSize ) outputStream.writeInt(array.length);
+        for ( byte i : array )
+            outputStream.writeByte(i);
+    }
+
+    protected final static byte qualToByte(double phredScaledQual) {
+        return (byte)Math.round(Math.min(phredScaledQual, 255));
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/gcf/GCFGenotype.java b/public/java/src/org/broadinstitute/sting/utils/gcf/GCFGenotype.java
new file mode 100644
index 000000000..dd1fb091c
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/gcf/GCFGenotype.java
@@ -0,0 +1,147 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.gcf;
+
+import org.broadinstitute.sting.utils.variantcontext.Allele;
+import org.broadinstitute.sting.utils.variantcontext.Genotype;
+
+import java.io.DataInputStream;
+import java.io.DataOutputStream;
+import java.io.IOException;
+import java.util.*;
+
+/**
+ * GATK binary VCF record
+ *
+ * @author Your Name
+ * @since Date created
+ */
+public class GCFGenotype {
+    private byte gq;
+    private int gt;
+    private int dp;
+    private int ad[];
+    private byte[] pl;
+
+    // todo -- what to do about phasing?  Perhaps we shouldn't support it
+    // todo -- is the FL field generic or just a flag?  Should we even support per sample filtering?
+
+    public GCFGenotype(final GCFHeaderBuilder GCFHeaderBuilder, final List<Allele> allAlleles, Genotype genotype) {
+        gq = GCF.qualToByte(genotype.getPhredScaledQual());
+        gt = encodeAlleles(genotype.getAlleles(), allAlleles);
+
+        dp = genotype.getAttributeAsInt("DP", 0);
+
+        int nAlleles = allAlleles.size();
+        ad = new int[nAlleles];
+
+        int npls = nAllelesToNPls(nAlleles);
+        pl = new byte[npls];
+    }
+
+    private int nAllelesToNPls( int nAlleles ) {
+        return nAlleles*(nAlleles+1) / 2;
+    }
+
+    public GCFGenotype(GCF GCF, DataInputStream inputStream) throws IOException {
+        int gqInt = inputStream.readUnsignedByte();
+        gq = (byte)gqInt;
+        gt = inputStream.readInt();
+        dp = inputStream.readInt();
+        ad = GCF.readIntArray(inputStream, GCF.getNAlleles());
+        pl = GCF.readByteArray(inputStream, nAllelesToNPls(GCF.getNAlleles()));
+    }
+
+    // 2 alleles => 1 + 8 + 8 + 3 => 20
+    protected int sizeInBytes() {
+        return 1 // gq
+                + 4 * 2 // gt + dp
+                + 4 * ad.length // ad
+                + 1 * pl.length; // pl
+    }
+
+    public Genotype decode(final String sampleName, final GCFHeader header, GCF GCF, List<Allele> alleleIndex) {
+        final List<Allele> alleles = decodeAlleles(gt, alleleIndex);
+        final double negLog10PError = gq / 10.0;
+        final Set<String> filters = Collections.emptySet();
+        final Map<String, Object> attributes = new HashMap<String, Object>();
+        attributes.put("DP", dp);
+        attributes.put("AD", ad);
+        attributes.put("PL", pl);
+
+        return new Genotype(sampleName, alleles, negLog10PError, filters, attributes, false);
+    }
+
+    private static int encodeAlleles(List<Allele> gtList, List<Allele> allAlleles) {
+        final int nAlleles = gtList.size();
+        if ( nAlleles  > 4 )
+            throw new IllegalArgumentException("encodeAlleles doesn't support more than 4 alt alleles, but I saw " + gtList);
+
+        int gtInt = 0;
+        for ( int i = 0; i < nAlleles ; i++ ) {
+            final int bitOffset = i * 8;
+            final int allelei = getAlleleIndex(gtList.get(i), allAlleles);
+            final int gti = (allelei + 1) << bitOffset;
+            gtInt = gtInt | gti;
+        }
+
+        return gtInt;
+    }
+
+    private static int getAlleleIndex(Allele q, List<Allele> allAlleles) {
+        if ( q.isNoCall() )
+            return 254;
+        for ( int i = 0; i < allAlleles.size(); i++ )
+            if ( q.equals(allAlleles.get(i)) )
+                return i;
+        throw new IllegalStateException("getAlleleIndex passed allele not in map! allele " + q + " allAlleles " + allAlleles);
+    }
+
+    private static List<Allele> decodeAlleles(int gtInt, List<Allele> alleleIndex) {
+        List<Allele> alleles = new ArrayList<Allele>(4);
+
+        for ( int i = 0; i < 32; i += 8 ) {
+            final int gi = (gtInt & (0x000000FF << i)) >> i;
+            if ( gi != 0 ) {
+                final int allelei = gi - 1;
+                alleles.add( allelei == 254 ? Allele.NO_CALL : alleleIndex.get(allelei) );
+            } else {
+                break;
+            }
+        }
+
+        return alleles;
+    }
+
+    public int write(DataOutputStream outputStream) throws IOException {
+        int startSize = outputStream.size();
+        outputStream.writeByte(gq);
+        outputStream.writeInt(gt);
+        outputStream.writeInt(dp);
+        GCF.writeIntArray(ad, outputStream, false);
+        GCF.writeByteArray(pl, outputStream, false);
+        return outputStream.size() - startSize;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/gcf/GCFHeader.java b/public/java/src/org/broadinstitute/sting/utils/gcf/GCFHeader.java
new file mode 100644
index 000000000..6d96eda56
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/gcf/GCFHeader.java
@@ -0,0 +1,205 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.gcf;
+
+import org.apache.log4j.Logger;
+import org.broadinstitute.sting.utils.codecs.vcf.VCFCodec;
+import org.broadinstitute.sting.utils.codecs.vcf.VCFConstants;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.variantcontext.Allele;
+
+import java.io.*;
+import java.util.*;
+
+/**
+ * [Short one sentence description of this walker]
+ * <p/>
+ * <p>
+ * [Functionality of this walker]
+ * </p>
+ * <p/>
+ * <h2>Input</h2>
+ * <p>
+ * [Input description]
+ * </p>
+ * <p/>
+ * <h2>Output</h2>
+ * <p>
+ * [Output description]
+ * </p>
+ * <p/>
+ * <h2>Examples</h2>
+ * <pre>
+ *    java
+ *      -jar GenomeAnalysisTK.jar
+ *      -T $WalkerName
+ *  </pre>
+ *
+ * @author Your Name
+ * @since Date created
+ */
+public class GCFHeader {
+    final protected static Logger logger = Logger.getLogger(GCFHeader.class);
+
+    public final static int GCF_VERSION = 1;
+    public final static byte[] GCF_FILE_START_MARKER = "GCF\1".getBytes();
+    public final static int FOOTER_START_MARKER = -1;
+    public final static long HEADER_FORWARD_REFERENCE_OFFSET = GCF_FILE_START_MARKER.length + 4; // for the version
+
+    final int version;
+    long footerPosition;
+    final List<Allele> alleles;
+    final List<String> strings;
+    final List<String> samples;
+    final List<Set<String>> filters;
+
+    public GCFHeader(final Map<Allele, Integer> allelesIn, final Map<String, Integer> stringIn, final Map<String, Integer> samplesIn) {
+        version = GCF_VERSION;
+        footerPosition = 0;
+        this.alleles = linearize(allelesIn);
+        this.strings = linearize(stringIn);
+        this.samples = linearize(samplesIn);
+        this.filters = null; // not used with this constructor
+    }
+
+    public GCFHeader(FileInputStream fileInputStream) throws IOException {
+        DataInputStream inputStream = new DataInputStream(fileInputStream);
+        byte[] headerTest = new byte[GCF_FILE_START_MARKER.length];
+        inputStream.read(headerTest);
+        if ( ! Arrays.equals(headerTest, GCF_FILE_START_MARKER) ) {
+            throw new UserException("Could not read GVCF file.  GCF_FILE_START_MARKER missing.  Saw " + new String(headerTest));
+        } else {
+            version = inputStream.readInt();
+            logger.info("Read GCF version " + version);
+            footerPosition = inputStream.readLong();
+            logger.info("Read footer position of " + footerPosition);
+            long lastPos = fileInputStream.getChannel().position();
+            logger.info("  Last position is " + lastPos);
+
+            // seek to the footer
+            fileInputStream.getChannel().position(footerPosition);
+            if ( inputStream.readInt() != FOOTER_START_MARKER )
+                throw new UserException.MalformedFile("Malformed GCF file: couldn't find the footer marker");
+            alleles = stringsToAlleles(readStrings(inputStream));
+            strings = readStrings(inputStream);
+            samples = readStrings(inputStream);
+            logger.info(String.format("Allele map of %d elements", alleles.size()));
+            logger.info(String.format("String map of %d elements", strings.size()));
+            logger.info(String.format("Sample map of %d elements", samples.size()));
+            filters = initializeFilterCache();
+            fileInputStream.getChannel().position(lastPos);
+        }
+    }
+
+    public static int writeHeader(final DataOutputStream outputStream) throws IOException {
+        int startBytes = outputStream.size();
+        outputStream.write(GCF_FILE_START_MARKER);
+        outputStream.writeInt(GCF_VERSION);
+        outputStream.writeLong(0);
+        return outputStream.size() - startBytes;
+    }
+
+    public int writeFooter(final DataOutputStream outputStream) throws IOException {
+        int startBytes = outputStream.size();
+        outputStream.writeInt(FOOTER_START_MARKER); // has to be the same as chrom encoding
+        write(outputStream, allelesToStrings(alleles));
+        write(outputStream, strings);
+        write(outputStream, samples);
+        return outputStream.size() - startBytes;
+    }
+
+    private void write(DataOutputStream outputStream, List<String> l) throws IOException {
+        outputStream.writeInt(l.size());
+        for ( String elt : l ) outputStream.writeUTF(elt);
+    }
+
+    private List<String> allelesToStrings(List<Allele> alleles) {
+        List<String> strings = new ArrayList<String>(alleles.size());
+        for ( Allele allele : alleles ) strings.add(allele.toString());
+        return strings;
+    }
+
+    private List<Set<String>> initializeFilterCache() {
+        // required to allow offset -> set lookup
+        List<Set<String>> l = new ArrayList<Set<String>>(strings.size());
+        for ( int i = 0; i < strings.size(); i++ ) l.add(null);
+        return l;
+    }
+
+    private static List<Allele> stringsToAlleles(final List<String> strings) {
+        final List<Allele> alleles = new ArrayList<Allele>(strings.size());
+        for ( String string : strings ) {
+            boolean isRef = string.endsWith("*");
+            if ( isRef ) string = string.substring(0, string.length() - 1);
+            alleles.add(Allele.create(string, isRef));
+        }
+        return alleles;
+    }
+
+    private static List<String> readStrings(final DataInputStream inputStream) throws IOException {
+        final int nStrings = inputStream.readInt();
+
+        final List<String> strings = new ArrayList<String>(nStrings);
+        for ( int i = 0; i < nStrings; i++ ) {
+            strings.add(inputStream.readUTF());
+        }
+
+        return strings;
+    }
+
+    private static <T> List<T> linearize(final Map<T, Integer> map) {
+        final ArrayList<T> l = new ArrayList<T>(map.size());
+        for ( int i = 0; i < map.size(); i++ ) l.add(null);
+        for ( final Map.Entry<T, Integer> elt : map.entrySet() )
+            l.set(elt.getValue(), elt.getKey());
+        return l;
+    }
+
+    public String getSample(final int offset) { return samples.get(offset); }
+    public String getString(final int offset) { return strings.get(offset); }
+    public Allele getAllele(final int offset) { return alleles.get(offset); }
+    public List<Allele> getAlleles(final int[] offsets) {
+        final List<Allele> alleles = new ArrayList<Allele>(offsets.length);
+        for ( int i : offsets ) alleles.add(getAllele(i));
+        return alleles;
+    }
+
+    public Set<String> getFilters(final int offset) {
+        Set<String> cached = filters.get(offset);
+
+        if ( cached != null )
+            return cached;
+        else {
+            final String filterString = getString(offset);
+            if ( filterString.equals(VCFConstants.UNFILTERED) )
+                return null; // UNFILTERED records are represented by null
+            else {
+                Set<String> set = VCFCodec.parseFilters(null, -1, filterString);
+                filters.set(offset, set); // remember the result
+                return set;
+            }
+        }
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/gcf/GCFHeaderBuilder.java b/public/java/src/org/broadinstitute/sting/utils/gcf/GCFHeaderBuilder.java
new file mode 100644
index 000000000..40e01ec72
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/gcf/GCFHeaderBuilder.java
@@ -0,0 +1,80 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.gcf;
+
+import org.broadinstitute.sting.utils.variantcontext.Allele;
+
+import java.util.HashMap;
+import java.util.Map;
+
+/**
+ * [Short one sentence description of this walker]
+ * <p/>
+ * <p>
+ * [Functionality of this walker]
+ * </p>
+ * <p/>
+ * <h2>Input</h2>
+ * <p>
+ * [Input description]
+ * </p>
+ * <p/>
+ * <h2>Output</h2>
+ * <p>
+ * [Output description]
+ * </p>
+ * <p/>
+ * <h2>Examples</h2>
+ * <pre>
+ *    java
+ *      -jar GenomeAnalysisTK.jar
+ *      -T $WalkerName
+ *  </pre>
+ *
+ * @author Your Name
+ * @since Date created
+ */
+public class GCFHeaderBuilder {
+    Map<Allele, Integer> alleles = new HashMap<Allele, Integer>();
+    Map<String, Integer> strings = new HashMap<String, Integer>();
+    Map<String, Integer> samples = new HashMap<String, Integer>();
+
+    public GCFHeader createHeader() {
+        return new GCFHeader(alleles, strings, samples);
+    }
+
+    public int encodeString(final String chr)    { return encode(strings, chr); }
+    public int encodeAllele(final Allele allele) { return encode(alleles, allele); }
+    public int encodeSample(final String sampleName) { return encode(samples, sampleName); }
+
+    private <T> int encode(Map<T, Integer> map, T key) {
+        Integer v = map.get(key);
+        if ( v == null ) {
+            v = map.size();
+            map.put(key, v);
+        }
+        return v;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/gcf/GCFWriter.java b/public/java/src/org/broadinstitute/sting/utils/gcf/GCFWriter.java
new file mode 100644
index 000000000..18fae18c4
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/gcf/GCFWriter.java
@@ -0,0 +1,123 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.gcf;
+
+import net.sf.samtools.SAMSequenceDictionary;
+import org.broadinstitute.sting.utils.codecs.vcf.IndexingVCFWriter;
+import org.broadinstitute.sting.utils.codecs.vcf.VCFHeader;
+import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.variantcontext.VariantContext;
+
+import java.io.*;
+
+/**
+ * GCFWriter implementing the VCFWriter interface
+ * @author Your Name
+ * @since Date created
+ */
+public class GCFWriter extends IndexingVCFWriter {
+    final boolean skipGenotypes;
+    final FileOutputStream fileOutputStream;
+    final DataOutputStream dataOutputStream;
+    final GCFHeaderBuilder gcfHeaderBuilder;
+    int nbytes = 0;
+    VCFHeader header = null;
+    File location;
+
+    // --------------------------------------------------------------------------------
+    //
+    // Constructors
+    //
+    // --------------------------------------------------------------------------------
+
+    public GCFWriter(final File location, final SAMSequenceDictionary refDict, boolean enableOnTheFlyIndexing, boolean doNotWriteGenotypes) {
+        super(writerName(location, null), location, null, refDict, enableOnTheFlyIndexing);
+        this.location = location;
+        this.skipGenotypes = doNotWriteGenotypes;
+
+        // write the output
+        try {
+            fileOutputStream = new FileOutputStream(location);
+            dataOutputStream = createDataOutputStream(fileOutputStream);
+            gcfHeaderBuilder = new GCFHeaderBuilder();
+        } catch ( FileNotFoundException e ) {
+            throw new UserException.CouldNotCreateOutputFile(location, e);
+        }
+    }
+
+    // --------------------------------------------------------------------------------
+    //
+    // VCFWriter interface functions
+    //
+    // --------------------------------------------------------------------------------
+
+    @Override
+    public void writeHeader(VCFHeader header) {
+        this.header = header;
+        try {
+            nbytes += GCFHeader.writeHeader(dataOutputStream);
+        } catch ( IOException e ) {
+            throw new UserException.CouldNotCreateOutputFile(getStreamName(), "Couldn't write header", e);
+        }
+    }
+
+    @Override
+    public void add(VariantContext vc) {
+        super.add(vc);
+        GCF gcf = new GCF(gcfHeaderBuilder, vc, skipGenotypes);
+        try {
+            nbytes += gcf.write(dataOutputStream);
+        } catch ( IOException e ) {
+            throw new UserException.CouldNotCreateOutputFile(getStreamName(), "Failed to add gcf record " + gcf + " to stream " + getStreamName(), e);
+        }
+    }
+
+    @Override
+    public void close() {
+        // todo -- write out VCF header lines
+        GCFHeader gcfHeader = gcfHeaderBuilder.createHeader();
+        try {
+            long headerPosition = nbytes;
+            nbytes += gcfHeader.writeFooter(dataOutputStream);
+            dataOutputStream.close();
+            //System.out.println("Writing forward reference to " + headerPosition);
+
+            RandomAccessFile raFile = new RandomAccessFile(location, "rw");
+            raFile.seek(GCFHeader.HEADER_FORWARD_REFERENCE_OFFSET);
+            raFile.writeLong(headerPosition);
+            raFile.close();
+        } catch ( IOException e ) {
+            throw new ReviewedStingException("Failed to close GCFWriter " + getStreamName(), e);
+        }
+
+        super.close();
+    }
+
+    private static final DataOutputStream createDataOutputStream(final OutputStream stream) {
+        return new DataOutputStream(new BufferedOutputStream(stream, GCF.BUFFER_SIZE));
+    }
+
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/help/HelpFormatter.java b/public/java/src/org/broadinstitute/sting/utils/help/HelpFormatter.java
index a9d71ef98..25ef8ccd2 100755
--- a/public/java/src/org/broadinstitute/sting/utils/help/HelpFormatter.java
+++ b/public/java/src/org/broadinstitute/sting/utils/help/HelpFormatter.java
@@ -29,6 +29,7 @@ import org.apache.log4j.Logger;
 import org.broadinstitute.sting.commandline.ArgumentDefinition;
 import org.broadinstitute.sting.commandline.ArgumentDefinitionGroup;
 import org.broadinstitute.sting.commandline.ArgumentDefinitions;
+import org.broadinstitute.sting.commandline.ArgumentMatchSource;
 import org.broadinstitute.sting.utils.Utils;
 import org.broadinstitute.sting.utils.text.TextFormattingUtils;
 
@@ -47,6 +48,7 @@ public class HelpFormatter {
 
     /**
      * Prints the help, given a collection of argument definitions.
+     * @param applicationDetails Application details
      * @param argumentDefinitions Argument definitions for which help should be printed.
      */
     public void printHelp( ApplicationDetails applicationDetails, ArgumentDefinitions argumentDefinitions ) {
@@ -233,7 +235,7 @@ public class HelpFormatter {
     private List<ArgumentDefinitionGroup> prepareArgumentGroups( ArgumentDefinitions argumentDefinitions ) {
         // Sort the list of argument definitions according to how they should be shown.
         // Put the sorted results into a new cloned data structure.
-        Comparator definitionComparator = new Comparator<ArgumentDefinition>() {
+        Comparator<ArgumentDefinition> definitionComparator = new Comparator<ArgumentDefinition>() {
             public int compare( ArgumentDefinition lhs, ArgumentDefinition rhs ) {
                 if( lhs.required && rhs.required ) return 0;
                 if( lhs.required ) return -1;
@@ -242,15 +244,15 @@ public class HelpFormatter {
             }
         };
 
-        List<ArgumentDefinitionGroup> argumentGroups = new ArrayList();        
+        List<ArgumentDefinitionGroup> argumentGroups = new ArrayList<ArgumentDefinitionGroup>();
         for( ArgumentDefinitionGroup argumentGroup: argumentDefinitions.getArgumentDefinitionGroups() ) {
-            List<ArgumentDefinition> sortedDefinitions = new ArrayList( argumentGroup.argumentDefinitions );
+            List<ArgumentDefinition> sortedDefinitions = new ArrayList<ArgumentDefinition>( argumentGroup.argumentDefinitions );
             Collections.sort( sortedDefinitions, definitionComparator );
             argumentGroups.add( new ArgumentDefinitionGroup(argumentGroup.groupName,sortedDefinitions) );
         }
 
         // Sort the argument groups themselves with main arguments first, followed by plugins sorted in name order.
-        Comparator groupComparator = new Comparator<ArgumentDefinitionGroup>() {
+        Comparator<ArgumentDefinitionGroup> groupComparator = new Comparator<ArgumentDefinitionGroup>() {
             public int compare( ArgumentDefinitionGroup lhs, ArgumentDefinitionGroup rhs ) {
                 if( lhs.groupName == null && rhs.groupName == null ) return 0;
                 if( lhs.groupName == null ) return -1;
@@ -271,9 +273,9 @@ public class HelpFormatter {
      * Generate a standard header for the logger
      *
      * @param applicationDetails details of the application to run.
-     * @param args the command line arguments passed in
+     * @param parsedArgs the command line arguments passed in
      */
-    public static void generateHeaderInformation(ApplicationDetails applicationDetails, String[] args) {
+    public static void generateHeaderInformation(ApplicationDetails applicationDetails, Map<ArgumentMatchSource, List<String>> parsedArgs) {
 
         DateFormat dateFormat = new SimpleDateFormat("yyyy/MM/dd HH:mm:ss");
         java.util.Date date = new java.util.Date();
@@ -283,11 +285,22 @@ public class HelpFormatter {
         logger.info(barrier);
         for (String headerLine : applicationDetails.applicationHeader)
             logger.info(headerLine);
-        String output = "";
-        for (String str : args) {
-            output = output + str + " ";
+        logger.debug("Current directory: " + System.getProperty("user.dir"));
+        for (Map.Entry<ArgumentMatchSource, List<String>> entry: parsedArgs.entrySet()) {
+            ArgumentMatchSource matchSource = entry.getKey();
+            final String sourceName;
+            switch (matchSource.getType()) {
+                case CommandLine: sourceName = "Program"; break;
+                case File: sourceName = matchSource.getFile().getPath(); break;
+                default: throw new RuntimeException("Unexpected argument match source type: " + matchSource.getType());
+            }
+
+            String output = sourceName + " Args:";
+            for (String str : entry.getValue()) {
+                output = output + " " + str;
+            }
+            logger.info(output);
         }
-        logger.info("Program Args: " + output);
         logger.info("Date/Time: " + dateFormat.format(date));
         logger.info(barrier);
 
diff --git a/public/java/src/org/broadinstitute/sting/utils/interval/IntervalFileMergingIterator.java b/public/java/src/org/broadinstitute/sting/utils/interval/IntervalFileMergingIterator.java
deleted file mode 100644
index 2bc3fa284..000000000
--- a/public/java/src/org/broadinstitute/sting/utils/interval/IntervalFileMergingIterator.java
+++ /dev/null
@@ -1,116 +0,0 @@
-/*
- * Copyright (c) 2010 The Broad Institute
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use,
- * copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following
- * conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
- * OTHER DEALINGS IN THE SOFTWARE.
- */
-
-package org.broadinstitute.sting.utils.interval;
-
-import org.broadinstitute.sting.gatk.iterators.PushbackIterator;
-import org.broadinstitute.sting.utils.GenomeLoc;
-import org.broadinstitute.sting.utils.GenomeLocParser;
-import org.broadinstitute.sting.utils.exceptions.UserException;
-import org.broadinstitute.sting.utils.text.XReadLines;
-
-import java.io.File;
-import java.io.FileNotFoundException;
-import java.util.Iterator;
-
-/**
- * Created by IntelliJ IDEA.
- * User: asivache
- * Date: Jun 11, 2010
- * Time: 2:56:29 PM
- * To change this template use File | Settings | File Templates.
- */
-
-/** This iterator reads intervals from interval file (can be gatk-style
- * interval list or a bed file) and merges them on the fly. Very much alike
- * IntervalUtils.sortAndMergeIntervals() but the list is read sequentially
- * from a file upon request instead of loading the whole list into memory.
- * Intervals in the underlying file MUST be
- * pre-sorted into the reference order (they can overlap though, as this
- * iterator is a merging one).
- */
-public class IntervalFileMergingIterator implements Iterator<GenomeLoc> {
-    private PushbackIterator<GenomeLoc> it ;
-    private IntervalMergingRule myRule;
-    private File myFile;
-
-    public IntervalFileMergingIterator(GenomeLocParser genomeLocParser,File f, IntervalMergingRule rule) {
-        myFile = f;
-
-        try {
-            XReadLines reader = new XReadLines(f);
-
-            if (f.getName().toUpperCase().endsWith(".BED")) {
-                it = new PushbackIterator<GenomeLoc>( new StringToGenomeLocIteratorAdapter( genomeLocParser,reader.iterator(),
-                                                              StringToGenomeLocIteratorAdapter.FORMAT.BED ) ) ;
-            } else {
-                it = new PushbackIterator<GenomeLoc>( new StringToGenomeLocIteratorAdapter( genomeLocParser,reader.iterator(),
-                                                              StringToGenomeLocIteratorAdapter.FORMAT.GATK ) ) ;
-            }
-        } catch ( FileNotFoundException e ) {
-            throw new UserException.CouldNotReadInputFile(f, e);
-        }
-        myRule = rule;
-    }
-
-    public boolean hasNext() {
-        return it.hasNext();
-    }
-
-    /** Returns next merged interval from the underlying interval file. In other words, keeps reading intervals
-     * for as long as they overlap and returns a single merged interval encompassing the set of overlapping
-     * intervals read from the file. Non-overlapping intervals are returned as is. This method will throw an
-     * exception if it runs into an interval that is out of order.
-     * @return
-     */
-    public GenomeLoc next() {
-
-        GenomeLoc current = it.next();
-
-        while ( it.hasNext() ) {
-            GenomeLoc next = it.next();
-
-            if ( next.isBefore(current)) {
-                throw new UserException.MalformedFile(myFile, "Interval "+next+" in the interval file is out of order.");
-            }
-
-            if (current.overlapsP(next)) {
-                current = current.merge(next);
-            } else if (current.contiguousP(next) && myRule == IntervalMergingRule.ALL) {
-                current = current.merge(next);
-            } else {
-                it.pushback(next);
-                break;
-            }
-        }
-
-        return current;
-    }
-
-    public void remove() {
-        throw new UnsupportedOperationException("method 'remove' is not supported by this iterator");
-    }
-
-}
diff --git a/public/java/src/org/broadinstitute/sting/utils/interval/IntervalSetRule.java b/public/java/src/org/broadinstitute/sting/utils/interval/IntervalSetRule.java
index eae4f8db5..f31c0a5a0 100644
--- a/public/java/src/org/broadinstitute/sting/utils/interval/IntervalSetRule.java
+++ b/public/java/src/org/broadinstitute/sting/utils/interval/IntervalSetRule.java
@@ -4,6 +4,8 @@ package org.broadinstitute.sting.utils.interval;
  * set operators for combining lists of intervals
  */
 public enum IntervalSetRule {
+    /** Take the union of all intervals */
     UNION,
+    /** Take the intersection of intervals (the subset that overlaps all intervals specified) */
     INTERSECTION;
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/interval/IntervalUtils.java b/public/java/src/org/broadinstitute/sting/utils/interval/IntervalUtils.java
index f551e1368..f0e164c87 100644
--- a/public/java/src/org/broadinstitute/sting/utils/interval/IntervalUtils.java
+++ b/public/java/src/org/broadinstitute/sting/utils/interval/IntervalUtils.java
@@ -1,5 +1,7 @@
 package org.broadinstitute.sting.utils.interval;
 
+import com.google.java.contract.Ensures;
+import com.google.java.contract.Requires;
 import net.sf.picard.util.Interval;
 import net.sf.picard.util.IntervalList;
 import net.sf.samtools.SAMFileHeader;
@@ -8,8 +10,9 @@ import org.broadinstitute.sting.gatk.datasources.reference.ReferenceDataSource;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.GenomeLocParser;
 import org.broadinstitute.sting.utils.GenomeLocSortedSet;
-import org.broadinstitute.sting.utils.bed.BedParser;
+import org.broadinstitute.sting.utils.Utils;
 import org.broadinstitute.sting.utils.collections.Pair;
+import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
 import org.broadinstitute.sting.utils.text.XReadLines;
 
@@ -35,70 +38,68 @@ public class IntervalUtils {
      *
      * @param parser Genome loc parser.
      * @param argList A list of strings containing interval data.
-     * @param allowEmptyIntervalList If false instead of an empty interval list will return null.
-     * @return an unsorted, unmerged representation of the given intervals.  Null is used to indicate that all intervals should be used. 
+     * @return an unsorted, unmerged representation of the given intervals.  Null is used to indicate that all intervals should be used.
      */
-    public static List<GenomeLoc> parseIntervalArguments(GenomeLocParser parser, List<String> argList, boolean allowEmptyIntervalList) {
+    public static List<GenomeLoc> parseIntervalArguments(GenomeLocParser parser, List<String> argList) {
         List<GenomeLoc> rawIntervals = new ArrayList<GenomeLoc>();    // running list of raw GenomeLocs
 
         if (argList != null) { // now that we can be in this function if only the ROD-to-Intervals was provided, we need to
                                // ensure that the arg list isn't null before looping.
             for (String argument : argList) {
-
-                // separate argument on semicolon first
-                for (String fileOrInterval : argument.split(";")) {
-                    // if any interval argument is '-L all', consider all loci by returning no intervals
-                    if (fileOrInterval.trim().toLowerCase().equals("all")) {
-                        if (argList.size() != 1) {
-                            // throw error if '-L all' is not only interval - potentially conflicting commands
-                            throw new UserException.CommandLineException(String.format("Conflicting arguments: Intervals given along with \"-L all\""));
-                        }
-                        return null;
-                    }
-                    // if any argument is 'unmapped', "parse" it to a null entry.  A null in this case means 'all the intervals with no alignment data'.
-                    else if (isUnmapped(fileOrInterval))
-                        rawIntervals.add(GenomeLoc.UNMAPPED);
-                    // if it's a file, add items to raw interval list
-                    else if (isIntervalFile(fileOrInterval)) {
-                        try {
-                            rawIntervals.addAll(intervalFileToList(parser, fileOrInterval, allowEmptyIntervalList));
-                        }
-                        catch ( UserException.MalformedGenomeLoc e ) {
-                            throw e;
-                        }
-                        catch ( Exception e ) {
-                            throw new UserException.MalformedFile(fileOrInterval, "Interval file could not be parsed in any supported format.", e);
-                        }
-                    }
-
-                        // otherwise treat as an interval -> parse and add to raw interval list
-                    else {
-                        rawIntervals.add(parser.parseGenomeLoc(fileOrInterval));
-                    }
-                }
+                rawIntervals.addAll(parseIntervalArguments(parser, argument));
             }
         }
 
         return rawIntervals;
     }
 
-        /**
+    public static List<GenomeLoc> parseIntervalArguments(GenomeLocParser parser, String arg) {
+        List<GenomeLoc> rawIntervals = new ArrayList<GenomeLoc>();    // running list of raw GenomeLocs
+
+        // separate argument on semicolon first
+        for (String fileOrInterval : arg.split(";")) {
+            // if any argument is 'unmapped', "parse" it to a null entry.  A null in this case means 'all the intervals with no alignment data'.
+            if (isUnmapped(fileOrInterval))
+                rawIntervals.add(GenomeLoc.UNMAPPED);
+            // if it's a file, add items to raw interval list
+            else if (isIntervalFile(fileOrInterval)) {
+                try {
+                    rawIntervals.addAll(intervalFileToList(parser, fileOrInterval));
+                }
+                catch ( UserException.MalformedGenomeLoc e ) {
+                    throw e;
+                }
+                catch ( Exception e ) {
+                    throw new UserException.MalformedFile(fileOrInterval, "Interval file could not be parsed in any supported format.", e);
+                }
+            }
+
+                // otherwise treat as an interval -> parse and add to raw interval list
+            else {
+                rawIntervals.add(parser.parseGenomeLoc(fileOrInterval));
+            }
+        }
+
+        return rawIntervals;
+    }
+
+    /**
      * Read a file of genome locations to process. The file may be in BED, Picard,
      * or GATK interval format.
      *
-     * @param file_name interval file
-     * @param allowEmptyIntervalList if false an exception will be thrown for files that contain no intervals
+     * @param glParser   GenomeLocParser
+     * @param file_name  interval file
      * @return List<GenomeLoc> List of Genome Locs that have been parsed from file
      */
-    public static List<GenomeLoc> intervalFileToList(final GenomeLocParser glParser, final String file_name, boolean allowEmptyIntervalList) {
+    public static List<GenomeLoc> intervalFileToList(final GenomeLocParser glParser, final String file_name) {
         // try to open file
         File inputFile = new File(file_name);
         List<GenomeLoc> ret = new ArrayList<GenomeLoc>();
 
         // case: BED file
-        if (file_name.toUpperCase().endsWith(".BED")) {
-            BedParser parser = new BedParser(glParser,inputFile);
-            ret.addAll(parser.getLocations());
+        if ( file_name.toUpperCase().endsWith(".BED") ) {
+            // this is now supported in Tribble
+            throw new ReviewedStingException("BED files must be parsed through Tribble; parsing them as intervals through the GATK engine is no longer supported");
         }
         else {
             /**
@@ -145,12 +146,6 @@ public class IntervalUtils {
             }
         }
 
-        if ( ret.isEmpty() && ! allowEmptyIntervalList ) {
-            throw new UserException("The interval file " + inputFile.getAbsolutePath() + " contains no intervals " +
-                                    "that could be parsed, and the unsafe operation ALLOW_EMPTY_INTERVAL_LIST has " +
-                                    "not been enabled");
-        }
-
         return ret;
     }
 
@@ -204,7 +199,7 @@ public class IntervalUtils {
 
         //if we have an empty list, throw an exception.  If they specified intersection and there are no items, this is bad.
         if (retList.size() == 0)
-                throw new UserException.BadInput("The INTERSECTION of your -BTI and -L options produced no intervals.");
+                throw new UserException.BadInput("The INTERSECTION of your -L options produced no intervals.");
 
         // we don't need to add the rest of remaining locations, since we know they don't overlap. return what we have
         return retList;
@@ -229,6 +224,44 @@ public class IntervalUtils {
         return GenomeLocSortedSet.createSetFromList(parser,intervals);
     }
 
+    /**
+     * computes whether the test interval list is equivalent to master.  To be equivalent, test must
+     * contain GenomeLocs covering every base in master, exactly once.  Note that this algorithm
+     * assumes that master genomelocs are all discontiguous (i.e., we don't have locs like 1-3 and 4-6 but
+     * rather just 1-6).  In order to use this algorithm with contiguous genomelocs first merge them.  The algorithm
+     * doesn't assume that test has discontinuous genomelocs.
+     *
+     * Returns a null string if there are no differences, otherwise returns a string describing the difference
+     * (useful for UnitTests).  Assumes both lists are sorted
+     */
+    public static final String equateIntervals(List<GenomeLoc> masterArg, List<GenomeLoc> testArg) {
+        LinkedList<GenomeLoc> master = new LinkedList<GenomeLoc>(masterArg);
+        LinkedList<GenomeLoc> test = new LinkedList<GenomeLoc>(testArg);
+
+        while ( ! master.isEmpty() ) { // there's still unchecked bases in master
+            final GenomeLoc masterHead = master.pop();
+            final GenomeLoc testHead = test.pop();
+
+            if ( testHead.overlapsP(masterHead) ) {
+                // remove the parts of test that overlap master, and push the remaining
+                // parts onto master for further comparison.
+                for ( final GenomeLoc masterPart : Utils.reverse(masterHead.subtract(testHead)) ) {
+                    master.push(masterPart);
+                }
+            } else {
+                // testHead is incompatible with masterHead, so we must have extra bases in testHead
+                // that aren't in master
+                return "Incompatible locs detected masterHead=" + masterHead + ", testHead=" + testHead;
+            }
+        }
+
+        if ( test.isEmpty() ) // everything is equal
+            return null; // no differences
+        else
+            return "Remaining elements found in test: first=" + test.peek();
+    }
+
+
     /**
      * Check if string argument was intented as a file
      * Accepted file extensions: .bed .list, .picard, .interval_list, .intervals.
@@ -334,24 +367,44 @@ public class IntervalUtils {
     }
 
     /**
-     * Splits an interval list into multiple files.
-     * @param fileHeader The sam file header.
+     * Splits an interval list into multiple sublists.
      * @param locs The genome locs to split.
      * @param splits The stop points for the genome locs returned by splitFixedIntervals.
-     * @param scatterParts The output interval lists to write to.
+     * @return A list of lists of genome locs, split according to splits
      */
-    public static void scatterFixedIntervals(SAMFileHeader fileHeader, List<GenomeLoc> locs, List<Integer> splits, List<File> scatterParts) {
-        if (splits.size() != scatterParts.size())
-            throw new UserException.BadArgumentValue("splits", String.format("Split points %d does not equal the number of scatter parts %d.", splits.size(), scatterParts.size()));
-        int fileIndex = 0;
+    public static List<List<GenomeLoc>> splitIntervalsToSubLists(List<GenomeLoc> locs, List<Integer> splits) {
         int locIndex = 1;
         int start = 0;
+        List<List<GenomeLoc>> sublists = new ArrayList<List<GenomeLoc>>(splits.size());
         for (Integer stop: splits) {
-            IntervalList intervalList = new IntervalList(fileHeader);
+            List<GenomeLoc> curList = new ArrayList<GenomeLoc>();
             for (int i = start; i < stop; i++)
-                intervalList.add(toInterval(locs.get(i), locIndex++));
-            intervalList.write(scatterParts.get(fileIndex++));
+                curList.add(locs.get(i));
             start = stop;
+            sublists.add(curList);
+        }
+
+        return sublists;
+    }
+
+
+    /**
+     * Splits an interval list into multiple files.
+     * @param fileHeader The sam file header.
+     * @param splits Pre-divided genome locs returned by splitFixedIntervals.
+     * @param scatterParts The output interval lists to write to.
+     */
+    public static void scatterFixedIntervals(SAMFileHeader fileHeader, List<List<GenomeLoc>> splits, List<File> scatterParts) {
+        if (splits.size() != scatterParts.size())
+            throw new UserException.BadArgumentValue("splits", String.format("Split points %d does not equal the number of scatter parts %d.", splits.size(), scatterParts.size()));
+
+        int fileIndex = 0;
+        int locIndex = 1;
+        for (final List<GenomeLoc> split : splits) {
+            IntervalList intervalList = new IntervalList(fileHeader);
+            for (final GenomeLoc loc : split)
+                intervalList.add(toInterval(loc, locIndex++));
+            intervalList.write(scatterParts.get(fileIndex++));
         }
     }
 
@@ -361,17 +414,101 @@ public class IntervalUtils {
      * @param numParts Number of parts to split the locs into.
      * @return The stop points to split the genome locs.
      */
-    public static List<Integer> splitFixedIntervals(List<GenomeLoc> locs, int numParts) {
+    public static List<List<GenomeLoc>> splitFixedIntervals(List<GenomeLoc> locs, int numParts) {
         if (locs.size() < numParts)
             throw new UserException.BadArgumentValue("scatterParts", String.format("Cannot scatter %d locs into %d parts.", locs.size(), numParts));
-        long locsSize = 0;
-        for (GenomeLoc loc: locs)
-            locsSize += loc.size();
-        List<Integer> splitPoints = new ArrayList<Integer>();
+        final long locsSize = intervalSize(locs);
+        final List<Integer> splitPoints = new ArrayList<Integer>();
         addFixedSplit(splitPoints, locs, locsSize, 0, locs.size(), numParts);
         Collections.sort(splitPoints);
         splitPoints.add(locs.size());
-        return splitPoints;
+        return splitIntervalsToSubLists(locs, splitPoints);
+    }
+
+    @Requires({"locs != null", "numParts > 0"})
+    @Ensures("result != null")
+    public static List<List<GenomeLoc>> splitLocusIntervals(List<GenomeLoc> locs, int numParts) {
+        // the ideal size of each split
+        final long bp = IntervalUtils.intervalSize(locs);
+        final long idealSplitSize = Math.max((long)Math.floor(bp / (1.0*numParts)), 1);
+
+        // algorithm:
+        // split = ()
+        // set size = 0
+        // pop the head H off locs.
+        // If size + size(H) < splitSize:
+        //      add H to split, continue
+        // If size + size(H) == splitSize:
+        //      done with split, put in splits, restart
+        // if size + size(H) > splitSize:
+        //      cut H into two pieces, first of which has splitSize - size bp
+        //      push both pieces onto locs, continue
+        // The last split is special -- when you have only one split left, it gets all of the remaining locs
+        // to deal with rounding issues
+        final List<List<GenomeLoc>> splits = new ArrayList<List<GenomeLoc>>(numParts);
+
+        LinkedList<GenomeLoc> locsLinkedList = new LinkedList<GenomeLoc>(locs);
+        while ( ! locsLinkedList.isEmpty() ) {
+            if ( splits.size() + 1 == numParts ) {
+                // the last one gets all of the remaining parts
+                splits.add(new ArrayList<GenomeLoc>(locsLinkedList));
+                locsLinkedList.clear();
+            } else {
+                final SplitLocusRecursive one = splitLocusIntervals1(locsLinkedList, idealSplitSize);
+                splits.add(one.split);
+                locsLinkedList = one.remaining;
+            }
+        }
+
+        return splits;
+    }
+
+    @Requires({"remaining != null", "!remaining.isEmpty()", "idealSplitSize > 0"})
+    @Ensures({"result != null"})
+    final static SplitLocusRecursive splitLocusIntervals1(LinkedList<GenomeLoc> remaining, long idealSplitSize) {
+        final List<GenomeLoc> split = new ArrayList<GenomeLoc>();
+        long size = 0;
+
+        while ( ! remaining.isEmpty() ) {
+            GenomeLoc head = remaining.pop();
+            final long newSize = size + head.size();
+
+            if ( newSize == idealSplitSize ) {
+                split.add(head);
+                break; // we are done
+            } else if ( newSize > idealSplitSize ) {
+                final long remainingBp = idealSplitSize - size;
+                final long cutPoint = head.getStart() + remainingBp;
+                GenomeLoc[] parts = head.split((int)cutPoint);
+                remaining.push(parts[1]);
+                remaining.push(parts[0]);
+                // when we go around, head.size' = idealSplitSize - size
+                // so newSize' = splitSize + head.size' = size + (idealSplitSize - size) = idealSplitSize
+            } else {
+                split.add(head);
+                size = newSize;
+            }
+        }
+
+        return new SplitLocusRecursive(split, remaining);
+    }
+
+    private final static class SplitLocusRecursive {
+        final List<GenomeLoc> split;
+        final LinkedList<GenomeLoc> remaining;
+
+        @Requires({"split != null", "remaining != null"})
+        private SplitLocusRecursive(final List<GenomeLoc> split, final LinkedList<GenomeLoc> remaining) {
+            this.split = split;
+            this.remaining = remaining;
+        }
+    }
+
+    public static List<GenomeLoc> flattenSplitIntervals(List<List<GenomeLoc>> splits) {
+        final List<GenomeLoc> locs = new ArrayList<GenomeLoc>();
+        for ( final List<GenomeLoc> split : splits )
+            locs.addAll(split);
+        return locs;
     }
 
     private static void addFixedSplit(List<Integer> splitPoints, List<GenomeLoc> locs, long locsSize, int startIndex, int stopIndex, int numParts) {
@@ -441,4 +578,11 @@ public class IntervalUtils {
             return merged;
         }
     }
+
+    public static final long intervalSize(final List<GenomeLoc> locs) {
+        long size = 0;
+        for ( final GenomeLoc loc : locs )
+            size += loc.size();
+        return size;
+    }
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/interval/NwayIntervalMergingIterator.java b/public/java/src/org/broadinstitute/sting/utils/interval/NwayIntervalMergingIterator.java
deleted file mode 100644
index 7e87ce8b5..000000000
--- a/public/java/src/org/broadinstitute/sting/utils/interval/NwayIntervalMergingIterator.java
+++ /dev/null
@@ -1,201 +0,0 @@
-/*
- * Copyright (c) 2010 The Broad Institute
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use,
- * copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following
- * conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
- * OTHER DEALINGS IN THE SOFTWARE.
- */
-
-package org.broadinstitute.sting.utils.interval;
-
-import org.broadinstitute.sting.utils.GenomeLoc;
-import org.broadinstitute.sting.utils.exceptions.UserException;
-
-import java.util.Iterator;
-import java.util.PriorityQueue;
-
-/**
- * Created by IntelliJ IDEA.
- * User: asivache
- * Date: Oct 28, 2010
- * Time: 12:06:23 PM
- * To change this template use File | Settings | File Templates.
- */
-
-/**
- * An adapter over a collection of underlying Iterator<GenomeLoc> objects (a single underlying iterator is allowed). Each
- * individual underlying iterator must serve its intervals in coordinate-sorted order or an exception will be thrown.
- * Intervals from individual underlying streams (iterators) are 1) merged into a single ordered stream; 2) each group of
- * overlapping intervals from that merged stream are merged into a single interval; each call to next() returns such
- * merged interval guaranteed to have no overlaps with the previous or next interval. 
- *
- */
-public class NwayIntervalMergingIterator implements Iterator<GenomeLoc>, Iterable<GenomeLoc> {
-
-    private PriorityQueue<Element> queue = null;
-    private IntervalMergingRule myRule;
-
-    public NwayIntervalMergingIterator(IntervalMergingRule rule) {
-        myRule = rule;
-        queue = new PriorityQueue<Element>();
-    }
-
-    public void add(Iterator<GenomeLoc> it) {
-        Element e = new Element(it);
-        if ( ! e.isEmpty() ) queue.add(e);
-    }
-
-    public Iterator<GenomeLoc> iterator() {
-        return this;
-    }
-
-    /**
-     * Returns <tt>true</tt> if the iteration has more elements. (In other
-     * words, returns <tt>true</tt> if <tt>next</tt> would return an element
-     * rather than throwing an exception.)
-     *
-     * @return <tt>true</tt> if the iterator has more elements.
-     */
-    public boolean hasNext() {
-        return ! queue.isEmpty();  //To change body of implemented methods use File | Settings | File Templates.
-    }
-
-    /**
-     * Returns the next element in the iteration.
-     *
-     * @return the next element in the iteration.
-     * @throws java.util.NoSuchElementException
-     *          iteration has no more elements.
-     */
-    public GenomeLoc next() {
-        Element e = queue.poll();
-        GenomeLoc result = e.current;
-
-        // advance element (i.e. its underlying iterator) and reinsert into the queue
-        e.advance();
-        if ( ! e.isEmpty() ) queue.add(e);
-
-        while ( ! queue.isEmpty () ) {
-            e = queue.peek();
-
-            if (result.overlapsP(e.current) ||  myRule == IntervalMergingRule.ALL && result.contiguousP(e.current)) {
-                // we need to merge:
-                result = result.merge(e.current);
-
-                // remove current head of the queue that we just merged into the result:
-                e = queue.poll();
-                // advance element we just merged into the result and reinsert it into the queue (if it has any data left):
-                e.advance();
-                if ( ! e.isEmpty() ) queue.add(e);
-
-            } else {
-                // next element does not overlap with current result; we are done: return the result and that
-                // next element will wait for next call to next()
-                break;
-            }
-
-        }
-        return result;  //To change body of implemented methods use File | Settings | File Templates.
-    }
-
-    /**
-     * Removes from the underlying collection the last element returned by the
-     * iterator (optional operation).  This method can be called only once per
-     * call to <tt>next</tt>.  The behavior of an iterator is unspecified if
-     * the underlying collection is modified while the iteration is in
-     * progress in any way other than by calling this method.
-     *
-     * @throws UnsupportedOperationException if the <tt>remove</tt>
-     *                                       operation is not supported by this Iterator.
-     * @throws IllegalStateException         if the <tt>next</tt> method has not
-     *                                       yet been called, or the <tt>remove</tt> method has already
-     *                                       been called after the last call to the <tt>next</tt>
-     *                                       method.
-     */
-    public void remove() {
-        throw new UnsupportedOperationException("remove() method not supported by this iterator");
-    }
-
-    private class Element implements Comparable<Element> {
-        private Iterator<GenomeLoc> it;
-        private GenomeLoc current = null;
-
-        private void advance() {
-            if ( it.hasNext() ) {
-                GenomeLoc next = it.next();
-                if ( next.isBefore(current) ) {
-                    throw new UserException("Interval list provided by underlying iterator "+it.getClass().getName() +" is out of order");
-                }
-                current = next;
-            }
-            else current = null;
-        }
-
-        public boolean isEmpty() { return current == null; }
-
-        public Element(Iterator<GenomeLoc> it) {
-            this.it = it;
-            if ( this.it.hasNext() ) current = this.it.next();
-        }
-
-        /**
-         * Compares this object with the specified object for order.  Returns a
-         * negative integer, zero, or a positive integer as this object is less
-         * than, equal to, or greater than the specified object.
-         * <p/>
-         * <p>The implementor must ensure <tt>sgn(x.compareTo(y)) ==
-         * -sgn(y.compareTo(x))</tt> for all <tt>x</tt> and <tt>y</tt>.  (This
-         * implies that <tt>x.compareTo(y)</tt> must throw an exception iff
-         * <tt>y.compareTo(x)</tt> throws an exception.)
-         * <p/>
-         * <p>The implementor must also ensure that the relation is transitive:
-         * <tt>(x.compareTo(y)&gt;0 &amp;&amp; y.compareTo(z)&gt;0)</tt> implies
-         * <tt>x.compareTo(z)&gt;0</tt>.
-         * <p/>
-         * <p>Finally, the implementor must ensure that <tt>x.compareTo(y)==0</tt>
-         * implies that <tt>sgn(x.compareTo(z)) == sgn(y.compareTo(z))</tt>, for
-         * all <tt>z</tt>.
-         * <p/>
-         * <p>It is strongly recommended, but <i>not</i> strictly required that
-         * <tt>(x.compareTo(y)==0) == (x.equals(y))</tt>.  Generally speaking, any
-         * class that implements the <tt>Comparable</tt> interface and violates
-         * this condition should clearly indicate this fact.  The recommended
-         * language is "Note: this class has a natural ordering that is
-         * inconsistent with equals."
-         * <p/>
-         * <p>In the foregoing description, the notation
-         * <tt>sgn(</tt><i>expression</i><tt>)</tt> designates the mathematical
-         * <i>signum</i> function, which is defined to return one of <tt>-1</tt>,
-         * <tt>0</tt>, or <tt>1</tt> according to whether the value of
-         * <i>expression</i> is negative, zero or positive.
-         *
-         * @param o the object to be compared.
-         * @return a negative integer, zero, or a positive integer as this object
-         *         is less than, equal to, or greater than the specified object.
-         * @throws ClassCastException if the specified object's type prevents it
-         *                            from being compared to this object.
-         */
-        public int compareTo(Element o) {
-            if ( current == null ) return 1;
-            if ( o.current == null ) return -1;
-            return current.compareTo(o.current);  //To change body of implemented methods use File | Settings | File Templates.
-        }
-    }
-}
diff --git a/public/java/src/org/broadinstitute/sting/utils/interval/StringToGenomeLocIteratorAdapter.java b/public/java/src/org/broadinstitute/sting/utils/interval/StringToGenomeLocIteratorAdapter.java
deleted file mode 100644
index 659260345..000000000
--- a/public/java/src/org/broadinstitute/sting/utils/interval/StringToGenomeLocIteratorAdapter.java
+++ /dev/null
@@ -1,94 +0,0 @@
-/*
- * Copyright (c) 2010 The Broad Institute
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use,
- * copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following
- * conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
- * OTHER DEALINGS IN THE SOFTWARE.
- */
-
-package org.broadinstitute.sting.utils.interval;
-
-import org.broadinstitute.sting.gatk.iterators.PushbackIterator;
-import org.broadinstitute.sting.utils.GenomeLoc;
-import org.broadinstitute.sting.utils.GenomeLocParser;
-import org.broadinstitute.sting.utils.bed.BedParser;
-
-import java.util.Iterator;
-
-/**
- * Created by IntelliJ IDEA.
-* User: asivache
-* Date: Jun 11, 2010
-* Time: 2:25:42 PM
-* To change this template use File | Settings | File Templates.
-*/
-
-/**
- * Wrap this adapter around Iterator<String> to get Iterator<GenomLoc>. Each string coming from the underlying
- * iterator is parsed and converted to GenomeLoc on the fly and the latter is returned on each call to next().
- * This adaptor silently skips empty lines received from the underlying string iterator.
- * Two string formats are currently supported: BED and GATK. This iterator will throw an exception if it fails
- * to parse a string.
- */
-public class StringToGenomeLocIteratorAdapter implements Iterator<GenomeLoc> {
-    private GenomeLocParser genomeLocParser;
-
-    private PushbackIterator<String> it = null;
-
-    public enum FORMAT { BED, GATK };
-
-    FORMAT myFormat = FORMAT.GATK;
-
-    public StringToGenomeLocIteratorAdapter(GenomeLocParser genomeLocParser,Iterator<String> it, FORMAT format) {
-        this.genomeLocParser = genomeLocParser;
-        this.it = new PushbackIterator<String>(it);
-        myFormat = format;
-    }
-
-    public StringToGenomeLocIteratorAdapter(GenomeLocParser genomeLocParser,Iterator<String> it ) {
-        this(genomeLocParser,it,FORMAT.GATK);
-    }
-
-    public boolean hasNext() {
-        String s = null;
-        boolean success = false;
-
-        // skip empty lines:
-        while ( it.hasNext() ) {
-            s = it.next();
-            if ( s.length() != 0 && ! s.matches("^\\s+$")) {
-                success = true;
-                it.pushback(s);
-                break;
-            }
-        }
-        return success;
-    }
-
-    public GenomeLoc next() {
-
-        if ( myFormat == FORMAT.GATK ) return genomeLocParser.parseGenomeLoc(it.next());
-        return BedParser.parseLocation( genomeLocParser,it.next() );
-    }
-
-    public void remove() {
-        throw new UnsupportedOperationException("method 'remove' is not supported by this iterator");
-    }
-}
diff --git a/public/java/src/org/broadinstitute/sting/utils/io/FileExtension.java b/public/java/src/org/broadinstitute/sting/utils/io/FileExtension.java
new file mode 100644
index 000000000..cd69ee126
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/io/FileExtension.java
@@ -0,0 +1,36 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person 
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.io;
+
+import java.io.File;
+
+public interface FileExtension {
+    /**
+     * Returns a clone of the FileExtension with a new path.
+     * @param path New path.
+     * @return New FileExtension
+     */
+    public File withPath(String path);
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/io/HardThresholdingOutputStream.java b/public/java/src/org/broadinstitute/sting/utils/io/HardThresholdingOutputStream.java
new file mode 100755
index 000000000..26b5ae6fd
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/io/HardThresholdingOutputStream.java
@@ -0,0 +1,54 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+package org.broadinstitute.sting.utils.io;
+
+import org.apache.commons.io.output.ThresholdingOutputStream;
+
+import java.io.IOException;
+
+/**
+ * An output stream which stops at the threshold
+ * instead of potentially triggering early.
+ */
+public abstract class HardThresholdingOutputStream extends ThresholdingOutputStream {
+    protected HardThresholdingOutputStream(int threshold) {
+        super(threshold);
+    }
+
+    @Override
+    public void write(byte[] b) throws IOException {
+        write(b, 0, b.length);
+    }
+
+    @Override
+    public void write(byte[] b, int off, int len) throws IOException {
+        int remaining = this.getThreshold() - (int)this.getByteCount();
+        if (!isThresholdExceeded() && len > remaining) {
+            super.write(b, off, remaining);
+            super.write(b, off + remaining, len - remaining);
+        } else {
+            super.write(b, off, len);
+        }
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/io/IOUtils.java b/public/java/src/org/broadinstitute/sting/utils/io/IOUtils.java
new file mode 100644
index 000000000..94c2d4c0b
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/io/IOUtils.java
@@ -0,0 +1,365 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.io;
+
+import org.apache.commons.io.FileUtils;
+import org.apache.commons.io.FilenameUtils;
+import org.apache.commons.io.LineIterator;
+import org.apache.commons.lang.StringUtils;
+import org.apache.log4j.Logger;
+import org.broadinstitute.sting.utils.exceptions.StingException;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+
+import java.io.*;
+import java.util.*;
+
+public class IOUtils {
+    private static Logger logger = Logger.getLogger(IOUtils.class);
+
+    /**
+     * Checks if the temp directory has been setup and throws an exception if they user hasn't set it correctly.
+     *
+     * @param tempDir Temporary directory.
+     */
+    public static void checkTempDir(File tempDir) {
+        String tempDirPath = tempDir.getAbsolutePath();
+        // Keeps the user from leaving the temp directory as the default, and on Macs from having pluses
+        // in the path which can cause problems with the Google Reflections library.
+        // see also: http://benjchristensen.com/2009/09/22/mac-osx-10-6-java-java-io-tmpdir/
+        if (tempDirPath.startsWith("/var/folders/") || (tempDirPath.equals("/tmp")) || (tempDirPath.equals("/tmp/")))
+            throw new UserException.BadTmpDir("java.io.tmpdir must be explicitly set");
+        if (!tempDir.exists() && !tempDir.mkdirs())
+            throw new UserException.BadTmpDir("Could not create directory: " + tempDir.getAbsolutePath());
+    }
+
+    /**
+     * Creates a temp directory with the prefix and optional suffix.
+     *
+     * @param prefix       Prefix for the directory name.
+     * @param suffix       Optional suffix for the directory name.
+     * @return The created temporary directory.
+     */
+    public static File tempDir(String prefix, String suffix) {
+        return tempDir(prefix, suffix, null);
+    }
+
+    /**
+     * Creates a temp directory with the prefix and optional suffix.
+     *
+     * @param prefix        Prefix for the directory name.
+     * @param suffix        Optional suffix for the directory name.
+     * @param tempDirParent Parent directory for the temp directory.
+     * @return The created temporary directory.
+     */
+    public static File tempDir(String prefix, String suffix, File tempDirParent) {
+        try {
+            if (tempDirParent == null)
+                tempDirParent = FileUtils.getTempDirectory();
+            if (!tempDirParent.exists() && !tempDirParent.mkdirs())
+                throw new UserException.BadTmpDir("Could not create temp directory: " + tempDirParent);
+            File temp = File.createTempFile(prefix + "-", suffix, tempDirParent);
+            if (!temp.delete())
+                throw new UserException.BadTmpDir("Could not delete sub file: " + temp.getAbsolutePath());
+            if (!temp.mkdir())
+                throw new UserException.BadTmpDir("Could not create sub directory: " + temp.getAbsolutePath());
+            return absolute(temp);
+        } catch (IOException e) {
+            throw new UserException.BadTmpDir(e.getMessage());
+        }
+    }
+
+    /**
+     * Writes content to a temp file and returns the path to the temporary file.
+     *
+     * @param content   to write.
+     * @param prefix    Prefix for the temp file.
+     * @param suffix    Suffix for the temp file.
+     * @return the path to the temp file.
+     */
+    public static File writeTempFile(String content, String prefix, String suffix) {
+        return writeTempFile(content, prefix, suffix, null);
+    }
+
+    /**
+     * Writes content to a temp file and returns the path to the temporary file.
+     *
+     * @param content   to write.
+     * @param prefix    Prefix for the temp file.
+     * @param suffix    Suffix for the temp file.
+     * @param directory Directory for the temp file.
+     * @return the path to the temp file.
+     */
+    public static File writeTempFile(String content, String prefix, String suffix, File directory) {
+        try {
+            File tempFile = absolute(File.createTempFile(prefix, suffix, directory));
+            FileUtils.writeStringToFile(tempFile, content);
+            return tempFile;
+        } catch (IOException e) {
+            throw new UserException.BadTmpDir(e.getMessage());
+        }
+    }
+
+    /**
+     * Waits for NFS to propagate a file creation, imposing a timeout.
+     *
+     * Based on Apache Commons IO FileUtils.waitFor()
+     *
+     * @param file    The file to wait for.
+     * @param seconds The maximum time in seconds to wait.
+     * @return true if the file exists
+     */
+    public static boolean waitFor(File file, int seconds) {
+        return waitFor(Collections.singletonList(file), seconds).isEmpty();
+    }
+
+    /**
+     * Waits for NFS to propagate a file creation, imposing a timeout.
+     *
+     * Based on Apache Commons IO FileUtils.waitFor()
+     *
+     * @param files   The list of files to wait for.
+     * @param seconds The maximum time in seconds to wait.
+     * @return Files that still do not exists at the end of the timeout, or a empty list if all files exists.
+     */
+    public static List<File> waitFor(Collection<File> files, int seconds) {
+        long timeout = 0;
+        long tick = 0;
+        List<File> missingFiles = new ArrayList<File>();
+        for (File file : files)
+            if (!file.exists())
+                missingFiles.add(file);
+
+        while (!missingFiles.isEmpty() && timeout <= seconds) {
+            if (tick >= 10) {
+                tick = 0;
+                timeout++;
+            }
+            tick++;
+            try {
+                Thread.sleep(100);
+            } catch (InterruptedException ignore) {
+            }
+            List<File> newMissingFiles = new ArrayList<File>();
+            for (File file : missingFiles)
+                if (!file.exists())
+                    newMissingFiles.add(file);
+            missingFiles = newMissingFiles;
+        }
+        return missingFiles;
+    }
+
+    /**
+     * Returns the directory at the number of levels deep.
+     * For example 2 levels of /path/to/dir will return /path/to
+     *
+     * @param dir   Directory path.
+     * @param level how many levels deep from the root.
+     * @return The path to the parent directory that is level-levels deep.
+     */
+    public static File dirLevel(File dir, int level) {
+        List<File> directories = new ArrayList<File>();
+        File parentDir = absolute(dir);
+        while (parentDir != null) {
+            directories.add(0, parentDir);
+            parentDir = parentDir.getParentFile();
+        }
+        if (directories.size() <= level)
+            return directories.get(directories.size() - 1);
+        else
+            return directories.get(level);
+    }
+
+    /**
+     * Returns the sub path rooted at the parent.
+     *
+     * @param parent The parent directory.
+     * @param path   The sub path to append to the parent, if the path is not absolute.
+     * @return The absolute path to the file in the parent dir if the path was not absolute, otherwise the original path.
+     */
+    public static File absolute(File parent, String path) {
+        return absolute(parent, new File(path));
+    }
+
+    /**
+     * Returns the sub path rooted at the parent.
+     *
+     * @param parent The parent directory.
+     * @param file   The sub path to append to the parent, if the path is not absolute.
+     * @return The absolute path to the file in the parent dir if the path was not absolute, otherwise the original path.
+     */
+    public static File absolute(File parent, File file) {
+        String newPath;
+        if (file.isAbsolute())
+            newPath = absolutePath(file);
+        else
+            newPath = absolutePath(new File(parent, file.getPath()));
+        return replacePath(file, newPath);
+    }
+
+    /**
+     * A mix of getCanonicalFile and getAbsoluteFile that returns the
+     * absolute path to the file without deferencing symbolic links.
+     *
+     * @param file the file.
+     * @return the absolute path to the file.
+     */
+    public static File absolute(File file) {
+        return replacePath(file, absolutePath(file));
+    }
+
+    private static String absolutePath(File file) {
+        File fileAbs = file.getAbsoluteFile();
+        LinkedList<String> names = new LinkedList<String>();
+        while (fileAbs != null) {
+            String name = fileAbs.getName();
+            fileAbs = fileAbs.getParentFile();
+
+            if (".".equals(name)) {
+                /* skip */
+
+                /* TODO: What do we do for ".."?
+              } else if (name == "..") {
+
+                CentOS tcsh says use getCanonicalFile:
+                ~ $ mkdir -p test1/test2
+                ~ $ ln -s test1/test2 test3
+                ~ $ cd test3/..
+                ~/test1 $
+
+                Mac bash says keep going with getAbsoluteFile:
+                ~ $ mkdir -p test1/test2
+                ~ $ ln -s test1/test2 test3
+                ~ $ cd test3/..
+                ~ $
+
+                For now, leave it and let the shell figure it out.
+                */
+            } else {
+                names.add(0, name);
+            }
+        }
+
+        return ("/" + StringUtils.join(names, "/"));
+    }
+
+    private static File replacePath(File file, String path) {
+        if (file instanceof FileExtension)
+            return ((FileExtension)file).withPath(path);
+        if (!File.class.equals(file.getClass()))
+            throw new StingException("Sub classes of java.io.File must also implement FileExtension");
+        return new File(path);
+    }
+
+    /**
+     * Returns the last lines of the file.
+     * NOTE: This is only safe to run on smaller files!
+     *
+     * @param file  File to read.
+     * @param count Maximum number of lines to return.
+     * @return The last count lines from file.
+     * @throws IOException When unable to read the file.
+     */
+    public static List<String> tail(File file, int count) throws IOException {
+        LinkedList<String> tailLines = new LinkedList<String>();
+        FileReader reader = new FileReader(file);
+        try {
+            LineIterator iterator = org.apache.commons.io.IOUtils.lineIterator(reader);
+            int lineCount = 0;
+            while (iterator.hasNext()) {
+                String line = iterator.nextLine();
+                lineCount++;
+                if (lineCount > count)
+                    tailLines.removeFirst();
+                tailLines.offer(line);
+            }
+        } finally {
+            org.apache.commons.io.IOUtils.closeQuietly(reader);
+        }
+        return tailLines;
+    }
+
+    /**
+     * Tries to delete a file. Emits a warning if the file was unable to be deleted.
+     *
+     * @param file File to delete.
+     * @return true if the file was deleted.
+     */
+    public static boolean tryDelete(File file) {
+        boolean deleted = FileUtils.deleteQuietly(file);
+        if (deleted)
+            logger.debug("Deleted " + file);
+        else if (file.exists())
+            logger.warn("Unable to delete " + file);
+        return deleted;
+    }
+
+    /**
+     * Writes the an embedded resource to a temp file.
+     * File is not scheduled for deletion and must be cleaned up by the caller.
+     * @param resource Embedded resource.
+     * @return Path to the temp file with the contents of the resource.
+     */
+    public static File writeTempResource(Resource resource) {
+        File temp;
+        try {
+            temp = File.createTempFile(FilenameUtils.getBaseName(resource.getPath()) + ".", "." + FilenameUtils.getExtension(resource.getPath()));
+        } catch (IOException e) {
+            throw new UserException.BadTmpDir(e.getMessage());
+        }
+        writeResource(resource, temp);
+        return temp;
+    }
+
+    /**
+     * Writes the an embedded resource to a file.
+     * File is not scheduled for deletion and must be cleaned up by the caller.
+     * @param resource Embedded resource.
+     * @param file File path to write.
+     */
+    public static void writeResource(Resource resource, File file) {
+        String path = resource.getPath();
+        Class<?> clazz = resource.getRelativeClass();
+        InputStream inputStream = null;
+        OutputStream outputStream = null;
+        try {
+            if (clazz == null) {
+                inputStream = ClassLoader.getSystemResourceAsStream(path);
+                if (inputStream == null)
+                    throw new IllegalArgumentException("Resource not found: " + path);
+            } else {
+                inputStream = clazz.getResourceAsStream(path);
+                if (inputStream == null)
+                    throw new IllegalArgumentException("Resource not found relative to " + clazz + ": " + path);
+            }
+            outputStream = FileUtils.openOutputStream(file);
+            org.apache.commons.io.IOUtils.copy(inputStream, outputStream);
+        } catch (IOException e) {
+            throw new StingException(String.format("Unable to copy resource '%s' to '%s'", path, file), e);
+        } finally {
+            org.apache.commons.io.IOUtils.closeQuietly(inputStream);
+            org.apache.commons.io.IOUtils.closeQuietly(outputStream);
+        }
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/io/Resource.java b/public/java/src/org/broadinstitute/sting/utils/io/Resource.java
new file mode 100644
index 000000000..895fb9731
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/io/Resource.java
@@ -0,0 +1,66 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.io;
+
+import java.io.File;
+
+/**
+ * Stores a resource by path and a relative class.
+ */
+public class Resource {
+    private final String path;
+    private final Class<?> relativeClass;
+
+    /**
+     * Create a resource with a path and a relative class.
+     * @param path Relative or absolute path to the class.
+     * @param relativeClass Relative class to use as a class loader and for a relative package.
+     *
+     * If the relative class is null then the system classloader will be used and the path must be absolute.
+     */
+    public Resource(String path, Class<?> relativeClass) {
+        this.path = path;
+        this.relativeClass = relativeClass;
+    }
+
+    public Class<?> getRelativeClass() {
+        return relativeClass;
+    }
+
+    public String getPath() {
+        return path;
+    }
+
+    public String getFullPath() {
+        if (relativeClass == null)
+            return path;
+        if (new File(path).isAbsolute())
+            return path;
+        return String.format("%s%s%s",
+                relativeClass.getPackage().getName().replace('.', File.separatorChar),
+                File.separator,
+                path);
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/pileup/AbstractReadBackedPileup.java b/public/java/src/org/broadinstitute/sting/utils/pileup/AbstractReadBackedPileup.java
index 3821c9c8a..18051ce92 100644
--- a/public/java/src/org/broadinstitute/sting/utils/pileup/AbstractReadBackedPileup.java
+++ b/public/java/src/org/broadinstitute/sting/utils/pileup/AbstractReadBackedPileup.java
@@ -24,13 +24,13 @@
 
 package org.broadinstitute.sting.utils.pileup;
 
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
 import org.broadinstitute.sting.utils.BaseUtils;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
-import org.broadinstitute.sting.utils.exceptions.StingException;
+import org.broadinstitute.sting.utils.fragments.FragmentCollection;
+import org.broadinstitute.sting.utils.fragments.FragmentUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.*;
 
@@ -45,6 +45,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
     protected final PileupElementTracker<PE> pileupElementTracker;
 
     protected int size = 0;                   // cached value of the size of the pileup
+    protected int abstractSize = -1;           // cached value of the abstract size of the pileup
     protected int nDeletions = 0;             // cached value of the number of deletions
     protected int nMQ0Reads = 0;              // cached value of the number of MQ0 reads
 
@@ -58,12 +59,12 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
      * @param reads
      * @param offsets
      */
-    public AbstractReadBackedPileup(GenomeLoc loc, List<SAMRecord> reads, List<Integer> offsets ) {
+    public AbstractReadBackedPileup(GenomeLoc loc, List<GATKSAMRecord> reads, List<Integer> offsets ) {
         this.loc = loc;
         this.pileupElementTracker = readsOffsets2Pileup(reads,offsets);
     }
 
-    public AbstractReadBackedPileup(GenomeLoc loc, List<SAMRecord> reads, int offset ) {
+    public AbstractReadBackedPileup(GenomeLoc loc, List<GATKSAMRecord> reads, int offset ) {
         this.loc = loc;
         this.pileupElementTracker = readsOffsets2Pileup(reads,offset);
     }
@@ -114,10 +115,10 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
         calculateCachedData();
     }
 
-    protected AbstractReadBackedPileup(GenomeLoc loc, Map<Sample,? extends AbstractReadBackedPileup<RBP,PE>> pileupsBySample) {
+    protected AbstractReadBackedPileup(GenomeLoc loc, Map<String,? extends AbstractReadBackedPileup<RBP,PE>> pileupsBySample) {
         this.loc = loc;
         PerSamplePileupElementTracker<PE> tracker = new PerSamplePileupElementTracker<PE>();
-        for(Map.Entry<Sample,? extends AbstractReadBackedPileup<RBP,PE>> pileupEntry: pileupsBySample.entrySet()) {
+        for(Map.Entry<String,? extends AbstractReadBackedPileup<RBP,PE>> pileupEntry: pileupsBySample.entrySet()) {
             tracker.addElements(pileupEntry.getKey(),pileupEntry.getValue().pileupElementTracker);
             addPileupToCumulativeStats(pileupEntry.getValue());
         }
@@ -145,8 +146,16 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
         }
     }
 
+    protected void calculateAbstractSize() {
+        abstractSize = 0;
+        for ( PileupElement p : pileupElementTracker ) {
+            abstractSize += p.getRepresentativeCount();
+        }
+    }
+
     protected void addPileupToCumulativeStats(AbstractReadBackedPileup<RBP,PE> pileup) {
-        size += pileup.size();
+        size += pileup.getNumberOfElements();
+        abstractSize += pileup.depthOfCoverage();
         nDeletions += pileup.getNumberOfDeletions();
         nMQ0Reads += pileup.getNumberOfMappingQualityZeroReads();
     }
@@ -158,7 +167,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
      * @param offsets
      * @return
      */
-    private PileupElementTracker<PE> readsOffsets2Pileup(List<SAMRecord> reads, List<Integer> offsets ) {
+    private PileupElementTracker<PE> readsOffsets2Pileup(List<GATKSAMRecord> reads, List<Integer> offsets ) {
         if ( reads == null ) throw new ReviewedStingException("Illegal null read list in UnifiedReadBackedPileup");
         if ( offsets == null ) throw new ReviewedStingException("Illegal null offsets list in UnifiedReadBackedPileup");
         if ( reads.size() != offsets.size() ) throw new ReviewedStingException("Reads and offset lists have different sizes!");
@@ -178,7 +187,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
      * @param offset
      * @return
      */
-    private PileupElementTracker<PE> readsOffsets2Pileup(List<SAMRecord> reads, int offset ) {
+    private PileupElementTracker<PE> readsOffsets2Pileup(List<GATKSAMRecord> reads, int offset ) {
         if ( reads == null ) throw new ReviewedStingException("Illegal null read list in UnifiedReadBackedPileup");
         if ( offset < 0 ) throw new ReviewedStingException("Illegal offset < 0 UnifiedReadBackedPileup");
 
@@ -191,7 +200,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
     }
 
     protected abstract AbstractReadBackedPileup<RBP,PE> createNewPileup(GenomeLoc loc, PileupElementTracker<PE> pileupElementTracker);
-    protected abstract PE createNewPileupElement(SAMRecord read, int offset);
+    protected abstract PE createNewPileupElement(GATKSAMRecord read, int offset);
 
     // --------------------------------------------------------
     //
@@ -213,7 +222,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
                 PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
                 PerSamplePileupElementTracker<PE> filteredTracker = new PerSamplePileupElementTracker<PE>();
 
-                for(Sample sample: tracker.getSamples()) {
+                for(final String sample: tracker.getSamples()) {
                     PileupElementTracker<PE> perSampleElements = tracker.getElements(sample);
                     AbstractReadBackedPileup<RBP,PE> pileup = createNewPileup(loc,perSampleElements).getPileupWithoutDeletions();
                     filteredTracker.addElements(sample,pileup.pileupElementTracker);
@@ -251,7 +260,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
             PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
             PerSamplePileupElementTracker<PE> filteredTracker = new PerSamplePileupElementTracker<PE>();
 
-            for(Sample sample: tracker.getSamples()) {
+            for(final String sample: tracker.getSamples()) {
                 PileupElementTracker<PE> perSampleElements = tracker.getElements(sample);
                 AbstractReadBackedPileup<RBP,PE> pileup = createNewPileup(loc,perSampleElements).getOverlappingFragmentFilteredPileup();
                 filteredTracker.addElements(sample,pileup.pileupElementTracker);
@@ -305,7 +314,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
                 PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
                 PerSamplePileupElementTracker<PE> filteredTracker = new PerSamplePileupElementTracker<PE>();
 
-                for(Sample sample: tracker.getSamples()) {
+                for(final String sample: tracker.getSamples()) {
                     PileupElementTracker<PE> perSampleElements = tracker.getElements(sample);
                     AbstractReadBackedPileup<RBP,PE> pileup = createNewPileup(loc,perSampleElements).getPileupWithoutMappingQualityZeroReads();
                     filteredTracker.addElements(sample,pileup.pileupElementTracker);
@@ -334,7 +343,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
             PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
             PerSamplePileupElementTracker<PE> filteredTracker = new PerSamplePileupElementTracker<PE>();
 
-            for(Sample sample: tracker.getSamples()) {
+            for(final String sample: tracker.getSamples()) {
                 PileupElementTracker<PE> perSampleElements = tracker.getElements(sample);
                 AbstractReadBackedPileup<RBP,PE> pileup = createNewPileup(loc,perSampleElements).getPositiveStrandPileup();
                 filteredTracker.addElements(sample,pileup.pileupElementTracker);
@@ -363,7 +372,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
             PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
             PerSamplePileupElementTracker<PE> filteredTracker = new PerSamplePileupElementTracker<PE>();
 
-            for(Sample sample: tracker.getSamples()) {
+            for(final String sample: tracker.getSamples()) {
                 PileupElementTracker<PE> perSampleElements = tracker.getElements(sample);
                 AbstractReadBackedPileup<RBP,PE> pileup = createNewPileup(loc,perSampleElements).getNegativeStrandPileup();
                 filteredTracker.addElements(sample,pileup.pileupElementTracker);
@@ -393,7 +402,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
             PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
             PerSamplePileupElementTracker<PE> filteredTracker = new PerSamplePileupElementTracker<PE>();
 
-            for(Sample sample: tracker.getSamples()) {
+            for(final String sample: tracker.getSamples()) {
                 PileupElementTracker<PE> perSampleElements = tracker.getElements(sample);
                 AbstractReadBackedPileup<RBP,PE> pileup = createNewPileup(loc,perSampleElements).getFilteredPileup(filter);
                 filteredTracker.addElements(sample,pileup.pileupElementTracker);
@@ -425,7 +434,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
             PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
             PerSamplePileupElementTracker<PE> filteredTracker = new PerSamplePileupElementTracker<PE>();
 
-            for(Sample sample: tracker.getSamples()) {
+            for(final String sample: tracker.getSamples()) {
                 PileupElementTracker<PE> perSampleElements = tracker.getElements(sample);
                 AbstractReadBackedPileup<RBP,PE> pileup = createNewPileup(loc,perSampleElements).getBaseAndMappingFilteredPileup(minBaseQ,minMapQ);
                 filteredTracker.addElements(sample,pileup.pileupElementTracker);
@@ -492,7 +501,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
             PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
             PerSamplePileupElementTracker<PE> filteredTracker = new PerSamplePileupElementTracker<PE>();
 
-            for(Sample sample: tracker.getSamples()) {
+            for(final String sample: tracker.getSamples()) {
                 PileupElementTracker<PE> perSampleElements = tracker.getElements(sample);
                 AbstractReadBackedPileup<RBP,PE> pileup = createNewPileup(loc,perSampleElements).getPileupForReadGroup(targetReadGroupId);
                 if(pileup != null)
@@ -503,7 +512,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
         else {
             UnifiedPileupElementTracker<PE> filteredTracker = new UnifiedPileupElementTracker<PE>();
             for(PE p: pileupElementTracker) {
-                SAMRecord read = p.getRead();
+                GATKSAMRecord read = p.getRead();
                 if(targetReadGroupId != null) {
                     if(read.getReadGroup() != null && targetReadGroupId.equals(read.getReadGroup().getReadGroupId()))
                         filteredTracker.add(p);
@@ -523,7 +532,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
             PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
             PerSamplePileupElementTracker<PE> filteredTracker = new PerSamplePileupElementTracker<PE>();
 
-            for(Sample sample: tracker.getSamples()) {
+            for(final String sample: tracker.getSamples()) {
                 PileupElementTracker<PE> perSampleElements = tracker.getElements(sample);
                 AbstractReadBackedPileup<RBP,PE> pileup = createNewPileup(loc,perSampleElements).getPileupForLane(laneID);
                 if(pileup != null)
@@ -534,7 +543,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
         else {
             UnifiedPileupElementTracker<PE> filteredTracker = new UnifiedPileupElementTracker<PE>();
             for(PE p: pileupElementTracker) {
-                SAMRecord read = p.getRead();
+                GATKSAMRecord read = p.getRead();
                 if(laneID != null) {
                     if(read.getReadGroup() != null &&
                        (read.getReadGroup().getReadGroupId().startsWith(laneID + ".")) ||   // lane is the same, but sample identifier is different
@@ -550,19 +559,15 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
         }
     }
 
-    public Collection<String> getSampleNames() {
+    public Collection<String> getSamples() {
         if(pileupElementTracker instanceof PerSamplePileupElementTracker) {
             PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
-            Collection<String> sampleNames = new HashSet<String>();
-            for (Sample sample : tracker.getSamples()) {
-                sampleNames.add(sample.getId());
-            }
-            return sampleNames;
+            return new HashSet<String>(tracker.getSamples());
         }
         else {
             Collection<String> sampleNames = new HashSet<String>();
             for(PileupElement p: this) {
-                SAMRecord read = p.getRead();
+                GATKSAMRecord read = p.getRead();
                 String sampleName = read.getReadGroup() != null ? read.getReadGroup().getSample() : null;
                 sampleNames.add(sampleName);
             }
@@ -570,16 +575,6 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
         }
     }
 
-    @Override
-    public Collection<Sample> getSamples() {
-        if(!(pileupElementTracker instanceof PerSamplePileupElementTracker)) {
-            throw new StingException("Must be an instance of PerSampleElementTracker");
-        }
-        PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
-        return tracker.getSamples();
-    }
-
-
     /**
      * Returns a pileup randomly downsampled to the desiredCoverage.
      *
@@ -588,7 +583,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
      */
     @Override
     public RBP getDownsampledPileup(int desiredCoverage) {
-        if ( size() <= desiredCoverage )
+        if ( getNumberOfElements() <= desiredCoverage )
             return (RBP)this;
 
         // randomly choose numbers corresponding to positions in the reads list
@@ -604,7 +599,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
 
             int current = 0;
 
-            for(Sample sample: tracker.getSamples()) {
+            for(final String sample: tracker.getSamples()) {
                 PileupElementTracker<PE> perSampleElements = tracker.getElements(sample);
 
                 List<PileupElement> filteredPileup = new ArrayList<PileupElement>();
@@ -639,7 +634,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
     }
 
     @Override
-    public RBP getPileupForSampleNames(Collection<String> sampleNames) {
+    public RBP getPileupForSamples(Collection<String> sampleNames) {
         if(pileupElementTracker instanceof PerSamplePileupElementTracker) {
             PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
             PileupElementTracker<PE> filteredElements = tracker.getElements(sampleNames);
@@ -649,7 +644,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
             HashSet<String> hashSampleNames = new HashSet<String>(sampleNames);    // to speed up the "contains" access in the for loop
             UnifiedPileupElementTracker<PE> filteredTracker = new UnifiedPileupElementTracker<PE>();
             for(PE p: pileupElementTracker) {
-                SAMRecord read = p.getRead();
+                GATKSAMRecord read = p.getRead();
                 if(sampleNames != null) {                                          // still checking on sampleNames because hashSampleNames will never be null. And empty means something else.
                     if(read.getReadGroup() != null && hashSampleNames.contains(read.getReadGroup().getSample()))
                         filteredTracker.add(p);
@@ -665,7 +660,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
 
 
     @Override
-    public RBP getPileupForSampleName(String sampleName) {
+    public RBP getPileupForSample(String sampleName) {
         if(pileupElementTracker instanceof PerSamplePileupElementTracker) {
             PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
             PileupElementTracker<PE> filteredElements = tracker.getElements(sampleName);
@@ -674,7 +669,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
         else {
             UnifiedPileupElementTracker<PE> filteredTracker = new UnifiedPileupElementTracker<PE>();
             for(PE p: pileupElementTracker) {
-                SAMRecord read = p.getRead();
+                GATKSAMRecord read = p.getRead();
                 if(sampleName != null) {
                     if(read.getReadGroup() != null && sampleName.equals(read.getReadGroup().getSample()))
                         filteredTracker.add(p);
@@ -688,30 +683,6 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
         }
     }
 
-    @Override
-    public RBP getPileupForSample(Sample sample) {
-        if(pileupElementTracker instanceof PerSamplePileupElementTracker) {
-            PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
-            PileupElementTracker<PE> filteredElements = tracker.getElements(sample);
-            return filteredElements != null ? (RBP)createNewPileup(loc,filteredElements) : null;
-        }
-        else {
-            UnifiedPileupElementTracker<PE> filteredTracker = new UnifiedPileupElementTracker<PE>();
-            for(PE p: pileupElementTracker) {
-                SAMRecord read = p.getRead();
-                if(sample != null) {
-                    if(read.getReadGroup() != null && sample.getId().equals(read.getReadGroup().getSample()))
-                        filteredTracker.add(p);
-                }
-                else {
-                    if(read.getReadGroup() == null || read.getReadGroup().getSample() == null)
-                        filteredTracker.add(p);
-                }
-            }
-            return filteredTracker.size()>0 ? (RBP)createNewPileup(loc,filteredTracker) : null;
-        }
-    }
-
     // --------------------------------------------------------
     //
     // iterators
@@ -765,13 +736,23 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
     }
 
     /**
-     * @return the number of elements in this pileup
+     * @return the number of physical elements in this pileup
      */
     @Override
-    public int size() {
+    public int getNumberOfElements() {
         return size;
     }
 
+    /**
+     * @return the number of abstract elements in this pileup
+     */
+    @Override
+    public int depthOfCoverage() {
+        if ( abstractSize == -1 )
+            calculateAbstractSize();
+        return abstractSize;
+    }
+
     /**
      * @return true if there are 0 elements in the pileup, false otherwise
      */
@@ -801,7 +782,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
 
         if(pileupElementTracker instanceof PerSamplePileupElementTracker) {
             PerSamplePileupElementTracker<PE> tracker = (PerSamplePileupElementTracker<PE>)pileupElementTracker;
-            for(Sample sample: tracker.getSamples()) {
+            for(final String sample: tracker.getSamples()) {
                 int[] countsBySample = createNewPileup(loc,tracker.getElements(sample)).getBaseCounts();
                 for(int i = 0; i < counts.length; i++)
                     counts[i] += countsBySample[i];
@@ -843,8 +824,8 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
      * @return
      */
     @Override
-    public List<SAMRecord> getReads() {
-        List<SAMRecord> reads = new ArrayList<SAMRecord>(size());
+    public List<GATKSAMRecord> getReads() {
+        List<GATKSAMRecord> reads = new ArrayList<GATKSAMRecord>(getNumberOfElements());
         for ( PileupElement pile : this ) { reads.add(pile.getRead()); }
         return reads;
     }
@@ -855,7 +836,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
      */
     @Override
     public List<Integer> getOffsets() {
-        List<Integer> offsets = new ArrayList<Integer>(size());
+        List<Integer> offsets = new ArrayList<Integer>(getNumberOfElements());
         for ( PileupElement pile : this ) { offsets.add(pile.getOffset()); }
         return offsets;
     }
@@ -866,7 +847,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
      */
     @Override
     public byte[] getBases() {
-        byte[] v = new byte[size()];
+        byte[] v = new byte[getNumberOfElements()];
         int pos = 0;
         for ( PileupElement pile : pileupElementTracker ) { v[pos++] = pile.getBase(); }
         return v;
@@ -878,7 +859,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
      */
     @Override
     public byte[] getQuals() {
-        byte[] v = new byte[size()];
+        byte[] v = new byte[getNumberOfElements()];
         int pos = 0;
         for ( PileupElement pile : pileupElementTracker ) { v[pos++] = pile.getQual(); }
         return v;
@@ -890,7 +871,7 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
      */
     @Override
     public byte[] getMappingQuals() {
-        byte[] v = new byte[size()];
+        byte[] v = new byte[getNumberOfElements()];
         int pos = 0;
         for ( PileupElement pile : pileupElementTracker ) { v[pos++] = (byte)pile.getRead().getMappingQuality(); }
         return v;
@@ -911,5 +892,10 @@ public abstract class AbstractReadBackedPileup<RBP extends AbstractReadBackedPil
         return quals2String(getQuals());
     }
 
+    @Override
+    public FragmentCollection<PileupElement> toFragments() {
+        return FragmentUtils.create(this);
+    }
 }
 
+
diff --git a/public/java/src/org/broadinstitute/sting/utils/pileup/ExtendedEventPileupElement.java b/public/java/src/org/broadinstitute/sting/utils/pileup/ExtendedEventPileupElement.java
index 26e66014c..1e5e4d4e5 100644
--- a/public/java/src/org/broadinstitute/sting/utils/pileup/ExtendedEventPileupElement.java
+++ b/public/java/src/org/broadinstitute/sting/utils/pileup/ExtendedEventPileupElement.java
@@ -1,131 +1,132 @@
-package org.broadinstitute.sting.utils.pileup;
-
-import net.sf.samtools.SAMRecord;
-
-import java.util.Arrays;
-
-/**
- * In the "standard" locus traversal mode,
- * the traversal is performed striclty over the reference bases. Thus, only pileups of bases (and hence local events
- * such as point mutations) are "seen" at every invocation of the walker's map() function at every (genomic) locus. Deletions
- * are seen on the base-by-base basis (i.e. the pileup does keep the information about the current reference base being deleted
- * in some reads), but the information about the extended event (deletion length, string of all deleted bases) is not kept.
- * The insertions that may be present in some reads are not seen at all in such strict reference traversal mode.
- *
- * By convention, any extended event (indel) is mapped onto the reference at the last base prior to the event (i.e.
- * last base before the insertion or deletion). If the special "extended" traversal mode is turned on and there is
- * an indel in at least one read that maps onto the reference position Z, the walker's map function will be called twice:
- * first call will be performed in a "standard" mode, with a pileup of bases over the position Z, and then the additional
- * call will be made at the same position with a pileup of event/noevent calls, where events are extended and contain
- * full information about insertions/deletions. Then the next, "standard", call to map() will be performed at the next
- * (covered) reference position. Note that if the extended event at Z was a deletion, the "standard" base pileup at
- * Z+1 and following bases may still contain deleted bases. However the fully extended event call will be performed
- * only once, at the position where the indel maps (starts).
- *
- * This class wraps an "extended" event (indel) so that in can be added to a pileup of events at a given location.
- *
- * Created by IntelliJ IDEA.
- * User: asivache
- * Date: Dec 21, 2009
- * Time: 2:57:55 PM
- * To change this template use File | Settings | File Templates.
- */
-public class ExtendedEventPileupElement extends PileupElement {
-    public enum Type {
-        NOEVENT, DELETION, INSERTION
-    }
-
-    private Type type = null;
-    private int eventLength = -1;
-    private String eventBases = null; // if it is a deletion, we do not have information about the actual deleted bases
-                               // in the read itself, so we fill the string with D's; for insertions we keep actual inserted bases
-    private SAMRecord read;
-    private int offset; // position in the read immediately BEFORE the event
-    // This is broken! offset is always zero because these member variables are shadowed by base class
-
-    /** Constructor for extended pileup element (indel).
-     *
-     * @param read the read, in which the indel is observed
-     * @param offset position in the read immediately before the indel (can be -1 if read starts with an insertion)
-     * @param length length of the indel (number of inserted or deleted bases); length <=0 indicates that the read has no indel (NOEVENT)
-     * @param eventBases inserted bases. null indicates that the event is a deletion; ignored if length<=0 (noevent)
-     */
-    public ExtendedEventPileupElement( SAMRecord read, int offset, int length, byte[] eventBases ) {
-        super(read, offset);
-        this.eventLength = length;
-        if ( length <= 0 ) type = Type.NOEVENT;
-        else {
-            if ( eventBases != null ) {
-                this.eventBases = new String(eventBases).toUpperCase();
-                type = Type.INSERTION;
-            } else {
-                type = Type.DELETION;
-            }
-        }
-    }
-
-    /** Constructor for deletion or noevent calls - does not take event bases as an argument (as those should
-     * be null or are ignored in these cases anyway)
-     * @param read
-     * @param offset
-     * @param length
-     */
-    public ExtendedEventPileupElement( SAMRecord read, int offset, int length ) {
-        this(read,offset, length, null);
-    }
-
-    public boolean isDeletion() {
-        return type == Type.DELETION;
-    }
-
-    public boolean isInsertion() {
-        return type == Type.INSERTION;
-    }
-
-    public boolean isIndel() {
-        return isDeletion() || isInsertion();
-    }
-
-    public Type getType() { return type; }
-
-    // The offset can be negative with insertions at the start of the read, but a valid base does exist at this position with
-    // a valid base quality.  The following code attempts to compensate for that.'
-
-    @Override
-    public byte getBase() {
-        return getBase(offset >= 0 ? offset : offset+eventLength);
-    }
-
-    @Override
-    public int getBaseIndex() {
-        return getBaseIndex(offset >= 0 ? offset : offset+eventLength);
-    }
-
-    @Override
-    public byte getQual() {
-        return getQual(offset >= 0 ? offset : offset+eventLength);
-    }
-
-    /** Returns length of the event (number of inserted or deleted bases */
-    public int getEventLength() { return eventLength; }
-
-    /** Returns actual sequence of inserted bases, or a null if the event is a deletion or if there is no event in the associated read.
-     *  */
-    public String getEventBases() { return eventBases; }
-
-    @Override
-    public String toString() {
-        char c = '.';
-        String fillStr = null ;
-        if ( isDeletion() ) {
-            c = '-';
-            char [] filler = new char[eventLength];
-            Arrays.fill(filler, 'D');
-            fillStr = new String(filler);
-        }
-        else if ( isInsertion() ) c = '+';
-        return String.format("%s @ %d = %c%s MQ%d", getRead().getReadName(), getOffset(), c, isIndel()?
-                (isInsertion() ? eventBases : fillStr ): "", getMappingQual());
-    }
-
-}
+package org.broadinstitute.sting.utils.pileup;
+
+import net.sf.samtools.SAMRecord;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
+
+import java.util.Arrays;
+
+/**
+ * In the "standard" locus traversal mode,
+ * the traversal is performed striclty over the reference bases. Thus, only pileups of bases (and hence local events
+ * such as point mutations) are "seen" at every invocation of the walker's map() function at every (genomic) locus. Deletions
+ * are seen on the base-by-base basis (i.e. the pileup does keep the information about the current reference base being deleted
+ * in some reads), but the information about the extended event (deletion length, string of all deleted bases) is not kept.
+ * The insertions that may be present in some reads are not seen at all in such strict reference traversal mode.
+ *
+ * By convention, any extended event (indel) is mapped onto the reference at the last base prior to the event (i.e.
+ * last base before the insertion or deletion). If the special "extended" traversal mode is turned on and there is
+ * an indel in at least one read that maps onto the reference position Z, the walker's map function will be called twice:
+ * first call will be performed in a "standard" mode, with a pileup of bases over the position Z, and then the additional
+ * call will be made at the same position with a pileup of event/noevent calls, where events are extended and contain
+ * full information about insertions/deletions. Then the next, "standard", call to map() will be performed at the next
+ * (covered) reference position. Note that if the extended event at Z was a deletion, the "standard" base pileup at
+ * Z+1 and following bases may still contain deleted bases. However the fully extended event call will be performed
+ * only once, at the position where the indel maps (starts).
+ *
+ * This class wraps an "extended" event (indel) so that in can be added to a pileup of events at a given location.
+ *
+ * Created by IntelliJ IDEA.
+ * User: asivache
+ * Date: Dec 21, 2009
+ * Time: 2:57:55 PM
+ * To change this template use File | Settings | File Templates.
+ */
+public class ExtendedEventPileupElement extends PileupElement {
+    public enum Type {
+        NOEVENT, DELETION, INSERTION
+    }
+
+    private Type type = null;
+    private int eventLength = -1;
+    private String eventBases = null; // if it is a deletion, we do not have information about the actual deleted bases
+                               // in the read itself, so we fill the string with D's; for insertions we keep actual inserted bases
+    private SAMRecord read;
+    private int offset; // position in the read immediately BEFORE the event
+    // This is broken! offset is always zero because these member variables are shadowed by base class
+
+    /** Constructor for extended pileup element (indel).
+     *
+     * @param read the read, in which the indel is observed
+     * @param offset position in the read immediately before the indel (can be -1 if read starts with an insertion)
+     * @param length length of the indel (number of inserted or deleted bases); length <=0 indicates that the read has no indel (NOEVENT)
+     * @param eventBases inserted bases. null indicates that the event is a deletion; ignored if length<=0 (noevent)
+     */
+    public ExtendedEventPileupElement( GATKSAMRecord read, int offset, int length, byte[] eventBases ) {
+        super(read, offset);
+        this.eventLength = length;
+        if ( length <= 0 ) type = Type.NOEVENT;
+        else {
+            if ( eventBases != null ) {
+                this.eventBases = new String(eventBases).toUpperCase();
+                type = Type.INSERTION;
+            } else {
+                type = Type.DELETION;
+            }
+        }
+    }
+
+    /** Constructor for deletion or noevent calls - does not take event bases as an argument (as those should
+     * be null or are ignored in these cases anyway)
+     * @param read
+     * @param offset
+     * @param length
+     */
+    public ExtendedEventPileupElement( GATKSAMRecord read, int offset, int length ) {
+        this(read,offset, length, null);
+    }
+
+    public boolean isDeletion() {
+        return type == Type.DELETION;
+    }
+
+    public boolean isInsertion() {
+        return type == Type.INSERTION;
+    }
+
+    public boolean isIndel() {
+        return isDeletion() || isInsertion();
+    }
+
+    public Type getType() { return type; }
+
+    // The offset can be negative with insertions at the start of the read, but a valid base does exist at this position with
+    // a valid base quality.  The following code attempts to compensate for that.'
+
+    @Override
+    public byte getBase() {
+        return getBase(offset >= 0 ? offset : offset+eventLength);
+    }
+
+    @Override
+    public int getBaseIndex() {
+        return getBaseIndex(offset >= 0 ? offset : offset+eventLength);
+    }
+
+    @Override
+    public byte getQual() {
+        return getQual(offset >= 0 ? offset : offset+eventLength);
+    }
+
+    /** Returns length of the event (number of inserted or deleted bases */
+    public int getEventLength() { return eventLength; }
+
+    /** Returns actual sequence of inserted bases, or a null if the event is a deletion or if there is no event in the associated read.
+     *  */
+    public String getEventBases() { return eventBases; }
+
+    @Override
+    public String toString() {
+        char c = '.';
+        String fillStr = null ;
+        if ( isDeletion() ) {
+            c = '-';
+            char [] filler = new char[eventLength];
+            Arrays.fill(filler, 'D');
+            fillStr = new String(filler);
+        }
+        else if ( isInsertion() ) c = '+';
+        return String.format("%s @ %d = %c%s MQ%d", getRead().getReadName(), getOffset(), c, isIndel()?
+                (isInsertion() ? eventBases : fillStr ): "", getMappingQual());
+    }
+
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/pileup/FragmentPileup.java b/public/java/src/org/broadinstitute/sting/utils/pileup/FragmentPileup.java
deleted file mode 100644
index f7d237401..000000000
--- a/public/java/src/org/broadinstitute/sting/utils/pileup/FragmentPileup.java
+++ /dev/null
@@ -1,95 +0,0 @@
-package org.broadinstitute.sting.utils.pileup;
-
-import java.util.ArrayList;
-import java.util.Collection;
-import java.util.HashMap;
-import java.util.Map;
-
-/**
- * An easy to access fragment-based pileup, which contains two separate pileups.  The first
- * is a regular collection of PileupElements containing all of the reads in the original RBP
- * that uniquely info about a fragment.  The second are TwoReadPileupElements that, as the
- * name suggests, contain two reads that are sequenced from the same underlying fragment.
- *
- * Based on the original code by E. Banks
- *
- * TODO -- technically we could generalize this code to support a pseudo-duplicate marking
- * TODO -- algorithm that could collect all duplicates into a single super pileup element
- *
- * User: depristo
- * Date: 3/26/11
- * Time: 10:09 PM
- */
-public class FragmentPileup {
-    final Collection<PileupElement> oneReadPile;
-    final Collection<TwoReadPileupElement> twoReadPile = new ArrayList<TwoReadPileupElement>();
-
-    /**
-     * Create a new Fragment-based pileup from the standard read-based pileup
-     * @param pileup
-     */
-    public FragmentPileup(ReadBackedPileup pileup) {
-        Map<String, PileupElement> nameMap = new HashMap<String, PileupElement>();
-
-        // build an initial map, grabbing all of the multi-read fragments
-        for ( PileupElement p : pileup ) {
-            String readName = p.getRead().getReadName();
-
-            PileupElement pe1 = nameMap.get(readName);
-            if ( pe1 != null ) {
-                // assumes we have at most 2 reads per fragment
-                twoReadPile.add(new TwoReadPileupElement(pe1, p));
-                nameMap.remove(readName);
-            } else {
-                nameMap.put(readName, p);
-            }
-        }
-
-        // now set the one Read pile to the values in the nameMap with only a single read
-        oneReadPile = nameMap.values();
-    }
-
-    /**
-     * Gets the pileup elements containing two reads, in no particular order
-     *
-     * @return
-     */
-    public Collection<TwoReadPileupElement> getTwoReadPileup() {
-        return twoReadPile;
-    }
-
-    /**
-     * Gets the pileup elements containing one read, in no particular order
-     *
-     * @return
-     */
-    public Collection<PileupElement> getOneReadPileup() {
-        return oneReadPile;
-    }
-
-    /**
-     * Useful helper class to represent a full read pair at a position
-     *
-     * User: ebanks, depristo
-     * Date: Jan 10, 2011
-     */
-    public static class TwoReadPileupElement {
-        final protected PileupElement PE1, PE2;
-
-        /**
-         * Creates a fragment element that contains both ends of a paired end read
-         * @param PE1
-         * @param PE2
-         */
-        public TwoReadPileupElement(PileupElement PE1, PileupElement PE2) {
-            this.PE1 = PE1;
-            this.PE2 = PE2;
-        }
-
-        /** Returns the first pileup element -- never null */
-        public PileupElement getFirst() { return PE1; }
-
-        /** Returns the second read in this fragment element.  May be null */
-        public PileupElement getSecond() { return PE2; }
-    }
-}
diff --git a/public/java/src/org/broadinstitute/sting/utils/pileup/MergingPileupElementIterator.java b/public/java/src/org/broadinstitute/sting/utils/pileup/MergingPileupElementIterator.java
index 7005cf869..c00ed24f2 100644
--- a/public/java/src/org/broadinstitute/sting/utils/pileup/MergingPileupElementIterator.java
+++ b/public/java/src/org/broadinstitute/sting/utils/pileup/MergingPileupElementIterator.java
@@ -25,7 +25,6 @@
 package org.broadinstitute.sting.utils.pileup;
 
 import net.sf.picard.util.PeekableIterator;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
 
 import java.util.Comparator;
 import java.util.Iterator;
@@ -42,7 +41,7 @@ class MergingPileupElementIterator<PE extends PileupElement> implements Iterator
 
     public MergingPileupElementIterator(PerSamplePileupElementTracker<PE> tracker) {
         perSampleIterators = new PriorityQueue<PeekableIterator<PE>>(Math.max(1,tracker.getSamples().size()),new PileupElementIteratorComparator());
-        for(Sample sample: tracker.getSamples()) {
+        for(final String sample: tracker.getSamples()) {
             PileupElementTracker<PE> trackerPerSample = tracker.getElements(sample);
             if(trackerPerSample.size() != 0)
                 perSampleIterators.add(new PeekableIterator<PE>(trackerPerSample.iterator()));
diff --git a/public/java/src/org/broadinstitute/sting/utils/pileup/PileupElement.java b/public/java/src/org/broadinstitute/sting/utils/pileup/PileupElement.java
index 12899e898..daf6606ef 100755
--- a/public/java/src/org/broadinstitute/sting/utils/pileup/PileupElement.java
+++ b/public/java/src/org/broadinstitute/sting/utils/pileup/PileupElement.java
@@ -2,9 +2,8 @@ package org.broadinstitute.sting.utils.pileup;
 
 import com.google.java.contract.Ensures;
 import com.google.java.contract.Requires;
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.utils.BaseUtils;
-import org.broadinstitute.sting.utils.sam.ReadUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 /**
  * Created by IntelliJ IDEA.
@@ -12,7 +11,7 @@ import org.broadinstitute.sting.utils.sam.ReadUtils;
  * Date: Apr 14, 2009
  * Time: 8:54:05 AM
  */
-public class PileupElement {
+public class PileupElement implements Comparable<PileupElement> {
     public static final byte DELETION_BASE = BaseUtils.D;
     public static final byte DELETION_QUAL = (byte) 16;
     public static final byte A_FOLLOWED_BY_INSERTION_BASE = (byte) 87;
@@ -20,14 +19,14 @@ public class PileupElement {
     public static final byte T_FOLLOWED_BY_INSERTION_BASE = (byte) 89;
     public static final byte G_FOLLOWED_BY_INSERTION_BASE = (byte) 90;
 
-    protected final SAMRecord read;
+    protected final GATKSAMRecord read;
     protected final int offset;
 
     @Requires({
             "read != null",
             "offset >= -1",
             "offset <= read.getReadLength()"})
-    public PileupElement( SAMRecord read, int offset ) {
+    public PileupElement( GATKSAMRecord read, int offset ) {
         this.read = read;
         this.offset = offset;
     }
@@ -37,7 +36,7 @@ public class PileupElement {
     }
 
     @Ensures("result != null")
-    public SAMRecord getRead() { return read; }
+    public GATKSAMRecord getRead() { return read; }
 
     @Ensures("result == offset")
     public int getOffset() { return offset; }
@@ -75,26 +74,32 @@ public class PileupElement {
         return isDeletion() ? DELETION_QUAL : read.getBaseQualities()[offset];
     }
 
+    @Override
+    public int compareTo(final PileupElement pileupElement) {
+        if ( offset < pileupElement.offset )
+            return -1;
+        else if ( offset > pileupElement.offset )
+            return 1;
+        else if ( read.getAlignmentStart() < pileupElement.read.getAlignmentStart() )
+            return -1;
+        else if ( read.getAlignmentStart() > pileupElement.read.getAlignmentStart() )
+            return 1;
+        else
+            return 0;
+    }
+
     // --------------------------------------------------------------------------
     //
     // Reduced read accessors
     //
     // --------------------------------------------------------------------------
 
-    private Integer getReducedReadQualityTagValue() {
-        return getRead().getIntegerAttribute(ReadUtils.REDUCED_READ_QUALITY_TAG);
-    }
-
     public boolean isReducedRead() {
-        return getReducedReadQualityTagValue() != null;
+        return ((GATKSAMRecord)read).isReducedRead();
     }
 
-    public int getReducedCount() {
-        return (int)getQual();
-    }
-
-    public byte getReducedQual() {
-        return (byte)(int)getReducedReadQualityTagValue();
+    public int getRepresentativeCount() {
+        return isReducedRead() ? ((GATKSAMRecord)read).getReducedCount(offset) : 1;
     }
 
 }
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/utils/pileup/PileupElementTracker.java b/public/java/src/org/broadinstitute/sting/utils/pileup/PileupElementTracker.java
index 29e431695..09b907e00 100644
--- a/public/java/src/org/broadinstitute/sting/utils/pileup/PileupElementTracker.java
+++ b/public/java/src/org/broadinstitute/sting/utils/pileup/PileupElementTracker.java
@@ -24,8 +24,6 @@
 
 package org.broadinstitute.sting.utils.pileup;
 
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
-
 import java.util.*;
 
 /**
@@ -60,52 +58,35 @@ class UnifiedPileupElementTracker<PE extends PileupElement> extends PileupElemen
 }
 
 class PerSamplePileupElementTracker<PE extends PileupElement> extends PileupElementTracker<PE> {
-    private final Map<Sample,PileupElementTracker<PE>> pileup;
-    private final Map<String, Sample> sampleNames = new HashMap<String, Sample>();
+    private final Map<String,PileupElementTracker<PE>> pileup;
     private int size = 0;
 
     public PerSamplePileupElementTracker() {
-        pileup = new HashMap<Sample,PileupElementTracker<PE>>();
-    }
-
-    public PerSamplePileupElementTracker(Map<Sample,AbstractReadBackedPileup<?,PE>> pileupsBySample) {
-        pileup = new HashMap<Sample,PileupElementTracker<PE>>();
-        for(Map.Entry<Sample,AbstractReadBackedPileup<?,PE>> entry: pileupsBySample.entrySet()) {
-            Sample sample = entry.getKey();
-            AbstractReadBackedPileup<?,PE> pileupBySample = entry.getValue();
-            pileup.put(sample,pileupBySample.pileupElementTracker);
-            sampleNames.put(sample.getId(), sample);
-        }
+        pileup = new HashMap<String,PileupElementTracker<PE>>();
     }
 
     /**
      * Gets a list of all the samples stored in this pileup.
      * @return List of samples in this pileup.
      */
-    public Collection<Sample> getSamples() {
+    public Collection<String> getSamples() {
         return pileup.keySet();
     }
 
-    public PileupElementTracker<PE> getElements(final Sample sample) {
+    public PileupElementTracker<PE> getElements(final String sample) {
         return pileup.get(sample);
     }
 
-    public PileupElementTracker<PE> getElements(final String sampleName) {
-        return pileup.get(sampleNames.get(sampleName));
-    }
-
     public PileupElementTracker<PE> getElements(final Collection<String> selectSampleNames) {
         PerSamplePileupElementTracker<PE> result = new PerSamplePileupElementTracker<PE>();
-        for (String sample :  selectSampleNames) {
-            Sample sampleObject = sampleNames.get(sample);
-            result.addElements(sampleObject, pileup.get(sampleObject));
+        for (final String sample :  selectSampleNames) {
+            result.addElements(sample, pileup.get(sample));
         }
         return result;
     }
 
-    public void addElements(final Sample sample, PileupElementTracker<PE> elements) {
+    public void addElements(final String sample, PileupElementTracker<PE> elements) {
         pileup.put(sample,elements);
-        sampleNames.put(sample.getId(), sample);
         size += elements.size();
     }
 
diff --git a/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedExtendedEventPileup.java b/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedExtendedEventPileup.java
index 8d43a368a..3d872f9fb 100644
--- a/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedExtendedEventPileup.java
+++ b/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedExtendedEventPileup.java
@@ -25,9 +25,9 @@
 package org.broadinstitute.sting.utils.pileup;
 
 import net.sf.samtools.SAMRecord;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.collections.Pair;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.Collection;
 import java.util.List;
@@ -121,20 +121,7 @@ public interface ReadBackedExtendedEventPileup extends ReadBackedPileup {
      * Gets a list of all the samples stored in this pileup.
      * @return List of samples in this pileup.
      */
-    public Collection<String> getSampleNames();
-
-        /**
-     * Gets a list of all the samples stored in this pileup.
-     * @return List of samples in this pileup.
-     */
-    public Collection<Sample> getSamples();
-
-    /**
-     * Gets the particular subset of this pileup with the given sample name.
-     * @param sample Name of the sample to use.
-     * @return A subset of this pileup containing only reads with the given sample.
-     */
-    public ReadBackedExtendedEventPileup getPileupForSample(Sample sample);
+    public Collection<String> getSamples();
 
     public Iterable<ExtendedEventPileupElement> toExtendedIterable();
 
@@ -169,7 +156,7 @@ public interface ReadBackedExtendedEventPileup extends ReadBackedPileup {
     /**
      * @return the number of elements in this pileup
      */
-    public int size();
+    public int getNumberOfElements();
 
     /**
      * @return the location of this pileup
@@ -180,7 +167,7 @@ public interface ReadBackedExtendedEventPileup extends ReadBackedPileup {
      * Returns a list of the reads in this pileup. Note this call costs O(n) and allocates fresh lists each time
      * @return
      */
-    public List<SAMRecord> getReads();
+    public List<GATKSAMRecord> getReads();
 
     /**
      * Returns a list of the offsets in this pileup. Note this call costs O(n) and allocates fresh lists each time
diff --git a/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedExtendedEventPileupImpl.java b/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedExtendedEventPileupImpl.java
index 31d29430a..43ad06352 100644
--- a/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedExtendedEventPileupImpl.java
+++ b/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedExtendedEventPileupImpl.java
@@ -23,11 +23,10 @@
  */
 package org.broadinstitute.sting.utils.pileup;
 
-import net.sf.samtools.SAMRecord;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.collections.Pair;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.*;
 
@@ -56,7 +55,7 @@ public class ReadBackedExtendedEventPileupImpl extends AbstractReadBackedPileup<
     }
 
     // this is the good new one
-    public ReadBackedExtendedEventPileupImpl(GenomeLoc loc, Map<Sample,? extends ReadBackedExtendedEventPileupImpl> pileupElementsBySample) {
+    public ReadBackedExtendedEventPileupImpl(GenomeLoc loc, Map<String,? extends ReadBackedExtendedEventPileupImpl> pileupElementsBySample) {
         super(loc,pileupElementsBySample);
     }
 
@@ -96,7 +95,7 @@ public class ReadBackedExtendedEventPileupImpl extends AbstractReadBackedPileup<
     }
 
     @Override
-    protected ExtendedEventPileupElement createNewPileupElement(SAMRecord read, int offset) {
+    protected ExtendedEventPileupElement createNewPileupElement(GATKSAMRecord read, int offset) {
         throw new UnsupportedOperationException("Not enough information provided to create a new pileup element");
     }
 
@@ -134,7 +133,7 @@ public class ReadBackedExtendedEventPileupImpl extends AbstractReadBackedPileup<
      */
     @Override
     public byte[] getEvents() {
-        byte[] v = new byte[size()];
+        byte[] v = new byte[getNumberOfElements()];
         int i = 0;
         for ( ExtendedEventPileupElement e : this.toExtendedIterable() ) {
             switch ( e.getType() ) {
diff --git a/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedPileup.java b/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedPileup.java
index 36b8a8c65..02767df7c 100644
--- a/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedPileup.java
+++ b/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedPileup.java
@@ -24,10 +24,10 @@
 
 package org.broadinstitute.sting.utils.pileup;
 
-import net.sf.samtools.SAMRecord;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.HasGenomeLocation;
+import org.broadinstitute.sting.utils.fragments.FragmentCollection;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.Collection;
 import java.util.List;
@@ -137,18 +137,11 @@ public interface ReadBackedPileup extends Iterable<PileupElement>, HasGenomeLoca
      */
     public ReadBackedPileup getPileupForLane(String laneID);
 
-
-     /**
-     * Gets a collection of all the samples stored in this pileup.
-     * @return Collection of samples in this pileup.
-     */
-    public Collection<Sample> getSamples();
-
     /**
      * Gets a collection of *names* of all the samples stored in this pileup.
      * @return Collection of names
      */
-    public Collection<String> getSampleNames();
+    public Collection<String> getSamples();
 
 
     /**
@@ -156,7 +149,7 @@ public interface ReadBackedPileup extends Iterable<PileupElement>, HasGenomeLoca
      * @param sampleNames Name of the sample to use.
      * @return A subset of this pileup containing only reads with the given sample.
      */
-    public ReadBackedPileup getPileupForSampleNames(Collection<String> sampleNames);
+    public ReadBackedPileup getPileupForSamples(Collection<String> sampleNames);
 
 
     /**
@@ -164,14 +157,7 @@ public interface ReadBackedPileup extends Iterable<PileupElement>, HasGenomeLoca
      * @param sampleName Name of the sample to use.
      * @return A subset of this pileup containing only reads with the given sample.
      */
-    public ReadBackedPileup getPileupForSampleName(String sampleName);
-
-    /**
-     * Gets the particular subset of this pileup with the given sample.
-     * @param sample Sample to use.
-     * @return A subset of this pileup containing only reads with the given sample.
-     */
-    public ReadBackedPileup getPileupForSample(Sample sample);
+    public ReadBackedPileup getPileupForSample(String sampleName);
     
     /**
      * Simple useful routine to count the number of deletion bases in this pileup
@@ -183,9 +169,14 @@ public interface ReadBackedPileup extends Iterable<PileupElement>, HasGenomeLoca
     public int getNumberOfMappingQualityZeroReads();
 
     /**
-     * @return the number of elements in this pileup
+     * @return the number of physical elements in this pileup (a reduced read is counted just once)
      */
-    public int size();
+    public int getNumberOfElements();
+
+    /**
+     * @return the number of abstract elements in this pileup (reduced reads are expanded to count all reads that they represent)
+     */
+    public int depthOfCoverage();
 
     /**
      * @return true if there are 0 elements in the pileup, false otherwise
@@ -211,7 +202,7 @@ public interface ReadBackedPileup extends Iterable<PileupElement>, HasGenomeLoca
      * Returns a list of the reads in this pileup. Note this call costs O(n) and allocates fresh lists each time
      * @return
      */
-    public List<SAMRecord> getReads();
+    public List<GATKSAMRecord> getReads();
 
     /**
      * Returns a list of the offsets in this pileup. Note this call costs O(n) and allocates fresh lists each time
@@ -237,4 +228,9 @@ public interface ReadBackedPileup extends Iterable<PileupElement>, HasGenomeLoca
      */
     public byte[] getMappingQuals();
 
+    /**
+     * Converts this pileup into a FragmentCollection (see FragmentUtils for documentation)
+     * @return
+     */
+    public FragmentCollection<PileupElement> toFragments();
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedPileupImpl.java b/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedPileupImpl.java
index e5b054961..b7445be8d 100644
--- a/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedPileupImpl.java
+++ b/public/java/src/org/broadinstitute/sting/utils/pileup/ReadBackedPileupImpl.java
@@ -23,9 +23,8 @@
  */
 package org.broadinstitute.sting.utils.pileup;
 
-import net.sf.samtools.SAMRecord;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
 import org.broadinstitute.sting.utils.GenomeLoc;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.util.List;
 import java.util.Map;
@@ -36,11 +35,11 @@ public class ReadBackedPileupImpl extends AbstractReadBackedPileup<ReadBackedPil
         super(loc);
     }
 
-    public ReadBackedPileupImpl(GenomeLoc loc, List<SAMRecord> reads, List<Integer> offsets ) {
+    public ReadBackedPileupImpl(GenomeLoc loc, List<GATKSAMRecord> reads, List<Integer> offsets ) {
         super(loc,reads,offsets);
     }
 
-    public ReadBackedPileupImpl(GenomeLoc loc, List<SAMRecord> reads, int offset ) {
+    public ReadBackedPileupImpl(GenomeLoc loc, List<GATKSAMRecord> reads, int offset ) {
         super(loc,reads,offset);
     }
 
@@ -48,7 +47,7 @@ public class ReadBackedPileupImpl extends AbstractReadBackedPileup<ReadBackedPil
         super(loc,pileupElements);
     }
 
-    public ReadBackedPileupImpl(GenomeLoc loc, Map<Sample,ReadBackedPileupImpl> pileupElementsBySample) {
+    public ReadBackedPileupImpl(GenomeLoc loc, Map<String,ReadBackedPileupImpl> pileupElementsBySample) {
         super(loc,pileupElementsBySample);
     }
 
@@ -71,7 +70,7 @@ public class ReadBackedPileupImpl extends AbstractReadBackedPileup<ReadBackedPil
     }
 
     @Override
-    protected PileupElement createNewPileupElement(SAMRecord read, int offset) {
+    protected PileupElement createNewPileupElement(GATKSAMRecord read, int offset) {
         return new PileupElement(read,offset);
     }
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/runtime/CapturedStreamOutput.java b/public/java/src/org/broadinstitute/sting/utils/runtime/CapturedStreamOutput.java
new file mode 100755
index 000000000..50622cef1
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/runtime/CapturedStreamOutput.java
@@ -0,0 +1,133 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.runtime;
+
+import org.apache.commons.io.IOUtils;
+import org.apache.commons.io.output.NullOutputStream;
+import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.io.HardThresholdingOutputStream;
+
+import java.io.*;
+import java.util.EnumMap;
+
+/**
+ * Stream output captured from a stream.
+ */
+public class CapturedStreamOutput extends StreamOutput {
+    private final InputStream processStream;
+    private final EnumMap<StreamLocation, OutputStream> outputStreams = new EnumMap<StreamLocation, OutputStream>(StreamLocation.class);
+
+    /**
+     * The byte stream to capture content or null if no output string content was requested.
+     */
+    private final ByteArrayOutputStream bufferStream;
+
+    /**
+     * True if the buffer is truncated.
+     */
+    private boolean bufferTruncated = false;
+
+    /**
+     * @param settings       Settings that define what to capture.
+     * @param processStream  Stream to capture output.
+     * @param standardStream Stream to write debug output.
+     */
+    public CapturedStreamOutput(OutputStreamSettings settings, InputStream processStream, PrintStream standardStream) {
+        this.processStream = processStream;
+        int bufferSize = settings.getBufferSize();
+        this.bufferStream = (bufferSize < 0) ? new ByteArrayOutputStream() : new ByteArrayOutputStream(bufferSize);
+
+        for (StreamLocation location : settings.getStreamLocations()) {
+            OutputStream outputStream;
+            switch (location) {
+                case Buffer:
+                    if (bufferSize < 0) {
+                        outputStream = this.bufferStream;
+                    } else {
+                        outputStream = new HardThresholdingOutputStream(bufferSize) {
+                            @Override
+                            protected OutputStream getStream() throws IOException {
+                                return bufferTruncated ? NullOutputStream.NULL_OUTPUT_STREAM : bufferStream;
+                            }
+
+                            @Override
+                            protected void thresholdReached() throws IOException {
+                                bufferTruncated = true;
+                            }
+                        };
+                    }
+                    break;
+                case File:
+                    try {
+                        outputStream = new FileOutputStream(settings.getOutputFile(), settings.isAppendFile());
+                    } catch (IOException e) {
+                        throw new UserException.BadInput(e.getMessage());
+                    }
+                    break;
+                case Standard:
+                    outputStream = standardStream;
+                    break;
+                default:
+                    throw new ReviewedStingException("Unexpected stream location: " + location);
+            }
+            this.outputStreams.put(location, outputStream);
+        }
+    }
+
+    @Override
+    public byte[] getBufferBytes() {
+        return bufferStream.toByteArray();
+    }
+
+    @Override
+    public boolean isBufferTruncated() {
+        return bufferTruncated;
+    }
+
+    /**
+     * Drain the input stream to keep the process from backing up until it's empty.
+     * File streams will be closed automatically when this method returns.
+     *
+     * @throws java.io.IOException When unable to read or write.
+     */
+    public void readAndClose() throws IOException {
+        try {
+            byte[] buf = new byte[4096];
+            int readCount;
+            while ((readCount = processStream.read(buf)) >= 0)
+                for (OutputStream outputStream : this.outputStreams.values()) {
+                    outputStream.write(buf, 0, readCount);
+                }
+        } finally {
+            for (StreamLocation location : this.outputStreams.keySet()) {
+                OutputStream outputStream = this.outputStreams.get(location);
+                outputStream.flush();
+                if (location != StreamLocation.Standard)
+                    IOUtils.closeQuietly(outputStream);
+            }
+        }
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/runtime/InputStreamSettings.java b/public/java/src/org/broadinstitute/sting/utils/runtime/InputStreamSettings.java
new file mode 100755
index 000000000..dfa380a68
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/runtime/InputStreamSettings.java
@@ -0,0 +1,115 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.runtime;
+
+import java.io.File;
+import java.util.Collections;
+import java.util.EnumSet;
+import java.util.Set;
+
+/**
+ * Settings that define text to write to the process stdin.
+ */
+public class InputStreamSettings {
+    private final EnumSet<StreamLocation> streamLocations = EnumSet.noneOf(StreamLocation.class);
+    private byte[] inputBuffer;
+    private File inputFile;
+
+    public InputStreamSettings() {
+    }
+
+    /**
+     * @param inputBuffer String to write to stdin.
+     */
+    public InputStreamSettings(String inputBuffer) {
+        setInputBuffer(inputBuffer);
+    }
+
+    /**
+     * @param inputFile File to write to stdin.
+     */
+    public InputStreamSettings(File inputFile) {
+        setInputFile(inputFile);
+    }
+
+    /**
+     * @param inputBuffer String to write to stdin.
+     * @param inputFile   File to write to stdin.
+     */
+    public InputStreamSettings(byte[] inputBuffer, File inputFile) {
+        setInputBuffer(inputBuffer);
+        setInputFile(inputFile);
+    }
+
+    public Set<StreamLocation> getStreamLocations() {
+        return Collections.unmodifiableSet(streamLocations);
+    }
+
+    public byte[] getInputBuffer() {
+        return inputBuffer;
+    }
+
+    public void setInputBuffer(String inputBuffer) {
+        if (inputBuffer == null)
+            throw new IllegalArgumentException("inputBuffer cannot be null");
+        this.streamLocations.add(StreamLocation.Buffer);
+        this.inputBuffer = inputBuffer.getBytes();
+    }
+
+    public void setInputBuffer(byte[] inputBuffer) {
+        if (inputBuffer == null)
+            throw new IllegalArgumentException("inputBuffer cannot be null");
+        this.streamLocations.add(StreamLocation.Buffer);
+        this.inputBuffer = inputBuffer;
+    }
+
+    public void clearInputBuffer() {
+        this.streamLocations.remove(StreamLocation.Buffer);
+        this.inputBuffer = null;
+    }
+
+    public File getInputFile() {
+        return inputFile;
+    }
+
+    public void setInputFile(File inputFile) {
+        if (inputFile == null)
+            throw new IllegalArgumentException("inputFile cannot be null");
+        this.streamLocations.add(StreamLocation.File);
+        this.inputFile = inputFile;
+    }
+
+    public void clearInputFile() {
+        this.streamLocations.remove(StreamLocation.File);
+        this.inputFile = null;
+    }
+
+    public void setInputStandard(boolean inputStandard) {
+        if (inputStandard)
+            this.streamLocations.add(StreamLocation.Standard);
+        else
+            this.streamLocations.remove(StreamLocation.Standard);
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/runtime/OutputStreamSettings.java b/public/java/src/org/broadinstitute/sting/utils/runtime/OutputStreamSettings.java
new file mode 100755
index 000000000..468ece178
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/runtime/OutputStreamSettings.java
@@ -0,0 +1,126 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.runtime;
+
+import java.io.File;
+import java.util.Collections;
+import java.util.EnumSet;
+import java.util.Set;
+
+/**
+ * Settings that define text to capture from a process stream.
+ */
+public class OutputStreamSettings {
+    private final EnumSet<StreamLocation> streamLocations = EnumSet.noneOf(StreamLocation.class);
+    private int bufferSize;
+    private File outputFile;
+    private boolean appendFile;
+
+    public OutputStreamSettings() {
+    }
+
+    /**
+     * @param bufferSize The number of bytes to capture, or -1 for unlimited.
+     */
+    public OutputStreamSettings(int bufferSize) {
+        setBufferSize(bufferSize);
+    }
+
+    /**
+     * @param outputFile The file to write output to.
+     */
+    public OutputStreamSettings(File outputFile) {
+        setOutputFile(outputFile);
+    }
+
+    /**
+     * @param outputFile The file to write output to.
+     * @param append     true if the output file should be appended to.
+     */
+    public OutputStreamSettings(File outputFile, boolean append) {
+        setOutputFile(outputFile, append);
+    }
+
+    public OutputStreamSettings(int bufferSize, File outputFile, boolean appendFile) {
+        setBufferSize(bufferSize);
+        setOutputFile(outputFile, appendFile);
+    }
+
+    public Set<StreamLocation> getStreamLocations() {
+        return Collections.unmodifiableSet(streamLocations);
+    }
+
+    public int getBufferSize() {
+        return bufferSize;
+    }
+
+    public void setBufferSize(int bufferSize) {
+        this.streamLocations.add(StreamLocation.Buffer);
+        this.bufferSize = bufferSize;
+    }
+
+    public void clearBufferSize() {
+        this.streamLocations.remove(StreamLocation.Buffer);
+        this.bufferSize = 0;
+    }
+
+    public File getOutputFile() {
+        return outputFile;
+    }
+
+    public boolean isAppendFile() {
+        return appendFile;
+    }
+
+    /**
+     * Overwrites the outputFile with the process output.
+     *
+     * @param outputFile File to overwrite.
+     */
+    public void setOutputFile(File outputFile) {
+        setOutputFile(outputFile, false);
+    }
+
+    public void setOutputFile(File outputFile, boolean append) {
+        if (outputFile == null)
+            throw new IllegalArgumentException("outputFile cannot be null");
+        streamLocations.add(StreamLocation.File);
+        this.outputFile = outputFile;
+        this.appendFile = append;
+    }
+
+    public void clearOutputFile() {
+        streamLocations.remove(StreamLocation.File);
+        this.outputFile = null;
+        this.appendFile = false;
+    }
+
+    public void printStandard(boolean print) {
+        if (print)
+            this.streamLocations.add(StreamLocation.Standard);
+        else
+            this.streamLocations.remove(StreamLocation.Standard);
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/runtime/ProcessController.java b/public/java/src/org/broadinstitute/sting/utils/runtime/ProcessController.java
new file mode 100755
index 000000000..6a3f9c753
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/runtime/ProcessController.java
@@ -0,0 +1,363 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.runtime;
+
+import org.apache.commons.io.FileUtils;
+import org.apache.commons.io.IOUtils;
+import org.apache.commons.lang.StringUtils;
+import org.apache.log4j.Logger;
+import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+
+import java.io.ByteArrayInputStream;
+import java.io.IOException;
+import java.io.InputStream;
+import java.io.OutputStream;
+import java.util.*;
+
+/**
+ * Facade to Runtime.exec() and java.lang.Process.  Handles
+ * running a process to completion and returns stdout and stderr
+ * as strings.  Creates separate threads for reading stdout and stderr,
+ * then reuses those threads for each process most efficient use is
+ * to create one of these and use it repeatedly.  Instances are not
+ * thread-safe, however.
+ *
+ * TODO: java.io sometimes zombies the backround threads locking up on read().
+ * Supposedly NIO has better ways of interrupting a blocked stream but will
+ * require a little bit of refactoring.
+ *
+ * @author Michael Koehrsen
+ * @author Khalid Shakir
+ */
+public class ProcessController {
+    private static Logger logger = Logger.getLogger(ProcessController.class);
+
+    private static enum ProcessStream {Stdout, Stderr}
+
+    // Tracks running processes.
+    private static final Set<ProcessController> running = Collections.synchronizedSet(new HashSet<ProcessController>());
+
+    // Tracks this running process.
+    private Process process;
+
+    // Threads that capture stdout and stderr
+    private final OutputCapture stdoutCapture;
+    private final OutputCapture stderrCapture;
+
+    // When a caller destroyes a controller a new thread local version will be created
+    private boolean destroyed = false;
+
+    // Communication channels with output capture threads
+
+    // Holds the stdout and stderr sent to the background capture threads
+    private final Map<ProcessStream, CapturedStreamOutput> toCapture =
+            new EnumMap<ProcessStream, CapturedStreamOutput>(ProcessStream.class);
+
+    // Holds the results of the capture from the background capture threads.
+    // May be the content via toCapture or an StreamOutput.EMPTY if the capture was interrupted.
+    private final Map<ProcessStream, StreamOutput> fromCapture =
+            new EnumMap<ProcessStream, StreamOutput>(ProcessStream.class);
+
+    // Useful for debugging if background threads have shut down correctly
+    private static int nextControllerId = 0;
+    private final int controllerId;
+
+    public ProcessController() {
+        // Start the background threads for this controller.
+        synchronized (running) {
+            controllerId = nextControllerId++;
+        }
+        stdoutCapture = new OutputCapture(ProcessStream.Stdout, controllerId);
+        stderrCapture = new OutputCapture(ProcessStream.Stderr, controllerId);
+        stdoutCapture.start();
+        stderrCapture.start();
+    }
+
+    /**
+     * Returns a thread local ProcessController.
+     * Should NOT be closed when finished so it can be reused by the thread.
+     *
+     * @return a thread local ProcessController.
+     */
+    public static ProcessController getThreadLocal() {
+        // If the local controller was destroyed get a fresh instance.
+        if (threadProcessController.get().destroyed)
+            threadProcessController.remove();
+        return threadProcessController.get();
+    }
+
+    /**
+     * Thread local process controller container.
+     */
+    private static final ThreadLocal<ProcessController> threadProcessController =
+            new ThreadLocal<ProcessController>() {
+                @Override
+                protected ProcessController initialValue() {
+                    return new ProcessController();
+                }
+            };
+
+    /**
+     * Similar to Runtime.exec() but drains the output and error streams.
+     *
+     * @param command Command to run.
+     * @return The result code.
+     */
+    public static int exec(String[] command) {
+        ProcessController controller = ProcessController.getThreadLocal();
+        return controller.exec(new ProcessSettings(command)).getExitValue();
+    }
+
+    /**
+     * Executes a command line program with the settings and waits for it to return,
+     * processing the output on a background thread.
+     *
+     * @param settings Settings to be run.
+     * @return The output of the command.
+     */
+    public ProcessOutput exec(ProcessSettings settings) {
+        if (destroyed)
+            throw new IllegalStateException("This controller was destroyed");
+
+        ProcessBuilder builder = new ProcessBuilder(settings.getCommand());
+        builder.directory(settings.getDirectory());
+
+        Map<String, String> settingsEnvironment = settings.getEnvironment();
+        if (settingsEnvironment != null) {
+            Map<String, String> builderEnvironment = builder.environment();
+            builderEnvironment.clear();
+            builderEnvironment.putAll(settingsEnvironment);
+        }
+
+        builder.redirectErrorStream(settings.isRedirectErrorStream());
+
+        StreamOutput stdout = null;
+        StreamOutput stderr = null;
+
+        // Start the process running.
+
+        try {
+            synchronized (toCapture) {
+                process = builder.start();
+            }
+            running.add(this);
+        } catch (IOException e) {
+            throw new ReviewedStingException("Unable to start command: " + StringUtils.join(builder.command(), " "));
+        }
+
+        int exitCode;
+
+        try {
+            // Notify the background threads to start capturing.
+            synchronized (toCapture) {
+                toCapture.put(ProcessStream.Stdout,
+                        new CapturedStreamOutput(settings.getStdoutSettings(), process.getInputStream(), System.out));
+                toCapture.put(ProcessStream.Stderr,
+                        new CapturedStreamOutput(settings.getStderrSettings(), process.getErrorStream(), System.err));
+                toCapture.notifyAll();
+            }
+
+            // Write stdin content
+            InputStreamSettings stdinSettings = settings.getStdinSettings();
+            Set<StreamLocation> streamLocations = stdinSettings.getStreamLocations();
+            if (!streamLocations.isEmpty()) {
+                try {
+                    OutputStream stdinStream = process.getOutputStream();
+                    for (StreamLocation location : streamLocations) {
+                        InputStream inputStream;
+                        switch (location) {
+                            case Buffer:
+                                inputStream = new ByteArrayInputStream(stdinSettings.getInputBuffer());
+                                break;
+                            case File:
+                                try {
+                                    inputStream = FileUtils.openInputStream(stdinSettings.getInputFile());
+                                } catch (IOException e) {
+                                    throw new UserException.BadInput(e.getMessage());
+                                }
+                                break;
+                            case Standard:
+                                inputStream = System.in;
+                                break;
+                            default:
+                                throw new ReviewedStingException("Unexpected stream location: " + location);
+                        }
+                        try {
+                            IOUtils.copy(inputStream, stdinStream);
+                        } finally {
+                            if (location != StreamLocation.Standard)
+                                IOUtils.closeQuietly(inputStream);
+                        }
+                    }
+                    stdinStream.flush();
+                } catch (IOException e) {
+                    throw new ReviewedStingException("Error writing to stdin on command: " + StringUtils.join(builder.command(), " "), e);
+                }
+            }
+
+            // Wait for the process to complete.
+            try {
+                process.getOutputStream().close();
+                process.waitFor();
+            } catch (IOException e) {
+                throw new ReviewedStingException("Unable to close stdin on command: " + StringUtils.join(builder.command(), " "), e);
+            } catch (InterruptedException e) {
+                throw new ReviewedStingException("Process interrupted", e);
+            } finally {
+                while (!destroyed && stdout == null || stderr == null) {
+                    synchronized (fromCapture) {
+                        if (fromCapture.containsKey(ProcessStream.Stdout))
+                            stdout = fromCapture.remove(ProcessStream.Stdout);
+                        if (fromCapture.containsKey(ProcessStream.Stderr))
+                            stderr = fromCapture.remove(ProcessStream.Stderr);
+                        try {
+                            if (stdout == null || stderr == null)
+                                fromCapture.wait();
+                        } catch (InterruptedException e) {
+                            // Log the error, ignore the interrupt and wait patiently
+                            // for the OutputCaptures to (via finally) return their
+                            // stdout and stderr.
+                            logger.error(e);
+                        }
+                    }
+                }
+
+                if (destroyed) {
+                    if (stdout == null)
+                        stdout = StreamOutput.EMPTY;
+                    if (stderr == null)
+                        stderr = StreamOutput.EMPTY;
+                }
+            }
+        } finally {
+            synchronized (toCapture) {
+                exitCode = process.exitValue();
+                process = null;
+            }
+            running.remove(this);
+        }
+
+        return new ProcessOutput(exitCode, stdout, stderr);
+    }
+
+    /**
+     * @return The set of still running processes.
+     */
+    public static Set<ProcessController> getRunning() {
+        synchronized (running) {
+            return new HashSet<ProcessController>(running);
+        }
+    }
+
+    /**
+     * Stops the process from running and tries to ensure process is cleaned up properly.
+     * NOTE: sub-processes started by process may be zombied with their parents set to pid 1.
+     * NOTE: capture threads may block on read.
+     * TODO: Try to use NIO to interrupt streams.
+     */
+    public void tryDestroy() {
+        destroyed = true;
+        synchronized (toCapture) {
+            if (process != null) {
+                process.destroy();
+                IOUtils.closeQuietly(process.getInputStream());
+                IOUtils.closeQuietly(process.getErrorStream());
+            }
+            stdoutCapture.interrupt();
+            stderrCapture.interrupt();
+            toCapture.notifyAll();
+        }
+    }
+
+    @Override
+    protected void finalize() throws Throwable {
+        try {
+            tryDestroy();
+        } catch (Exception e) {
+            logger.error(e);
+        }
+        super.finalize();
+    }
+
+    private class OutputCapture extends Thread {
+        private final int controllerId;
+        private final ProcessStream key;
+
+        /**
+         * Reads in the output of a stream on a background thread to keep the output pipe from backing up and freezing the called process.
+         *
+         * @param key The stdout or stderr key for this output capture.
+         * @param controllerId Unique id of the controller.
+         */
+        public OutputCapture(ProcessStream key, int controllerId) {
+            super(String.format("OutputCapture-%d-%s-%s-%d", controllerId, key.name().toLowerCase(),
+                    Thread.currentThread().getName(), Thread.currentThread().getId()));
+            this.controllerId = controllerId;
+            this.key = key;
+            setDaemon(true);
+        }
+
+        /**
+         * Runs the capture.
+         */
+        @Override
+        public void run() {
+            while (!destroyed) {
+                StreamOutput processStream = StreamOutput.EMPTY;
+                try {
+                    // Wait for a new input stream to be passed from this process controller.
+                    CapturedStreamOutput capturedProcessStream = null;
+                    while (!destroyed && capturedProcessStream == null) {
+                        synchronized (toCapture) {
+                            if (toCapture.containsKey(key)) {
+                                capturedProcessStream = toCapture.remove(key);
+                            } else {
+                                toCapture.wait();
+                            }
+                        }
+                    }
+
+                    if (!destroyed) {
+                        // Read in the input stream
+                        processStream = capturedProcessStream;
+                        capturedProcessStream.readAndClose();
+                    }
+                } catch (InterruptedException e) {
+                    logger.info("OutputCapture interrupted, exiting");
+                    break;
+                } catch (IOException e) {
+                    logger.error("Error reading process output", e);
+                } finally {
+                    // Send the string back to the process controller.
+                    synchronized (fromCapture) {
+                        fromCapture.put(key, processStream);
+                        fromCapture.notify();
+                    }
+                }
+            }
+        }
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/runtime/ProcessOutput.java b/public/java/src/org/broadinstitute/sting/utils/runtime/ProcessOutput.java
new file mode 100755
index 000000000..211008950
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/runtime/ProcessOutput.java
@@ -0,0 +1,56 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.runtime;
+
+public class ProcessOutput {
+    private final int exitValue;
+    private final StreamOutput stdout;
+    private final StreamOutput stderr;
+
+    /**
+     * The output of a process.
+     *
+     * @param exitValue The exit value.
+     * @param stdout    The capture of stdout as defined by the stdout OutputStreamSettings.
+     * @param stderr    The capture of stderr as defined by the stderr OutputStreamSettings.
+     */
+    public ProcessOutput(int exitValue, StreamOutput stdout, StreamOutput stderr) {
+        this.exitValue = exitValue;
+        this.stdout = stdout;
+        this.stderr = stderr;
+    }
+
+    public int getExitValue() {
+        return exitValue;
+    }
+
+    public StreamOutput getStdout() {
+        return stdout;
+    }
+
+    public StreamOutput getStderr() {
+        return stderr;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/runtime/ProcessSettings.java b/public/java/src/org/broadinstitute/sting/utils/runtime/ProcessSettings.java
new file mode 100755
index 000000000..b9f67f3a4
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/runtime/ProcessSettings.java
@@ -0,0 +1,140 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.runtime;
+
+import com.sun.corba.se.spi.orbutil.fsm.Input;
+
+import java.io.File;
+import java.util.Map;
+
+public class ProcessSettings {
+    private String[] command;
+    private Map<String, String> environment;
+    private File directory;
+    private boolean redirectErrorStream;
+    private InputStreamSettings stdinSettings;
+    private OutputStreamSettings stdoutSettings;
+    private OutputStreamSettings stderrSettings;
+
+    /**
+     * @param command Command line to run.
+     */
+    public ProcessSettings(String[] command) {
+        this(command, false, null, null, null, null, null);
+    }
+
+    /**
+     * @param command             Command line to run.
+     * @param redirectErrorStream true if stderr should be sent to stdout.
+     * @param environment         Environment settings to override System.getEnv, or null to use System.getEnv.
+     * @param directory           The directory to run the command in, or null to run in the current directory.
+     * @param stdinSettings       Settings for writing to the process stdin.
+     * @param stdoutSettings      Settings for capturing the process stdout.
+     * @param stderrSettings      Setting for capturing the process stderr.
+     */
+    public ProcessSettings(String[] command, boolean redirectErrorStream, File directory, Map<String, String> environment,
+                           InputStreamSettings stdinSettings, OutputStreamSettings stdoutSettings, OutputStreamSettings stderrSettings) {
+        this.command = checkCommand(command);
+        this.redirectErrorStream = redirectErrorStream;
+        this.directory = directory;
+        this.environment = environment;
+        this.stdinSettings = checkSettings(stdinSettings);
+        this.stdoutSettings = checkSettings(stdoutSettings);
+        this.stderrSettings = checkSettings(stderrSettings);
+    }
+
+    public String[] getCommand() {
+        return command;
+    }
+
+    public void setCommand(String[] command) {
+        this.command = checkCommand(command);
+    }
+
+    public boolean isRedirectErrorStream() {
+        return redirectErrorStream;
+    }
+
+    public void setRedirectErrorStream(boolean redirectErrorStream) {
+        this.redirectErrorStream = redirectErrorStream;
+    }
+
+    public File getDirectory() {
+        return directory;
+    }
+
+    public void setDirectory(File directory) {
+        this.directory = directory;
+    }
+
+    public Map<String, String> getEnvironment() {
+        return environment;
+    }
+
+    public void setEnvironment(Map<String, String> environment) {
+        this.environment = environment;
+    }
+
+    public InputStreamSettings getStdinSettings() {
+        return stdinSettings;
+    }
+
+    public void setStdinSettings(InputStreamSettings stdinSettings) {
+        this.stdinSettings = checkSettings(stdinSettings);
+    }
+
+    public OutputStreamSettings getStdoutSettings() {
+        return stdoutSettings;
+    }
+
+    public void setStdoutSettings(OutputStreamSettings stdoutSettings) {
+        this.stdoutSettings = checkSettings(stdoutSettings);
+    }
+
+    public OutputStreamSettings getStderrSettings() {
+        return stderrSettings;
+    }
+
+    public void setStderrSettings(OutputStreamSettings stderrSettings) {
+        this.stderrSettings = checkSettings(stderrSettings);
+    }
+
+    protected String[] checkCommand(String[] command) {
+        if (command == null)
+            throw new IllegalArgumentException("Command is not allowed to be null");
+        for (String s: command)
+            if (s == null)
+                throw new IllegalArgumentException("Command is not allowed to contain nulls");
+        return command;
+    }
+
+    protected InputStreamSettings checkSettings(InputStreamSettings settings) {
+        return settings == null ? new InputStreamSettings() : settings;
+    }
+
+    protected OutputStreamSettings checkSettings(OutputStreamSettings settings) {
+        return settings == null ? new OutputStreamSettings() : settings;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/runtime/RuntimeUtils.java b/public/java/src/org/broadinstitute/sting/utils/runtime/RuntimeUtils.java
new file mode 100644
index 000000000..b5b2cbee5
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/runtime/RuntimeUtils.java
@@ -0,0 +1,58 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.runtime;
+
+import org.apache.commons.lang.StringUtils;
+
+import java.io.File;
+
+public class RuntimeUtils {
+    public static final String[] PATHS;
+
+    static {
+        String path = System.getenv("PATH");
+        if (path == null)
+            path = System.getenv("path");
+        if (path == null) {
+            PATHS = new String[0];
+        } else {
+            PATHS = StringUtils.split(path, File.pathSeparatorChar);
+        }
+    }
+
+    /**
+     * Returns the path to an executable or null if it doesn't exist.
+     * @param executable Relative path
+     * @return The absolute file path.
+     */
+    public static File which(String executable) {
+        for (String path: PATHS) {
+            File file = new File(path, executable);
+            if (file.exists())
+                return file.getAbsoluteFile();
+        }
+        return null;
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/runtime/StreamLocation.java b/public/java/src/org/broadinstitute/sting/utils/runtime/StreamLocation.java
new file mode 100755
index 000000000..df72180f1
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/runtime/StreamLocation.java
@@ -0,0 +1,32 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.runtime;
+
+/**
+ * Where to read/write a stream
+ */
+public enum StreamLocation {
+    Buffer, File, Standard
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/runtime/StreamOutput.java b/public/java/src/org/broadinstitute/sting/utils/runtime/StreamOutput.java
new file mode 100755
index 000000000..5dc94815f
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/runtime/StreamOutput.java
@@ -0,0 +1,68 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.runtime;
+
+/**
+ * The content of stdout or stderr.
+ */
+public abstract class StreamOutput {
+    /**
+     * Empty stream output when no output is captured due to an error.
+     */
+    public static final StreamOutput EMPTY = new StreamOutput() {
+        @Override
+        public byte[] getBufferBytes() {
+            return new byte[0];
+        }
+
+        @Override
+        public boolean isBufferTruncated() {
+            return false;
+        }
+    };
+
+    /**
+     * Returns the content as a string.
+     *
+     * @return The content as a string.
+     */
+    public String getBufferString() {
+        return new String(getBufferBytes());
+    }
+
+    /**
+     * Returns the content as a string.
+     *
+     * @return The content as a string.
+     */
+    public abstract byte[] getBufferBytes();
+
+    /**
+     * Returns true if the buffer was truncated.
+     *
+     * @return true if the buffer was truncated.
+     */
+    public abstract boolean isBufferTruncated();
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/sam/AlignmentStartWithNoTiesComparator.java b/public/java/src/org/broadinstitute/sting/utils/sam/AlignmentStartWithNoTiesComparator.java
new file mode 100644
index 000000000..02512c8dc
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/sam/AlignmentStartWithNoTiesComparator.java
@@ -0,0 +1,46 @@
+package org.broadinstitute.sting.utils.sam;
+
+import com.google.java.contract.Ensures;
+import com.google.java.contract.Requires;
+import net.sf.samtools.SAMRecord;
+
+import java.util.Comparator;
+
+public class AlignmentStartWithNoTiesComparator implements Comparator<SAMRecord> {
+    @Requires("c1 >= 0 && c2 >= 0")
+    @Ensures("result == 0 || result == 1 || result == -1")
+    private int compareContigs(int c1, int c2) {
+        if (c1 == c2)
+            return 0;
+        else if (c1 > c2)
+            return 1;
+        return -1;
+    }
+
+    @Requires("r1 != null && r2 != null")
+    @Ensures("result == 0 || result == 1 || result == -1")
+    public int compare(SAMRecord r1, SAMRecord r2) {
+        int result;
+
+        if (r1 == r2)
+            result = 0;
+
+        else if (r1.getReadUnmappedFlag())
+            result = 1;
+        else if (r2.getReadUnmappedFlag())
+            result = -1;
+        else {
+            final int cmpContig = compareContigs(r1.getReferenceIndex(), r2.getReferenceIndex());
+
+            if (cmpContig != 0)
+                result = cmpContig;
+
+            else {
+                if (r1.getAlignmentStart() < r2.getAlignmentStart()) result = -1;
+                else result = 1;
+            }
+        }
+
+        return result;
+    }
+}
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/utils/sam/ArtificialReadsTraversal.java b/public/java/src/org/broadinstitute/sting/utils/sam/ArtificialReadsTraversal.java
index 5f7db458a..475f7de21 100644
--- a/public/java/src/org/broadinstitute/sting/utils/sam/ArtificialReadsTraversal.java
+++ b/public/java/src/org/broadinstitute/sting/utils/sam/ArtificialReadsTraversal.java
@@ -104,9 +104,9 @@ public class ArtificialReadsTraversal<M,T> extends TraversalEngine<M,T,Walker<M,
             // an array of characters that represent the reference
             ReferenceContext refSeq = null;
 
-            final boolean keepMeP = readWalker.filter(refSeq, read);
+            final boolean keepMeP = readWalker.filter(refSeq, (GATKSAMRecord) read);
             if (keepMeP) {
-                M x = readWalker.map(refSeq, read, null);  // TODO: fix me at some point, it would be nice to fake out ROD data too
+                M x = readWalker.map(refSeq, (GATKSAMRecord) read, null);  // TODO: fix me at some point, it would be nice to fake out ROD data too
                 sum = readWalker.reduce(x, sum);
             }
         }
diff --git a/public/java/src/org/broadinstitute/sting/utils/sam/ArtificialSAMUtils.java b/public/java/src/org/broadinstitute/sting/utils/sam/ArtificialSAMUtils.java
index 2dcdd5ce6..26fabade2 100755
--- a/public/java/src/org/broadinstitute/sting/utils/sam/ArtificialSAMUtils.java
+++ b/public/java/src/org/broadinstitute/sting/utils/sam/ArtificialSAMUtils.java
@@ -2,11 +2,14 @@ package org.broadinstitute.sting.utils.sam;
 
 import net.sf.samtools.*;
 import org.broadinstitute.sting.gatk.iterators.StingSAMIterator;
+import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.pileup.PileupElement;
+import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
+import org.broadinstitute.sting.utils.pileup.ReadBackedPileupImpl;
 
 import java.io.File;
-import java.util.ArrayList;
-import java.util.List;
+import java.util.*;
 
 /**
  * @author aaron
@@ -29,7 +32,7 @@ public class ArtificialSAMUtils {
         File outFile = new File(filename);
 
         SAMFileWriter out = new SAMFileWriterFactory().makeBAMWriter(header, true, outFile);
-        
+
         for (int x = startingChromosome; x < startingChromosome + numberOfChromosomes; x++) {
             for (int readNumber = 1; readNumber < readsPerChomosome; readNumber++) {
                 out.addAlignment(createArtificialRead(header, "Read_" + readNumber, x - startingChromosome, readNumber, DEFAULT_READ_LENGTH));
@@ -134,6 +137,7 @@ public class ArtificialSAMUtils {
     /**
      * Create an artificial read based on the parameters.  The cigar string will be *M, where * is the length of the read
      *
+     *
      * @param header         the SAM header to associate the read with
      * @param name           the name of the read
      * @param refIndex       the reference index, i.e. what chromosome to associate it with
@@ -142,11 +146,11 @@ public class ArtificialSAMUtils {
      *
      * @return the artificial read
      */
-    public static SAMRecord createArtificialRead( SAMFileHeader header, String name, int refIndex, int alignmentStart, int length ) {
+    public static GATKSAMRecord createArtificialRead(SAMFileHeader header, String name, int refIndex, int alignmentStart, int length) {
         if( (refIndex == SAMRecord.NO_ALIGNMENT_REFERENCE_INDEX && alignmentStart != SAMRecord.NO_ALIGNMENT_START) ||
-            (refIndex != SAMRecord.NO_ALIGNMENT_REFERENCE_INDEX && alignmentStart == SAMRecord.NO_ALIGNMENT_START) )
+                (refIndex != SAMRecord.NO_ALIGNMENT_REFERENCE_INDEX && alignmentStart == SAMRecord.NO_ALIGNMENT_START) )
             throw new ReviewedStingException("Invalid alignment start for artificial read, start = " + alignmentStart);
-        SAMRecord record = new SAMRecord(header);
+        GATKSAMRecord record = new GATKSAMRecord(header);
         record.setReadName(name);
         record.setReferenceIndex(refIndex);
         record.setAlignmentStart(alignmentStart);
@@ -166,6 +170,7 @@ public class ArtificialSAMUtils {
         if (refIndex == SAMRecord.NO_ALIGNMENT_REFERENCE_INDEX) {
             record.setReadUnmappedFlag(true);
         }
+
         return record;
     }
 
@@ -181,19 +186,51 @@ public class ArtificialSAMUtils {
      *
      * @return the artificial read
      */
-    public static SAMRecord createArtificialRead( SAMFileHeader header, String name, int refIndex, int alignmentStart, byte[] bases, byte[] qual ) {
+    public static GATKSAMRecord createArtificialRead( SAMFileHeader header, String name, int refIndex, int alignmentStart, byte[] bases, byte[] qual ) {
         if (bases.length != qual.length) {
             throw new ReviewedStingException("Passed in read string is different length then the quality array");
         }
-        SAMRecord rec = createArtificialRead(header, name, refIndex, alignmentStart, bases.length);
+        GATKSAMRecord rec = createArtificialRead(header, name, refIndex, alignmentStart, bases.length);
         rec.setReadBases(bases);
         rec.setBaseQualities(qual);
         if (refIndex == -1) {
             rec.setReadUnmappedFlag(true);
         }
+
         return rec;
     }
 
+    public final static List<GATKSAMRecord> createPair(SAMFileHeader header, String name, int readLen, int leftStart, int rightStart, boolean leftIsFirst, boolean leftIsNegative) {
+        GATKSAMRecord left = ArtificialSAMUtils.createArtificialRead(header, name, 0, leftStart, readLen);
+        GATKSAMRecord right = ArtificialSAMUtils.createArtificialRead(header, name, 0, rightStart, readLen);
+
+        left.setReadPairedFlag(true);
+        right.setReadPairedFlag(true);
+
+        left.setProperPairFlag(true);
+        right.setProperPairFlag(true);
+
+        left.setFirstOfPairFlag(leftIsFirst);
+        right.setFirstOfPairFlag(! leftIsFirst);
+
+        left.setReadNegativeStrandFlag(leftIsNegative);
+        left.setMateNegativeStrandFlag(!leftIsNegative);
+        right.setReadNegativeStrandFlag(!leftIsNegative);
+        right.setMateNegativeStrandFlag(leftIsNegative);
+
+        left.setMateAlignmentStart(right.getAlignmentStart());
+        right.setMateAlignmentStart(left.getAlignmentStart());
+
+        left.setMateReferenceIndex(0);
+        right.setMateReferenceIndex(0);
+
+        int isize = rightStart + readLen - leftStart;
+        left.setInferredInsertSize(isize);
+        right.setInferredInsertSize(-isize);
+
+        return Arrays.asList(left, right);
+    }
+
     /**
      * create an iterator containing the specified read piles
      *
@@ -255,4 +292,52 @@ public class ArtificialSAMUtils {
 
         return new ArtificialSAMQueryIterator(startingChr, endingChr, readCount, unmappedReadCount, header);
     }
+
+    private final static int ranIntInclusive(Random ran, int start, int stop) {
+        final int range = stop - start;
+        return ran.nextInt(range) + start;
+    }
+
+    /**
+     * Creates a read backed pileup containing up to pileupSize reads at refID 0 from header at loc with
+     * reads created that have readLen bases.  Pairs are sampled from a gaussian distribution with mean insert
+     * size of insertSize and variation of insertSize / 10.  The first read will be in the pileup, and the second
+     * may be, depending on where this sampled insertSize puts it.
+     * @param header
+     * @param loc
+     * @param readLen
+     * @param insertSize
+     * @param pileupSize
+     * @return
+     */
+    public static ReadBackedPileup createReadBackedPileup(final SAMFileHeader header, final GenomeLoc loc, final int readLen, final int insertSize, final int pileupSize) {
+        final Random ran = new Random();
+        final boolean leftIsFirst = true;
+        final boolean leftIsNegative = false;
+        final int insertSizeVariation = insertSize / 10;
+        final int pos = loc.getStart();
+
+        final List<PileupElement> pileupElements = new ArrayList<PileupElement>();
+        for ( int i = 0; i < pileupSize / 2; i++ ) {
+            final String readName = "read" + i;
+            final int leftStart = ranIntInclusive(ran, 1, pos);
+            final int fragmentSize = (int)(ran.nextGaussian() * insertSizeVariation + insertSize);
+            final int rightStart = leftStart + fragmentSize - readLen;
+
+            if ( rightStart <= 0 ) continue;
+
+            List<GATKSAMRecord> pair = createPair(header, readName, readLen, leftStart, rightStart, leftIsFirst, leftIsNegative);
+            final GATKSAMRecord left = pair.get(0);
+            final GATKSAMRecord right = pair.get(1);
+
+            pileupElements.add(new PileupElement(left, pos - leftStart));
+
+            if ( pos >= right.getAlignmentStart() && pos <= right.getAlignmentEnd() ) {
+                pileupElements.add(new PileupElement(right, pos - rightStart));
+            }
+        }
+
+        Collections.sort(pileupElements);
+        return new ReadBackedPileupImpl(loc, pileupElements);
+    }
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/sam/GATKSAMReadGroupRecord.java b/public/java/src/org/broadinstitute/sting/utils/sam/GATKSAMReadGroupRecord.java
index c7ffcab0c..ff7d12f09 100755
--- a/public/java/src/org/broadinstitute/sting/utils/sam/GATKSAMReadGroupRecord.java
+++ b/public/java/src/org/broadinstitute/sting/utils/sam/GATKSAMReadGroupRecord.java
@@ -1,6 +1,7 @@
 package org.broadinstitute.sting.utils.sam;
 
 import net.sf.samtools.SAMReadGroupRecord;
+import org.broadinstitute.sting.utils.NGSPlatform;
 
 /**
  * @author ebanks
@@ -15,16 +16,28 @@ public class GATKSAMReadGroupRecord extends SAMReadGroupRecord {
     // the SAMReadGroupRecord data we're caching
     private String mSample = null;
     private String mPlatform = null;
+    private NGSPlatform mNGSPlatform = null;
 
     // because some values can be null, we don't want to duplicate effort
     private boolean retrievedSample = false;
     private boolean retrievedPlatform = false;
+    private boolean retrievedNGSPlatform = false;
 
+    public GATKSAMReadGroupRecord(final String id) {
+        super(id);
+    }
 
     public GATKSAMReadGroupRecord(SAMReadGroupRecord record) {
         super(record.getReadGroupId(), record);
     }
 
+    public GATKSAMReadGroupRecord(SAMReadGroupRecord record, NGSPlatform pl) {
+        super(record.getReadGroupId(), record);
+        setPlatform(pl.getDefaultPlatform());
+        mNGSPlatform = pl;
+        retrievedPlatform = retrievedNGSPlatform = true;
+    }
+
     ///////////////////////////////////////////////////////////////////////////////
     // *** The following methods are overloaded to cache the appropriate data ***//
     ///////////////////////////////////////////////////////////////////////////////
@@ -55,5 +68,15 @@ public class GATKSAMReadGroupRecord extends SAMReadGroupRecord {
         super.setPlatform(s);
         mPlatform = s;
         retrievedPlatform = true;
+        retrievedNGSPlatform = false;  // recalculate the NGSPlatform
+    }
+
+    public NGSPlatform getNGSPlatform() {
+        if ( ! retrievedNGSPlatform ) {
+            mNGSPlatform = NGSPlatform.fromReadGroupPL(getPlatform());
+            retrievedNGSPlatform = true;
+        }
+
+        return mNGSPlatform;
     }
 }
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/utils/sam/GATKSAMRecord.java b/public/java/src/org/broadinstitute/sting/utils/sam/GATKSAMRecord.java
index c55a462f1..ede75817a 100755
--- a/public/java/src/org/broadinstitute/sting/utils/sam/GATKSAMRecord.java
+++ b/public/java/src/org/broadinstitute/sting/utils/sam/GATKSAMRecord.java
@@ -1,49 +1,57 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
 package org.broadinstitute.sting.utils.sam;
 
 import net.sf.samtools.*;
-import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
-import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.NGSPlatform;
 
-import java.lang.reflect.Method;
 import java.util.HashMap;
-import java.util.List;
 import java.util.Map;
 
 /**
- * @author ebanks
+ * @author ebanks, depristo
  * GATKSAMRecord
  *
- * this class extends the samtools SAMRecord class and caches important
+ * this class extends the samtools BAMRecord class (and SAMRecord) and caches important
  * (and oft-accessed) data that's not already cached by the SAMRecord class
  *
  * IMPORTANT NOTE: Because ReadGroups are not set through the SAMRecord,
  *   if they are ever modified externally then one must also invoke the
  *   setReadGroup() method here to ensure that the cache is kept up-to-date.
  *
- * 13 Oct 2010 - mhanna - this class is fundamentally flawed: it uses a decorator
- *                        pattern to wrap a heavyweight object, which can lead
- *                        to heinous side effects if the wrapping is not carefully
- *                        done.  Hopefully SAMRecord will become an interface and
- *                        this will eventually be fixed.
  */
-public class GATKSAMRecord extends SAMRecord {
-
-    // the underlying SAMRecord which we are wrapping
-    private final SAMRecord mRecord;
-
+public class GATKSAMRecord extends BAMRecord {
+    public static final String REDUCED_READ_QUALITY_TAG = "RR";
     // the SAMRecord data we're caching
     private String mReadString = null;
-    private SAMReadGroupRecord mReadGroup = null;
-    private boolean mNegativeStrandFlag;
-    private boolean mUnmappedFlag;
-    private Boolean mSecondOfPairFlag = null;
+    private GATKSAMReadGroupRecord mReadGroup = null;
+    private byte[] reducedReadCounts = null;
 
     // because some values can be null, we don't want to duplicate effort
     private boolean retrievedReadGroup = false;
-
-    /** A private cache for the reduced read quality.  Null indicates the value hasn't be fetched yet or isn't available */
-    private boolean lookedUpReducedReadQuality = false;
-    private Integer reducedReadQuality;
+    private boolean retrievedReduceReadCounts = false;
 
     // These temporary attributes were added here to make life easier for
     // certain algorithms by providing a way to label or attach arbitrary data to
@@ -51,105 +59,112 @@ public class GATKSAMRecord extends SAMRecord {
     // These attributes exist in memory only, and are never written to disk.
     private Map<Object, Object> temporaryAttributes;
 
-    public GATKSAMRecord(SAMRecord record, boolean useOriginalBaseQualities, byte defaultBaseQualities) {
-        super(null); // it doesn't matter - this isn't used
-        if ( record == null )
-            throw new IllegalArgumentException("The SAMRecord argument cannot be null");
-        mRecord = record;
+    /**
+     * HACK TO CREATE GATKSAMRECORD WITH ONLY A HEADER FOR TESTING PURPOSES ONLY
+     * @param header
+     */
+    public GATKSAMRecord(final SAMFileHeader header) {
+        this(new SAMRecord(header));
+    }
 
-        mNegativeStrandFlag = mRecord.getReadNegativeStrandFlag();
-        mUnmappedFlag = mRecord.getReadUnmappedFlag();
+    /**
+     * HACK TO CREATE GATKSAMRECORD BASED ONLY A SAMRECORD FOR TESTING PURPOSES ONLY
+     * @param read
+     */
+    public GATKSAMRecord(final SAMRecord read) {
+        super(read.getHeader(), read.getMateReferenceIndex(),
+                read.getAlignmentStart(),
+                read.getReadName() != null ? (short)read.getReadNameLength() : 0,
+                (short)read.getMappingQuality(),
+                0,
+                read.getCigarLength(),
+                read.getFlags(),
+                read.getReadLength(),
+                read.getMateReferenceIndex(),
+                read.getMateAlignmentStart(),
+                read.getInferredInsertSize(),
+                new byte[]{});
+        super.clearAttributes();
+    }
 
-        // because attribute methods are declared to be final (and we can't overload them),
-        // we need to actually set all of the attributes here
-        List<SAMTagAndValue> attributes = record.getAttributes();
-        for ( SAMTagAndValue attribute : attributes )
-            setAttribute(attribute.tag, attribute.value);
-
-        // if we are using default quals, check if we need them, and add if necessary.
-        // 1. we need if reads are lacking or have incomplete quality scores
-        // 2. we add if defaultBaseQualities has a positive value
-        if (defaultBaseQualities >= 0) {
-            byte reads [] = record.getReadBases();
-            byte quals [] = record.getBaseQualities();
-            if (quals == null || quals.length < reads.length) {
-                byte new_quals [] = new byte [reads.length];
-                for (int i=0; i<reads.length; i++)
-                    new_quals[i] = defaultBaseQualities;
-                record.setBaseQualities(new_quals);
-            }
-        }
-
-        // if we are using original quals, set them now if they are present in the record
-        if ( useOriginalBaseQualities ) {
-            byte[] originalQuals = mRecord.getOriginalBaseQualities();
-            if ( originalQuals != null )
-                mRecord.setBaseQualities(originalQuals);
-        }
-
-        // sanity check that the lengths of the base and quality strings are equal
-        if ( getBaseQualities().length  != getReadLength() )
-            throw new UserException.MalformedBAM(this, String.format("Error: the number of base qualities does not match the number of bases in %s.", mRecord.getReadName()));
+    public GATKSAMRecord(final SAMFileHeader header,
+                         final int referenceSequenceIndex,
+                         final int alignmentStart,
+                         final short readNameLength,
+                         final short mappingQuality,
+                         final int indexingBin,
+                         final int cigarLen,
+                         final int flags,
+                         final int readLen,
+                         final int mateReferenceSequenceIndex,
+                         final int mateAlignmentStart,
+                         final int insertSize,
+                         final byte[] variableLengthBlock) {
+        super(header, referenceSequenceIndex, alignmentStart, readNameLength, mappingQuality, indexingBin, cigarLen,
+                flags, readLen, mateReferenceSequenceIndex, mateAlignmentStart, insertSize, variableLengthBlock);
     }
 
     ///////////////////////////////////////////////////////////////////////////////
     // *** The following methods are overloaded to cache the appropriate data ***//
     ///////////////////////////////////////////////////////////////////////////////
 
+    @Override
     public String getReadString() {
         if ( mReadString == null )
-            mReadString = mRecord.getReadString();
+            mReadString = super.getReadString();
         return mReadString;
     }
 
+    @Override
     public void setReadString(String s) {
-        mRecord.setReadString(s);
+        super.setReadString(s);
         mReadString = s;
     }
 
-    public SAMReadGroupRecord getReadGroup() {
+    @Override
+    public GATKSAMReadGroupRecord getReadGroup() {
         if ( !retrievedReadGroup ) {
-            SAMReadGroupRecord tempReadGroup = mRecord.getReadGroup();
-            mReadGroup = (tempReadGroup == null ? tempReadGroup : new GATKSAMReadGroupRecord(tempReadGroup));
+            SAMReadGroupRecord tempReadGroup = super.getReadGroup();
+            mReadGroup = (tempReadGroup == null ? null : new GATKSAMReadGroupRecord(tempReadGroup));
             retrievedReadGroup = true;
         }
         return mReadGroup;
     }
 
-    public void setReadGroup(SAMReadGroupRecord record) {
-        mReadGroup = record;
+    /**
+     * Efficient caching accessor that returns the GATK NGSPlatform of this read
+     * @return
+     */
+    public NGSPlatform getNGSPlatform() {
+        return getReadGroup().getNGSPlatform();
     }
 
-    public boolean getReadUnmappedFlag() {
-        return mUnmappedFlag;
+    public void setReadGroup( final GATKSAMReadGroupRecord readGroup ) {
+        mReadGroup = readGroup;
+        retrievedReadGroup = true;
     }
 
-    public void setReadUnmappedFlag(boolean b) {
-        mRecord.setReadUnmappedFlag(b);
-        mUnmappedFlag = b;
-    }
+    //
+    //
+    // Reduced read functions
+    //
+    //
 
-    public boolean getReadNegativeStrandFlag() {
-        return mNegativeStrandFlag;
-    }
-
-    public void setReadNegativeStrandFlag(boolean b) {
-        mRecord.setReadNegativeStrandFlag(b);
-        mNegativeStrandFlag = b;
-    }
-
-    public boolean getSecondOfPairFlag() {
-        if( mSecondOfPairFlag == null ) {
-            //not done in constructor because this method can't be called for
-            //all SAMRecords.
-            mSecondOfPairFlag = mRecord.getSecondOfPairFlag();
+    public byte[] getReducedReadCounts() {
+        if ( ! retrievedReduceReadCounts ) {
+            reducedReadCounts = getByteArrayAttribute(REDUCED_READ_QUALITY_TAG);
+            retrievedReduceReadCounts = true;
         }
-        return mSecondOfPairFlag;
+
+        return reducedReadCounts;
     }
 
-    public void setSecondOfPairFlag(boolean b) {
-        mRecord.setSecondOfPairFlag(b);
-        mSecondOfPairFlag = b;
+    public boolean isReducedRead() {
+        return getReducedReadCounts() != null;
+    }
+
+    public final byte getReducedCount(final int i) {
+        return getReducedReadCounts()[i];
     }
 
     /**
@@ -205,269 +220,18 @@ public class GATKSAMRecord extends SAMRecord {
         return null;
     }
 
-    /**
-     * Removes the attribute that has the given key.
-     *
-     * Temporary attributes provide a way to label or attach arbitrary data to
-     * individual GATKSAMRecords. These attributes exist in memory only,
-     * and are never written to disk.
-     *
-     * @param key key
-     * @return The value that was associated with this key, or null.
-     */
-    public Object removeTemporaryAttribute(Object key) {
-         if(temporaryAttributes != null) {
-             return temporaryAttributes.remove(key);
-         }
-         return null;
+    @Override
+    public int hashCode() {
+        return super.hashCode();
     }
 
-    /////////////////////////////////////////////////////////////////////////////////
-    // *** The following methods just call the appropriate method in the record ***//
-    /////////////////////////////////////////////////////////////////////////////////
-
-    public String getReadName() { return mRecord.getReadName(); }
-
-    public int getReadNameLength() { return mRecord.getReadNameLength(); }
-
-    public void setReadName(String s) { mRecord.setReadName(s); }
-
-    public byte[] getReadBases() { return mRecord.getReadBases(); }
-
-    public void setReadBases(byte[] bytes) { mRecord.setReadBases(bytes); }
-
-    public int getReadLength() { return mRecord.getReadLength(); }
-
-    public byte[] getBaseQualities() { return mRecord.getBaseQualities(); }
-
-    public void setBaseQualities(byte[] bytes) { mRecord.setBaseQualities(bytes); }
-
-    public String getBaseQualityString() { return mRecord.getBaseQualityString(); }
-
-    public void setBaseQualityString(String s) { mRecord.setBaseQualityString(s); }
-
-    public byte[] getOriginalBaseQualities() { return mRecord.getOriginalBaseQualities(); }
-
-    public void setOriginalBaseQualities(byte[] bytes) { mRecord.setOriginalBaseQualities(bytes); }
-
-    public String getReferenceName() { return mRecord.getReferenceName(); }
-
-    public void setReferenceName(String s) { mRecord.setReferenceName(s); }
-
-    public Integer getReferenceIndex() { return mRecord.getReferenceIndex(); }
-
-    public void setReferenceIndex(int i) { mRecord.setReferenceIndex(i); }
-
-    public String getMateReferenceName() { return mRecord.getMateReferenceName(); }
-
-    public void setMateReferenceName(String s) { mRecord.setMateReferenceName(s); }
-
-    public Integer getMateReferenceIndex() { return mRecord.getMateReferenceIndex(); }
-
-    public void setMateReferenceIndex(int i) { mRecord.setMateReferenceIndex(i); }
-
-    public int getAlignmentStart() { return mRecord.getAlignmentStart(); }
-
-    public void setAlignmentStart(int i) { mRecord.setAlignmentStart(i); }
-
-    public int getAlignmentEnd() { return mRecord.getAlignmentEnd(); }
-
-    public int getUnclippedStart() { return mRecord.getUnclippedStart(); }
-
-    public int getUnclippedEnd() { return mRecord.getUnclippedEnd(); }
-
-    public void setAlignmentEnd(int i) { mRecord.setAlignmentEnd(i); }
-
-    public int getMateAlignmentStart() { return mRecord.getMateAlignmentStart(); }
-
-    public void setMateAlignmentStart(int i) { mRecord.setMateAlignmentStart(i); }
-
-    public int getInferredInsertSize() { return mRecord.getInferredInsertSize(); }
-
-    public void setInferredInsertSize(int i) { mRecord.setInferredInsertSize(i); }
-
-    public int getMappingQuality() { return mRecord.getMappingQuality(); }
-
-    public void setMappingQuality(int i) { mRecord.setMappingQuality(i); }
-
-    public String getCigarString() { return mRecord.getCigarString(); }
-
-    public void setCigarString(String s) { mRecord.setCigarString(s); }
-
-    public Cigar getCigar() { return mRecord.getCigar(); }
-
-    public int getCigarLength() { return mRecord.getCigarLength(); }
-
-    public void setCigar(Cigar cigar) { mRecord.setCigar(cigar); }
-
-    public int getFlags() { return mRecord.getFlags(); }
-
-    public void setFlags(int i) { mRecord.setFlags(i); }
-
-    public boolean getReadPairedFlag() { return mRecord.getReadPairedFlag(); }
-
-    public boolean getProperPairFlag() { return mRecord.getProperPairFlag(); }
-
-    public boolean getMateUnmappedFlag() { return mRecord.getMateUnmappedFlag(); }
-
-    public boolean getMateNegativeStrandFlag() { return mRecord.getMateNegativeStrandFlag(); }
-
-    public boolean getFirstOfPairFlag() { return mRecord.getFirstOfPairFlag(); }
-
-    public boolean getNotPrimaryAlignmentFlag() { return mRecord.getNotPrimaryAlignmentFlag(); }
-
-    public boolean getReadFailsVendorQualityCheckFlag() { return mRecord.getReadFailsVendorQualityCheckFlag(); }
-
-    public boolean getDuplicateReadFlag() { return mRecord.getDuplicateReadFlag(); }
-
-    public void setReadPairedFlag(boolean b) { mRecord.setReadPairedFlag(b); }
-
-    public void setProperPairFlag(boolean b) { mRecord.setProperPairFlag(b); }
-
-    public void setMateUnmappedFlag(boolean b) { mRecord.setMateUnmappedFlag(b); }
-
-    public void setMateNegativeStrandFlag(boolean b) { mRecord.setMateNegativeStrandFlag(b); }
-
-    public void setFirstOfPairFlag(boolean b) { mRecord.setFirstOfPairFlag(b); }
-
-    public void setNotPrimaryAlignmentFlag(boolean b) { mRecord.setNotPrimaryAlignmentFlag(b); }
-
-    public void setReadFailsVendorQualityCheckFlag(boolean b) { mRecord.setReadFailsVendorQualityCheckFlag(b); }
-
-    public void setDuplicateReadFlag(boolean b) { mRecord.setDuplicateReadFlag(b); }
-
-    public net.sf.samtools.SAMFileReader.ValidationStringency getValidationStringency() { return mRecord.getValidationStringency(); }
-
-    public void setValidationStringency(net.sf.samtools.SAMFileReader.ValidationStringency validationStringency) { mRecord.setValidationStringency(validationStringency); }
-
-    public Object getAttribute(final String tag) { return mRecord.getAttribute(tag); }
-
-    public Integer getIntegerAttribute(final String tag) {
-        if ( tag == ReadUtils.REDUCED_READ_QUALITY_TAG ) {
-            if ( ! lookedUpReducedReadQuality ) {
-                lookedUpReducedReadQuality = true;
-                reducedReadQuality = mRecord.getIntegerAttribute(tag);
-            }
-            return reducedReadQuality;
-        } else {
-            return mRecord.getIntegerAttribute(tag);
-        }
-    }
-
-    public Short getShortAttribute(final String tag) { return mRecord.getShortAttribute(tag); }
-
-    public Byte getByteAttribute(final String tag) { return mRecord.getByteAttribute(tag); }
-
-    public String getStringAttribute(final String tag) { return mRecord.getStringAttribute(tag); }
-
-    public Character getCharacterAttribute(final String tag) { return mRecord.getCharacterAttribute(tag); }
-
-    public Float getFloatAttribute(final String tag) { return mRecord.getFloatAttribute(tag); }
-
-    public byte[] getByteArrayAttribute(final String tag) { return mRecord.getByteArrayAttribute(tag); }
-
-    protected Object getAttribute(final short tag) {
-        Object attribute;
-        try {
-            Method method = mRecord.getClass().getDeclaredMethod("getAttribute",Short.TYPE);
-            method.setAccessible(true);
-            attribute = method.invoke(mRecord,tag);
-        }
-        catch(Exception ex) {
-            throw new ReviewedStingException("Unable to invoke getAttribute method",ex);
-        }
-        return attribute;
-    }
-
-    public void setAttribute(final String tag, final Object value) { mRecord.setAttribute(tag,value); }
-
-    protected void setAttribute(final short tag, final Object value) {
-        try {
-            Method method = mRecord.getClass().getDeclaredMethod("setAttribute",Short.TYPE,Object.class);
-            method.setAccessible(true);
-            method.invoke(mRecord,tag,value);
-        }
-        catch(Exception ex) {
-            throw new ReviewedStingException("Unable to invoke setAttribute method",ex);
-        }
-    }
-
-    public void clearAttributes() { mRecord.clearAttributes(); }
-
-    protected void setAttributes(final SAMBinaryTagAndValue attributes) {
-        try {
-            Method method = mRecord.getClass().getDeclaredMethod("setAttributes",SAMBinaryTagAndValue.class);
-            method.setAccessible(true);
-            method.invoke(mRecord,attributes);
-        }
-        catch(Exception ex) {
-            throw new ReviewedStingException("Unable to invoke setAttributes method",ex);
-        }
-   }
-
-    protected SAMBinaryTagAndValue getBinaryAttributes() {
-        SAMBinaryTagAndValue binaryAttributes;
-        try {
-            Method method = mRecord.getClass().getDeclaredMethod("getBinaryAttributes");
-            method.setAccessible(true);
-            binaryAttributes = (SAMBinaryTagAndValue)method.invoke(mRecord);
-        }
-        catch(Exception ex) {
-            throw new ReviewedStingException("Unable to invoke getBinaryAttributes method",ex);
-        }
-        return binaryAttributes;
-    }
-
-    public List<SAMTagAndValue> getAttributes() { return mRecord.getAttributes(); }
-
-    public SAMFileHeader getHeader() { return mRecord.getHeader(); }
-
-    public void setHeader(SAMFileHeader samFileHeader) { mRecord.setHeader(samFileHeader); }
-
-    public byte[] getVariableBinaryRepresentation() { return mRecord.getVariableBinaryRepresentation(); }
-
-    public int getAttributesBinarySize() { return mRecord.getAttributesBinarySize(); }
-
-    public String format() { return mRecord.format(); }
-
-    public List<AlignmentBlock> getAlignmentBlocks() { return mRecord.getAlignmentBlocks(); }
-
-    public List<SAMValidationError> validateCigar(long l) { return mRecord.validateCigar(l); }
-
     @Override
     public boolean equals(Object o) {
         if (this == o) return true;
 
-        // note -- this forbids a GATKSAMRecord being equal to its underlying SAMRecord
         if (!(o instanceof GATKSAMRecord)) return false;
 
         // note that we do not consider the GATKSAMRecord internal state at all
-        return mRecord.equals(((GATKSAMRecord)o).mRecord);
-    }
-
-    public int hashCode() { return mRecord.hashCode(); }
-
-    public List<SAMValidationError> isValid() { return mRecord.isValid(); }
-
-    public Object clone() throws CloneNotSupportedException { return mRecord.clone(); }
-
-    public String toString() { return mRecord.toString(); }
-
-    public SAMFileSource getFileSource() { return mRecord.getFileSource(); }
-
-    /**
-     * Sets a marker providing the source reader for this file and the position in the file from which the read originated.
-     * @param fileSource source of the given file.
-     */
-    @Override
-    protected void setFileSource(final SAMFileSource fileSource) {
-        try {
-            Method method = SAMRecord.class.getDeclaredMethod("setFileSource",SAMFileSource.class);
-            method.setAccessible(true);
-            method.invoke(mRecord,fileSource);
-        }
-        catch(Exception ex) {
-            throw new ReviewedStingException("Unable to invoke setFileSource method",ex);
-        }
+        return super.equals(o);
     }
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/sam/GATKSamRecordFactory.java b/public/java/src/org/broadinstitute/sting/utils/sam/GATKSamRecordFactory.java
new file mode 100644
index 000000000..d96c874ea
--- /dev/null
+++ b/public/java/src/org/broadinstitute/sting/utils/sam/GATKSamRecordFactory.java
@@ -0,0 +1,74 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.sam;
+
+import net.sf.samtools.SAMFileHeader;
+import net.sf.samtools.SAMRecord;
+import net.sf.samtools.SAMRecordFactory;
+import net.sf.samtools.BAMRecord;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+
+/**
+ * Factory interface implementation used to create GATKSamRecords
+ * from SAMFileReaders with SAM-JDK
+ *
+ * @author Mark DePristo
+ */
+public class GATKSamRecordFactory implements SAMRecordFactory {
+
+    /** Create a new SAMRecord to be filled in */
+    public SAMRecord createSAMRecord(SAMFileHeader header) {
+        throw new UserException.BadInput("The GATK now longer supports input SAM files");
+    }
+
+    /** Create a new BAM Record. */
+    public BAMRecord createBAMRecord(final SAMFileHeader header,
+                                     final int referenceSequenceIndex,
+                                     final int alignmentStart,
+                                     final short readNameLength,
+                                     final short mappingQuality,
+                                     final int indexingBin,
+                                     final int cigarLen,
+                                     final int flags,
+                                     final int readLen,
+                                     final int mateReferenceSequenceIndex,
+                                     final int mateAlignmentStart,
+                                     final int insertSize,
+                                     final byte[] variableLengthBlock) {
+        return new GATKSAMRecord(header,
+                referenceSequenceIndex,
+                alignmentStart,
+                readNameLength,
+                mappingQuality,
+                indexingBin,
+                cigarLen,
+                flags,
+                readLen,
+                mateReferenceSequenceIndex,
+                mateAlignmentStart,
+                insertSize,
+                variableLengthBlock);
+    }
+}
diff --git a/public/java/src/org/broadinstitute/sting/utils/sam/NWaySAMFileWriter.java b/public/java/src/org/broadinstitute/sting/utils/sam/NWaySAMFileWriter.java
index 07bfc52c7..fa07523f3 100644
--- a/public/java/src/org/broadinstitute/sting/utils/sam/NWaySAMFileWriter.java
+++ b/public/java/src/org/broadinstitute/sting/utils/sam/NWaySAMFileWriter.java
@@ -25,18 +25,16 @@
 
 package org.broadinstitute.sting.utils.sam;
 
-import net.sf.samtools.SAMFileHeader;
-import net.sf.samtools.SAMFileWriter;
-import net.sf.samtools.SAMFileWriterFactory;
-import net.sf.samtools.SAMRecord;
+import net.sf.samtools.*;
 import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
 import org.broadinstitute.sting.gatk.datasources.reads.SAMReaderID;
+import org.broadinstitute.sting.gatk.io.StingSAMFileWriter;
 import org.broadinstitute.sting.utils.exceptions.StingException;
 import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.text.TextFormattingUtils;
 
 import java.io.File;
-import java.util.HashMap;
-import java.util.Map;
+import java.util.*;
 
 /**
  * Created by IntelliJ IDEA.
@@ -50,21 +48,35 @@ public class NWaySAMFileWriter implements SAMFileWriter {
     private Map<SAMReaderID,SAMFileWriter> writerMap = null;
     private boolean presorted ;
     GenomeAnalysisEngine toolkit;
+    boolean KEEP_ALL_PG_RECORDS = false;
 
-    public NWaySAMFileWriter(GenomeAnalysisEngine toolkit, Map<String,String> in2out, SAMFileHeader.SortOrder order, boolean presorted, boolean indexOnTheFly, boolean generateMD5) {
+    public NWaySAMFileWriter(GenomeAnalysisEngine toolkit, Map<String,String> in2out, SAMFileHeader.SortOrder order,
+                             boolean presorted, boolean indexOnTheFly, boolean generateMD5, SAMProgramRecord pRecord, boolean keep_records) {
         this.presorted = presorted;
         this.toolkit = toolkit;
+        this.KEEP_ALL_PG_RECORDS = keep_records;
         writerMap = new HashMap<SAMReaderID,SAMFileWriter>();
-        setupByReader(toolkit,in2out,order, presorted, indexOnTheFly, generateMD5);
+        setupByReader(toolkit,in2out,order, presorted, indexOnTheFly, generateMD5, pRecord);
     }
 
-    public NWaySAMFileWriter(GenomeAnalysisEngine toolkit, String ext, SAMFileHeader.SortOrder order, boolean presorted, boolean indexOnTheFly , boolean generateMD5) {
+    public NWaySAMFileWriter(GenomeAnalysisEngine toolkit, String ext, SAMFileHeader.SortOrder order,
+                              boolean presorted, boolean indexOnTheFly , boolean generateMD5, SAMProgramRecord pRecord, boolean keep_records) {
         this.presorted = presorted;
         this.toolkit = toolkit;
+        this.KEEP_ALL_PG_RECORDS = keep_records;
         writerMap = new HashMap<SAMReaderID,SAMFileWriter>();
-        setupByReader(toolkit,ext,order, presorted, indexOnTheFly, generateMD5);
+        setupByReader(toolkit,ext,order, presorted, indexOnTheFly, generateMD5, pRecord);
     }
 
+    public NWaySAMFileWriter(GenomeAnalysisEngine toolkit, Map<String,String> in2out, SAMFileHeader.SortOrder order,
+                             boolean presorted, boolean indexOnTheFly, boolean generateMD5) {
+        this(toolkit, in2out, order, presorted, indexOnTheFly, generateMD5, null,false);
+    }
+
+    public NWaySAMFileWriter(GenomeAnalysisEngine toolkit, String ext, SAMFileHeader.SortOrder order,
+                              boolean presorted, boolean indexOnTheFly , boolean generateMD5) {
+        this(toolkit, ext, order, presorted, indexOnTheFly, generateMD5, null,false);
+    }
 
     /**
      * Instantiates multiple underlying SAM writes, one per input SAM reader registered with GATK engine (those will be retrieved
@@ -73,7 +85,8 @@ public class NWaySAMFileWriter implements SAMFileWriter {
      * @param toolkit
      * @param in2out
      */
-    public void setupByReader(GenomeAnalysisEngine toolkit, Map<String,String> in2out, SAMFileHeader.SortOrder order, boolean presorted, boolean indexOnTheFly, boolean generateMD5) {
+    public void setupByReader(GenomeAnalysisEngine toolkit, Map<String,String> in2out, SAMFileHeader.SortOrder order,
+                              boolean presorted, boolean indexOnTheFly, boolean generateMD5, SAMProgramRecord pRecord) {
         if ( in2out==null ) throw new StingException("input-output bam filename map for n-way-out writing is NULL");
         for ( SAMReaderID rid : toolkit.getReadsDataSource().getReaderIDs() ) {
 
@@ -85,9 +98,10 @@ public class NWaySAMFileWriter implements SAMFileWriter {
             outName = in2out.get(fName);
 
             if ( writerMap.containsKey( rid ) )
-                throw new StingException("nWayOut mode: Reader id for input sam file "+fName+" is already registered");
+                throw new StingException("nWayOut mode: Reader id for input sam file "+fName+" is already registered; "+
+                        "map file likely contains multiple entries for this input file");
 
-            addWriter(rid,outName, order, presorted, indexOnTheFly, generateMD5);
+            addWriter(rid,outName, order, presorted, indexOnTheFly, generateMD5, pRecord);
         }
 
     }
@@ -100,7 +114,8 @@ public class NWaySAMFileWriter implements SAMFileWriter {
      * @param toolkit
      * @param ext
      */
-    public void setupByReader(GenomeAnalysisEngine toolkit, String ext, SAMFileHeader.SortOrder order, boolean presorted, boolean indexOnTheFly, boolean generateMD5) {
+    public void setupByReader(GenomeAnalysisEngine toolkit, String ext, SAMFileHeader.SortOrder order,
+                              boolean presorted, boolean indexOnTheFly, boolean generateMD5, SAMProgramRecord pRecord) {
         for ( SAMReaderID rid : toolkit.getReadsDataSource().getReaderIDs() ) {
 
             String fName = toolkit.getReadsDataSource().getSAMFile(rid).getName();
@@ -117,16 +132,29 @@ public class NWaySAMFileWriter implements SAMFileWriter {
 
             if ( writerMap.containsKey( rid ) )
                 throw new StingException("nWayOut mode: Reader id for input sam file "+fName+" is already registered");
-
-            addWriter(rid,outName, order, presorted, indexOnTheFly, generateMD5);
+            addWriter(rid,outName, order, presorted, indexOnTheFly, generateMD5, pRecord);
         }
 
     }
 
-    private void addWriter(SAMReaderID id , String outName, SAMFileHeader.SortOrder order, boolean presorted, boolean indexOnTheFly, boolean generateMD5) {
+    private void addWriter(SAMReaderID id , String outName, SAMFileHeader.SortOrder order, boolean presorted,
+                           boolean indexOnTheFly, boolean generateMD5, SAMProgramRecord programRecord) {
         File f = new File(outName);
         SAMFileHeader header = toolkit.getSAMFileHeader(id).clone();
         header.setSortOrder(order);
+
+        if ( programRecord != null )  {
+            // --->> add program record
+            List<SAMProgramRecord> oldRecords = header.getProgramRecords();
+            List<SAMProgramRecord> newRecords = new ArrayList<SAMProgramRecord>(oldRecords.size()+1);
+            for ( SAMProgramRecord record : oldRecords ) {
+                if ( !record.getId().startsWith(programRecord.getId()) || KEEP_ALL_PG_RECORDS )
+                    newRecords.add(record);
+            }
+            newRecords.add(programRecord);
+            header.setProgramRecords(newRecords);
+            // <-- add program record ends here
+        }
         SAMFileWriterFactory factory = new SAMFileWriterFactory();
         factory.setCreateIndex(indexOnTheFly);
         factory.setCreateMd5File(generateMD5);
@@ -134,7 +162,10 @@ public class NWaySAMFileWriter implements SAMFileWriter {
         writerMap.put(id,sw);
     }
 
-    
+    public Collection<SAMFileWriter> getWriters() {
+        return writerMap.values();
+    }
+
     public void addAlignment(SAMRecord samRecord) {
         final SAMReaderID id = toolkit.getReaderIDForRead(samRecord);
         String rg = samRecord.getStringAttribute("RG");
@@ -146,7 +177,7 @@ public class NWaySAMFileWriter implements SAMFileWriter {
     }
 
     public SAMFileHeader getFileHeader() {
-        return toolkit.getSAMFileHeader();  
+        return toolkit.getSAMFileHeader();
     }
 
     public void close() {
diff --git a/public/java/src/org/broadinstitute/sting/utils/sam/ReadUtils.java b/public/java/src/org/broadinstitute/sting/utils/sam/ReadUtils.java
old mode 100644
new mode 100755
index 62bbb0307..e125b8c80
--- a/public/java/src/org/broadinstitute/sting/utils/sam/ReadUtils.java
+++ b/public/java/src/org/broadinstitute/sting/utils/sam/ReadUtils.java
@@ -43,10 +43,19 @@ import java.util.*;
  * @version 0.1
  */
 public class ReadUtils {
-    public static final String REDUCED_READ_QUALITY_TAG = "RQ";
-
     private ReadUtils() { }
 
+    // ----------------------------------------------------------------------------------------------------
+    //
+    // Reduced read utilities
+    //
+    // ----------------------------------------------------------------------------------------------------
+
+    // ----------------------------------------------------------------------------------------------------
+    //
+    // General utilities
+    //
+    // ----------------------------------------------------------------------------------------------------
     public static SAMFileHeader copySAMFileHeader(SAMFileHeader toCopy) {
         SAMFileHeader copy = new SAMFileHeader();
 
@@ -118,37 +127,46 @@ public class ReadUtils {
     /**
      * This enum represents all the different ways in which a read can overlap an interval.
      *
-     * NO_OVERLAP:
+     * NO_OVERLAP_CONTIG:
+     * read and interval are in different contigs.
+     *
+     * NO_OVERLAP_LEFT:
+     * the read does not overlap the interval.
+     *
+     *                        |----------------| (interval)
+     *   <---------------->                      (read)
+     *
+     * NO_OVERLAP_RIGHT:
      * the read does not overlap the interval.
      *
      *   |----------------|                      (interval)
      *                        <----------------> (read)
      *
-     * LEFT_OVERLAP:
+     * OVERLAP_LEFT:
      * the read starts before the beginning of the interval but ends inside of it
      *
      *          |----------------| (interval)
      *   <---------------->        (read)
      *
-     * RIGHT_OVERLAP:
+     * OVERLAP_RIGHT:
      * the read starts inside the interval but ends outside of it
      *
      *   |----------------|     (interval)
      *       <----------------> (read)
      *
-     * FULL_OVERLAP:
+     * OVERLAP_LEFT_AND_RIGHT:
      * the read starts before the interval and ends after the interval
      *
      *      |-----------|     (interval)
      *  <-------------------> (read)
      *
-     * CONTAINED:
+     * OVERLAP_CONTAINED:
      * the read starts and ends inside the interval
      *
      *  |----------------|     (interval)
      *     <-------->          (read)
      */
-    public enum ReadAndIntervalOverlap {NO_OVERLAP_CONTIG, NO_OVERLAP_LEFT, NO_OVERLAP_RIGHT, OVERLAP_LEFT, OVERLAP_RIGHT, OVERLAP_LEFT_AND_RIGHT, OVERLAP_CONTAINED}
+    public enum ReadAndIntervalOverlap {NO_OVERLAP_CONTIG, NO_OVERLAP_LEFT, NO_OVERLAP_RIGHT, NO_OVERLAP_HARDCLIPPED_LEFT, NO_OVERLAP_HARDCLIPPED_RIGHT, OVERLAP_LEFT, OVERLAP_RIGHT, OVERLAP_LEFT_AND_RIGHT, OVERLAP_CONTAINED}
 
     /**
      * God, there's a huge information asymmetry in SAM format:
@@ -170,15 +188,15 @@ public class ReadUtils {
      * This makes the following code a little nasty, since we can only detect if a base is in the adaptor, but not
      * if it overlaps the read.
      *
-     * @param rec
+     * @param read
      * @param basePos
      * @param adaptorLength
      * @return
      */
-    public static OverlapType readPairBaseOverlapType(final SAMRecord rec, long basePos, final int adaptorLength) {
+    public static OverlapType readPairBaseOverlapType(final SAMRecord read, long basePos, final int adaptorLength) {
         OverlapType state = OverlapType.NOT_OVERLAPPING;
 
-        Pair<Integer, Integer> adaptorBoundaries = getAdaptorBoundaries(rec, adaptorLength);
+        Pair<Integer, Integer> adaptorBoundaries = getAdaptorBoundaries(read, adaptorLength);
 
         if ( adaptorBoundaries != null ) { // we're not an unmapped pair -- cannot filter out
 
@@ -187,28 +205,28 @@ public class ReadUtils {
             if ( inAdapator ) { 
                 state = OverlapType.IN_ADAPTOR;
                 //System.out.printf("baseOverlapState: %50s negStrand=%b base=%d start=%d stop=%d, adaptorStart=%d adaptorEnd=%d isize=%d => %s%n",
-                //        rec.getReadName(), rec.getReadNegativeStrandFlag(), basePos, rec.getAlignmentStart(), rec.getAlignmentEnd(), adaptorBoundaries.first, adaptorBoundaries.second, rec.getInferredInsertSize(), state);
+                //        read.getReadName(), read.getReadNegativeStrandFlag(), basePos, read.getAlignmentStart(), read.getAlignmentEnd(), adaptorBoundaries.first, adaptorBoundaries.second, read.getInferredInsertSize(), state);
             }
         }
 
         return state;
     }
 
-    private static Pair<Integer, Integer> getAdaptorBoundaries(SAMRecord rec, int adaptorLength) {
-        int isize = rec.getInferredInsertSize();
+    private static Pair<Integer, Integer> getAdaptorBoundaries(SAMRecord read, int adaptorLength) {
+        int isize = read.getInferredInsertSize();
         if ( isize == 0 )
             return null; // don't worry about unmapped pairs
 
         int adaptorStart, adaptorEnd;
 
-        if ( rec.getReadNegativeStrandFlag() ) {
+        if ( read.getReadNegativeStrandFlag() ) {
             // we are on the negative strand, so our mate is on the positive strand
-            int mateStart = rec.getMateAlignmentStart();
+            int mateStart = read.getMateAlignmentStart();
             adaptorStart = mateStart - adaptorLength - 1;
             adaptorEnd = mateStart - 1;
         } else {
             // we are on the positive strand, so our mate is on the negative strand
-            int mateEnd = rec.getAlignmentStart() + isize - 1;
+            int mateEnd = read.getAlignmentStart() + isize - 1;
             adaptorStart = mateEnd + 1;
             adaptorEnd = mateEnd + adaptorLength;
         }
@@ -218,47 +236,47 @@ public class ReadUtils {
 
     /**
      *
-     * @param rec  original SAM record
+     * @param read  original SAM record
      * @param adaptorLength  length of adaptor sequence
      * @return a new read with adaptor sequence hard-clipped out or null if read is fully clipped
      */
-    public static GATKSAMRecord hardClipAdaptorSequence(final SAMRecord rec, int adaptorLength) {
+    public static GATKSAMRecord hardClipAdaptorSequence(final GATKSAMRecord read, int adaptorLength) {
 
-        Pair<Integer, Integer> adaptorBoundaries = getAdaptorBoundaries(rec, adaptorLength);
-        GATKSAMRecord result = (GATKSAMRecord)rec;
+        Pair<Integer, Integer> adaptorBoundaries = getAdaptorBoundaries(read, adaptorLength);
+        GATKSAMRecord result = (GATKSAMRecord)read;
 
         if ( adaptorBoundaries != null ) {
-            if ( rec.getReadNegativeStrandFlag() && adaptorBoundaries.second >= rec.getAlignmentStart() && adaptorBoundaries.first < rec.getAlignmentEnd() )
-                result = hardClipStartOfRead(rec, adaptorBoundaries.second);
-            else if ( !rec.getReadNegativeStrandFlag() && adaptorBoundaries.first <= rec.getAlignmentEnd() )
-                result = hardClipEndOfRead(rec, adaptorBoundaries.first);
+            if ( read.getReadNegativeStrandFlag() && adaptorBoundaries.second >= read.getAlignmentStart() && adaptorBoundaries.first < read.getAlignmentEnd() )
+                result = hardClipStartOfRead(read, adaptorBoundaries.second);
+            else if ( !read.getReadNegativeStrandFlag() && adaptorBoundaries.first <= read.getAlignmentEnd() )
+                result = hardClipEndOfRead(read, adaptorBoundaries.first);
         }
 
         return result;
     }
 
     // return true if the read needs to be completely clipped
-    private static GATKSAMRecord hardClipStartOfRead(SAMRecord oldRec, int stopPosition) {
+    private static GATKSAMRecord hardClipStartOfRead(GATKSAMRecord oldRec, int stopPosition) {
 
         if ( stopPosition >= oldRec.getAlignmentEnd() ) {
             // BAM representation issue -- we can't clip away all bases in a read, just leave it alone and let the filter deal with it
-            //System.out.printf("Entire read needs to be clipped: %50s %n", rec.getReadName());
+            //System.out.printf("Entire read needs to be clipped: %50s %n", read.getReadName());
             return null;
         }
 
-        GATKSAMRecord rec;
+        GATKSAMRecord read;
         try {
-            rec = (GATKSAMRecord)oldRec.clone();
+            read = (GATKSAMRecord)oldRec.clone();
         } catch (Exception e) {
             return null;
         }
 
         //System.out.printf("Clipping start of read: %50s start=%d adaptorEnd=%d isize=%d %n",
-        //        rec.getReadName(), rec.getAlignmentStart(), stopPosition, rec.getInferredInsertSize());
+        //        read.getReadName(), read.getAlignmentStart(), stopPosition, read.getInferredInsertSize());
 
-        Cigar oldCigar = rec.getCigar();
+        Cigar oldCigar = read.getCigar();
         LinkedList<CigarElement> newCigarElements = new LinkedList<CigarElement>();
-        int currentPos = rec.getAlignmentStart();
+        int currentPos = read.getAlignmentStart();
         int basesToClip = 0;
         int basesAlreadyClipped = 0;
 
@@ -297,48 +315,48 @@ public class ReadUtils {
         }
 
         // copy over the unclipped bases
-        final byte[] bases = rec.getReadBases();
-        final byte[] quals = rec.getBaseQualities();
+        final byte[] bases = read.getReadBases();
+        final byte[] quals = read.getBaseQualities();
         int newLength = bases.length - basesToClip;
         byte[] newBases = new byte[newLength];
         byte[] newQuals = new byte[newLength];
         System.arraycopy(bases, basesToClip, newBases, 0, newLength);
         System.arraycopy(quals, basesToClip, newQuals, 0, newLength);
-        rec.setReadBases(newBases);
-        rec.setBaseQualities(newQuals);
+        read.setReadBases(newBases);
+        read.setBaseQualities(newQuals);
 
         // now add a CIGAR element for the clipped bases
         newCigarElements.addFirst(new CigarElement(basesToClip + basesAlreadyClipped, CigarOperator.H));
         Cigar newCigar = new Cigar(newCigarElements);
-        rec.setCigar(newCigar);
+        read.setCigar(newCigar);
 
         // adjust the start accordingly
-        rec.setAlignmentStart(stopPosition + 1);
+        read.setAlignmentStart(stopPosition + 1);
 
-        return rec;
+        return read;
     }
 
-    private static GATKSAMRecord hardClipEndOfRead(SAMRecord oldRec, int startPosition) {
+    private static GATKSAMRecord hardClipEndOfRead(GATKSAMRecord oldRec, int startPosition) {
 
         if ( startPosition <= oldRec.getAlignmentStart() ) {
             // BAM representation issue -- we can't clip away all bases in a read, just leave it alone and let the filter deal with it
-            //System.out.printf("Entire read needs to be clipped: %50s %n", rec.getReadName());
+            //System.out.printf("Entire read needs to be clipped: %50s %n", read.getReadName());
             return null;
         }
 
-        GATKSAMRecord rec;
+        GATKSAMRecord read;
         try {
-            rec = (GATKSAMRecord)oldRec.clone();
+            read = (GATKSAMRecord)oldRec.clone();
         } catch (Exception e) {
             return null;
         }
 
         //System.out.printf("Clipping end of read: %50s adaptorStart=%d end=%d isize=%d %n",
-        //        rec.getReadName(), startPosition, rec.getAlignmentEnd(), rec.getInferredInsertSize());
+        //        read.getReadName(), startPosition, read.getAlignmentEnd(), read.getInferredInsertSize());
 
-        Cigar oldCigar = rec.getCigar();
+        Cigar oldCigar = read.getCigar();
         LinkedList<CigarElement> newCigarElements = new LinkedList<CigarElement>();
-        int currentPos = rec.getAlignmentStart();
+        int currentPos = read.getAlignmentStart();
         int basesToKeep = 0;
         int basesAlreadyClipped = 0;
 
@@ -384,41 +402,41 @@ public class ReadUtils {
         }
 
         // copy over the unclipped bases
-        final byte[] bases = rec.getReadBases();
-        final byte[] quals = rec.getBaseQualities();
+        final byte[] bases = read.getReadBases();
+        final byte[] quals = read.getBaseQualities();
         byte[] newBases = new byte[basesToKeep];
         byte[] newQuals = new byte[basesToKeep];
         System.arraycopy(bases, 0, newBases, 0, basesToKeep);
         System.arraycopy(quals, 0, newQuals, 0, basesToKeep);
-        rec.setReadBases(newBases);
-        rec.setBaseQualities(newQuals);
+        read.setReadBases(newBases);
+        read.setBaseQualities(newQuals);
 
         // now add a CIGAR element for the clipped bases
         newCigarElements.add(new CigarElement((bases.length - basesToKeep) + basesAlreadyClipped, CigarOperator.H));
         Cigar newCigar = new Cigar(newCigarElements);
-        rec.setCigar(newCigar);
+        read.setCigar(newCigar);
 
         // adjust the stop accordingly
-        // rec.setAlignmentEnd(startPosition - 1);
+        // read.setAlignmentEnd(startPosition - 1);
 
-        return rec;
+        return read;
     }
 
     /**
      * Hard clips away (i.e.g, removes from the read) bases that were previously soft clipped.
      *
-     * @param rec
+     * @param read
      * @return
      */
-    @Requires("rec != null")
+    @Requires("read != null")
     @Ensures("result != null")
-    public static SAMRecord hardClipSoftClippedBases(SAMRecord rec) {
-        List<CigarElement> cigarElts = rec.getCigar().getCigarElements();
+    public static GATKSAMRecord hardClipSoftClippedBases(GATKSAMRecord read) {
+        List<CigarElement> cigarElts = read.getCigar().getCigarElements();
 
         if ( cigarElts.size() == 1 ) // can't be soft clipped, just return
-            return rec;
+            return read;
 
-        int keepStart = 0, keepEnd = rec.getReadLength() - 1;
+        int keepStart = 0, keepEnd = read.getReadLength() - 1;
         List<CigarElement> newCigarElements = new LinkedList<CigarElement>();
 
         for ( int i = 0; i < cigarElts.size(); i++ ) {
@@ -429,7 +447,7 @@ public class ReadUtils {
                     if ( i == 0 )
                         keepStart = l;
                     else
-                        keepEnd = rec.getReadLength() - l - 1;
+                        keepEnd = read.getReadLength() - l - 1;
                     newCigarElements.add(new CigarElement(l, CigarOperator.HARD_CLIP));
                     break;
 
@@ -459,54 +477,54 @@ public class ReadUtils {
         }
         mergedCigarElements.add(new CigarElement(currentOperatorLength, currentOperator));
 
-        return hardClipBases(rec, keepStart, keepEnd, mergedCigarElements);
+        return hardClipBases(read, keepStart, keepEnd, mergedCigarElements);
     }
 
     /**
-     * Hard clips out the bases in rec, keeping the bases from keepStart to keepEnd, inclusive.  Note these
+     * Hard clips out the bases in read, keeping the bases from keepStart to keepEnd, inclusive.  Note these
      * are offsets, so they are 0 based
      *
-     * @param rec
+     * @param read
      * @param keepStart
      * @param keepEnd
      * @param newCigarElements
      * @return
      */
     @Requires({
-            "rec != null",
+            "read != null",
             "keepStart >= 0",
-            "keepEnd < rec.getReadLength()",
-            "rec.getReadUnmappedFlag() || newCigarElements != null"})
+            "keepEnd < read.getReadLength()",
+            "read.getReadUnmappedFlag() || newCigarElements != null"})
     @Ensures("result != null")
-    public static SAMRecord hardClipBases(SAMRecord rec, int keepStart, int keepEnd, List<CigarElement> newCigarElements) {
+    public static GATKSAMRecord hardClipBases(GATKSAMRecord read, int keepStart, int keepEnd, List<CigarElement> newCigarElements) {
         int newLength = keepEnd - keepStart + 1;
-        if ( newLength != rec.getReadLength() ) {
+        if ( newLength != read.getReadLength() ) {
             try {
-                rec = SimplifyingSAMFileWriter.simplifyRead((SAMRecord)rec.clone());
+                read = (GATKSAMRecord)read.clone();
                 // copy over the unclipped bases
-                final byte[] bases = rec.getReadBases();
-                final byte[] quals = rec.getBaseQualities();
+                final byte[] bases = read.getReadBases();
+                final byte[] quals = read.getBaseQualities();
                 byte[] newBases = new byte[newLength];
                 byte[] newQuals = new byte[newLength];
                 System.arraycopy(bases, keepStart, newBases, 0, newLength);
                 System.arraycopy(quals, keepStart, newQuals, 0, newLength);
-                rec.setReadBases(newBases);
-                rec.setBaseQualities(newQuals);
+                read.setReadBases(newBases);
+                read.setBaseQualities(newQuals);
 
                 // now add a CIGAR element for the clipped bases, if the read isn't unmapped
-                if ( ! rec.getReadUnmappedFlag() ) {
+                if ( ! read.getReadUnmappedFlag() ) {
                     Cigar newCigar = new Cigar(newCigarElements);
-                    rec.setCigar(newCigar);
+                    read.setCigar(newCigar);
                 }
             } catch ( CloneNotSupportedException e ) {
                 throw new ReviewedStingException("WTF, where did clone go?", e);
             }
         }
 
-        return rec;
+        return read;
     }
 
-    public static SAMRecord replaceSoftClipsWithMatches(SAMRecord read) {
+    public static GATKSAMRecord replaceSoftClipsWithMatches(GATKSAMRecord read) {
         List<CigarElement> newCigarElements = new ArrayList<CigarElement>();
 
         for ( CigarElement ce : read.getCigar().getCigarElements() ) {
@@ -543,15 +561,15 @@ public class ReadUtils {
 
     /**
      *
-     * @param rec  original SAM record
+     * @param read  original SAM record
      * @return a new read with adaptor sequence hard-clipped out or null if read is fully clipped
      */
-    public static GATKSAMRecord hardClipAdaptorSequence(final SAMRecord rec) {
-        return hardClipAdaptorSequence(rec, DEFAULT_ADAPTOR_SIZE);
+    public static GATKSAMRecord hardClipAdaptorSequence(final GATKSAMRecord read) {
+        return hardClipAdaptorSequence(read, DEFAULT_ADAPTOR_SIZE);
     }
 
-    public static OverlapType readPairBaseOverlapType(final SAMRecord rec, long basePos) {
-        return readPairBaseOverlapType(rec, basePos, DEFAULT_ADAPTOR_SIZE);
+    public static OverlapType readPairBaseOverlapType(final SAMRecord read, long basePos) {
+        return readPairBaseOverlapType(read, basePos, DEFAULT_ADAPTOR_SIZE);
     }
 
     public static boolean is454Read(SAMRecord read) {
@@ -583,10 +601,10 @@ public class ReadUtils {
         readFlagNames.put(0x400, "Duplicate");
     }
 
-    public static String readFlagsAsString(SAMRecord rec) {
+    public static String readFlagsAsString(GATKSAMRecord read) {
         String flags = "";
         for (int flag : readFlagNames.keySet()) {
-            if ((rec.getFlags() & flag) != 0) {
+            if ((read.getFlags() & flag) != 0) {
                 flags += readFlagNames.get(flag) + " ";
             }
         }
@@ -600,7 +618,7 @@ public class ReadUtils {
      * @param reads
      * @return
      */
-    public final static List<SAMRecord> coordinateSortReads(List<SAMRecord> reads) {
+    public final static List<GATKSAMRecord> coordinateSortReads(List<GATKSAMRecord> reads) {
         final SAMRecordComparator comparer = new SAMRecordCoordinateComparator();
         Collections.sort(reads, comparer);
         return reads;
@@ -629,37 +647,45 @@ public class ReadUtils {
      * @param interval the interval
      * @return the overlap type as described by ReadAndIntervalOverlap enum (see above)
      */
-    public static ReadAndIntervalOverlap getReadAndIntervalOverlapType(SAMRecord read, GenomeLoc interval) {
+    public static ReadAndIntervalOverlap getReadAndIntervalOverlapType(GATKSAMRecord read, GenomeLoc interval) {
 
-        int start = getRefCoordSoftUnclippedStart(read);
-        int stop = getRefCoordSoftUnclippedEnd(read);
+        int sStart = getRefCoordSoftUnclippedStart(read);
+        int sStop = getRefCoordSoftUnclippedEnd(read);
+        int uStart = read.getUnclippedStart();
+        int uStop = read.getUnclippedEnd();
 
         if ( !read.getReferenceName().equals(interval.getContig()) )
             return ReadAndIntervalOverlap.NO_OVERLAP_CONTIG;
 
-        else if  ( stop < interval.getStart() )
+        else if ( uStop < interval.getStart() )
             return ReadAndIntervalOverlap.NO_OVERLAP_LEFT;
 
-        else if ( start > interval.getStop() )
+        else if ( uStart > interval.getStop() )
             return ReadAndIntervalOverlap.NO_OVERLAP_RIGHT;
 
-        else if ( (start >= interval.getStart()) &&
-                  (stop <= interval.getStop()) )
+        else if ( sStop < interval.getStart() )
+            return ReadAndIntervalOverlap.NO_OVERLAP_HARDCLIPPED_LEFT;
+
+        else if ( sStart > interval.getStop() )
+            return ReadAndIntervalOverlap.NO_OVERLAP_HARDCLIPPED_RIGHT;
+
+        else if ( (sStart >= interval.getStart()) &&
+                  (sStop <= interval.getStop()) )
             return ReadAndIntervalOverlap.OVERLAP_CONTAINED;
 
-        else if ( (start < interval.getStart()) &&
-                  (stop > interval.getStop()) )
+        else if ( (sStart < interval.getStart()) &&
+                  (sStop > interval.getStop()) )
             return ReadAndIntervalOverlap.OVERLAP_LEFT_AND_RIGHT;
 
-        else if ( (start < interval.getStart()) )
+        else if ( (sStart < interval.getStart()) )
             return ReadAndIntervalOverlap.OVERLAP_LEFT;
 
         else
             return ReadAndIntervalOverlap.OVERLAP_RIGHT;
     }
 
-    @Ensures({"result >= read.getUnclippedStart()", "result <= read.getUnclippedEnd()"})
-    public static int getRefCoordSoftUnclippedStart(SAMRecord read) {
+    @Ensures({"result >= read.getUnclippedStart()", "result <= read.getUnclippedEnd() || readIsEntirelyInsertion(read)"})
+    public static int getRefCoordSoftUnclippedStart(GATKSAMRecord read) {
         int start = read.getUnclippedStart();
         for (CigarElement cigarElement : read.getCigar().getCigarElements()) {
             if (cigarElement.getOperator() == CigarOperator.HARD_CLIP)
@@ -670,9 +696,13 @@ public class ReadUtils {
         return start;
     }
 
-    @Ensures({"result >= read.getUnclippedStart()", "result <= read.getUnclippedEnd()"})
-    public static int getRefCoordSoftUnclippedEnd(SAMRecord read) {
+    @Ensures({"result >= read.getUnclippedStart()", "result <= read.getUnclippedEnd() || readIsEntirelyInsertion(read)"})
+    public static int getRefCoordSoftUnclippedEnd(GATKSAMRecord read) {
         int stop = read.getUnclippedStart();
+
+        if (readIsEntirelyInsertion(read))
+            return stop;
+
         int shift = 0;
         CigarOperator lastOperator = null;
         for (CigarElement cigarElement : read.getCigar().getCigarElements()) {
@@ -686,85 +716,198 @@ public class ReadUtils {
         return (lastOperator == CigarOperator.HARD_CLIP) ? stop-1 : stop+shift-1 ;
     }
 
+    private static boolean readIsEntirelyInsertion(GATKSAMRecord read) {
+        for (CigarElement cigarElement : read.getCigar().getCigarElements()) {
+            if (cigarElement.getOperator() != CigarOperator.INSERTION)
+                return false;
+        }
+        return true;
+    }
+
+    public enum ClippingTail {
+        LEFT_TAIL,
+        RIGHT_TAIL
+    }
+
     /**
-     * Looks for a read coordinate that corresponds to the reference coordinate in the soft clipped region before
-     * the alignment start of the read.
+     * Pre-processes the results of getReadCoordinateForReferenceCoordinate(GATKSAMRecord, int) in case it falls in
+     * a deletion following the typical clipping needs. If clipping the left tail (beginning of the read) returns
+     * the base prior to the deletion. If clipping the right tail (end of the read) returns the base after the
+     * deletion.
      *
      * @param read
      * @param refCoord
-     * @return the corresponding read coordinate or -1 if it failed to find it (it has been hard clipped before)
+     * @param tail
+     * @return the read coordinate corresponding to the requested reference coordinate for clipping.
      */
-    @Requires({"refCoord >= read.getUnclippedStart()", "refCoord < read.getAlignmentStart()"})
-    private static int getReadCoordinateForReferenceCoordinateBeforeAlignmentStart(SAMRecord read, int refCoord) {
-        if (getRefCoordSoftUnclippedStart(read) <= refCoord)
-            return refCoord - getRefCoordSoftUnclippedStart(read) + 1;
-        return -1;
-    }
-
-
-    /**
-     * Looks for a read coordinate that corresponds to the reference coordinate in the soft clipped region after
-     * the alignment end of the read.
-     *
-     * @param read
-     * @param refCoord
-     * @return the corresponding read coordinate or -1 if it failed to find it (it has been hard clipped before)
-     */
-    @Requires({"refCoord <= read.getUnclippedEnd()", "refCoord > read.getAlignmentEnd()"})
-    private static int getReadCoordinateForReferenceCoordinateBeforeAlignmentEnd(SAMRecord read, int refCoord) {
-        if (getRefCoordSoftUnclippedEnd(read) >= refCoord)
-            return refCoord - getRefCoordSoftUnclippedStart(read) + 1;
-        return -1;
-    }
-
-
     @Requires({"refCoord >= read.getUnclippedStart()", "refCoord <= read.getUnclippedEnd()"})
     @Ensures({"result >= 0", "result < read.getReadLength()"})
-    public static int getReadCoordinateForReferenceCoordinate(SAMRecord read, int refCoord) {
+    public static int getReadCoordinateForReferenceCoordinate(GATKSAMRecord read, int refCoord, ClippingTail tail) {
+        Pair<Integer, Boolean> result = getReadCoordinateForReferenceCoordinate(read, refCoord);
+        int readCoord = result.getFirst();
+
+        if (result.getSecond() && tail == ClippingTail.RIGHT_TAIL)
+            readCoord++;
+
+        return readCoord;
+    }
+
+    /**
+     * Returns the read coordinate corresponding to the requested reference coordinate.
+     *
+     * WARNING: if the requested reference coordinate happens to fall inside a deletion in the read, this function
+     * will return the last read base before the deletion. This function returns a
+     * Pair(int readCoord, boolean fallsInsideDeletion) so you can choose which readCoordinate to use when faced with
+     * a deletion.
+     *
+     * SUGGESTION: Use getReadCoordinateForReferenceCoordinate(GATKSAMRecord, int, ClippingTail) instead to get a
+     * pre-processed result according to normal clipping needs. Or you can use this function and tailor the
+     * behavior to your needs.
+     *
+     * @param read
+     * @param refCoord
+     * @return the read coordinate corresponding to the requested reference coordinate. (see warning!)
+     */
+    @Requires({"refCoord >= getRefCoordSoftUnclippedStart(read)", "refCoord <= getRefCoordSoftUnclippedEnd(read)"})
+    @Ensures({"result.getFirst() >= 0", "result.getFirst() < read.getReadLength()"})
+    public static Pair<Integer, Boolean> getReadCoordinateForReferenceCoordinate(GATKSAMRecord read, int refCoord) {
         int readBases = 0;
         int refBases = 0;
+        boolean fallsInsideDeletion = false;
 
-        if (refCoord < read.getAlignmentStart()) {
-            readBases = getReadCoordinateForReferenceCoordinateBeforeAlignmentStart(read, refCoord);
-            if (readBases < 0)
-                throw new ReviewedStingException("Requested a coordinate in a hard clipped area of the read. No equivalent read coordinate.");
-        }
-        else if (refCoord > read.getAlignmentEnd()) {
-            readBases = getReadCoordinateForReferenceCoordinateBeforeAlignmentEnd(read, refCoord);
-            if (readBases < 0)
-                throw new ReviewedStingException("Requested a coordinate in a hard clipped area of the read. No equivalent read coordinate.");
-        }
-        else {
-            int goal = refCoord - read.getAlignmentStart();  // The goal is to move this many reference bases
-            boolean goalReached = refBases == goal;
+        int goal = refCoord - getRefCoordSoftUnclippedStart(read);  // The goal is to move this many reference bases
+        boolean goalReached = refBases == goal;
 
-            Iterator<CigarElement> cigarElementIterator = read.getCigar().getCigarElements().iterator();
-            while (!goalReached && cigarElementIterator.hasNext()) {
-                CigarElement cigarElement = cigarElementIterator.next();
-                int shift = 0;
+        Iterator<CigarElement> cigarElementIterator = read.getCigar().getCigarElements().iterator();
+        while (!goalReached && cigarElementIterator.hasNext()) {
+            CigarElement cigarElement = cigarElementIterator.next();
+            int shift = 0;
 
-                if (cigarElement.getOperator().consumesReferenceBases()) {
-                    if (refBases + cigarElement.getLength() < goal) {
-                        shift = cigarElement.getLength();
+            if (cigarElement.getOperator().consumesReferenceBases() || cigarElement.getOperator() == CigarOperator.SOFT_CLIP) {
+                if (refBases + cigarElement.getLength() < goal)
+                    shift = cigarElement.getLength();
+                else
+                    shift = goal - refBases;
+
+                refBases += shift;
+            }
+            goalReached = refBases == goal;
+
+            if (!goalReached && cigarElement.getOperator().consumesReadBases())
+                readBases += cigarElement.getLength();
+
+            if (goalReached) {
+                // Is this base's reference position within this cigar element? Or did we use it all?
+                boolean endsWithinCigar = shift <  cigarElement.getLength();
+
+                // If it isn't, we need to check the next one. There should *ALWAYS* be a next one
+                // since we checked if the goal coordinate is within the read length, so this is just a sanity check.
+                if (!endsWithinCigar && !cigarElementIterator.hasNext())
+                    throw new ReviewedStingException("Reference coordinate corresponds to a non-existent base in the read. This should never happen -- call Mauricio");
+
+                CigarElement nextCigarElement;
+
+                // if we end inside the current cigar element, we just have to check if it is a deletion
+                if (endsWithinCigar)
+                    fallsInsideDeletion = cigarElement.getOperator() == CigarOperator.DELETION;
+
+                // if we end outside the current cigar element, we need to check if the next element is an insertion or deletion.
+                else {
+                    nextCigarElement = cigarElementIterator.next();
+
+                    // if it's an insertion, we need to clip the whole insertion before looking at the next element
+                    if (nextCigarElement.getOperator() == CigarOperator.INSERTION) {
+                        readBases += nextCigarElement.getLength();
+                        if (!cigarElementIterator.hasNext())
+                            throw new ReviewedStingException("Reference coordinate corresponds to a non-existent base in the read. This should never happen -- call Mauricio");
+
+                        nextCigarElement = cigarElementIterator.next();
                     }
-                    else {
-                        shift = goal - refBases;
-                    }
-                    refBases += shift;
+
+                    // if it's a deletion, we will pass the information on to be handled downstream.
+                    fallsInsideDeletion = nextCigarElement.getOperator() == CigarOperator.DELETION;
                 }
-                goalReached = refBases == goal;
 
-                if (cigarElement.getOperator().consumesReadBases()) {
-                    readBases += goalReached ? shift : cigarElement.getLength();
+                // If we reached our goal outside a deletion, add the shift
+                if (!fallsInsideDeletion && cigarElement.getOperator().consumesReadBases())
+                    readBases += shift;
+
+                // If we reached our goal inside a deletion, but the deletion is the next cigar element then we need
+                // to add the shift of the current cigar element but go back to it's last element to return the last
+                // base before the deletion (see warning in function contracts)
+                else if (fallsInsideDeletion && !endsWithinCigar)
+                    readBases += shift - 1;
+
+                // If we reached our goal inside a deletion then we must backtrack to the last base before the deletion
+                else if (fallsInsideDeletion && endsWithinCigar)
+                    readBases--;
                 }
             }
 
             if (!goalReached)
                 throw new ReviewedStingException("Somehow the requested coordinate is not covered by the read. Too many deletions?");
-        }
+        
 
-        return readBases;
+        return new Pair<Integer, Boolean>(readBases, fallsInsideDeletion);
     }
 
+    public static GATKSAMRecord unclipSoftClippedBases(GATKSAMRecord read) {
+        int newReadStart = read.getAlignmentStart();
+        int newReadEnd = read.getAlignmentEnd();
+        List<CigarElement> newCigarElements = new ArrayList<CigarElement>(read.getCigar().getCigarElements().size());
+        int heldOver = -1;
+        boolean sSeen = false;
+        for ( CigarElement e : read.getCigar().getCigarElements() ) {
+            if ( e.getOperator().equals(CigarOperator.S) ) {
+                newCigarElements.add(new CigarElement(e.getLength(),CigarOperator.M));
+                if ( sSeen ) {
+                    newReadEnd += e.getLength();
+                    sSeen = true;
+                } else {
+                    newReadStart -= e.getLength();
+                }
+            } else {
+                newCigarElements.add(e);
+            }
+        }
+        // merge duplicate operators together
+        int idx = 0;
+        List<CigarElement> finalCigarElements = new ArrayList<CigarElement>(read.getCigar().getCigarElements().size());
+        while ( idx < newCigarElements.size() -1 ) {
+            if ( newCigarElements.get(idx).getOperator().equals(newCigarElements.get(idx+1).getOperator()) ) {
+                int combSize = newCigarElements.get(idx).getLength();
+                int offset = 0;
+                while (  idx + offset < newCigarElements.size()-1 && newCigarElements.get(idx+offset).getOperator().equals(newCigarElements.get(idx+1+offset).getOperator()) ) {
+                    combSize += newCigarElements.get(idx+offset+1).getLength();
+                    offset++;
+                }
+                finalCigarElements.add(new CigarElement(combSize,newCigarElements.get(idx).getOperator()));
+                idx = idx + offset -1;
+            } else {
+                finalCigarElements.add(newCigarElements.get(idx));
+            }
+            idx++;
+        }
+
+        read.setCigar(new Cigar(finalCigarElements));
+        read.setAlignmentStart(newReadStart);
+
+        return read;
+    }
+
+    /**
+     * Compares two SAMRecords only the basis on alignment start.  Note that
+     * comparisons are performed ONLY on the basis of alignment start; any
+     * two SAM records with the same alignment start will be considered equal.
+     *
+     * Unmapped alignments will all be considered equal.
+     */
+
+    @Requires({"read1 != null", "read2 != null"})
+    @Ensures("result == 0 || result == 1 || result == -1")
+    public static int compareSAMRecords(GATKSAMRecord read1, GATKSAMRecord read2) {
+        AlignmentStartComparator comp = new AlignmentStartComparator();
+        return comp.compare(read1, read2);
+    }
 
 }
diff --git a/public/java/src/org/broadinstitute/sting/utils/text/ListFileUtils.java b/public/java/src/org/broadinstitute/sting/utils/text/ListFileUtils.java
index 9d4b23a8b..c146bf4d4 100644
--- a/public/java/src/org/broadinstitute/sting/utils/text/ListFileUtils.java
+++ b/public/java/src/org/broadinstitute/sting/utils/text/ListFileUtils.java
@@ -80,7 +80,7 @@ public class ListFileUtils {
                 unpackedReads.add(new SAMReaderID(inputFileName,inputFileNameTags));
             }
             else {
-                throw new UserException.CommandLineException(String.format("The GATK reads argument (-I) supports only BAM files with the .bam extension and lists of BAM files " +
+                throw new UserException.CommandLineException(String.format("The GATK reads argument (-I, --input_file) supports only BAM files with the .bam extension and lists of BAM files " +
                         "with the .list extension, but the file %s has neither extension.  Please ensure that your BAM file or list " +
                         "of BAM files is in the correct format, update the extension, and try again.",inputFileName));
             }
diff --git a/public/java/src/org/broadinstitute/sting/utils/text/XReadLines.java b/public/java/src/org/broadinstitute/sting/utils/text/XReadLines.java
index 52b6f3b01..49e9ddf52 100644
--- a/public/java/src/org/broadinstitute/sting/utils/text/XReadLines.java
+++ b/public/java/src/org/broadinstitute/sting/utils/text/XReadLines.java
@@ -99,9 +99,9 @@ public class XReadLines implements Iterator<String>, Iterable<String> {
      *
      * @param reader
      */
-    public XReadLines(final BufferedReader reader, final boolean trimWhitespace) {
+    public XReadLines(final Reader reader, final boolean trimWhitespace) {
         try {
-            this.in = reader;
+            this.in = new BufferedReader(reader);
             nextline = readNextLine();
             this.trimWhitespace = trimWhitespace;
         } catch(IOException e) {
@@ -109,7 +109,7 @@ public class XReadLines implements Iterator<String>, Iterable<String> {
         }
     }
 
-    public XReadLines(final BufferedReader reader) throws FileNotFoundException {
+    public XReadLines(final Reader reader) {
         this(reader, true);
     }
 
diff --git a/public/java/src/org/broadinstitute/sting/utils/variantcontext/Genotype.java b/public/java/src/org/broadinstitute/sting/utils/variantcontext/Genotype.java
index fdf3d97db..e2e44e2b9 100755
--- a/public/java/src/org/broadinstitute/sting/utils/variantcontext/Genotype.java
+++ b/public/java/src/org/broadinstitute/sting/utils/variantcontext/Genotype.java
@@ -26,14 +26,31 @@ public class Genotype {
     protected boolean filtersWereAppliedToContext;
 
     public Genotype(String sampleName, List<Allele> alleles, double negLog10PError, Set<String> filters, Map<String, ?> attributes, boolean isPhased) {
+        this(sampleName, alleles, negLog10PError, filters, attributes, isPhased, null);
+    }
+
+    public Genotype(String sampleName, List<Allele> alleles, double negLog10PError, Set<String> filters, Map<String, ?> attributes, boolean isPhased, double[] log10Likelihoods) {
         if ( alleles != null )
             this.alleles = Collections.unmodifiableList(alleles);
         commonInfo = new InferredGeneticContext(sampleName, negLog10PError, filters, attributes);
+        if ( log10Likelihoods != null )
+            commonInfo.putAttribute(VCFConstants.PHRED_GENOTYPE_LIKELIHOODS_KEY, GenotypeLikelihoods.fromLog10Likelihoods(log10Likelihoods));
         filtersWereAppliedToContext = filters != null;
         this.isPhased = isPhased;
         validate();
     }
 
+    /**
+     * Creates a new Genotype for sampleName with genotype according to alleles.
+     * @param sampleName
+     * @param alleles
+     * @param negLog10PError the confidence in these alleles
+     * @param log10Likelihoods a log10 likelihoods for each of the genotype combinations possible for alleles, in the standard VCF ordering, or null if not known
+     */
+    public Genotype(String sampleName, List<Allele> alleles, double negLog10PError, double[] log10Likelihoods) {
+        this(sampleName, alleles, negLog10PError, null, null, false, log10Likelihoods);
+    }
+
     public Genotype(String sampleName, List<Allele> alleles, double negLog10PError) {
         this(sampleName, alleles, negLog10PError, null, null, false);
     }
@@ -57,13 +74,6 @@ public class Genotype {
         return new Genotype(g.getSampleName(), g.getAlleles(), g.getNegLog10PError(), g.filtersWereApplied() ? g.getFilters() : null, attributes, g.isPhased());
     }
 
-    public static Genotype removePLs(Genotype g) {
-        Map<String, Object> attrs = new HashMap<String, Object>(g.getAttributes());
-        attrs.remove(VCFConstants.PHRED_GENOTYPE_LIKELIHOODS_KEY);
-        attrs.remove(VCFConstants.GENOTYPE_LIKELIHOODS_KEY);
-        return new Genotype(g.getSampleName(), g.getAlleles(), g.getNegLog10PError(), g.filtersWereApplied() ? g.getFilters() : null, attrs, g.isPhased());
-    }
-
     public static Genotype modifyAlleles(Genotype g, List<Allele> alleles) {
         return new Genotype(g.getSampleName(), alleles, g.getNegLog10PError(), g.filtersWereApplied() ? g.getFilters() : null, g.getAttributes(), g.isPhased());
     }
@@ -98,14 +108,19 @@ public class Genotype {
     /**
      * @return the ploidy of this genotype
      */
-    public int getPloidy() { return alleles.size(); }
+    public int getPloidy() {
+        if ( alleles == null )
+            throw new ReviewedStingException("Requesting ploidy for an UNAVAILABLE genotype");
+        return alleles.size();
+    }
 
     public enum Type {
         NO_CALL,
         HOM_REF,
         HET,
         HOM_VAR,
-        UNAVAILABLE
+        UNAVAILABLE,
+        MIXED  // no-call and call in the same genotype
     }
 
     public Type getType() {
@@ -119,36 +134,68 @@ public class Genotype {
         if ( alleles == null )
             return Type.UNAVAILABLE;
 
-        Allele firstAllele = alleles.get(0);
+        boolean sawNoCall = false, sawMultipleAlleles = false;
+        Allele observedAllele = null;
 
-        if ( firstAllele.isNoCall() ) {
-            return Type.NO_CALL;
+        for ( Allele allele : alleles ) {
+            if ( allele.isNoCall() )
+                sawNoCall = true;
+            else if ( observedAllele == null )
+                observedAllele = allele;
+            else if ( !allele.equals(observedAllele) )
+                sawMultipleAlleles = true;
         }
 
-        for (Allele a : alleles) {
-            if ( ! firstAllele.equals(a) )
-                return Type.HET;
+        if ( sawNoCall ) {
+            if ( observedAllele == null )
+                return Type.NO_CALL;
+            return Type.MIXED;
         }
-        return firstAllele.isReference() ? Type.HOM_REF : Type.HOM_VAR;
+
+        if ( observedAllele == null )
+            throw new ReviewedStingException("BUG: there are no alleles present in this genotype but the alleles list is not null");
+
+        return sawMultipleAlleles ? Type.HET : observedAllele.isReference() ? Type.HOM_REF : Type.HOM_VAR;
     }
 
     /**
-     * @return true if all observed alleles are the same (regardless of whether they are ref or alt)
+     * @return true if all observed alleles are the same (regardless of whether they are ref or alt); if any alleles are no-calls, this method will return false.
      */
     public boolean isHom()    { return isHomRef() || isHomVar(); }
+
+    /**
+     * @return true if all observed alleles are ref; if any alleles are no-calls, this method will return false.
+     */
     public boolean isHomRef() { return getType() == Type.HOM_REF; }
+
+    /**
+     * @return true if all observed alleles are alt; if any alleles are no-calls, this method will return false.
+     */
     public boolean isHomVar() { return getType() == Type.HOM_VAR; }
     
     /**
-     * @return true if we're het (observed alleles differ)
+     * @return true if we're het (observed alleles differ); if the ploidy is less than 2 or if any alleles are no-calls, this method will return false.
      */
     public boolean isHet() { return getType() == Type.HET; }
 
     /**
-     * @return true if this genotype is not actually a genotype but a "no call" (e.g. './.' in VCF)
+     * @return true if this genotype is not actually a genotype but a "no call" (e.g. './.' in VCF); if any alleles are not no-calls (even if some are), this method will return false.
      */
     public boolean isNoCall() { return getType() == Type.NO_CALL; }
+
+    /**
+     * @return true if this genotype is comprised of any alleles that are not no-calls (even if some are).
+     */
     public boolean isCalled() { return getType() != Type.NO_CALL && getType() != Type.UNAVAILABLE; }
+
+    /**
+     * @return true if this genotype is comprised of both calls and no-calls.
+     */
+    public boolean isMixed() { return getType() == Type.MIXED; }
+
+    /**
+     * @return true if the type of this genotype is set.
+     */
     public boolean isAvailable() { return getType() != Type.UNAVAILABLE; }
 
     //
@@ -187,14 +234,16 @@ public class Genotype {
         if ( alleles == null ) return;
         if ( alleles.size() == 0) throw new IllegalArgumentException("BUG: alleles cannot be of size 0");
 
-        int nNoCalls = 0;
+        // int nNoCalls = 0;
         for ( Allele allele : alleles ) {
             if ( allele == null )
                 throw new IllegalArgumentException("BUG: allele cannot be null in Genotype");
-            nNoCalls += allele.isNoCall() ? 1 : 0;
+            // nNoCalls += allele.isNoCall() ? 1 : 0;
         }
-        if ( nNoCalls > 0 && nNoCalls != alleles.size() )
-            throw new IllegalArgumentException("BUG: alleles include some No Calls and some Calls, an illegal state " + this);
+
+        // Technically, the spec does allow for the below case so this is not an illegal state
+        //if ( nNoCalls > 0 && nNoCalls != alleles.size() )
+        //    throw new IllegalArgumentException("BUG: alleles include some No Calls and some Calls, an illegal state " + this);
     }
 
     public String getGenotypeString() {
@@ -258,7 +307,8 @@ public class Genotype {
      * @param <V> the value type
      * @return a sting, enclosed in {}, with comma seperated key value pairs in order of the keys
      */
-    public static <T extends Comparable<T>, V> String sortedString(Map<T, V> c) {
+    private static <T extends Comparable<T>, V> String sortedString(Map<T, V> c) {
+        // NOTE -- THIS IS COPIED FROM GATK UTILS TO ALLOW US TO KEEP A SEPARATION BETWEEN THE GATK AND VCF CODECS
         List<T> t = new ArrayList<T>(c.keySet());
         Collections.sort(t);
 
@@ -293,17 +343,8 @@ public class Genotype {
         return commonInfo.getAttribute(key, defaultValue); 
     }
 
-    public String getAttributeAsString(String key)                        { return commonInfo.getAttributeAsString(key); }
     public String getAttributeAsString(String key, String defaultValue)   { return commonInfo.getAttributeAsString(key, defaultValue); }
-    public int getAttributeAsInt(String key)                              { return commonInfo.getAttributeAsInt(key); }
     public int getAttributeAsInt(String key, int defaultValue)            { return commonInfo.getAttributeAsInt(key, defaultValue); }
-    public double getAttributeAsDouble(String key)                        { return commonInfo.getAttributeAsDouble(key); }
     public double getAttributeAsDouble(String key, double  defaultValue)  { return commonInfo.getAttributeAsDouble(key, defaultValue); }
-    public boolean getAttributeAsBoolean(String key)                        { return commonInfo.getAttributeAsBoolean(key); }
     public boolean getAttributeAsBoolean(String key, boolean  defaultValue)  { return commonInfo.getAttributeAsBoolean(key, defaultValue); }
-
-    public Integer getAttributeAsIntegerNoException(String key)  { return commonInfo.getAttributeAsIntegerNoException(key); }
-    public Double getAttributeAsDoubleNoException(String key)    { return commonInfo.getAttributeAsDoubleNoException(key); }
-    public String getAttributeAsStringNoException(String key)    { return commonInfo.getAttributeAsStringNoException(key); }
-    public Boolean getAttributeAsBooleanNoException(String key)  { return commonInfo.getAttributeAsBooleanNoException(key); }
 }
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/utils/variantcontext/InferredGeneticContext.java b/public/java/src/org/broadinstitute/sting/utils/variantcontext/InferredGeneticContext.java
index 3d162adb0..bf16cd1cf 100755
--- a/public/java/src/org/broadinstitute/sting/utils/variantcontext/InferredGeneticContext.java
+++ b/public/java/src/org/broadinstitute/sting/utils/variantcontext/InferredGeneticContext.java
@@ -1,6 +1,8 @@
 package org.broadinstitute.sting.utils.variantcontext;
 
 
+import org.broadinstitute.sting.utils.codecs.vcf.VCFConstants;
+
 import java.util.*;
 
 
@@ -204,27 +206,40 @@ public final class InferredGeneticContext {
             return defaultValue;
     }
 
-//    public AttributedObject getAttributes(Collection<Object> keys) {
-//        AttributedObject selected = new AttributedObject();
-//
-//        for ( Object key : keys )
-//            selected.putAttribute(key, this.getAttribute(key));
-//
-//        return selected;
-//    }
+    public String getAttributeAsString(String key, String defaultValue) {
+        Object x = getAttribute(key);
+        if ( x == null ) return defaultValue;
+        if ( x instanceof String ) return (String)x;
+        return String.valueOf(x); // throws an exception if this isn't a string
+    }
 
-    public String getAttributeAsString(String key)      { return (String.valueOf(getAttribute(key))); } // **NOTE**: will turn a null Object into the String "null"
-    public int getAttributeAsInt(String key)            { Object x = getAttribute(key); return x instanceof Integer ? (Integer)x : Integer.valueOf((String)x); }
-    public double getAttributeAsDouble(String key)      { Object x = getAttribute(key); return x instanceof Double ? (Double)x : Double.valueOf((String)x); }
-    public boolean getAttributeAsBoolean(String key)      { Object x = getAttribute(key); return x instanceof Boolean ? (Boolean)x : Boolean.valueOf((String)x); }
+    public int getAttributeAsInt(String key, int defaultValue) {
+        Object x = getAttribute(key);
+        if ( x == null || x == VCFConstants.MISSING_VALUE_v4 ) return defaultValue;
+        if ( x instanceof Integer ) return (Integer)x;
+        return Integer.valueOf((String)x); // throws an exception if this isn't a string
+    }
 
-    public String getAttributeAsString(String key, String defaultValue)   { return (String)getAttribute(key, defaultValue); }
-    public int getAttributeAsInt(String key, int defaultValue)            { return (Integer)getAttribute(key, defaultValue); }
-    public double getAttributeAsDouble(String key, double defaultValue)   { return (Double)getAttribute(key, defaultValue); }
-    public boolean getAttributeAsBoolean(String key, boolean defaultValue){ return (Boolean)getAttribute(key, defaultValue); }
+    public double getAttributeAsDouble(String key, double defaultValue) {
+        Object x = getAttribute(key);
+        if ( x == null ) return defaultValue;
+        if ( x instanceof Double ) return (Double)x;
+        return Double.valueOf((String)x); // throws an exception if this isn't a string
+    }
 
-    public Integer getAttributeAsIntegerNoException(String key)  { try {return getAttributeAsInt(key);} catch (Exception e) {return null;} }
-    public Double getAttributeAsDoubleNoException(String key)    { try {return getAttributeAsDouble(key);} catch (Exception e) {return null;} }
-    public String getAttributeAsStringNoException(String key)    { if (getAttribute(key) == null) return null; return getAttributeAsString(key); }
-    public Boolean getAttributeAsBooleanNoException(String key)  { try {return getAttributeAsBoolean(key);} catch (Exception e) {return null;} }
+    public boolean getAttributeAsBoolean(String key, boolean defaultValue) {
+        Object x = getAttribute(key);
+        if ( x == null ) return defaultValue;
+        if ( x instanceof Boolean ) return (Boolean)x;
+        return Boolean.valueOf((String)x); // throws an exception if this isn't a string
+    }
+
+//    public String getAttributeAsString(String key)      { return (String.valueOf(getAttribute(key))); } // **NOTE**: will turn a null Object into the String "null"
+//    public int getAttributeAsInt(String key)            { Object x = getAttribute(key); return x instanceof Integer ? (Integer)x : Integer.valueOf((String)x); }
+//    public double getAttributeAsDouble(String key)      { Object x = getAttribute(key); return x instanceof Double ? (Double)x : Double.valueOf((String)x); }
+//    public boolean getAttributeAsBoolean(String key)      { Object x = getAttribute(key); return x instanceof Boolean ? (Boolean)x : Boolean.valueOf((String)x); }
+//    public Integer getAttributeAsIntegerNoException(String key)  { try {return getAttributeAsInt(key);} catch (Exception e) {return null;} }
+//    public Double getAttributeAsDoubleNoException(String key)    { try {return getAttributeAsDouble(key);} catch (Exception e) {return null;} }
+//    public String getAttributeAsStringNoException(String key)    { if (getAttribute(key) == null) return null; return getAttributeAsString(key); }
+//    public Boolean getAttributeAsBooleanNoException(String key)  { try {return getAttributeAsBoolean(key);} catch (Exception e) {return null;} }
 }
\ No newline at end of file
diff --git a/public/java/src/org/broadinstitute/sting/utils/variantcontext/MutableGenotype.java b/public/java/src/org/broadinstitute/sting/utils/variantcontext/MutableGenotype.java
index 0cd684cb6..14419a2a0 100755
--- a/public/java/src/org/broadinstitute/sting/utils/variantcontext/MutableGenotype.java
+++ b/public/java/src/org/broadinstitute/sting/utils/variantcontext/MutableGenotype.java
@@ -40,19 +40,7 @@ public class MutableGenotype extends Genotype {
      */
     public void setAlleles(List<Allele> alleles) {
         this.alleles = new ArrayList<Allele>(alleles);
-
-        // todo -- add validation checking here
-
-        if ( alleles == null ) throw new IllegalArgumentException("BUG: alleles cannot be null in setAlleles");
-        if ( alleles.size() == 0) throw new IllegalArgumentException("BUG: alleles cannot be of size 0 in setAlleles");
-
-        int nNoCalls = 0;
-        for ( Allele allele : alleles ) { nNoCalls += allele.isNoCall() ? 1 : 0; }
-        if ( nNoCalls > 0 && nNoCalls != alleles.size() )
-            throw new IllegalArgumentException("BUG: alleles include some No Calls and some Calls, an illegal state " + this);
-
-        for ( Allele allele : alleles )
-            if ( allele == null ) throw new IllegalArgumentException("BUG: Cannot add a null allele to a genotype");
+        validate();
     }
 
     public void setPhase(boolean isPhased) {
diff --git a/public/java/src/org/broadinstitute/sting/utils/variantcontext/VariantContext.java b/public/java/src/org/broadinstitute/sting/utils/variantcontext/VariantContext.java
index cfd59b504..f52a7087b 100755
--- a/public/java/src/org/broadinstitute/sting/utils/variantcontext/VariantContext.java
+++ b/public/java/src/org/broadinstitute/sting/utils/variantcontext/VariantContext.java
@@ -132,7 +132,7 @@ import java.util.*;
  * vc.hasGenotypes()
  * vc.isMonomorphic()
  * vc.isPolymorphic()
- * vc.getSampleNames().size()
+ * vc.getSamples().size()
  *
  * vc.getGenotypes()
  * vc.getGenotypes().get("g1")
@@ -181,7 +181,7 @@ public class VariantContext implements Feature { // to enable tribble intergrati
     protected Type type = null;
 
     /** A set of the alleles segregating in this context */
-    protected LinkedHashSet<Allele> alleles = null;
+    final protected List<Allele> alleles;
 
     /** A mapping from sampleName -> genotype objects for all genotypes associated with this context */
     protected Map<String, Genotype> genotypes = null;
@@ -355,7 +355,7 @@ public class VariantContext implements Feature { // to enable tribble intergrati
         if ( alleles == null ) { throw new IllegalArgumentException("Alleles cannot be null"); }
 
         // we need to make this a LinkedHashSet in case the user prefers a given ordering of alleles
-        this.alleles = alleleCollectionToSet(new LinkedHashSet<Allele>(), alleles);
+        this.alleles = makeAlleles(alleles);
 
 
         if ( genotypes == null ) { genotypes = NO_GENOTYPES; }
@@ -445,7 +445,7 @@ public class VariantContext implements Feature { // to enable tribble intergrati
      * @param alleles the set of allele segregating alleles at this site.  Must include those in genotypes, but may be more
      * @return vc subcontext
      */
-    public VariantContext subContextFromGenotypes(Collection<Genotype> genotypes, Set<Allele> alleles) {
+    public VariantContext subContextFromGenotypes(Collection<Genotype> genotypes, Collection<Allele> alleles) {
         return new VariantContext(getSource(), contig, start, stop, alleles, genotypes != null ? genotypeCollectionToMap(new TreeMap<String, Genotype>(), genotypes) : null, getNegLog10PError(), filtersWereApplied() ? getFilters() : null, getAttributes(), getReferenceBaseForIndel());
     }
 
@@ -666,21 +666,11 @@ public class VariantContext implements Feature { // to enable tribble intergrati
         return commonInfo.getAttribute(key, defaultValue);
     }
 
-    public String getAttributeAsString(String key)                        { return commonInfo.getAttributeAsString(key); }
     public String getAttributeAsString(String key, String defaultValue)   { return commonInfo.getAttributeAsString(key, defaultValue); }
-    public int getAttributeAsInt(String key)                              { return commonInfo.getAttributeAsInt(key); }
     public int getAttributeAsInt(String key, int defaultValue)            { return commonInfo.getAttributeAsInt(key, defaultValue); }
-    public double getAttributeAsDouble(String key)                        { return commonInfo.getAttributeAsDouble(key); }
     public double getAttributeAsDouble(String key, double  defaultValue)  { return commonInfo.getAttributeAsDouble(key, defaultValue); }
-    public boolean getAttributeAsBoolean(String key)                        { return commonInfo.getAttributeAsBoolean(key); }
     public boolean getAttributeAsBoolean(String key, boolean  defaultValue)  { return commonInfo.getAttributeAsBoolean(key, defaultValue); }
 
-    public Integer getAttributeAsIntegerNoException(String key)  { return commonInfo.getAttributeAsIntegerNoException(key); }
-    public Double getAttributeAsDoubleNoException(String key)    { return commonInfo.getAttributeAsDoubleNoException(key); }
-    public String getAttributeAsStringNoException(String key)    { return commonInfo.getAttributeAsStringNoException(key); }
-    public Boolean getAttributeAsBooleanNoException(String key)  { return commonInfo.getAttributeAsBooleanNoException(key); }
-
-
     // ---------------------------------------------------------------------------------------------------------
     //
     // Working with alleles
@@ -697,17 +687,6 @@ public class VariantContext implements Feature { // to enable tribble intergrati
         return ref;
     }
 
-    /** Private helper routine that grabs the reference allele but doesn't throw an error if there's no such allele */
-
-//    private Allele getReferenceWithoutError() {
-//        for ( Allele allele : getAlleles() ) {
-//            if ( allele.isReference() ) {
-//                return allele;
-//            }
-//        }
-//
-//        return null;
-//    }
 
     /**
      * @return true if the context is strictly bi-allelic
@@ -764,7 +743,7 @@ public class VariantContext implements Feature { // to enable tribble intergrati
      *
      * @return the set of alleles
      */
-    public Set<Allele> getAlleles() { return alleles; }
+    public List<Allele> getAlleles() { return alleles; }
 
     /**
      * Gets the alternate alleles.  This method should return all the alleles present at the location,
@@ -773,14 +752,8 @@ public class VariantContext implements Feature { // to enable tribble intergrati
      *
      * @return the set of alternate alleles
      */
-    public Set<Allele> getAlternateAlleles() {
-        LinkedHashSet<Allele> altAlleles = new LinkedHashSet<Allele>();
-        for ( Allele allele : alleles ) {
-            if ( allele.isNonReference() )
-                altAlleles.add(allele);
-        }
-
-        return Collections.unmodifiableSet(altAlleles);
+    public List<Allele> getAlternateAlleles() {
+        return alleles.subList(1, alleles.size());
     }
 
     /**
@@ -807,14 +780,7 @@ public class VariantContext implements Feature { // to enable tribble intergrati
      * @throws IllegalArgumentException if i is invalid
      */
     public Allele getAlternateAllele(int i) {
-        int n = 0;
-
-        for ( Allele allele : alleles ) {
-            if ( allele.isNonReference() && n++ == i )
-                return allele;
-        }
-
-        throw new IllegalArgumentException("Requested " + i + " alternative allele but there are only " + n + " alternative alleles " + this);
+        return alleles.get(i+1);
     }
 
     /**
@@ -823,8 +789,8 @@ public class VariantContext implements Feature { // to enable tribble intergrati
      *         regardless of ordering. Otherwise returns false.
      */
     public boolean hasSameAlternateAllelesAs ( VariantContext other ) {
-        Set<Allele> thisAlternateAlleles = getAlternateAlleles();
-        Set<Allele> otherAlternateAlleles = other.getAlternateAlleles();
+        List<Allele> thisAlternateAlleles = getAlternateAlleles();
+        List<Allele> otherAlternateAlleles = other.getAlternateAlleles();
 
         if ( thisAlternateAlleles.size() != otherAlternateAlleles.size() ) {
             return false;
@@ -1032,7 +998,7 @@ public class VariantContext implements Feature { // to enable tribble intergrati
                 else if ( g.isHomVar() )
                     genotypeCounts[Genotype.Type.HOM_VAR.ordinal()]++;
                 else
-                    throw new IllegalStateException("Genotype of unknown type: " + g);
+                    genotypeCounts[Genotype.Type.MIXED.ordinal()]++;
             }
         }
     }
@@ -1076,6 +1042,15 @@ public class VariantContext implements Feature { // to enable tribble intergrati
         return genotypeCounts[Genotype.Type.HOM_VAR.ordinal()];
     }
 
+    /**
+     * Genotype-specific functions -- how many mixed calls are there in the genotypes?
+     *
+     * @return number of mixed calls
+     */
+    public int getMixedCount() {
+        return genotypeCounts[Genotype.Type.MIXED.ordinal()];
+    }
+
     // ---------------------------------------------------------------------------------------------------------
     //
     // validation: extra-strict validation routines for paranoid users
@@ -1131,7 +1106,7 @@ public class VariantContext implements Feature { // to enable tribble intergrati
         if ( !hasGenotypes() )
             return;
 
-        Set<Allele> reportedAlleles = getAlleles();
+        List<Allele> reportedAlleles = getAlleles();
         Set<Allele> observedAlleles = new HashSet<Allele>();
         observedAlleles.add(getReference());
         for ( Genotype g : getGenotypes().values() ) {
@@ -1381,17 +1356,34 @@ public class VariantContext implements Feature { // to enable tribble intergrati
     }
 
     // protected basic manipulation routines
-    private static LinkedHashSet<Allele> alleleCollectionToSet(LinkedHashSet<Allele> dest, Collection<Allele> alleles) {
-        for ( Allele a : alleles ) {
-            for ( Allele b : dest ) {
+    private static List<Allele> makeAlleles(Collection<Allele> alleles) {
+        final List<Allele> alleleList = new ArrayList<Allele>(alleles.size());
+
+        boolean sawRef = false;
+        for ( final Allele a : alleles ) {
+            for ( final Allele b : alleleList ) {
                 if ( a.equals(b, true) )
                     throw new IllegalArgumentException("Duplicate allele added to VariantContext: " + a);
             }
 
-            dest.add(a);
+            // deal with the case where the first allele isn't the reference
+            if ( a.isReference() ) {
+                if ( sawRef )
+                    throw new IllegalArgumentException("Alleles for a VariantContext must contain at most one reference allele: " + alleles);
+                alleleList.add(0, a);
+                sawRef = true;
+            }
+            else
+                alleleList.add(a);
         }
 
-        return dest;
+        if ( alleleList.isEmpty() )
+            throw new IllegalArgumentException("Cannot create a VariantContext with an empty allele list");
+
+        if ( alleleList.get(0).isNonReference() )
+            throw new IllegalArgumentException("Alleles for a VariantContext must contain at least one reference allele: " + alleles);
+
+        return alleleList;
     }
 
     public static Map<String, Genotype> genotypeCollectionToMap(Map<String, Genotype> dest, Collection<Genotype> genotypes) {
@@ -1505,7 +1497,7 @@ public class VariantContext implements Feature { // to enable tribble intergrati
 
             // Do not change the filter state if filters were not applied to this context
             Set<String> inputVCFilters = inputVC.filtersWereAppliedToContext ? inputVC.getFilters() : null;
-            return new VariantContext(inputVC.getSource(), inputVC.getChr(), inputVC.getStart(), inputVC.getEnd(), alleles, genotypes, inputVC.getNegLog10PError(), inputVCFilters, inputVC.getAttributes());
+            return new VariantContext(inputVC.getSource(), inputVC.getChr(), inputVC.getStart(), inputVC.getEnd(), alleles, genotypes, inputVC.getNegLog10PError(), inputVCFilters, inputVC.getAttributes(),refByte);
         }
         else
             return inputVC;
diff --git a/public/java/src/org/broadinstitute/sting/utils/variantcontext/VariantContextUtils.java b/public/java/src/org/broadinstitute/sting/utils/variantcontext/VariantContextUtils.java
index e0e27b4f7..43f91041f 100755
--- a/public/java/src/org/broadinstitute/sting/utils/variantcontext/VariantContextUtils.java
+++ b/public/java/src/org/broadinstitute/sting/utils/variantcontext/VariantContextUtils.java
@@ -29,6 +29,7 @@ import net.sf.picard.reference.ReferenceSequenceFile;
 import net.sf.samtools.util.StringUtil;
 import org.apache.commons.jexl2.Expression;
 import org.apache.commons.jexl2.JexlEngine;
+import org.apache.log4j.Logger;
 import org.broad.tribble.util.popgen.HardyWeinbergCalculation;
 import org.broadinstitute.sting.gatk.walkers.phasing.ReadBackedPhasingWalker;
 import org.broadinstitute.sting.utils.BaseUtils;
@@ -44,6 +45,12 @@ import java.io.Serializable;
 import java.util.*;
 
 public class VariantContextUtils {
+    private static Logger logger = Logger.getLogger(VariantContextUtils.class);
+    public final static String MERGE_INTERSECTION = "Intersection";
+    public final static String MERGE_FILTER_IN_ALL = "FilteredInAll";
+    public final static String MERGE_REF_IN_ALL = "ReferenceInAll";
+    public final static String MERGE_FILTER_PREFIX = "filterIn";
+
     final public static JexlEngine engine = new JexlEngine();
     static {
         engine.setSilent(false); // will throw errors now for selects that don't evaluate properly
@@ -154,6 +161,13 @@ public class VariantContextUtils {
         return "%." + precision + "f";
     }
 
+    public static Genotype removePLs(Genotype g) {
+        Map<String, Object> attrs = new HashMap<String, Object>(g.getAttributes());
+        attrs.remove(VCFConstants.PHRED_GENOTYPE_LIKELIHOODS_KEY);
+        attrs.remove(VCFConstants.GENOTYPE_LIKELIHOODS_KEY);
+        return new Genotype(g.getSampleName(), g.getAlleles(), g.getNegLog10PError(), g.filtersWereApplied() ? g.getFilters() : null, attrs, g.isPhased());
+    }
+
     /**
      * A simple but common wrapper for matching VariantContext objects using JEXL expressions
      */
@@ -499,7 +513,7 @@ public class VariantContextUtils {
         final String name = first.getSource();
         final Allele refAllele = determineReferenceAllele(VCs);
 
-        final Set<Allele> alleles = new TreeSet<Allele>();
+        final Set<Allele> alleles = new LinkedHashSet<Allele>();
         final Set<String> filters = new TreeSet<String>();
         final Map<String, Object> attributes = new TreeMap<String, Object>();
         final Set<String> inconsistentAttributes = new HashSet<String>();
@@ -548,12 +562,10 @@ public class VariantContextUtils {
             // special case DP (add it up) and ID (just preserve it)
             //
             if (vc.hasAttribute(VCFConstants.DEPTH_KEY))
-                depth += Integer.valueOf(vc.getAttributeAsString(VCFConstants.DEPTH_KEY));
-
+                depth += vc.getAttributeAsInt(VCFConstants.DEPTH_KEY, 0);
             if ( vc.hasID() && ! vc.getID().equals(VCFConstants.EMPTY_ID_FIELD) ) rsIDs.add(vc.getID());
-
             if (mergeInfoWithMaxAC && vc.hasAttribute(VCFConstants.ALLELE_COUNT_KEY)) {
-                String rawAlleleCounts = vc.getAttributeAsString(VCFConstants.ALLELE_COUNT_KEY);
+                String rawAlleleCounts = vc.getAttributeAsString(VCFConstants.ALLELE_COUNT_KEY, null);
                 // lets see if the string contains a , separator
                 if (rawAlleleCounts.contains(VCFConstants.INFO_FIELD_ARRAY_SEPARATOR)) {
                     List<String> alleleCountArray = Arrays.asList(rawAlleleCounts.substring(1, rawAlleleCounts.length() - 1).split(VCFConstants.INFO_FIELD_ARRAY_SEPARATOR));
@@ -594,10 +606,17 @@ public class VariantContextUtils {
             }
         }
 
-        // if we have more alternate alleles in the merged VC than in one or more of the original VCs, we need to strip out the GL/PLs (because they are no longer accurate)
+        // if we have more alternate alleles in the merged VC than in one or more of the
+        // original VCs, we need to strip out the GL/PLs (because they are no longer accurate), as well as allele-dependent attributes like AC,AF
         for ( VariantContext vc : VCs ) {
-            if ( vc.alleles.size() != alleles.size() ) {
+            if (vc.alleles.size() == 1)
+                continue;
+            if ( hasPLIncompatibleAlleles(alleles, vc.alleles)) {
+                logger.warn(String.format("Stripping PLs at %s due incompatible alleles merged=%s vs. single=%s",
+                        genomeLocParser.createGenomeLoc(vc), alleles, vc.alleles));
                 genotypes = stripPLs(genotypes);
+                // this will remove stale AC,AF attributed from vc
+                calculateChromosomeCounts(vc, attributes, true);
                 break;
             }
         }
@@ -611,19 +630,20 @@ public class VariantContextUtils {
         if ( filteredRecordMergeType == FilteredRecordMergeType.KEEP_IF_ANY_UNFILTERED && nFiltered != VCs.size() )
             filters.clear();
 
+
         if ( annotateOrigin ) { // we care about where the call came from
             String setValue;
             if ( nFiltered == 0 && variantSources.size() == priorityListOfVCs.size() ) // nothing was unfiltered
-                setValue = "Intersection";
+                setValue = MERGE_INTERSECTION;
             else if ( nFiltered == VCs.size() )     // everything was filtered out
-                setValue = "FilteredInAll";
+                setValue = MERGE_FILTER_IN_ALL;
             else if ( variantSources.isEmpty() )               // everyone was reference
-                setValue = "ReferenceInAll";
+                setValue = MERGE_REF_IN_ALL;
             else {
                 LinkedHashSet<String> s = new LinkedHashSet<String>();
                 for ( VariantContext vc : VCs )
                     if ( vc.isVariant() )
-                        s.add( vc.isFiltered() ? "filterIn" + vc.getSource() : vc.getSource() );
+                        s.add( vc.isFiltered() ? MERGE_FILTER_PREFIX + vc.getSource() : vc.getSource() );
                 setValue = Utils.join("-", s);
             }
 
@@ -648,6 +668,36 @@ public class VariantContextUtils {
         return merged;
     }
 
+    private static final boolean hasPLIncompatibleAlleles(final Collection<Allele> alleleSet1, final Collection<Allele> alleleSet2) {
+        final Iterator<Allele> it1 = alleleSet1.iterator();
+        final Iterator<Allele> it2 = alleleSet2.iterator();
+
+        while ( it1.hasNext() && it2.hasNext() ) {
+            final Allele a1 = it1.next();
+            final Allele a2 = it2.next();
+            if ( ! a1.equals(a2) )
+                return true;
+        }
+
+        // by this point, at least one of the iterators is empty.  All of the elements
+        // we've compared are equal up until this point.  But it's possible that the
+        // sets aren't the same size, which is indicated by the test below.  If they
+        // are of the same size, though, the sets are compatible
+        return it1.hasNext() || it2.hasNext();
+    }
+
+    public static boolean allelesAreSubset(VariantContext vc1, VariantContext vc2) {
+        // if all alleles of vc1 are a contained in alleles of vc2, return true
+        if (!vc1.getReference().equals(vc2.getReference()))
+            return false;
+
+        for (Allele a :vc1.getAlternateAlleles()) {
+            if (!vc2.getAlternateAlleles().contains(a))
+                return false;
+        }
+
+        return true;
+    }
     public static VariantContext createVariantContextWithTrimmedAlleles(VariantContext inputVC) {
         // see if we need to trim common reference base from all alleles
         boolean trimVC;
@@ -724,7 +774,7 @@ public class VariantContextUtils {
         Map<String, Genotype> newGs = new HashMap<String, Genotype>(genotypes.size());
 
         for ( Map.Entry<String, Genotype> g : genotypes.entrySet() ) {
-            newGs.put(g.getKey(), g.getValue().hasLikelihoods() ? Genotype.removePLs(g.getValue()) : g.getValue());
+            newGs.put(g.getKey(), g.getValue().hasLikelihoods() ? removePLs(g.getValue()) : g.getValue());
         }
 
         return newGs;
@@ -733,9 +783,46 @@ public class VariantContextUtils {
     public static Map<VariantContext.Type, List<VariantContext>> separateVariantContextsByType(Collection<VariantContext> VCs) {
         HashMap<VariantContext.Type, List<VariantContext>> mappedVCs = new HashMap<VariantContext.Type, List<VariantContext>>();
         for ( VariantContext vc : VCs ) {
-            if ( !mappedVCs.containsKey(vc.getType()) )
-                mappedVCs.put(vc.getType(), new ArrayList<VariantContext>());
-            mappedVCs.get(vc.getType()).add(vc);
+
+            // look at previous variant contexts of different type. If:
+            // a) otherVC has alleles which are subset of vc, remove otherVC from its list and add otherVC to  vc's list
+            // b) vc has alleles which are subset of otherVC. Then, add vc to otherVC's type list (rather, do nothing since vc will be added automatically to its list)
+            // c) neither: do nothing, just add vc to its own list
+            boolean addtoOwnList = true;
+            for (VariantContext.Type type : VariantContext.Type.values()) {
+                if (type.equals(vc.getType()))
+                    continue;
+
+                if (!mappedVCs.containsKey(type))
+                    continue;
+
+                List<VariantContext> vcList = mappedVCs.get(type);
+                for (int k=0; k <  vcList.size(); k++) {
+                    VariantContext otherVC = vcList.get(k);
+                    if (allelesAreSubset(otherVC,vc)) {
+                        // otherVC has a type different than vc and its alleles are a subset of vc: remove otherVC from its list and add it to vc's type list
+                        vcList.remove(k);
+                        // avoid having empty lists
+                        if (vcList.size() == 0)
+                            mappedVCs.remove(vcList);
+                        if ( !mappedVCs.containsKey(vc.getType()) )
+                            mappedVCs.put(vc.getType(), new ArrayList<VariantContext>());
+                        mappedVCs.get(vc.getType()).add(otherVC);
+                        break;
+                    }
+                    else if (allelesAreSubset(vc,otherVC)) {
+                        // vc has a type different than otherVC and its alleles are a subset of VC: add vc to otherVC's type list and don't add to its own
+                        mappedVCs.get(type).add(vc);
+                        addtoOwnList = false;
+                        break;
+                    }
+                }
+            }
+            if (addtoOwnList) {
+                if ( !mappedVCs.containsKey(vc.getType()) )
+                    mappedVCs.put(vc.getType(), new ArrayList<VariantContext>());
+                mappedVCs.get(vc.getType()).add(vc);
+                }
         }
 
         return mappedVCs;
@@ -1132,9 +1219,7 @@ public class VariantContextUtils {
         for (String orAttrib : MERGE_OR_ATTRIBS) {
             boolean attribVal = false;
             for (VariantContext vc : vcList) {
-                Boolean val = vc.getAttributeAsBooleanNoException(orAttrib);
-                if (val != null)
-                    attribVal = (attribVal || val);
+                attribVal = vc.getAttributeAsBoolean(orAttrib, false);
                 if (attribVal) // already true, so no reason to continue:
                     break;
             }
@@ -1144,7 +1229,7 @@ public class VariantContextUtils {
         // Merge ID fields:
         String iDVal = null;
         for (VariantContext vc : vcList) {
-            String val = vc.getAttributeAsStringNoException(VariantContext.ID_KEY);
+            String val = vc.getAttributeAsString(VariantContext.ID_KEY, null);
             if (val != null && !val.equals(VCFConstants.EMPTY_ID_FIELD)) {
                 if (iDVal == null)
                     iDVal = val;
@@ -1224,8 +1309,10 @@ public class VariantContextUtils {
 
         public PhaseAndQuality(Genotype gt) {
             this.isPhased = gt.isPhased();
-            if (this.isPhased)
-                this.PQ = gt.getAttributeAsDoubleNoException(ReadBackedPhasingWalker.PQ_KEY);
+            if (this.isPhased) {
+                this.PQ = gt.getAttributeAsDouble(ReadBackedPhasingWalker.PQ_KEY, -1);
+                if ( this.PQ == -1 ) this.PQ = null;
+            }
         }
     }
 
diff --git a/public/java/test/org/broadinstitute/sting/BaseTest.java b/public/java/test/org/broadinstitute/sting/BaseTest.java
index 63faf1ab9..f99a105ae 100755
--- a/public/java/test/org/broadinstitute/sting/BaseTest.java
+++ b/public/java/test/org/broadinstitute/sting/BaseTest.java
@@ -50,6 +50,7 @@ public abstract class BaseTest {
     public static final String hg18Reference = "/seq/references/Homo_sapiens_assembly18/v0/Homo_sapiens_assembly18.fasta";
     public static final String hg19Reference = "/seq/references/Homo_sapiens_assembly19/v1/Homo_sapiens_assembly19.fasta";
     public static final String b36KGReference = "/humgen/1kg/reference/human_b36_both.fasta";
+    //public static final String b37KGReference = "/Users/depristo/Desktop/broadLocal/localData/human_g1k_v37.fasta";
     public static final String b37KGReference = "/humgen/1kg/reference/human_g1k_v37.fasta";
     public static final String GATKDataLocation = "/humgen/gsa-hpprojects/GATK/data/";
     public static final String validationDataLocation = GATKDataLocation + "Validation_Data/";
@@ -80,7 +81,8 @@ public abstract class BaseTest {
     public static final String networkTempDir = "/broad/shptmp/";
     public static final File networkTempDirFile = new File(networkTempDir);
 
-    public static final String testDir = "public/testdata/";
+    public static final File testDirFile = new File("public/testdata/");
+    public static final String testDir = testDirFile.getAbsolutePath() + "/";
 
     /** before the class starts up */
     static {
@@ -98,10 +100,10 @@ public abstract class BaseTest {
         logger.setLevel(Level.WARN);
 
         // find our file sources
-        if (!fileExist(hg18Reference) || !fileExist(hg19Reference) || !fileExist(b36KGReference)) {
-            logger.fatal("We can't locate the reference directories.  Aborting!");
-            throw new RuntimeException("BaseTest setup failed: unable to locate the reference directories");
-        }
+//        if (!fileExist(hg18Reference) || !fileExist(hg19Reference) || !fileExist(b36KGReference)) {
+//            logger.fatal("We can't locate the reference directories.  Aborting!");
+//            throw new RuntimeException("BaseTest setup failed: unable to locate the reference directories");
+//        }
     }
 
     /**
@@ -132,15 +134,21 @@ public abstract class BaseTest {
      */
     public static class TestDataProvider {
         private static final Map<Class, List<Object>> tests = new HashMap<Class, List<Object>>();
+        private final String name;
 
         /**
          * Create a new TestDataProvider instance bound to the class variable C
          * @param c
          */
-        public TestDataProvider(Class c) {
+        public TestDataProvider(Class c, String name) {
             if ( ! tests.containsKey(c) )
                 tests.put(c, new ArrayList<Object>());
             tests.get(c).add(this);
+            this.name = name;
+        }
+
+        public TestDataProvider(Class c) {
+            this(c, "");
         }
 
         /**
@@ -153,6 +161,11 @@ public abstract class BaseTest {
             for ( Object x : tests.get(c) ) params2.add(new Object[]{x});
             return params2.toArray(new Object[][]{});
         }
+
+        @Override
+        public String toString() {
+            return "TestDataProvider("+name+")";
+        }
     }
 
     /**
diff --git a/public/java/test/org/broadinstitute/sting/MD5DB.java b/public/java/test/org/broadinstitute/sting/MD5DB.java
index 2fd8f8b6d..c9f53c581 100644
--- a/public/java/test/org/broadinstitute/sting/MD5DB.java
+++ b/public/java/test/org/broadinstitute/sting/MD5DB.java
@@ -129,7 +129,7 @@ public class MD5DB {
                 System.out.printf("##### Skipping update, cannot write file %s%n", dbFile);
             }
         } else {
-            System.out.printf("##### MD5 file is up to date: %s%n", dbFile.getPath());
+            //System.out.printf("##### MD5 file is up to date: %s%n", dbFile.getPath());
         }
     }
 
@@ -170,6 +170,18 @@ public class MD5DB {
         return bytes;
     }
 
+    public static class MD5Match {
+        final String md5;
+        final String failMessage;
+        boolean failed;
+
+        public MD5Match(final String md5, final String failMessage, final boolean failed) {
+            this.md5 = md5;
+            this.failMessage = failMessage;
+            this.failed = failed;
+        }
+    }
+
     /**
      * Tests a file MD5 against an expected value, returning the MD5.  NOTE: This function WILL throw an exception if the MD5s are different.
      * @param name Name of the test.
@@ -178,18 +190,21 @@ public class MD5DB {
      * @param parameterize If true or if expectedMD5 is an empty string, will print out the calculated MD5 instead of error text.
      * @return The calculated MD5.
      */
-    public static String assertMatchingMD5(final String name, final File resultsFile, final String expectedMD5, final boolean parameterize) {
-        String filemd5sum = testFileMD5(name, resultsFile, expectedMD5, parameterize);
+    public static MD5Match assertMatchingMD5(final String name, final File resultsFile, final String expectedMD5, final boolean parameterize) {
+        final String filemd5sum = testFileMD5(name, resultsFile, expectedMD5, parameterize);
+        String failMessage = null;
+        boolean failed = false;
 
         if (parameterize || expectedMD5.equals("")) {
             // Don't assert
         } else if ( filemd5sum.equals(expectedMD5) ) {
-            System.out.println(String.format("  => %s PASSED", name));
+            System.out.println(String.format("  => %s PASSED (expected=%s)", name, expectedMD5));
         } else {
-            Assert.fail(String.format("%s has mismatching MD5s: expected=%s observed=%s", name, expectedMD5, filemd5sum));
+            failed = true;
+            failMessage = String.format("%s has mismatching MD5s: expected=%s observed=%s", name, expectedMD5, filemd5sum);
         }
 
-        return filemd5sum;
+        return new MD5Match(filemd5sum, failMessage, failed);
     }
 
 
@@ -218,8 +233,8 @@ public class MD5DB {
                 System.out.println(String.format("PARAMETERIZATION[%s]: file %s has md5 = %s, stated expectation is %s, equal? = %b",
                         name, resultsFile, filemd5sum, expectedMD5, filemd5sum.equals(expectedMD5)));
             } else {
-                System.out.println(String.format("Checking MD5 for %s [calculated=%s, expected=%s]", resultsFile, filemd5sum, expectedMD5));
-                System.out.flush();
+                //System.out.println(String.format("Checking MD5 for %s [calculated=%s, expected=%s]", resultsFile, filemd5sum, expectedMD5));
+                //System.out.flush();
 
                 if ( ! expectedMD5.equals(filemd5sum) ) {
                     // we are going to fail for real in assertEquals (so we are counted by the testing framework).
diff --git a/public/java/test/org/broadinstitute/sting/WalkerTest.java b/public/java/test/org/broadinstitute/sting/WalkerTest.java
index 386c17659..ca7653b58 100755
--- a/public/java/test/org/broadinstitute/sting/WalkerTest.java
+++ b/public/java/test/org/broadinstitute/sting/WalkerTest.java
@@ -52,7 +52,7 @@ public class WalkerTest extends BaseTest {
         GenomeAnalysisEngine.resetRandomGenerator();
     }
 
-    public String assertMatchingMD5(final String name, final File resultsFile, final String expectedMD5) {
+    public MD5DB.MD5Match assertMatchingMD5(final String name, final File resultsFile, final String expectedMD5) {
         return MD5DB.assertMatchingMD5(name, resultsFile, expectedMD5, parameterize());
     }
 
@@ -75,7 +75,7 @@ public class WalkerTest extends BaseTest {
         Index indexFromOutputFile = IndexFactory.createIndex(resultFile, new VCFCodec());
         Index dynamicIndex = IndexFactory.loadIndex(indexFile.getAbsolutePath());
 
-        if ( ! indexFromOutputFile.equalsIgnoreTimestamp(dynamicIndex) ) {
+        if ( ! indexFromOutputFile.equalsIgnoreProperties(dynamicIndex) ) {
             Assert.fail(String.format("Index on disk from indexing on the fly not equal to the index created after the run completed.  FileIndex %s vs. on-the-fly %s%n",
                     indexFromOutputFile.getProperties(),
                     dynamicIndex.getProperties()));
@@ -84,10 +84,23 @@ public class WalkerTest extends BaseTest {
 
     public List<String> assertMatchingMD5s(final String name, List<File> resultFiles, List<String> expectedMD5s) {
         List<String> md5s = new ArrayList<String>();
+        List<MD5DB.MD5Match> fails = new ArrayList<MD5DB.MD5Match>();
+
         for (int i = 0; i < resultFiles.size(); i++) {
-            String md5 = assertMatchingMD5(name, resultFiles.get(i), expectedMD5s.get(i));
-            maybeValidateSupplementaryFile(name, resultFiles.get(i));
-            md5s.add(i, md5);
+            MD5DB.MD5Match result = assertMatchingMD5(name, resultFiles.get(i), expectedMD5s.get(i));
+            if ( ! result.failed ) {
+                maybeValidateSupplementaryFile(name, resultFiles.get(i));
+                md5s.add(result.md5);
+            } else {
+                fails.add(result);
+            }
+        }
+
+        if ( ! fails.isEmpty() ) {
+            for ( final MD5DB.MD5Match fail : fails ) {
+                logger.warn("Fail: " + fail.failMessage);
+            }
+            Assert.fail("Test failed: " + name);
         }
 
         return md5s;
diff --git a/public/java/test/org/broadinstitute/sting/commandline/ArgumentMatchSiteUnitTest.java b/public/java/test/org/broadinstitute/sting/commandline/ArgumentMatchSiteUnitTest.java
new file mode 100644
index 000000000..99d6b88f3
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/commandline/ArgumentMatchSiteUnitTest.java
@@ -0,0 +1,79 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.commandline;
+
+import org.testng.Assert;
+import org.testng.annotations.Test;
+
+import java.io.File;
+
+public class ArgumentMatchSiteUnitTest {
+    @Test
+    public void testCommandLine() {
+        ArgumentMatchSite site = new ArgumentMatchSite(ArgumentMatchSource.COMMAND_LINE, 1);
+        Assert.assertEquals(site.getSource(), ArgumentMatchSource.COMMAND_LINE);
+        Assert.assertEquals(site.getIndex(), 1);
+    }
+
+    @Test
+    public void testFile() {
+        ArgumentMatchSource source = new ArgumentMatchSource(new File("test"));
+        ArgumentMatchSite site = new ArgumentMatchSite(source, 1);
+        Assert.assertEquals(site.getSource(), source);
+        Assert.assertEquals(site.getIndex(), 1);
+    }
+
+    @Test
+    public void testEquals() {
+        ArgumentMatchSource cmdLine = ArgumentMatchSource.COMMAND_LINE;
+        ArgumentMatchSite site1 = new ArgumentMatchSite(cmdLine, 1);
+        ArgumentMatchSite site2 = new ArgumentMatchSite(cmdLine, 2);
+
+        Assert.assertFalse(site1.equals(null));
+
+        Assert.assertTrue(site1.equals(site1));
+        Assert.assertFalse(site1.equals(site2));
+
+        Assert.assertFalse(site2.equals(site1));
+        Assert.assertTrue(site2.equals(site2));
+    }
+
+    @Test
+    public void testCompareTo() {
+        ArgumentMatchSource cmdLine = ArgumentMatchSource.COMMAND_LINE;
+        ArgumentMatchSite site1 = new ArgumentMatchSite(cmdLine, 1);
+        ArgumentMatchSite site2 = new ArgumentMatchSite(cmdLine, 2);
+
+        Assert.assertTrue(site1.compareTo(site1) == 0);
+        Assert.assertTrue(site1.compareTo(site2) < 0);
+        Assert.assertTrue(site2.compareTo(site1) > 0);
+        Assert.assertTrue(site2.compareTo(site2) == 0);
+    }
+
+    @Test(expectedExceptions = NullPointerException.class)
+    public void testCompareToNull() {
+        new ArgumentMatchSite(ArgumentMatchSource.COMMAND_LINE, 0).compareTo(null);
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/commandline/ArgumentMatchSourceUnitTest.java b/public/java/test/org/broadinstitute/sting/commandline/ArgumentMatchSourceUnitTest.java
new file mode 100644
index 000000000..4bc7eb822
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/commandline/ArgumentMatchSourceUnitTest.java
@@ -0,0 +1,98 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.commandline;
+
+import org.broadinstitute.sting.BaseTest;
+import org.testng.Assert;
+import org.testng.annotations.Test;
+
+import java.io.File;
+
+public class ArgumentMatchSourceUnitTest extends BaseTest {
+    @Test
+    public void testCommandLine() {
+        ArgumentMatchSource source = ArgumentMatchSource.COMMAND_LINE;
+        Assert.assertEquals(source.getType(), ArgumentMatchSourceType.CommandLine);
+        Assert.assertNull(source.getFile());
+    }
+
+    @Test
+    public void testFile() {
+        File f = new File("test");
+        ArgumentMatchSource source = new ArgumentMatchSource(f);
+        Assert.assertEquals(source.getType(), ArgumentMatchSourceType.File);
+        Assert.assertEquals(source.getFile(), f);
+    }
+
+    @Test(expectedExceptions = IllegalArgumentException.class)
+    public void testNullFile() {
+        new ArgumentMatchSource(null);
+    }
+
+    @Test
+    public void testEquals() {
+        ArgumentMatchSource cmdLine = ArgumentMatchSource.COMMAND_LINE;
+        ArgumentMatchSource fileA = new ArgumentMatchSource(new File("a"));
+        ArgumentMatchSource fileB = new ArgumentMatchSource(new File("b"));
+
+        Assert.assertFalse(cmdLine.equals(null));
+
+        Assert.assertTrue(cmdLine.equals(cmdLine));
+        Assert.assertFalse(cmdLine.equals(fileA));
+        Assert.assertFalse(cmdLine.equals(fileB));
+
+        Assert.assertFalse(fileA.equals(cmdLine));
+        Assert.assertTrue(fileA.equals(fileA));
+        Assert.assertFalse(fileA.equals(fileB));
+
+        Assert.assertFalse(fileB.equals(cmdLine));
+        Assert.assertFalse(fileB.equals(fileA));
+        Assert.assertTrue(fileB.equals(fileB));
+    }
+
+    @Test
+    public void testCompareTo() {
+        ArgumentMatchSource cmdLine = ArgumentMatchSource.COMMAND_LINE;
+        ArgumentMatchSource fileA = new ArgumentMatchSource(new File("a"));
+        ArgumentMatchSource fileB = new ArgumentMatchSource(new File("b"));
+
+        Assert.assertTrue(cmdLine.compareTo(cmdLine) == 0);
+        Assert.assertTrue(cmdLine.compareTo(fileA) < 0);
+        Assert.assertTrue(cmdLine.compareTo(fileB) < 0);
+
+        Assert.assertTrue(fileA.compareTo(cmdLine) > 0);
+        Assert.assertTrue(fileA.compareTo(fileA) == 0);
+        Assert.assertTrue(fileA.compareTo(fileB) < 0);
+
+        Assert.assertTrue(fileB.compareTo(cmdLine) > 0);
+        Assert.assertTrue(fileB.compareTo(fileA) > 0);
+        Assert.assertTrue(fileB.compareTo(fileB) == 0);
+    }
+
+    @Test(expectedExceptions = NullPointerException.class)
+    public void testCompareToNull() {
+        ArgumentMatchSource.COMMAND_LINE.compareTo(null);
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/commandline/ParsingEngineUnitTest.java b/public/java/test/org/broadinstitute/sting/commandline/ParsingEngineUnitTest.java
index f04731214..87f0e6ff0 100755
--- a/public/java/test/org/broadinstitute/sting/commandline/ParsingEngineUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/commandline/ParsingEngineUnitTest.java
@@ -25,6 +25,7 @@
 
 package org.broadinstitute.sting.commandline;
 
+import org.apache.commons.io.FileUtils;
 import org.broad.tribble.Feature;
 import org.broadinstitute.sting.utils.exceptions.UserException;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
@@ -34,6 +35,8 @@ import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.testng.annotations.BeforeMethod;
 import org.testng.annotations.Test;
 
+import java.io.File;
+import java.io.IOException;
 import java.util.List;
 import java.util.EnumSet;
 /**
@@ -493,6 +496,7 @@ public class ParsingEngineUnitTest extends BaseTest {
         Assert.assertNotNull(definition, "Invalid default argument name assigned");
     }
 
+    @SuppressWarnings("unused")
     private class CamelCaseArgProvider {
         @Argument(doc="my arg")
         Integer myArg;
@@ -507,6 +511,7 @@ public class ParsingEngineUnitTest extends BaseTest {
         parsingEngine.validate();
     }
 
+    @SuppressWarnings("unused")
     private class BooleanArgProvider {
         @Argument(doc="my bool")
         boolean myBool;
@@ -561,6 +566,7 @@ public class ParsingEngineUnitTest extends BaseTest {
         parsingEngine.validate();
     }
 
+    @SuppressWarnings("unused")
     private class MutuallyExclusiveArgProvider {
         @Argument(doc="foo",exclusiveOf="bar")
         Integer foo;
@@ -618,6 +624,7 @@ public class ParsingEngineUnitTest extends BaseTest {
         parsingEngine.addArgumentSource( MultipleArgumentCollectionProvider.class );
     }
 
+    @SuppressWarnings("unused")
     private class MultipleArgumentCollectionProvider {
         @ArgumentCollection
         RequiredArgProvider rap1 = new RequiredArgProvider();
@@ -937,4 +944,23 @@ public class ParsingEngineUnitTest extends BaseTest {
         VariantContextRodBindingArgProvider argProvider = new VariantContextRodBindingArgProvider();
         parsingEngine.loadArgumentsIntoObject( argProvider );
     }
+
+    @Test
+    public void argumentListTest() throws IOException {
+        File argsFile = BaseTest.createTempFile("args.", ".list");
+        try {
+            FileUtils.write(argsFile, "-I na12878.bam");
+            final String[] commandLine = new String[] {"-args", argsFile.getPath()};
+            parsingEngine.addArgumentSource(InputFileArgProvider.class);
+            parsingEngine.parse(commandLine);
+            parsingEngine.validate();
+
+            InputFileArgProvider argProvider = new InputFileArgProvider();
+            parsingEngine.loadArgumentsIntoObject(argProvider);
+
+            Assert.assertEquals(argProvider.inputFile, "na12878.bam", "Argument is not correctly initialized");
+        } finally {
+            FileUtils.deleteQuietly(argsFile);
+        }
+    }
 }
diff --git a/public/java/test/org/broadinstitute/sting/gatk/GenomeAnalysisEngineUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/GenomeAnalysisEngineUnitTest.java
index 1e4625bf0..3ce62b697 100644
--- a/public/java/test/org/broadinstitute/sting/gatk/GenomeAnalysisEngineUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/GenomeAnalysisEngineUnitTest.java
@@ -28,24 +28,25 @@ import net.sf.picard.reference.IndexedFastaSequenceFile;
 import net.sf.picard.util.Interval;
 import net.sf.picard.util.IntervalList;
 import net.sf.samtools.SAMFileHeader;
+import org.broad.tribble.Feature;
 import org.broadinstitute.sting.BaseTest;
 import org.broadinstitute.sting.commandline.ArgumentException;
+import org.broadinstitute.sting.commandline.IntervalBinding;
 import org.broadinstitute.sting.gatk.arguments.GATKArgumentCollection;
 import org.broadinstitute.sting.gatk.datasources.reads.SAMReaderID;
 import org.broadinstitute.sting.commandline.Tags;
 import org.broadinstitute.sting.gatk.walkers.PrintReadsWalker;
-import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.GenomeLocParser;
 import org.broadinstitute.sting.utils.GenomeLocSortedSet;
 
 import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.interval.IntervalSetRule;
 import org.testng.annotations.DataProvider;
 import org.testng.annotations.Test;
 
 import java.io.File;
 import java.io.PrintWriter;
 import java.util.ArrayList;
-import java.util.Arrays;
 import java.util.Collection;
 import java.util.List;
 
@@ -72,7 +73,7 @@ public class GenomeAnalysisEngineUnitTest extends BaseTest {
         GenomeAnalysisEngine testEngine = new GenomeAnalysisEngine();
 
         Collection<SAMReaderID> samFiles = new ArrayList<SAMReaderID>();
-        samFiles.add(new SAMReaderID(new File("public/testdata/exampleBAM.bam"),  new Tags()));
+        samFiles.add(new SAMReaderID(new File("public/testdata/exampleBAM.bam"), new Tags()));
         samFiles.add(new SAMReaderID(new File("public/testdata/exampleNORG.bam"), new Tags()));
         samFiles.add(new SAMReaderID(new File("public/testdata/exampleBAM.bam"),  new Tags()));
         samFiles.add(new SAMReaderID(new File("public/testdata/exampleNORG.bam"), new Tags()));
@@ -81,7 +82,7 @@ public class GenomeAnalysisEngineUnitTest extends BaseTest {
         testEngine.checkForDuplicateSamFiles();
     }
 
-    @Test(expectedExceptions=ArgumentException.class)
+    @Test
     public void testEmptyIntervalSetHandling() throws Exception {
         GenomeAnalysisEngine testEngine = new GenomeAnalysisEngine();
 
@@ -108,31 +109,7 @@ public class GenomeAnalysisEngineUnitTest extends BaseTest {
         };
     }
 
-    @Test(expectedExceptions=UserException.class, dataProvider="invalidIntervalTestData")
-    public void testInvalidRODIntervalHandling(GenomeAnalysisEngine testEngine, GenomeLocParser genomeLocParser,
-                                               String contig, int intervalStart, int intervalEnd ) throws Exception {
-
-        List<String> intervalArgs = new ArrayList<String>();
-        List<GenomeLoc> rodIntervals = Arrays.asList(genomeLocParser.createGenomeLoc(contig, intervalStart, intervalEnd, true));
-
-        testEngine.loadIntervals(intervalArgs, rodIntervals);
-    }
-
-    @Test(expectedExceptions=UserException.class, dataProvider="invalidIntervalTestData")
-    public void testInvalidBedIntervalHandling(GenomeAnalysisEngine testEngine, GenomeLocParser genomeLocParser,
-                                               String contig, int intervalStart, int intervalEnd ) throws Exception {
-        // We need to adjust intervalStart, since BED intervals are 0-based. We don't need to adjust intervalEnd,
-        // since the ending point is an open interval.
-        File bedFile = createTempFile("testInvalidBedIntervalHandling", ".bed",
-                                      String.format("%s %d %d", contig, intervalStart -1, intervalEnd));
-
-        List<String> intervalArgs = Arrays.asList(bedFile.getAbsolutePath());
-        List<GenomeLoc> rodIntervals = new ArrayList<GenomeLoc>();
-
-        testEngine.loadIntervals(intervalArgs, rodIntervals);
-    }
-
-    @Test(expectedExceptions=UserException.class, dataProvider="invalidIntervalTestData")
+    @Test(dataProvider="invalidIntervalTestData")
     public void testInvalidPicardIntervalHandling(GenomeAnalysisEngine testEngine, GenomeLocParser genomeLocParser,
                                                   String contig, int intervalStart, int intervalEnd ) throws Exception {
 
@@ -144,10 +121,10 @@ public class GenomeAnalysisEngineUnitTest extends BaseTest {
         File picardIntervalFile = createTempFile("testInvalidPicardIntervalHandling", ".intervals");
         picardIntervals.write(picardIntervalFile);
 
-        List<String> intervalArgs = Arrays.asList(picardIntervalFile.getAbsolutePath());
-        List<GenomeLoc> rodIntervals = new ArrayList<GenomeLoc>();
+        List<IntervalBinding<Feature>> intervalArgs = new ArrayList<IntervalBinding<Feature>>(1);
+        intervalArgs.add(new IntervalBinding<Feature>(picardIntervalFile.getAbsolutePath()));
 
-        testEngine.loadIntervals(intervalArgs, rodIntervals);
+        testEngine.loadIntervals(intervalArgs, IntervalSetRule.UNION);
     }
 
     @Test(expectedExceptions=UserException.class, dataProvider="invalidIntervalTestData")
@@ -157,10 +134,10 @@ public class GenomeAnalysisEngineUnitTest extends BaseTest {
         File gatkIntervalFile = createTempFile("testInvalidGATKFileIntervalHandling", ".intervals",
                                                String.format("%s:%d-%d", contig, intervalStart, intervalEnd));
 
-        List<String> intervalArgs = Arrays.asList(gatkIntervalFile.getAbsolutePath());
-        List<GenomeLoc> rodIntervals = new ArrayList<GenomeLoc>();
+        List<IntervalBinding<Feature>> intervalArgs = new ArrayList<IntervalBinding<Feature>>(1);
+        intervalArgs.add(new IntervalBinding<Feature>(gatkIntervalFile.getAbsolutePath()));
 
-        testEngine.loadIntervals(intervalArgs, rodIntervals);
+        testEngine.loadIntervals(intervalArgs, IntervalSetRule.UNION);
     }
 
     private File createTempFile( String tempFilePrefix, String tempFileExtension, String... lines ) throws Exception {
diff --git a/public/java/test/org/broadinstitute/sting/gatk/arguments/GATKArgumentCollectionUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/arguments/GATKArgumentCollectionUnitTest.java
deleted file mode 100755
index 3a242cb13..000000000
--- a/public/java/test/org/broadinstitute/sting/gatk/arguments/GATKArgumentCollectionUnitTest.java
+++ /dev/null
@@ -1,113 +0,0 @@
-package org.broadinstitute.sting.gatk.arguments;
-
-import org.broadinstitute.sting.BaseTest;
-import org.testng.annotations.AfterMethod;
-import org.testng.annotations.BeforeMethod;
-import org.testng.annotations.Test;
-import static org.testng.Assert.fail;
-
-import java.io.File;
-import java.util.*;
-
-import net.sf.samtools.SAMFileReader;
-
-/*
- * Copyright (c) 2009 The Broad Institute
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use,
- * copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following
- * conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
- * OTHER DEALINGS IN THE SOFTWARE.
- */
-
-/**
- * @author aaron
- * @version 1.0
- * @date May 7, 2009
- * <p/>
- * Class GATKArgumentCollection
- * <p/>
- * Test out the argument collection class
- */
-public class GATKArgumentCollectionUnitTest extends BaseTest {
-
-    // our collection of arguments
-    private GATKArgumentCollection collect;
-
-    // where to write our xml file
-    private String xmlFileLoc = "testfile.xml";
-
-    /** setup our test */
-    @BeforeMethod
-    public void setup() {
-        collect = new GATKArgumentCollection();
-    }
-
-    /** destroy the temp file */
-    @AfterMethod
-    public void takedown() {
-        File f = new File(xmlFileLoc);
-        if (f.exists()) {
-            f.delete();
-        }
-    }
-
-    private void setupCollection() {
-        // parameters and their defaults
-        Map<String, String> wArgs = new HashMap<String, String>();
-        wArgs.put("wArgType1", "Arg1");
-        wArgs.put("wArgType2", "Arg2");
-        wArgs.put("wArgType3", "Arg3");
-        collect.walkerArgs = wArgs;
-
-        List<String> input = new ArrayList<String>();
-        input.add("test.file");
-        collect.samFiles = input;
-        collect.strictnessLevel = SAMFileReader.ValidationStringency.STRICT;
-        collect.referenceFile = new File("referenceFile".toLowerCase());
-        collect.unsafe = ValidationExclusion.TYPE.ALL;
-        collect.downsampleFraction = null;
-        collect.downsampleCoverage = null;
-        collect.intervals = new ArrayList<String>();
-        collect.intervals.add("intervals".toLowerCase());
-        collect.excludeIntervals = new ArrayList<String>();
-        collect.numberOfThreads = 1;
-    }
-
-
-    /** test the output of an XML file in the arg collection */
-    @Test
-    public void testOutput() {
-        setupCollection();
-
-        GATKArgumentCollection.marshal(collect, xmlFileLoc);
-        GATKArgumentCollection collection = GATKArgumentCollection.unmarshal(xmlFileLoc);
-        if (!collect.equals(collection)) {
-            fail("Collections not equal");
-        }
-    }
-
-
-    /** test the output of an XML file in the arg collection */
-    @Test
-    public void testInput() {
-        setupCollection();
-        GATKArgumentCollection.marshal(collect, xmlFileLoc);
-    }
-}
diff --git a/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/AllLocusViewUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/AllLocusViewUnitTest.java
index 9807cede4..ecb865f0c 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/AllLocusViewUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/AllLocusViewUnitTest.java
@@ -1,11 +1,10 @@
 package org.broadinstitute.sting.gatk.datasources.providers;
 
 
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.testng.Assert;
 import org.broadinstitute.sting.utils.GenomeLoc;
-import org.broadinstitute.sting.utils.GenomeLocParser;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
-import net.sf.samtools.SAMRecord;
 
 import java.util.List;
 /**
@@ -38,7 +37,7 @@ public class AllLocusViewUnitTest extends LocusViewTemplate {
      * @param reads
      */
     @Override
-    protected void testReadsInContext( LocusView view, List<GenomeLoc> range, List<SAMRecord> reads ) {
+    protected void testReadsInContext( LocusView view, List<GenomeLoc> range, List<GATKSAMRecord> reads ) {
         AllLocusView allLocusView = (AllLocusView)view;
 
         // TODO: Should skip over loci not in the given range.
@@ -52,7 +51,7 @@ public class AllLocusViewUnitTest extends LocusViewTemplate {
             Assert.assertEquals(locusContext.getLocation(), site, "Locus context location is incorrect");
             int expectedReadsAtSite = 0;
 
-            for( SAMRecord read: reads ) {
+            for( GATKSAMRecord read: reads ) {
                 if(genomeLocParser.createGenomeLoc(read).containsP(locusContext.getLocation())) {
                     Assert.assertTrue(locusContext.getReads().contains(read),"Target locus context does not contain reads");
                     expectedReadsAtSite++;
diff --git a/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/CoveredLocusViewUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/CoveredLocusViewUnitTest.java
index 75716eae6..3a0caef51 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/CoveredLocusViewUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/CoveredLocusViewUnitTest.java
@@ -1,11 +1,11 @@
 package org.broadinstitute.sting.gatk.datasources.providers;
 
 
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.testng.Assert;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.GenomeLocParser;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
-import net.sf.samtools.SAMRecord;
 
 import java.util.List;
 /**
@@ -41,7 +41,7 @@ public class CoveredLocusViewUnitTest extends LocusViewTemplate {
      * @param reads
      */
     @Override
-    protected void testReadsInContext( LocusView view, List<GenomeLoc> range, List<SAMRecord> reads ) {
+    protected void testReadsInContext( LocusView view, List<GenomeLoc> range, List<GATKSAMRecord> reads ) {
         CoveredLocusView coveredLocusView = (CoveredLocusView)view;
 
         // TODO: Should skip over loci not in the given range.
@@ -53,7 +53,7 @@ public class CoveredLocusViewUnitTest extends LocusViewTemplate {
             GenomeLoc site = genomeLocParser.createGenomeLoc("chr1",i);
 
             int expectedReadsAtSite = 0;
-            for( SAMRecord read: reads ) {
+            for( GATKSAMRecord read: reads ) {
                 if( genomeLocParser.createGenomeLoc(read).containsP(site) )
                     expectedReadsAtSite++;
             }
@@ -67,7 +67,7 @@ public class CoveredLocusViewUnitTest extends LocusViewTemplate {
             Assert.assertEquals(locusContext.getLocation(), site, "Target locus context location is incorrect");
             Assert.assertEquals(locusContext.getReads().size(), expectedReadsAtSite, "Found wrong number of reads at site");
 
-            for( SAMRecord read: reads ) {
+            for( GATKSAMRecord read: reads ) {
                 if(genomeLocParser.createGenomeLoc(read).containsP(locusContext.getLocation()))
                     Assert.assertTrue(locusContext.getReads().contains(read),"Target locus context does not contain reads");
             }
diff --git a/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/LocusViewTemplate.java b/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/LocusViewTemplate.java
index e5cf80826..8d7dd82ac 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/LocusViewTemplate.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/datasources/providers/LocusViewTemplate.java
@@ -8,13 +8,12 @@ import org.broadinstitute.sting.gatk.datasources.reads.MockLocusShard;
 import org.broadinstitute.sting.gatk.datasources.reads.SAMReaderID;
 import org.broadinstitute.sting.gatk.datasources.reads.Shard;
 import org.broadinstitute.sting.gatk.executive.WindowMaker;
-import org.broadinstitute.sting.gatk.datasources.sample.SampleDataSource;
 import org.broadinstitute.sting.gatk.datasources.reads.LocusShard;
 import org.broadinstitute.sting.gatk.datasources.reads.SAMDataSource;
 import org.broadinstitute.sting.gatk.iterators.StingSAMIterator;
-import org.broadinstitute.sting.gatk.iterators.LocusIteratorByState;
 import org.broadinstitute.sting.utils.GenomeLoc;
 import org.broadinstitute.sting.utils.GenomeLocParser;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.testng.annotations.BeforeClass;
 import org.testng.annotations.Test;
 
@@ -51,23 +50,23 @@ public abstract class LocusViewTemplate extends BaseTest {
 
         GenomeLoc shardBounds = genomeLocParser.createGenomeLoc("chr1", 1, 5);
         Shard shard = new LocusShard(genomeLocParser, new SAMDataSource(Collections.<SAMReaderID>emptyList(),genomeLocParser),Collections.singletonList(shardBounds),Collections.<SAMReaderID,SAMFileSpan>emptyMap());
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(), new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, null, genomeLocParser, window.getLocus(), window, null, null);
 
         LocusView view = createView(dataProvider);
 
-        testReadsInContext(view, shard.getGenomeLocs(), Collections.<SAMRecord>emptyList());
+        testReadsInContext(view, shard.getGenomeLocs(), Collections.<GATKSAMRecord>emptyList());
     }
 
     @Test
     public void singleReadTest() {
-        SAMRecord read = buildSAMRecord("chr1", 1, 5);
+        GATKSAMRecord read = buildSAMRecord("read1","chr1", 1, 5);
         SAMRecordIterator iterator = new SAMRecordIterator(read);
 
         GenomeLoc shardBounds = genomeLocParser.createGenomeLoc("chr1", 1, 5);
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(shardBounds));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(), new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
 
@@ -78,11 +77,11 @@ public abstract class LocusViewTemplate extends BaseTest {
 
     @Test
     public void readCoveringFirstPartTest() {
-        SAMRecord read = buildSAMRecord("chr1", 1, 5);
+        GATKSAMRecord read = buildSAMRecord("read1","chr1", 1, 5);
         SAMRecordIterator iterator = new SAMRecordIterator(read);
 
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(genomeLocParser.createGenomeLoc("chr1", 1, 10)));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(),new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
         LocusView view = createView(dataProvider);
@@ -92,11 +91,11 @@ public abstract class LocusViewTemplate extends BaseTest {
 
     @Test
     public void readCoveringLastPartTest() {
-        SAMRecord read = buildSAMRecord("chr1", 6, 10);
+        GATKSAMRecord read = buildSAMRecord("read1","chr1", 6, 10);
         SAMRecordIterator iterator = new SAMRecordIterator(read);
 
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(genomeLocParser.createGenomeLoc("chr1", 1, 10)));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(), new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
         LocusView view = createView(dataProvider);
@@ -106,11 +105,11 @@ public abstract class LocusViewTemplate extends BaseTest {
 
     @Test
     public void readCoveringMiddleTest() {
-        SAMRecord read = buildSAMRecord("chr1", 3, 7);
+        GATKSAMRecord read = buildSAMRecord("read1","chr1", 3, 7);
         SAMRecordIterator iterator = new SAMRecordIterator(read);
 
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(genomeLocParser.createGenomeLoc("chr1", 1, 10)));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(), new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
         LocusView view = createView(dataProvider);
@@ -120,11 +119,11 @@ public abstract class LocusViewTemplate extends BaseTest {
 
     @Test
     public void readAndLocusOverlapAtLastBase() {
-        SAMRecord read = buildSAMRecord("chr1", 1, 5);
+        GATKSAMRecord read = buildSAMRecord("read1","chr1", 1, 5);
         SAMRecordIterator iterator = new SAMRecordIterator(read);
 
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(genomeLocParser.createGenomeLoc("chr1", 5, 5)));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(),new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
         LocusView view = createView(dataProvider);
@@ -134,11 +133,11 @@ public abstract class LocusViewTemplate extends BaseTest {
 
     @Test
     public void readOverlappingStartTest() {
-        SAMRecord read = buildSAMRecord("chr1", 1, 10);
+        GATKSAMRecord read = buildSAMRecord("read1","chr1", 1, 10);
         SAMRecordIterator iterator = new SAMRecordIterator(read);
 
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(genomeLocParser.createGenomeLoc("chr1", 6, 15)));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(), new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
         LocusView view = createView(dataProvider);
@@ -148,11 +147,11 @@ public abstract class LocusViewTemplate extends BaseTest {
 
     @Test
     public void readOverlappingEndTest() {
-        SAMRecord read = buildSAMRecord("chr1", 6, 15);
+        GATKSAMRecord read = buildSAMRecord("read1","chr1", 6, 15);
         SAMRecordIterator iterator = new SAMRecordIterator(read);
 
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(genomeLocParser.createGenomeLoc("chr1", 1, 10)));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(),new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
         LocusView view = createView(dataProvider);
@@ -162,104 +161,104 @@ public abstract class LocusViewTemplate extends BaseTest {
 
     @Test
     public void readsSpanningTest() {
-        SAMRecord read1 = buildSAMRecord("chr1", 1, 5);
-        SAMRecord read2 = buildSAMRecord("chr1", 6, 10);
+        GATKSAMRecord read1 = buildSAMRecord("read1","chr1", 1, 5);
+        GATKSAMRecord read2 = buildSAMRecord("read2","chr1", 6, 10);
         SAMRecordIterator iterator = new SAMRecordIterator(read1, read2);
 
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(genomeLocParser.createGenomeLoc("chr1", 1, 10)));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(),new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
         LocusView view = createView(dataProvider);
 
-        List<SAMRecord> expectedReads = new ArrayList<SAMRecord>();
+        List<GATKSAMRecord> expectedReads = new ArrayList<GATKSAMRecord>();
         Collections.addAll(expectedReads, read1, read2);
         testReadsInContext(view, shard.getGenomeLocs(), expectedReads);
     }
 
     @Test
     public void duplicateReadsTest() {
-        SAMRecord read1 = buildSAMRecord("chr1", 1, 5);
-        SAMRecord read2 = buildSAMRecord("chr1", 1, 5);
-        SAMRecord read3 = buildSAMRecord("chr1", 6, 10);
-        SAMRecord read4 = buildSAMRecord("chr1", 6, 10);
+        GATKSAMRecord read1 = buildSAMRecord("read1","chr1", 1, 5);
+        GATKSAMRecord read2 = buildSAMRecord("read2","chr1", 1, 5);
+        GATKSAMRecord read3 = buildSAMRecord("read3","chr1", 6, 10);
+        GATKSAMRecord read4 = buildSAMRecord("read4","chr1", 6, 10);
         SAMRecordIterator iterator = new SAMRecordIterator(read1, read2, read3, read4);
 
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(genomeLocParser.createGenomeLoc("chr1", 1, 10)));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(),new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
         LocusView view = createView(dataProvider);
 
-        List<SAMRecord> expectedReads = new ArrayList<SAMRecord>();
+        List<GATKSAMRecord> expectedReads = new ArrayList<GATKSAMRecord>();
         Collections.addAll(expectedReads, read1, read2, read3, read4);
         testReadsInContext(view, shard.getGenomeLocs(), expectedReads);
     }
 
     @Test
     public void cascadingReadsWithinBoundsTest() {
-        SAMRecord read1 = buildSAMRecord("chr1", 2, 6);
-        SAMRecord read2 = buildSAMRecord("chr1", 3, 7);
-        SAMRecord read3 = buildSAMRecord("chr1", 4, 8);
-        SAMRecord read4 = buildSAMRecord("chr1", 5, 9);
+        GATKSAMRecord read1 = buildSAMRecord("read1","chr1", 2, 6);
+        GATKSAMRecord read2 = buildSAMRecord("read2","chr1", 3, 7);
+        GATKSAMRecord read3 = buildSAMRecord("read3","chr1", 4, 8);
+        GATKSAMRecord read4 = buildSAMRecord("read4","chr1", 5, 9);
         SAMRecordIterator iterator = new SAMRecordIterator(read1, read2, read3, read4);
 
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(genomeLocParser.createGenomeLoc("chr1", 1, 10)));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(),new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
         LocusView view = createView(dataProvider);
 
-        List<SAMRecord> expectedReads = new ArrayList<SAMRecord>();
+        List<GATKSAMRecord> expectedReads = new ArrayList<GATKSAMRecord>();
         Collections.addAll(expectedReads, read1, read2, read3, read4);
         testReadsInContext(view, shard.getGenomeLocs(), expectedReads);
     }
 
     @Test
     public void cascadingReadsAtBoundsTest() {
-        SAMRecord read1 = buildSAMRecord("chr1", 1, 5);
-        SAMRecord read2 = buildSAMRecord("chr1", 2, 6);
-        SAMRecord read3 = buildSAMRecord("chr1", 3, 7);
-        SAMRecord read4 = buildSAMRecord("chr1", 4, 8);
-        SAMRecord read5 = buildSAMRecord("chr1", 5, 9);
-        SAMRecord read6 = buildSAMRecord("chr1", 6, 10);
+        GATKSAMRecord read1 = buildSAMRecord("read1","chr1", 1, 5);
+        GATKSAMRecord read2 = buildSAMRecord("read2","chr1", 2, 6);
+        GATKSAMRecord read3 = buildSAMRecord("read3","chr1", 3, 7);
+        GATKSAMRecord read4 = buildSAMRecord("read4","chr1", 4, 8);
+        GATKSAMRecord read5 = buildSAMRecord("read5","chr1", 5, 9);
+        GATKSAMRecord read6 = buildSAMRecord("read6","chr1", 6, 10);
         SAMRecordIterator iterator = new SAMRecordIterator(read1, read2, read3, read4, read5, read6);
 
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(genomeLocParser.createGenomeLoc("chr1", 1, 10)));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(), new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
         LocusView view = createView(dataProvider);
 
-        List<SAMRecord> expectedReads = new ArrayList<SAMRecord>();
+        List<GATKSAMRecord> expectedReads = new ArrayList<GATKSAMRecord>();
         Collections.addAll(expectedReads, read1, read2, read3, read4, read5, read6);
         testReadsInContext(view, shard.getGenomeLocs(), expectedReads);
     }
 
     @Test
     public void cascadingReadsOverlappingBoundsTest() {
-        SAMRecord read01 = buildSAMRecord("chr1", 1, 5);
-        SAMRecord read02 = buildSAMRecord("chr1", 2, 6);
-        SAMRecord read03 = buildSAMRecord("chr1", 3, 7);
-        SAMRecord read04 = buildSAMRecord("chr1", 4, 8);
-        SAMRecord read05 = buildSAMRecord("chr1", 5, 9);
-        SAMRecord read06 = buildSAMRecord("chr1", 6, 10);
-        SAMRecord read07 = buildSAMRecord("chr1", 7, 11);
-        SAMRecord read08 = buildSAMRecord("chr1", 8, 12);
-        SAMRecord read09 = buildSAMRecord("chr1", 9, 13);
-        SAMRecord read10 = buildSAMRecord("chr1", 10, 14);
-        SAMRecord read11 = buildSAMRecord("chr1", 11, 15);
-        SAMRecord read12 = buildSAMRecord("chr1", 12, 16);
+        GATKSAMRecord read01 = buildSAMRecord("read1","chr1", 1, 5);
+        GATKSAMRecord read02 = buildSAMRecord("read2","chr1", 2, 6);
+        GATKSAMRecord read03 = buildSAMRecord("read3","chr1", 3, 7);
+        GATKSAMRecord read04 = buildSAMRecord("read4","chr1", 4, 8);
+        GATKSAMRecord read05 = buildSAMRecord("read5","chr1", 5, 9);
+        GATKSAMRecord read06 = buildSAMRecord("read6","chr1", 6, 10);
+        GATKSAMRecord read07 = buildSAMRecord("read7","chr1", 7, 11);
+        GATKSAMRecord read08 = buildSAMRecord("read8","chr1", 8, 12);
+        GATKSAMRecord read09 = buildSAMRecord("read9","chr1", 9, 13);
+        GATKSAMRecord read10 = buildSAMRecord("read10","chr1", 10, 14);
+        GATKSAMRecord read11 = buildSAMRecord("read11","chr1", 11, 15);
+        GATKSAMRecord read12 = buildSAMRecord("read12","chr1", 12, 16);
         SAMRecordIterator iterator = new SAMRecordIterator(read01, read02, read03, read04, read05, read06,
                                                            read07, read08, read09, read10, read11, read12);
 
         Shard shard = new MockLocusShard(genomeLocParser,Collections.singletonList(genomeLocParser.createGenomeLoc("chr1", 6, 15)));
-        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs(), new SampleDataSource());
+        WindowMaker windowMaker = new WindowMaker(shard,genomeLocParser,iterator,shard.getGenomeLocs());
         WindowMaker.WindowMakerIterator window = windowMaker.next();
         LocusShardDataProvider dataProvider = new LocusShardDataProvider(shard, window.getSourceInfo(), genomeLocParser, window.getLocus(), window, null, null);
         LocusView view = createView(dataProvider);
 
-        List<SAMRecord> expectedReads = new ArrayList<SAMRecord>();
+        List<GATKSAMRecord> expectedReads = new ArrayList<GATKSAMRecord>();
         Collections.addAll(expectedReads, read01, read02, read03, read04, read05, read06,
                            read07, read08, read09, read10, read11, read12);
         testReadsInContext(view, shard.getGenomeLocs(), expectedReads);
@@ -279,7 +278,7 @@ public abstract class LocusViewTemplate extends BaseTest {
      * @param bounds
      * @param reads
      */
-    protected abstract void testReadsInContext(LocusView view, List<GenomeLoc> bounds, List<SAMRecord> reads);
+    protected abstract void testReadsInContext(LocusView view, List<GenomeLoc> bounds, List<GATKSAMRecord> reads);
 
     /**
      * Fake a reference sequence file.  Essentially, seek a header with a bunch of dummy data.
@@ -323,12 +322,13 @@ public abstract class LocusViewTemplate extends BaseTest {
      *
      * @return New SAM Record
      */
-    protected SAMRecord buildSAMRecord(String contig, int alignmentStart, int alignmentEnd) {
+    protected GATKSAMRecord buildSAMRecord(String readName, String contig, int alignmentStart, int alignmentEnd) {
         SAMFileHeader header = new SAMFileHeader();
         header.setSequenceDictionary(sequenceSourceFile.getSequenceDictionary());
 
-        SAMRecord record = new SAMRecord(header);
+        GATKSAMRecord record = new GATKSAMRecord(header);
 
+        record.setReadName(readName);
         record.setReferenceIndex(sequenceSourceFile.getSequenceDictionary().getSequenceIndex(contig));
         record.setAlignmentStart(alignmentStart);
         Cigar cigar = new Cigar();
diff --git a/public/java/test/org/broadinstitute/sting/gatk/datasources/reads/DownsamplerBenchmark.java b/public/java/test/org/broadinstitute/sting/gatk/datasources/reads/DownsamplerBenchmark.java
index 2ecd75754..5ee373e4f 100644
--- a/public/java/test/org/broadinstitute/sting/gatk/datasources/reads/DownsamplerBenchmark.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/datasources/reads/DownsamplerBenchmark.java
@@ -26,7 +26,6 @@ package org.broadinstitute.sting.gatk.datasources.reads;
 
 import com.google.caliper.Param;
 import net.sf.picard.filter.FilteringIterator;
-import net.sf.picard.filter.SamRecordFilter;
 import net.sf.samtools.SAMFileReader;
 import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.commandline.Tags;
@@ -34,15 +33,12 @@ import org.broadinstitute.sting.gatk.DownsamplingMethod;
 import org.broadinstitute.sting.gatk.ReadProperties;
 import org.broadinstitute.sting.gatk.arguments.GATKArgumentCollection;
 import org.broadinstitute.sting.gatk.arguments.ValidationExclusion;
-import org.broadinstitute.sting.gatk.datasources.reads.SAMReaderID;
-import org.broadinstitute.sting.gatk.datasources.sample.SampleDataSource;
 import org.broadinstitute.sting.gatk.filters.ReadFilter;
 import org.broadinstitute.sting.gatk.filters.UnmappedReadFilter;
 import org.broadinstitute.sting.gatk.iterators.LocusIteratorByState;
 import org.broadinstitute.sting.utils.GenomeLocParser;
 import org.broadinstitute.sting.utils.baq.BAQ;
 
-import java.io.File;
 import java.util.Collections;
 import java.util.Iterator;
 
@@ -88,12 +84,9 @@ public class DownsamplerBenchmark extends ReadProcessingBenchmark {
                                                                (byte)0);
 
             GenomeLocParser genomeLocParser = new GenomeLocParser(reader.getFileHeader().getSequenceDictionary());
-            SampleDataSource sampleDataSource = new SampleDataSource();
-            sampleDataSource.addSamplesFromSAMHeader(reader.getFileHeader());
-
             // Filter unmapped reads.  TODO: is this always strictly necessary?  Who in the GATK normally filters these out?
             Iterator<SAMRecord> readIterator = new FilteringIterator(reader.iterator(),new UnmappedReadFilter());
-            LocusIteratorByState locusIteratorByState = new LocusIteratorByState(readIterator,readProperties,genomeLocParser,sampleDataSource);
+            LocusIteratorByState locusIteratorByState = new LocusIteratorByState(readIterator,readProperties,genomeLocParser, LocusIteratorByState.sampleListForSAMWithoutReadGroups());
             while(locusIteratorByState.hasNext()) {
                 locusIteratorByState.next().getLocation();
             }
diff --git a/public/java/test/org/broadinstitute/sting/gatk/datasources/reads/GATKWalkerBenchmark.java b/public/java/test/org/broadinstitute/sting/gatk/datasources/reads/GATKWalkerBenchmark.java
index 31458f835..564d1e2a3 100644
--- a/public/java/test/org/broadinstitute/sting/gatk/datasources/reads/GATKWalkerBenchmark.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/datasources/reads/GATKWalkerBenchmark.java
@@ -25,13 +25,10 @@
 package org.broadinstitute.sting.gatk.datasources.reads;
 
 import com.google.caliper.Param;
-import net.sf.picard.filter.SamRecordFilter;
-import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.commandline.Tags;
 import org.broadinstitute.sting.gatk.GenomeAnalysisEngine;
 import org.broadinstitute.sting.gatk.arguments.GATKArgumentCollection;
 import org.broadinstitute.sting.gatk.contexts.ReferenceContext;
-import org.broadinstitute.sting.gatk.datasources.reads.SAMReaderID;
 import org.broadinstitute.sting.gatk.filters.ReadFilter;
 import org.broadinstitute.sting.gatk.filters.UnmappedReadFilter;
 import org.broadinstitute.sting.gatk.refdata.ReadMetaDataTracker;
@@ -41,9 +38,9 @@ import org.broadinstitute.sting.gatk.walkers.Walker;
 import org.broadinstitute.sting.gatk.walkers.qc.CountLociWalker;
 import org.broadinstitute.sting.gatk.walkers.qc.CountReadsWalker;
 import org.broadinstitute.sting.utils.classloader.JVMUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 
 import java.io.File;
-import java.lang.reflect.Field;
 import java.util.Collections;
 
 /**
@@ -126,7 +123,7 @@ class CountBasesInReadPerformanceWalker extends ReadWalker<Integer,Long> {
     private long Gs;
     private long Ts;
 
-    public Integer map(ReferenceContext ref, SAMRecord read, ReadMetaDataTracker tracker) {
+    public Integer map(ReferenceContext ref, GATKSAMRecord read, ReadMetaDataTracker tracker) {
         for(byte base: read.getReadBases()) {
             switch(base) {
                 case 'A': As++; break;
diff --git a/public/java/test/org/broadinstitute/sting/gatk/datasources/sample/SampleDataSourceUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/datasources/sample/SampleDataSourceUnitTest.java
deleted file mode 100644
index 59405c065..000000000
--- a/public/java/test/org/broadinstitute/sting/gatk/datasources/sample/SampleDataSourceUnitTest.java
+++ /dev/null
@@ -1,241 +0,0 @@
-package org.broadinstitute.sting.gatk.datasources.sample;
-
-import net.sf.samtools.SAMFileHeader;
-import org.broadinstitute.sting.utils.variantcontext.Allele;
-import org.broadinstitute.sting.utils.variantcontext.Genotype;
-import org.broadinstitute.sting.utils.variantcontext.VariantContext;
-import org.testng.Assert;
-import org.broadinstitute.sting.BaseTest;
-import org.broadinstitute.sting.utils.exceptions.StingException;
-
-import org.testng.annotations.Test;
-
-import java.io.File;
-import java.util.*;
-
-/**
- * Created by IntelliJ IDEA.
- * User: brett
- * Date: Sep 9, 2010
- * Time: 8:21:00 AM
- */
-public class SampleDataSourceUnitTest extends BaseTest {
-
-    // this empty header used to instantiate sampledatasource objects
-    private static SAMFileHeader header = new SAMFileHeader();
-
-    // all the test sample files are located here
-    private String sampleFilesDir = validationDataLocation +  "samples/";
-
-    // make sure samples are created from the SAM file correctly
-    @Test()
-    public void loadSAMSamplesTest() {
-        SampleDataSource s = new SampleDataSource(header, null);
-    }
-
-    // tests that a basic sample with relationships loads correctly
-    // Note that this is the only test for family relationships - we may want to expand this
-    @Test()
-    public void basicLoadSampleFileTest() {
-        File sampleFile = new File(sampleFilesDir + "basicSampleFile.yaml");
-        SampleDataSource s = new SampleDataSource(header, makeFileList(sampleFile));
-        Assert.assertTrue(s.sampleCount() == 5);
-        Sample sampleA = s.getSampleById("sampleA");
-        Sample sampleB = s.getSampleById("sampleB");
-        Assert.assertTrue(sampleB.getMother() == sampleA);
-        Assert.assertTrue(s.getChildren(sampleA).contains(sampleB));
-        Set<Sample> family = s.getFamily("family1");
-        Assert.assertTrue(family.size() == 2);
-        Assert.assertTrue(family.contains(sampleA));
-        Assert.assertTrue(family.contains(sampleB));
-    }
-
-    // but that file should fail if it has an extra character in it...
-    @Test(expectedExceptions=StingException.class)
-    public void loadInvalidSampleExtraCharText() {
-        File sampleFile = new File(sampleFilesDir + "invalidSyntaxExtraChar.yaml");
-        SampleDataSource s = new SampleDataSource(header, makeFileList(sampleFile));
-    }
-
-    // ...or a typo...
-    @Test(expectedExceptions=StingException.class)
-    public void loadInvalidSampleTypoText() {
-        File sampleFile = new File(sampleFilesDir + "invalidSyntaxTypo.yaml");
-        SampleDataSource s = new SampleDataSource(header, makeFileList(sampleFile));
-
-    }
-
-    // ...or an extra unrecognized array
-    @Test(expectedExceptions=StingException.class)
-    public void loadInvalidSampleExtraArrayText() {
-        File sampleFile = new File(sampleFilesDir + "invalidSyntaxExtraArray.yaml");
-        SampleDataSource s = new SampleDataSource(header, makeFileList(sampleFile));
-    }
-
-    // make sure aliases work
-    @Test(expectedExceptions=StingException.class)
-    public void sampleAliasText() {
-        File sampleFile = new File(sampleFilesDir + "basicSampleFileWithAlias.yaml");
-        SampleDataSource s = new SampleDataSource(header, makeFileList(sampleFile));
-        // this file has two samples, but one has an alias. let's make sure that checks out...
-        Assert.assertTrue(s.sampleCount() == 3);
-        Assert.assertTrue(s.getSampleById("sampleA") == s.getSampleById("sampleC"));
-    }
-
-    // error is thrown if property is included that's not in properties array
-    @Test(expectedExceptions=StingException.class)
-    public void unallowedPropertySampleTest() {
-        File sampleFile = new File(sampleFilesDir + "basicSampleFileUnallowedProperty.yaml");
-        SampleDataSource s = new SampleDataSource(header, makeFileList(sampleFile));
-    }
-
-    // same as above, with relationship
-    @Test(expectedExceptions=StingException.class)
-    public void unallowedRelationshipSampleTest() {
-        File sampleFile = new File(sampleFilesDir + "basicSampleFileUnallowedRelationship.yaml");
-        SampleDataSource s = new SampleDataSource(header, makeFileList(sampleFile));
-    }
-
-    // two sample files
-    @Test()
-    public void twoSampleFilesTest() {
-        File sampleFile = new File(sampleFilesDir + "basicSampleFile.yaml");
-        File secondFile = new File(sampleFilesDir + "basicSampleFileExt.yaml");
-        ArrayList<File> files = new ArrayList<File>();
-        files.add(sampleFile);
-        files.add(secondFile);
-        SampleDataSource s = new SampleDataSource(header, files);
-        Assert.assertTrue(s.getSampleById("sampleA").getProperty("propC").equals("valC"));
-        Assert.assertTrue(s.getSampleById("sampleA").getProperty("propA").equals("valA"));
-    }
-
-    // two sample files, with contradictory properties
-    @Test(expectedExceptions=StingException.class)
-    public void twoContradictorySampleFilesTest() {
-        File sampleFile = new File(sampleFilesDir + "basicSampleFile.yaml");
-        File secondFile = new File(sampleFilesDir + "basicSampleFileInvalidExt.yaml");
-        ArrayList<File> files = new ArrayList<File>();
-        files.add(sampleFile);
-        files.add(secondFile);
-        SampleDataSource s = new SampleDataSource(header, files);
-    }
-
-    // three sample files
-    @Test()
-    public void threeSamplesTest() {
-        File sampleFile = new File(sampleFilesDir + "basicSampleFile.yaml");
-        ArrayList<File> files = new ArrayList<File>();
-        files.add(sampleFile);
-        files.add(new File(sampleFilesDir + "basicSampleFileExt.yaml"));
-        files.add(new File(sampleFilesDir + "basicSampleFileExt2.yaml"));
-        SampleDataSource s = new SampleDataSource(header, files);
-        Assert.assertTrue(s.sampleCount() == 6);
-        Assert.assertTrue(s.getSampleById("sampleE").getProperty("propC").equals("valC"));
-        Assert.assertTrue(s.getSampleById("sampleA").getProperty("propA").equals("valA"));
-    }
-
-    /**
-     * testing getSamplesWithProperty
-     * in this file there are 5 samples - 2 with population "CEU", 1 with population "ABC", 1 with no population,
-     * and then the default null sample
-     */
-    @Test()
-    public void getSamplesWithPropertyTest() {
-        File sampleFile = new File(sampleFilesDir + "sampleFileWithProperties.yaml");
-        SampleDataSource s = new SampleDataSource(header, makeFileList(sampleFile));
-        Assert.assertTrue(s.sampleCount() == 5);
-        Set<Sample> ceuSamples = s.getSamplesWithProperty("population", "CEU");
-        Assert.assertTrue(ceuSamples.size() == 2);
-
-        Iterator<Sample> i = ceuSamples.iterator();
-        ArrayList<String> sampleNames = new ArrayList<String>();
-        sampleNames.add(i.next().getId());
-        sampleNames.add(i.next().getId());
-        Assert.assertTrue(sampleNames.contains("sampleA"));
-        Assert.assertTrue(sampleNames.contains("sampleB"));
-    }
-
-    // make sure we can import data types other than Strings
-    @Test()
-    public void sampleTestPropertyType() {
-        File sampleFile = new File(sampleFilesDir + "sampleFileOtherTypes.yaml");
-        SampleDataSource s = new SampleDataSource(header, makeFileList(sampleFile));
-        Sample sample = s.getSampleById("sampleA");
-        Assert.assertTrue(sample.getProperty("a").getClass() == Integer.class);
-        Assert.assertTrue(sample.getProperty("b").getClass() == String.class);
-        Assert.assertTrue(sample.getProperty("c").getClass() == Double.class);
-        Assert.assertTrue(sample.getProperty("b").getClass() == String.class);
-    }
-
-    /**
-     * check that getSamplesFromVariantContext works
-     * create a variant context with two sample names, and make sure the right samples are there
-     */
-    @Test()
-    public void variantContextTest() {
-        SampleDataSource s = new SampleDataSource(header, null);
-        List<Allele> alleleCollection = new ArrayList<Allele>();
-        Allele a1 = Allele.create("A", true);
-        alleleCollection.add(a1);
-
-        Set<Genotype> genotypeCollection = new HashSet<Genotype>();
-        genotypeCollection.add(new Genotype("NA123", alleleCollection));
-        genotypeCollection.add(new Genotype("NA456", alleleCollection));
-
-        VariantContext v = new VariantContext("contextName", "chr1", 1, 1, alleleCollection, genotypeCollection);
-
-        // make sure the set that's returned is the right size
-        HashSet<Sample> set = (HashSet) s.getSamplesByVariantContext(v);
-        Assert.assertTrue(set.size() == 2);
-
-        // make sure both samples are included
-        Iterator<Sample> i = set.iterator();
-        ArrayList<String> sampleNames = new ArrayList<String>();
-        sampleNames.add(i.next().getId());
-        sampleNames.add(i.next().getId());
-        Assert.assertTrue(sampleNames.contains("NA123"));
-        Assert.assertTrue(sampleNames.contains("NA456"));
-    }
-
-    /**
-     * checking subContextFromSampleProperty
-     */
-
-    /**
-     * check that subContextFromSampleProperty works
-     * create a variant context with four sample names, make sure that it filters correctly to 2
-     */
-    @Test()
-    public void subContextFromSamplePropertyTest() {
-
-        File sampleFile = new File(sampleFilesDir + "sampleFileWithProperties.yaml");
-        SampleDataSource s = new SampleDataSource(header, makeFileList(sampleFile));
-        Assert.assertTrue(s.sampleCount() == 5);
-
-        List<Allele> alleleCollection = new ArrayList<Allele>();
-        Allele a1 = Allele.create("A", true);
-        alleleCollection.add(a1);
-
-        Set<Genotype> genotypeCollection = new HashSet<Genotype>();
-        genotypeCollection.add(new Genotype("NA123", alleleCollection));
-        genotypeCollection.add(new Genotype("sampleA", alleleCollection));
-        genotypeCollection.add(new Genotype("sampleB", alleleCollection));
-        genotypeCollection.add(new Genotype("sampleC", alleleCollection));
-
-        VariantContext v = new VariantContext("contextName", "chr1", 1, 1, alleleCollection, genotypeCollection);
-        VariantContext subContext = s.subContextFromSampleProperty(v, "population", "CEU");
-
-        Assert.assertTrue(subContext.getSampleNames().contains("sampleA"));
-        Assert.assertTrue(subContext.getSampleNames().contains("sampleA"));
-        Assert.assertTrue(subContext.getSampleNames().size() == 2);
-
-    }
-    
-
-    // we create lots of single item lists...
-    private ArrayList<File> makeFileList(File file) {
-        ArrayList<File> a = new ArrayList<File>();
-        a.add(file);
-        return a;
-    }
-}
diff --git a/public/java/test/org/broadinstitute/sting/gatk/datasources/sample/SampleUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/datasources/sample/SampleUnitTest.java
deleted file mode 100644
index 67e84cdd8..000000000
--- a/public/java/test/org/broadinstitute/sting/gatk/datasources/sample/SampleUnitTest.java
+++ /dev/null
@@ -1,64 +0,0 @@
-package org.broadinstitute.sting.gatk.datasources.sample;
-
-import org.testng.Assert;
-import org.broadinstitute.sting.BaseTest;
-
-import org.testng.annotations.BeforeClass;
-import org.testng.annotations.Test;
-
-/**
- * Created by IntelliJ IDEA.
- * User: brett
- * Date: Sep 9, 2010
- * Time: 8:21:00 AM
- */
-public class SampleUnitTest extends BaseTest {
-
-    static Sample sampleA;
-    static Sample sampleA1;
-    static Sample sampleB;
-    static Sample sampleC;
-
-    @BeforeClass
-    public void init() {
-        sampleA = new Sample("sampleA");
-        sampleA.setProperty("uniqueProperty", "uniqueValue");
-        sampleA1 = new Sample("sampleA");
-        sampleA1.setProperty("uniqueProperty", "uniqueValue");
-        sampleB = new Sample("sampleB");
-        sampleC = new Sample("sampleC");
-        sampleC.setProperty("population", "pop1");
-        sampleC.setProperty("gender", Sample.Gender.MALE);
-    }
-
-    /**
-     * Testing equality
-     */
-    @Test()
-    public void equalsTest() {
-        Assert.assertTrue(sampleA.equals(sampleA1));
-        Assert.assertFalse(sampleA == sampleA1);
-        Assert.assertFalse(sampleA.equals(sampleB));
-    }
-
-    /**
-     * And hash
-     */
-    @Test()
-    public void basicHashTest() {
-        Assert.assertFalse(sampleA.hashCode() == sampleB.hashCode());
-        Assert.assertTrue(sampleA.hashCode() == sampleA1.hashCode());
-    }
-
-    /**
-     * Now test the special getter methods
-     */
-    @Test()
-    public void specialGettersTest() {
-        Assert.assertTrue(sampleC.getId().equals("sampleC"));
-        Assert.assertTrue(sampleC.getPopulation().equals("pop1"));
-        Assert.assertTrue(sampleC.isMale());
-        Assert.assertFalse(sampleA.isMale());   // sample A doesn't have a gender, so this should be false
-    }
-
-}                     
diff --git a/public/java/test/org/broadinstitute/sting/gatk/iterators/LocusIteratorByStateUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/iterators/LocusIteratorByStateUnitTest.java
index 32d3675b7..c9727d904 100644
--- a/public/java/test/org/broadinstitute/sting/gatk/iterators/LocusIteratorByStateUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/iterators/LocusIteratorByStateUnitTest.java
@@ -1,6 +1,5 @@
 package org.broadinstitute.sting.gatk.iterators;
 
-import net.sf.picard.filter.SamRecordFilter;
 import net.sf.samtools.SAMFileHeader;
 import net.sf.samtools.SAMFileReader;
 import net.sf.samtools.SAMRecord;
@@ -8,11 +7,11 @@ import net.sf.samtools.util.CloseableIterator;
 import org.broadinstitute.sting.gatk.filters.ReadFilter;
 import org.broadinstitute.sting.utils.Utils;
 import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.testng.Assert;
 import org.broadinstitute.sting.BaseTest;
 import org.broadinstitute.sting.gatk.ReadProperties;
 import org.broadinstitute.sting.gatk.arguments.ValidationExclusion;
-import org.broadinstitute.sting.gatk.datasources.sample.SampleDataSource;
 import org.broadinstitute.sting.gatk.datasources.reads.SAMReaderID;
 import org.broadinstitute.sting.gatk.contexts.AlignmentContext;
 import org.broadinstitute.sting.utils.GenomeLocParser;
@@ -29,11 +28,8 @@ import java.util.*;
  * testing of the LocusIteratorByState
  */
 public class LocusIteratorByStateUnitTest extends BaseTest {
-
-    private final int MAX_READS = 10;
     private static SAMFileHeader header;
     private LocusIteratorByState li;
-
     private GenomeLocParser genomeLocParser;
 
     @BeforeClass
@@ -42,6 +38,10 @@ public class LocusIteratorByStateUnitTest extends BaseTest {
         genomeLocParser = new GenomeLocParser(header.getSequenceDictionary());
     }
 
+    private final LocusIteratorByState makeLTBS(List<SAMRecord> reads, ReadProperties readAttributes) {
+        return new LocusIteratorByState(new FakeCloseableIterator<SAMRecord>(reads.iterator()), readAttributes, genomeLocParser, LocusIteratorByState.sampleListForSAMWithoutReadGroups());
+    }
+
     @Test
     public void testIndelBaseQualityFiltering() {
         final byte[] bases = new byte[] {'A','A','A','A','A','A','A','A','A','A'};
@@ -68,7 +68,7 @@ public class LocusIteratorByStateUnitTest extends BaseTest {
         List<SAMRecord> reads = Arrays.asList(before,during,after);
 
         // create the iterator by state with the fake reads and fake records
-        li = new LocusIteratorByState(new FakeCloseableIterator<SAMRecord>(reads.iterator()),readAttributes,genomeLocParser, new SampleDataSource());
+        li = makeLTBS(reads,readAttributes);
 
         boolean foundExtendedEventPileup = false;
         while (li.hasNext()) {
@@ -78,7 +78,7 @@ public class LocusIteratorByStateUnitTest extends BaseTest {
 
             ReadBackedExtendedEventPileup pileup = context.getExtendedEventPileup().getBaseFilteredPileup(10);
             Assert.assertEquals(pileup.getLocation().getStart(), 5, "Extended event pileup at wrong location");
-            Assert.assertEquals(pileup.size(), 3, "Pileup size is incorrect");
+            Assert.assertEquals(pileup.getNumberOfElements(), 3, "Pileup size is incorrect");
 
             foundExtendedEventPileup = true;
         }
@@ -120,7 +120,7 @@ public class LocusIteratorByStateUnitTest extends BaseTest {
         List<SAMRecord> reads = Arrays.asList(before,during,after);
 
         // create the iterator by state with the fake reads and fake records
-        li = new LocusIteratorByState(new FakeCloseableIterator<SAMRecord>(reads.iterator()),readAttributes,genomeLocParser, new SampleDataSource());
+        li = makeLTBS(reads,readAttributes);
 
         boolean foundExtendedEventPileup = false;
         while (li.hasNext()) {
@@ -154,7 +154,7 @@ public class LocusIteratorByStateUnitTest extends BaseTest {
         List<SAMRecord> reads = Arrays.asList(indelOnlyRead);
 
         // create the iterator by state with the fake reads and fake records
-        li = new LocusIteratorByState(new FakeCloseableIterator<SAMRecord>(reads.iterator()),readAttributes,genomeLocParser,new SampleDataSource());
+        li = makeLTBS(reads, readAttributes);
 
         // Traditionally, reads that end with indels bleed into the pileup at the following locus.  Verify that the next pileup contains this read
         // and considers it to be an indel-containing read.
@@ -167,7 +167,7 @@ public class LocusIteratorByStateUnitTest extends BaseTest {
 
         // Turn on extended events, and make sure the event is found.
         JVMUtils.setFieldValue(JVMUtils.findField(ReadProperties.class,"generateExtendedEvents"),readAttributes,true);
-        li = new LocusIteratorByState(new FakeCloseableIterator<SAMRecord>(reads.iterator()),readAttributes,genomeLocParser,new SampleDataSource());
+        li = makeLTBS(reads, readAttributes);
 
         Assert.assertTrue(li.hasNext(),"LocusIteratorByState with extended events should contain exactly one pileup");
         alignmentContext = li.next();
@@ -203,7 +203,7 @@ public class LocusIteratorByStateUnitTest extends BaseTest {
         List<SAMRecord> reads = Arrays.asList(leadingRead,indelOnlyRead,fullMatchAfterIndel);
 
         // create the iterator by state with the fake reads and fake records
-        li = new LocusIteratorByState(new FakeCloseableIterator<SAMRecord>(reads.iterator()),createTestReadProperties(),genomeLocParser,new SampleDataSource());
+        li = makeLTBS(reads, createTestReadProperties());
         int currentLocus = firstLocus;
         int numAlignmentContextsFound = 0;
 
@@ -212,12 +212,12 @@ public class LocusIteratorByStateUnitTest extends BaseTest {
             Assert.assertEquals(alignmentContext.getLocation().getStart(),currentLocus,"Current locus returned by alignment context is incorrect");
 
             if(currentLocus == firstLocus) {
-                List<SAMRecord> readsAtLocus = alignmentContext.getBasePileup().getReads();
+                List<GATKSAMRecord> readsAtLocus = alignmentContext.getBasePileup().getReads();
                 Assert.assertEquals(readsAtLocus.size(),1,"Wrong number of reads at locus " + currentLocus);
                 Assert.assertSame(readsAtLocus.get(0),leadingRead,"leadingRead absent from pileup at locus " + currentLocus);
             }
             else if(currentLocus == secondLocus) {
-                List<SAMRecord> readsAtLocus = alignmentContext.getBasePileup().getReads();
+                List<GATKSAMRecord> readsAtLocus = alignmentContext.getBasePileup().getReads();
                 Assert.assertEquals(readsAtLocus.size(),2,"Wrong number of reads at locus " + currentLocus);
                 Assert.assertSame(readsAtLocus.get(0),indelOnlyRead,"indelOnlyRead absent from pileup at locus " + currentLocus);
                 Assert.assertSame(readsAtLocus.get(1),fullMatchAfterIndel,"fullMatchAfterIndel absent from pileup at locus " + currentLocus);
@@ -260,12 +260,12 @@ public class LocusIteratorByStateUnitTest extends BaseTest {
         List<SAMRecord> reads = Arrays.asList(leadingRead,indelOnlyRead,fullMatchAfterIndel);
 
         // create the iterator by state with the fake reads and fake records
-        li = new LocusIteratorByState(new FakeCloseableIterator<SAMRecord>(reads.iterator()),readAttributes,genomeLocParser,new SampleDataSource());
+        li = makeLTBS(reads,readAttributes);
 
         Assert.assertTrue(li.hasNext(),"Missing first locus at " + firstLocus);
         AlignmentContext alignmentContext = li.next();
         Assert.assertEquals(alignmentContext.getLocation().getStart(),firstLocus,"Incorrect locus at this position; should be " + firstLocus);
-        List<SAMRecord> readsAtLocus = alignmentContext.getBasePileup().getReads();
+        List<GATKSAMRecord> readsAtLocus = alignmentContext.getBasePileup().getReads();
         Assert.assertEquals(readsAtLocus.size(),1,"Wrong number of reads at locus " + firstLocus);
         Assert.assertSame(readsAtLocus.get(0),leadingRead,"leadingRead absent from pileup at locus " + firstLocus);
 
diff --git a/public/java/test/org/broadinstitute/sting/gatk/refdata/tracks/FeatureManagerUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/refdata/tracks/FeatureManagerUnitTest.java
index bae8e99ed..e8799e2ab 100644
--- a/public/java/test/org/broadinstitute/sting/gatk/refdata/tracks/FeatureManagerUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/refdata/tracks/FeatureManagerUnitTest.java
@@ -56,6 +56,7 @@ public class FeatureManagerUnitTest extends BaseTest {
     private static final File VCF3_FILE = new File(validationDataLocation + "vcfexample3.vcf");
     private static final File VCF4_FILE = new File(testDir + "HiSeq.10000.vcf");
     private static final File VCF4_FILE_GZ = new File(testDir + "HiSeq.10000.vcf.gz");
+    private static final File VCF4_FILE_BGZIP = new File(testDir + "HiSeq.10000.bgzip.vcf.gz");
 
     private FeatureManager manager;
     private GenomeLocParser genomeLocParser;
@@ -109,6 +110,7 @@ public class FeatureManagerUnitTest extends BaseTest {
         new FMTest(VariantContext.class, VCF3Codec.class, "VCF3", VCF3_FILE);
         new FMTest(VariantContext.class, VCFCodec.class, "VCF", VCF4_FILE);
         new FMTest(VariantContext.class, VCFCodec.class, "VCF", VCF4_FILE_GZ);
+        new FMTest(VariantContext.class, VCFCodec.class, "VCF", VCF4_FILE_BGZIP);
         new FMTest(TableFeature.class, BedTableCodec.class, "bedtable", null);
         return FMTest.getTests(FMTest.class);
     }
diff --git a/public/java/test/org/broadinstitute/sting/gatk/refdata/tracks/RMDTrackBuilderUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/refdata/tracks/RMDTrackBuilderUnitTest.java
index ae218e898..724c343e4 100644
--- a/public/java/test/org/broadinstitute/sting/gatk/refdata/tracks/RMDTrackBuilderUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/refdata/tracks/RMDTrackBuilderUnitTest.java
@@ -29,7 +29,6 @@ import net.sf.picard.reference.IndexedFastaSequenceFile;
 import net.sf.samtools.SAMSequenceDictionary;
 import org.broad.tribble.Tribble;
 import org.broad.tribble.index.Index;
-import org.broadinstitute.sting.gatk.refdata.tracks.RMDTrackBuilder;
 import org.broadinstitute.sting.utils.codecs.vcf.VCF3Codec;
 import org.broadinstitute.sting.utils.codecs.vcf.VCFCodec;
 import org.broadinstitute.sting.utils.exceptions.UserException;
@@ -45,7 +44,6 @@ import org.testng.annotations.Test;
 
 import java.io.*;
 import java.nio.channels.FileChannel;
-import java.util.Map;
 
 
 /**
@@ -164,7 +162,7 @@ public class RMDTrackBuilderUnitTest extends BaseTest {
         try {
             Index idx = builder.loadIndex(vcfFile, new VCFCodec());
             // catch any exception; this call should pass correctly
-            SAMSequenceDictionary dict =  RMDTrackBuilder.getSequenceDictionaryFromProperties(idx);
+            SAMSequenceDictionary dict =  IndexDictionaryUtils.getSequenceDictionaryFromProperties(idx);
         } catch (IOException e) {
             e.printStackTrace();
             Assert.fail("IO exception unexpected" + e.getMessage());
diff --git a/public/java/test/org/broadinstitute/sting/gatk/samples/PedReaderUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/samples/PedReaderUnitTest.java
new file mode 100644
index 000000000..1601845cd
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/gatk/samples/PedReaderUnitTest.java
@@ -0,0 +1,353 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.gatk.samples;
+
+import org.apache.log4j.Logger;
+import org.broadinstitute.sting.BaseTest;
+import org.broadinstitute.sting.utils.Utils;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.testng.Assert;
+import org.testng.annotations.DataProvider;
+import org.testng.annotations.Test;
+
+import java.io.StringReader;
+import java.util.*;
+
+/**
+ * UnitTest for PedReader
+ *
+ * @author Mark DePristo
+ * @since 2011
+ */
+public class PedReaderUnitTest extends BaseTest {
+    private static Logger logger = Logger.getLogger(PedReaderUnitTest.class);
+
+    private class PedReaderTest extends TestDataProvider {
+        public String fileContents;
+        public List<Sample> expectedSamples;
+        EnumSet<PedReader.MissingPedField> missing;
+
+        private PedReaderTest(final String name, final List<Sample> expectedSamples, final String fileContents) {
+            super(PedReaderTest.class, name);
+            this.fileContents = fileContents;
+            this.expectedSamples = expectedSamples;
+        }
+    }
+
+//     Family ID
+//     Individual ID
+//     Paternal ID
+//     Maternal ID
+//     Sex (1=male; 2=female; other=unknown)
+//     Phenotype
+//
+//     -9 missing
+//     0 missing
+//     1 unaffected
+//     2 affected
+
+    @DataProvider(name = "readerTest")
+    public Object[][] createPEDFiles() {
+        new PedReaderTest("singleRecordMale",
+                Arrays.asList(new Sample("kid", "fam1", null, null, Gender.MALE, Affection.UNAFFECTED)),
+                "fam1 kid 0 0 1 1");
+
+        new PedReaderTest("singleRecordFemale",
+                Arrays.asList(new Sample("kid", "fam1", null, null, Gender.FEMALE, Affection.UNAFFECTED)),
+                "fam1 kid 0 0 2 1");
+
+        new PedReaderTest("singleRecordMissingGender",
+                Arrays.asList(new Sample("kid", "fam1", null, null, Gender.UNKNOWN, Affection.UNKNOWN)),
+                "fam1 kid 0 0 0 0");
+
+        // Affection
+        new PedReaderTest("singleRecordAffected",
+                Arrays.asList(new Sample("kid", "fam1", null, null, Gender.MALE, Affection.AFFECTED)),
+                "fam1 kid 0 0 1 2");
+
+        new PedReaderTest("singleRecordUnaffected",
+                Arrays.asList(new Sample("kid", "fam1", null, null, Gender.MALE, Affection.UNAFFECTED)),
+                "fam1 kid 0 0 1 1");
+
+        new PedReaderTest("singleRecordMissingAffection-9",
+                Arrays.asList(new Sample("kid", "fam1", null, null, Gender.MALE, Affection.UNKNOWN)),
+                "fam1 kid 0 0 1 -9");
+
+        new PedReaderTest("singleRecordMissingAffection0",
+                Arrays.asList(new Sample("kid", "fam1", null, null, Gender.MALE, Affection.UNKNOWN)),
+                "fam1 kid 0 0 1 0");
+
+        new PedReaderTest("multipleUnrelated",
+                Arrays.asList(
+                        new Sample("s1", "fam1", null, null, Gender.MALE,   Affection.UNAFFECTED),
+                        new Sample("s2", "fam2", null, null, Gender.FEMALE, Affection.AFFECTED)),
+                String.format("%s%n%s",
+                        "fam1 s1 0 0 1 1",
+                        "fam2 s2 0 0 2 2"));
+
+        new PedReaderTest("multipleUnrelatedExtraLine",
+                Arrays.asList(
+                        new Sample("s1", "fam1", null, null, Gender.MALE,   Affection.UNAFFECTED),
+                        new Sample("s2", "fam2", null, null, Gender.FEMALE, Affection.AFFECTED)),
+                String.format("%s%n%s%n  %n", // note extra newlines and whitespace
+                        "fam1 s1 0 0 1 1",
+                        "fam2 s2 0 0 2 2"));
+
+        new PedReaderTest("explicitTrio",
+                Arrays.asList(
+                        new Sample("kid", "fam1", "dad", "mom", Gender.MALE,   Affection.AFFECTED),
+                        new Sample("dad", "fam1", null, null,   Gender.MALE,   Affection.UNAFFECTED),
+                        new Sample("mom", "fam1", null, null,   Gender.FEMALE, Affection.AFFECTED)),
+                String.format("%s%n%s%n%s",
+                        "fam1 kid dad mom 1 2",
+                        "fam1 dad 0   0   1 1",
+                        "fam1 mom 0   0   2 2"));
+
+        new PedReaderTest("implicitTrio",
+                Arrays.asList(
+                        new Sample("kid", "fam1", "dad", "mom", Gender.MALE,   Affection.AFFECTED),
+                        new Sample("dad", "fam1", null, null,   Gender.MALE,   Affection.UNKNOWN),
+                        new Sample("mom", "fam1", null, null,   Gender.FEMALE, Affection.UNKNOWN)),
+                "fam1 kid dad mom 1 2");
+
+        new PedReaderTest("partialTrio",
+                Arrays.asList(
+                        new Sample("kid", "fam1", "dad", "mom", Gender.MALE,   Affection.AFFECTED),
+                        new Sample("dad", "fam1", null, null,   Gender.MALE,   Affection.UNAFFECTED),
+                        new Sample("mom", "fam1", null, null,   Gender.FEMALE, Affection.UNKNOWN)),
+                String.format("%s%n%s",
+                        "fam1 kid dad mom 1 2",
+                        "fam1 dad 0   0   1 1"));
+
+        new PedReaderTest("bigPedigree",
+                Arrays.asList(
+                        new Sample("kid", "fam1", "dad",       "mom",      Gender.MALE,   Affection.AFFECTED),
+                        new Sample("dad", "fam1", "granddad1", "grandma1", Gender.MALE,   Affection.UNAFFECTED),
+                        new Sample("granddad1", "fam1", null, null,        Gender.MALE,   Affection.UNKNOWN),
+                        new Sample("grandma1",  "fam1", null, null,        Gender.FEMALE,   Affection.UNKNOWN),
+                        new Sample("mom", "fam1", "granddad2", "grandma2", Gender.FEMALE, Affection.AFFECTED),
+                        new Sample("granddad2", "fam1", null, null,        Gender.MALE,   Affection.UNKNOWN),
+                        new Sample("grandma2",  "fam1", null, null,        Gender.FEMALE,   Affection.UNKNOWN)),
+                String.format("%s%n%s%n%s",
+                        "fam1 kid dad       mom      1 2",
+                        "fam1 dad granddad1 grandma1 1 1",
+                        "fam1 mom granddad2 grandma2 2 2"));
+
+        // Quantitative trait
+        new PedReaderTest("OtherPhenotype",
+                Arrays.asList(
+                        new Sample("s1", "fam1", null, null, Gender.MALE,   Affection.OTHER, "1"),
+                        new Sample("s2", "fam2", null, null, Gender.FEMALE, Affection.OTHER, "10.0")),
+                String.format("%s%n%s",
+                        "fam1 s1 0 0 1 1",
+                        "fam2 s2 0 0 2 10.0"));
+
+        new PedReaderTest("OtherPhenotypeWithMissing",
+                Arrays.asList(
+                        new Sample("s1", "fam1", null, null, Gender.MALE,   Affection.UNKNOWN, Sample.UNSET_QT),
+                        new Sample("s2", "fam2", null, null, Gender.FEMALE, Affection.OTHER, "10.0")),
+                String.format("%s%n%s",
+                        "fam1 s1 0 0 1 -9",
+                        "fam2 s2 0 0 2 10.0"));
+
+        new PedReaderTest("OtherPhenotypeOnlyInts",
+                Arrays.asList(
+                        new Sample("s1", "fam1", null, null, Gender.MALE,   Affection.OTHER, "1"),
+                        new Sample("s2", "fam2", null, null, Gender.FEMALE, Affection.OTHER, "10")),
+                String.format("%s%n%s",
+                        "fam1 s1 0 0 1 1",
+                        "fam2 s2 0 0 2 10"));
+
+        return PedReaderTest.getTests(PedReaderTest.class);
+    }
+
+    private static final void runTest(PedReaderTest test, String myFileContents, EnumSet<PedReader.MissingPedField> missing) {
+        logger.warn("Test " + test);
+        PedReader reader = new PedReader();
+        SampleDB sampleDB = new SampleDB();
+        List<Sample> readSamples = reader.parse(myFileContents, missing, sampleDB);
+        Assert.assertEquals(new HashSet<Sample>(test.expectedSamples), new HashSet<Sample>(readSamples));
+    }
+
+    @Test(enabled = true, dataProvider = "readerTest")
+    public void testPedReader(PedReaderTest test) {
+        runTest(test, test.fileContents, EnumSet.noneOf(PedReader.MissingPedField.class));
+    }
+
+    @Test(enabled = true, dataProvider = "readerTest")
+    public void testPedReaderWithComments(PedReaderTest test) {
+        runTest(test, String.format("#comment%n%s", test.fileContents), EnumSet.noneOf(PedReader.MissingPedField.class));
+    }
+
+    @Test(enabled = true, dataProvider = "readerTest")
+    public void testPedReaderWithSemicolons(PedReaderTest test) {
+        runTest(test,
+                test.fileContents.replace(String.format("%n"), ";"),
+                EnumSet.noneOf(PedReader.MissingPedField.class));
+    }
+
+    // -----------------------------------------------------------------
+    // missing format field tests
+    // -----------------------------------------------------------------
+
+    private class PedReaderTestMissing extends TestDataProvider {
+        public EnumSet<PedReader.MissingPedField> missingDesc;
+        public EnumSet<PedReader.Field> missingFields;
+        public final String fileContents;
+        public Sample expected;
+
+
+        private PedReaderTestMissing(final String name, final String fileContents,
+                                     EnumSet<PedReader.MissingPedField> missingDesc,
+                                     EnumSet<PedReader.Field> missingFields,
+                                     final Sample expected) {
+            super(PedReaderTestMissing.class, name);
+            this.fileContents = fileContents;
+            this.missingDesc = missingDesc;
+            this.missingFields = missingFields;
+            this.expected = expected;
+        }
+    }
+
+    @DataProvider(name = "readerTestMissing")
+    public Object[][] createPEDFilesWithMissing() {
+        new PedReaderTestMissing("missingFam",
+                "fam1 kid dad mom 1 2",
+                EnumSet.of(PedReader.MissingPedField.NO_FAMILY_ID),
+                EnumSet.of(PedReader.Field.FAMILY_ID),
+                new Sample("kid", null, "dad", "mom", Gender.MALE, Affection.AFFECTED));
+
+        new PedReaderTestMissing("missingParents",
+                "fam1 kid dad mom 1 2",
+                EnumSet.of(PedReader.MissingPedField.NO_PARENTS),
+                EnumSet.of(PedReader.Field.PATERNAL_ID, PedReader.Field.MATERNAL_ID),
+                new Sample("kid", "fam1", null, null, Gender.MALE, Affection.AFFECTED));
+
+        new PedReaderTestMissing("missingSex",
+                "fam1 kid dad mom 1 2",
+                EnumSet.of(PedReader.MissingPedField.NO_SEX),
+                EnumSet.of(PedReader.Field.GENDER),
+                new Sample("kid", "fam1", "dad", "mom", Gender.UNKNOWN, Affection.AFFECTED));
+
+        new PedReaderTestMissing("missingPhenotype",
+                "fam1 kid dad mom 1 2",
+                EnumSet.of(PedReader.MissingPedField.NO_PHENOTYPE),
+                EnumSet.of(PedReader.Field.PHENOTYPE),
+                new Sample("kid", "fam1", "dad", "mom", Gender.MALE, Affection.UNKNOWN));
+
+        new PedReaderTestMissing("missingEverythingButGender",
+                "fam1 kid dad mom 1 2",
+                EnumSet.of(PedReader.MissingPedField.NO_PHENOTYPE, PedReader.MissingPedField.NO_PARENTS, PedReader.MissingPedField.NO_FAMILY_ID),
+                EnumSet.of(PedReader.Field.FAMILY_ID, PedReader.Field.PATERNAL_ID, PedReader.Field.MATERNAL_ID, PedReader.Field.PHENOTYPE),
+                new Sample("kid", null, null, null, Gender.MALE, Affection.UNKNOWN));
+
+
+        return PedReaderTestMissing.getTests(PedReaderTestMissing.class);
+    }
+
+    @Test(enabled = true, dataProvider = "readerTestMissing")
+    public void testPedReaderWithMissing(PedReaderTestMissing test) {
+        final String contents = sliceContents(test.missingFields, test.fileContents);
+        logger.warn("Test " + test);
+        PedReader reader = new PedReader();
+        SampleDB sampleDB = new SampleDB();
+        reader.parse(new StringReader(contents), test.missingDesc, sampleDB);
+        final Sample missingSample = sampleDB.getSample("kid");
+        Assert.assertEquals(test.expected, missingSample, "Missing field value not expected value for " + test);
+    }
+
+    private final static String sliceContents(EnumSet<PedReader.Field> missingFieldsSet, String full) {
+        List<String> parts = new ArrayList<String>(Arrays.asList(full.split("\\s+")));
+        final List<PedReader.Field> missingFields = new ArrayList<PedReader.Field>(missingFieldsSet);
+        Collections.reverse(missingFields);
+        for ( PedReader.Field field : missingFields )
+            parts.remove(field.ordinal());
+        return Utils.join("\t", parts);
+    }
+
+    // -----------------------------------------------------------------
+    // parsing tags
+    // -----------------------------------------------------------------
+
+    private class PedReaderTestTagParsing extends TestDataProvider {
+        public EnumSet<PedReader.MissingPedField> expected;
+        public final List<String> tags;
+
+        private PedReaderTestTagParsing(final List<String> tags, EnumSet<PedReader.MissingPedField> missingDesc) {
+            super(PedReaderTestTagParsing.class);
+            this.tags = tags;
+            this.expected = missingDesc;
+        }
+    }
+
+    @DataProvider(name = "readerTestTagParsing")
+    public Object[][] createReaderTestTagParsing() {
+        new PedReaderTestTagParsing(
+                Collections.<String>emptyList(),
+                EnumSet.noneOf(PedReader.MissingPedField.class));
+
+        new PedReaderTestTagParsing(
+                Arrays.asList("NO_FAMILY_ID"),
+                EnumSet.of(PedReader.MissingPedField.NO_FAMILY_ID));
+
+        new PedReaderTestTagParsing(
+                Arrays.asList("NO_PARENTS"),
+                EnumSet.of(PedReader.MissingPedField.NO_PARENTS));
+
+        new PedReaderTestTagParsing(
+                Arrays.asList("NO_PHENOTYPE"),
+                EnumSet.of(PedReader.MissingPedField.NO_PHENOTYPE));
+
+        new PedReaderTestTagParsing(
+                Arrays.asList("NO_SEX"),
+                EnumSet.of(PedReader.MissingPedField.NO_SEX));
+
+        new PedReaderTestTagParsing(
+                Arrays.asList("NO_SEX", "NO_PHENOTYPE"),
+                EnumSet.of(PedReader.MissingPedField.NO_SEX, PedReader.MissingPedField.NO_PHENOTYPE));
+
+        new PedReaderTestTagParsing(
+                Arrays.asList("NO_SEX", "NO_PHENOTYPE", "NO_PARENTS"),
+                EnumSet.of(PedReader.MissingPedField.NO_SEX, PedReader.MissingPedField.NO_PHENOTYPE, PedReader.MissingPedField.NO_PARENTS));
+
+        return PedReaderTestTagParsing.getTests(PedReaderTestTagParsing.class);
+    }
+
+    @Test(enabled = true, dataProvider = "readerTestTagParsing")
+    public void testPedReaderTagParsing(PedReaderTestTagParsing test) {
+        EnumSet<PedReader.MissingPedField> parsed = PedReader.parseMissingFieldTags("test", test.tags);
+        Assert.assertEquals(test.expected, parsed, "Failed to properly parse tags " + test.tags);
+    }
+
+    @Test(enabled = true, expectedExceptions = UserException.class)
+    public void testPedReaderTagParsing1() {
+        EnumSet<PedReader.MissingPedField> parsed = PedReader.parseMissingFieldTags("test", Arrays.asList("XXX"));
+    }
+
+    @Test(enabled = true, expectedExceptions = UserException.class)
+    public void testPedReaderTagParsing2() {
+        EnumSet<PedReader.MissingPedField> parsed = PedReader.parseMissingFieldTags("test", Arrays.asList("NO_SEX", "XXX"));
+    }
+}
\ No newline at end of file
diff --git a/public/java/test/org/broadinstitute/sting/gatk/samples/SampleDBUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/samples/SampleDBUnitTest.java
new file mode 100644
index 000000000..d498ee61a
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/gatk/samples/SampleDBUnitTest.java
@@ -0,0 +1,157 @@
+package org.broadinstitute.sting.gatk.samples;
+
+import net.sf.samtools.SAMFileHeader;
+import org.broadinstitute.sting.BaseTest;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.sam.ArtificialSAMUtils;
+import org.testng.Assert;
+import org.testng.annotations.BeforeMethod;
+import org.testng.annotations.Test;
+
+import java.io.File;
+import java.util.*;
+
+/**
+ * Created by IntelliJ IDEA.
+ * User: brett
+ * Date: Sep 9, 2010
+ * Time: 8:21:00 AM
+ */
+public class SampleDBUnitTest extends BaseTest {
+    private static SampleDBBuilder builder;
+    // all the test sample files are located here
+    private File testPED = new File(testDir +  "ceutrio.ped");
+
+    private static final Set<Sample> testPEDSamples = new HashSet<Sample>(Arrays.asList(
+            new Sample("kid", "fam1", "dad", "mom", Gender.MALE,   Affection.AFFECTED),
+            new Sample("dad", "fam1", null, null,   Gender.MALE,   Affection.UNAFFECTED),
+            new Sample("mom", "fam1", null, null,   Gender.FEMALE, Affection.AFFECTED)));
+
+    private static final Set<Sample> testSAMSamples = new HashSet<Sample>(Arrays.asList(
+            new Sample("kid", null, null, null, Gender.UNKNOWN,   Affection.UNKNOWN),
+            new Sample("mom", null, null, null, Gender.UNKNOWN,   Affection.UNKNOWN),
+            new Sample("dad", null, null, null, Gender.UNKNOWN,   Affection.UNKNOWN)));
+
+    private static final String testPEDString =
+            String.format("%s%n%s%n%s",
+                    "fam1 kid dad mom 1 2",
+                    "fam1 dad 0   0   1 1",
+                    "fam1 mom 0   0   2 2");
+
+    private static final String testPEDMultipleFamilies =
+            String.format("%s%n%s%n%s%n%s%n%s",
+                    "fam1 kid dad mom 1 2",
+                    "fam1 dad 0   0   1 1",
+                    "fam1 mom 0   0   2 2",
+                    "fam3 s1  d1  m1  2 2",
+                    "fam2 s2  d2  m2  2 2");
+
+    private static final String testPEDStringInconsistentGender =
+            "fam1 kid 0   0   2 2";
+
+    private static final Set<Sample> testPEDSamplesAsSet =
+            new HashSet<Sample>(testPEDSamples);
+
+
+    @BeforeMethod
+    public void before() {
+        builder = new SampleDBBuilder(PedigreeValidationType.STRICT);
+    }
+
+    @Test()
+    public void loadPEDFile() {
+        builder.addSamplesFromPedigreeFiles(Arrays.asList(testPED));
+        SampleDB db = builder.getFinalSampleDB();
+        Assert.assertEquals(testPEDSamplesAsSet, db.getSamples());
+    }
+
+    @Test()
+    public void loadPEDString() {
+        builder.addSamplesFromPedigreeStrings(Arrays.asList(testPEDString));
+        SampleDB db = builder.getFinalSampleDB();
+        Assert.assertEquals(testPEDSamplesAsSet, db.getSamples());
+    }
+
+    private static final void addSAMHeader() {
+        SAMFileHeader header = ArtificialSAMUtils.createArtificialSamHeader(1, 1, 10);
+        ArtificialSAMUtils.createEnumeratedReadGroups(header, Arrays.asList("1", "2", "3"),
+                Arrays.asList("kid", "mom", "dad"));
+        builder.addSamplesFromSAMHeader(header);
+    }
+
+    @Test()
+    public void loadSAMHeader() {
+        addSAMHeader();
+        SampleDB db = builder.getFinalSampleDB();
+        Assert.assertEquals(testSAMSamples, db.getSamples());
+    }
+
+    @Test()
+    public void loadSAMHeaderPlusPED() {
+        addSAMHeader();
+        builder.addSamplesFromPedigreeFiles(Arrays.asList(testPED));
+        SampleDB db = builder.getFinalSampleDB();
+        Assert.assertEquals(testPEDSamples, db.getSamples());
+    }
+
+    @Test()
+    public void loadDuplicateData() {
+        builder.addSamplesFromPedigreeFiles(Arrays.asList(testPED));
+        builder.addSamplesFromPedigreeFiles(Arrays.asList(testPED));
+        SampleDB db = builder.getFinalSampleDB();
+        Assert.assertEquals(testPEDSamples, db.getSamples());
+    }
+
+    @Test(expectedExceptions = UserException.class)
+    public void loadNonExistentFile() {
+        builder.addSamplesFromPedigreeFiles(Arrays.asList(new File("non-existence-file.txt")));
+        SampleDB db = builder.getFinalSampleDB();
+        Assert.assertEquals(testSAMSamples, db.getSamples());
+    }
+
+    @Test(expectedExceptions = UserException.class)
+    public void loadInconsistentData() {
+        builder = new SampleDBBuilder(PedigreeValidationType.STRICT);
+        builder.addSamplesFromPedigreeFiles(Arrays.asList(testPED));
+        builder.addSamplesFromPedigreeStrings(Arrays.asList(testPEDStringInconsistentGender));
+        builder.getFinalSampleDB();
+    }
+
+    @Test(expectedExceptions = UserException.class)
+    public void sampleInSAMHeaderNotInSamplesDB() {
+        addSAMHeader();
+        builder.addSamplesFromPedigreeStrings(Arrays.asList(testPEDStringInconsistentGender));
+        builder.getFinalSampleDB();
+    }
+
+    @Test()
+    public void getFamilyIDs() {
+        builder.addSamplesFromPedigreeStrings(Arrays.asList(testPEDMultipleFamilies));
+        SampleDB db = builder.getFinalSampleDB();
+        Assert.assertEquals(db.getFamilyIDs(), new TreeSet<String>(Arrays.asList("fam1", "fam2", "fam3")));
+    }
+
+    @Test()
+    public void getFamily() {
+        builder.addSamplesFromPedigreeStrings(Arrays.asList(testPEDMultipleFamilies));
+        SampleDB db = builder.getFinalSampleDB();
+        Assert.assertEquals(db.getFamily("fam1"), testPEDSamplesAsSet);
+    }
+
+    @Test()
+    public void loadFamilyIDs() {
+        builder.addSamplesFromPedigreeStrings(Arrays.asList(testPEDMultipleFamilies));
+        SampleDB db = builder.getFinalSampleDB();
+        Map<String, Set<Sample>> families = db.getFamilies();
+        Assert.assertEquals(families.size(), 3);
+        Assert.assertEquals(families.keySet(), new TreeSet<String>(Arrays.asList("fam1", "fam2", "fam3")));
+
+        for ( final String famID : families.keySet() ) {
+            final Set<Sample> fam = families.get(famID);
+            Assert.assertEquals(fam.size(), 3);
+            for ( final Sample sample : fam ) {
+                Assert.assertEquals(sample.getFamilyID(), famID);
+            }
+        }
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/gatk/samples/SampleUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/samples/SampleUnitTest.java
new file mode 100644
index 000000000..3af40adbe
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/gatk/samples/SampleUnitTest.java
@@ -0,0 +1,64 @@
+package org.broadinstitute.sting.gatk.samples;
+
+import org.broadinstitute.sting.BaseTest;
+import org.testng.Assert;
+import org.testng.annotations.BeforeClass;
+import org.testng.annotations.Test;
+
+/**
+ *
+ */
+public class SampleUnitTest extends BaseTest {
+    SampleDB db;
+    static Sample fam1A, fam1B, fam1C;
+    static Sample s1, s2;
+    static Sample trait1, trait2, trait3, trait4, trait5;
+
+    @BeforeClass
+    public void init() {
+        db = new SampleDB();
+
+        fam1A = new Sample("1A", db, "fam1", "1B", "1C", Gender.UNKNOWN);
+        fam1B = new Sample("1B", db, "fam1", null, null, Gender.MALE);
+        fam1C = new Sample("1C", db, "fam1", null, null, Gender.FEMALE);
+
+        s1 = new Sample("s1", db);
+        s2 = new Sample("s2", db);
+
+        trait1 = new Sample("t1", db, Affection.AFFECTED, Sample.UNSET_QT);
+        trait2 = new Sample("t2", db, Affection.UNAFFECTED, Sample.UNSET_QT);
+        trait3 = new Sample("t3", db, Affection.UNKNOWN, Sample.UNSET_QT);
+        trait4 = new Sample("t4", db, Affection.OTHER, "1.0");
+        trait5 = new Sample("t4", db, Affection.OTHER, "CEU");
+    }
+
+    /**
+     * Now basic getters
+     */
+    @Test()
+    public void normalGettersTest() {
+        Assert.assertEquals("1A", fam1A.getID());
+        Assert.assertEquals("fam1", fam1A.getFamilyID());
+        Assert.assertEquals("1B", fam1A.getPaternalID());
+        Assert.assertEquals("1C", fam1A.getMaternalID());
+        Assert.assertEquals(null, fam1B.getPaternalID());
+        Assert.assertEquals(null, fam1B.getMaternalID());
+
+        Assert.assertEquals(Affection.AFFECTED, trait1.getAffection());
+        Assert.assertEquals(Sample.UNSET_QT, trait1.getOtherPhenotype());
+        Assert.assertEquals(Affection.UNAFFECTED, trait2.getAffection());
+        Assert.assertEquals(Sample.UNSET_QT, trait2.getOtherPhenotype());
+        Assert.assertEquals(Affection.UNKNOWN, trait3.getAffection());
+        Assert.assertEquals(Sample.UNSET_QT, trait3.getOtherPhenotype());
+        Assert.assertEquals(Affection.OTHER, trait4.getAffection());
+        Assert.assertEquals("1.0", trait4.getOtherPhenotype());
+        Assert.assertEquals("CEU", trait5.getOtherPhenotype());
+    }
+
+    @Test()
+    public void testGenders() {
+        Assert.assertTrue(fam1A.getGender() == Gender.UNKNOWN);
+        Assert.assertTrue(fam1B.getGender() == Gender.MALE);
+        Assert.assertTrue(fam1C.getGender() == Gender.FEMALE);
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/BAQIntegrationTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/BAQIntegrationTest.java
index 702ba9f4f..c7eb4d88b 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/BAQIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/BAQIntegrationTest.java
@@ -18,7 +18,7 @@ public class BAQIntegrationTest extends WalkerTest {
     // --------------------------------------------------------------------------------------------------------------
     @Test
     public void testPrintReadsNoBAQ() {
-        WalkerTestSpec spec = new WalkerTestSpec( baseCommand +" -baq OFF",  1, Arrays.asList("902197bf77ed5a828d50e08771685928"));
+        WalkerTestSpec spec = new WalkerTestSpec( baseCommand +" -baq OFF",  1, Arrays.asList("d97340a2bba2c6320d1ebeb86024a27c"));
         executeTest(String.format("testPrintReadsNoBAQ"), spec);
     }
 
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/ClipReadsWalkersIntegrationTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/ClipReadsWalkersIntegrationTest.java
index 1565c419b..216026a52 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/ClipReadsWalkersIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/ClipReadsWalkersIntegrationTest.java
@@ -36,7 +36,7 @@ public class ClipReadsWalkersIntegrationTest extends WalkerTest {
         WalkerTestSpec spec = new WalkerTestSpec(
                 "-R " + hg18Reference +
                         " -T ClipReads " +
-                        "-I " + validationDataLocation + "clippingReadsTest.bam " +
+                        "-I " + validationDataLocation + "clippingReadsTest.withRG.bam " +
                         "-os %s " +
                         "-o %s " + args,
                 2, // just one output file
@@ -46,23 +46,22 @@ public class ClipReadsWalkersIntegrationTest extends WalkerTest {
     }
 
     final static String Q10ClipOutput = "b29c5bc1cb9006ed9306d826a11d444f";
-    @Test public void testQClip0() { testClipper("clipQSum0", "-QT 0", "117a4760b54308f81789c39b1c9de578", "4deca83d80dfa3f093e0dc27d27d1352"); }
-    @Test public void testQClip2() { testClipper("clipQSum2", "-QT 2", Q10ClipOutput, "1e123233ebd2f35ac3f41b1b7d2c8199"); }
-    @Test public void testQClip10() { testClipper("clipQSum10", "-QT 10", "b29c5bc1cb9006ed9306d826a11d444f", "1e123233ebd2f35ac3f41b1b7d2c8199"); }
-    @Test public void testQClip20() { testClipper("clipQSum20", "-QT 20", "6c3434dce66ae5c9eeea502f10fb9bee", "b950538d2d8fac1bcee11850c452bd6a"); }
-    @Test public void testQClip30() { testClipper("clipQSum30", "-QT 20", "6c3434dce66ae5c9eeea502f10fb9bee", "b950538d2d8fac1bcee11850c452bd6a"); }
+    @Test public void testQClip0() { testClipper("clipQSum0", "-QT 0", "117a4760b54308f81789c39b1c9de578", "33e781084379aae538954e30919e8fd3"); }
+    @Test public void testQClip2() { testClipper("clipQSum2", "-QT 2", Q10ClipOutput, "57c05b6241db7110148a91fde2d431d0"); }
+    @Test public void testQClip10() { testClipper("clipQSum10", "-QT 10", "b29c5bc1cb9006ed9306d826a11d444f", "57c05b6241db7110148a91fde2d431d0"); }
+    @Test public void testQClip20() { testClipper("clipQSum20", "-QT 20", "6c3434dce66ae5c9eeea502f10fb9bee", "67263a39d5127f2660a5b638ff32056a"); }
 
-    @Test public void testClipRange1() { testClipper("clipRange1", "-CT 1-5", "b5acd753226e25b1e088838c1aab9117", "9f70540b795f227668dcf78edcb35c09"); }
-    @Test public void testClipRange2() { testClipper("clipRange2", "-CT 1-5,11-15", "be4fcad5b666a5540028b774169cbad7", "a22347a741640fc6df92700e0e8d6f61"); }
+    @Test public void testClipRange1() { testClipper("clipRange1", "-CT 1-5", "b5acd753226e25b1e088838c1aab9117", "764846d0592f346a33525af674fd7a10"); }
+    @Test public void testClipRange2() { testClipper("clipRange2", "-CT 1-5,11-15", "be4fcad5b666a5540028b774169cbad7", "3061cf742f9e5526a61130128ae761a3"); }
 
-    @Test public void testClipSeq() { testClipper("clipSeqX", "-X CCCCC", "db199bd06561c9f2122f6ffb07941fbc", "f49e9e61a44115e2be59330259966f53"); }
-    @Test public void testClipSeqFile() { testClipper("clipSeqXF", "-XF " + validationDataLocation + "seqsToClip.fasta", "d011a3152b31822475afbe0281491f8d", "5c977f261442ab6122d5198fa4086e67"); }
+    @Test public void testClipSeq() { testClipper("clipSeqX", "-X CCCCC", "db199bd06561c9f2122f6ffb07941fbc", "b89459f373e40f0b835c1faff2208839"); }
+    @Test public void testClipSeqFile() { testClipper("clipSeqXF", "-XF " + validationDataLocation + "seqsToClip.fasta", "d011a3152b31822475afbe0281491f8d", "24e19116ef16a37a6d095ed5c22c2466"); }
 
-    @Test public void testClipMulti() { testClipper("clipSeqMulti", "-QT 10 -CT 1-5 -XF " + validationDataLocation + "seqsToClip.fasta -X CCCCC", "a23187bd9bfb06557f799706d98441de", "38d5f33d198aeee7eebec9feb7b11199"); }
+    @Test public void testClipMulti() { testClipper("clipSeqMulti", "-QT 10 -CT 1-5 -XF " + validationDataLocation + "seqsToClip.fasta -X CCCCC", "a23187bd9bfb06557f799706d98441de", "ad8d30300cb43d5e300fcc4d2450da8e"); }
 
-    @Test public void testClipNs() { testClipper("testClipNs", "-QT 10 -CR WRITE_NS", Q10ClipOutput, "1e123233ebd2f35ac3f41b1b7d2c8199"); }
-    @Test public void testClipQ0s() { testClipper("testClipQs", "-QT 10 -CR WRITE_Q0S", Q10ClipOutput, "d44cab2e3b70f5492a0f5b59f0b80043"); }
-    @Test public void testClipSoft() { testClipper("testClipSoft", "-QT 10 -CR SOFTCLIP_BASES", Q10ClipOutput, "b86374a7e6f59e3dd35781e9e8006702"); }
+    @Test public void testClipNs() { testClipper("testClipNs", "-QT 10 -CR WRITE_NS", Q10ClipOutput, "57c05b6241db7110148a91fde2d431d0"); }
+    @Test public void testClipQ0s() { testClipper("testClipQs", "-QT 10 -CR WRITE_Q0S", Q10ClipOutput, "2a1a3153e0942ab355fd8a6e082b30e0"); }
+    @Test public void testClipSoft() { testClipper("testClipSoft", "-QT 10 -CR SOFTCLIP_BASES", Q10ClipOutput, "50d43d63d8e39f67a87a6359963c6f52"); }
 
     @Test
     public void testUseOriginalQuals() {
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/PrintReadsWalkerUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/PrintReadsWalkerUnitTest.java
index 5990f1a06..8cd10048a 100644
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/PrintReadsWalkerUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/PrintReadsWalkerUnitTest.java
@@ -10,6 +10,8 @@ import net.sf.samtools.SAMFileHeader;
 
 import static org.testng.Assert.assertEquals;
 import static org.testng.Assert.assertTrue;
+
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.testng.annotations.BeforeMethod;
 import org.testng.annotations.Test;
 
@@ -94,8 +96,8 @@ public class PrintReadsWalkerUnitTest extends BaseTest {
         walker.out = writer;
 
         SAMFileHeader head = ArtificialSAMUtils.createArtificialSamHeader(3,1,1000);
-        SAMRecord rec = ArtificialSAMUtils.createArtificialRead(head, "FakeRead", 1, 1, 50);
-        SAMRecord ret = walker.map(bases, rec,null);
+        GATKSAMRecord rec = ArtificialSAMUtils.createArtificialRead(head, "FakeRead", 1, 1, 50);
+        SAMRecord ret = walker.map(bases, rec, null);
         assertTrue(ret == rec);
         assertTrue(ret.getReadName().equals(rec.getReadName()));
     }
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotatorIntegrationTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotatorIntegrationTest.java
index 04bff8d41..8e887c32a 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotatorIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/annotator/VariantAnnotatorIntegrationTest.java
@@ -31,7 +31,7 @@ public class VariantAnnotatorIntegrationTest extends WalkerTest {
     @Test
     public void testHasAnnotsAsking1() {
         WalkerTestSpec spec = new WalkerTestSpec(
-                baseTestString() + " -G \"Standard\" --variant:VCF3 " + validationDataLocation + "vcfexample2.vcf -I " + validationDataLocation + "low_coverage_CEU.chr1.10k-11k.bam -L 1:10,020,000-10,021,000", 1,
+                baseTestString() + " -G Standard --variant:VCF3 " + validationDataLocation + "vcfexample2.vcf -I " + validationDataLocation + "low_coverage_CEU.chr1.10k-11k.bam -L 1:10,020,000-10,021,000", 1,
                 Arrays.asList("8e7de435105499cd71ffc099e268a83e"));
         executeTest("test file has annotations, asking for annotations, #1", spec);
     }
@@ -39,7 +39,7 @@ public class VariantAnnotatorIntegrationTest extends WalkerTest {
     @Test
     public void testHasAnnotsAsking2() {
         WalkerTestSpec spec = new WalkerTestSpec(
-                baseTestString() + " -G \"Standard\" --variant:VCF3 " + validationDataLocation + "vcfexample3.vcf -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam -L 1:10,000,000-10,050,000", 1,
+                baseTestString() + " -G Standard --variant:VCF3 " + validationDataLocation + "vcfexample3.vcf -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam -L 1:10,000,000-10,050,000", 1,
                 Arrays.asList("64b6804cb1e27826e3a47089349be581"));
         executeTest("test file has annotations, asking for annotations, #2", spec);
     }
@@ -63,7 +63,7 @@ public class VariantAnnotatorIntegrationTest extends WalkerTest {
     @Test
     public void testNoAnnotsAsking1() {
         WalkerTestSpec spec = new WalkerTestSpec(
-                baseTestString() + " -G \"Standard\" --variant:VCF3 " + validationDataLocation + "vcfexample2empty.vcf -I " + validationDataLocation + "low_coverage_CEU.chr1.10k-11k.bam -L 1:10,020,000-10,021,000", 1,
+                baseTestString() + " -G Standard --variant:VCF3 " + validationDataLocation + "vcfexample2empty.vcf -I " + validationDataLocation + "low_coverage_CEU.chr1.10k-11k.bam -L 1:10,020,000-10,021,000", 1,
                 Arrays.asList("fd1ffb669800c2e07df1e2719aa38e49"));
         executeTest("test file doesn't have annotations, asking for annotations, #1", spec);
     }
@@ -71,15 +71,23 @@ public class VariantAnnotatorIntegrationTest extends WalkerTest {
     @Test
     public void testNoAnnotsAsking2() {
         WalkerTestSpec spec = new WalkerTestSpec(
-                baseTestString() + " -G \"Standard\" --variant:VCF3 " + validationDataLocation + "vcfexample3empty.vcf -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam -L 1:10,000,000-10,050,000", 1,
+                baseTestString() + " -G Standard --variant:VCF3 " + validationDataLocation + "vcfexample3empty.vcf -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam -L 1:10,000,000-10,050,000", 1,
                 Arrays.asList("09f8e840770a9411ff77508e0ed0837f"));
         executeTest("test file doesn't have annotations, asking for annotations, #2", spec);
     }
 
+    @Test
+    public void testExcludeAnnotations() {
+        WalkerTestSpec spec = new WalkerTestSpec(
+                baseTestString() + " -G Standard -XA FisherStrand -XA ReadPosRankSumTest --variant:VCF3 " + validationDataLocation + "vcfexample2empty.vcf -I " + validationDataLocation + "low_coverage_CEU.chr1.10k-11k.bam -L 1:10,020,000-10,021,000", 1,
+                Arrays.asList("b49fe03aa4b675db80a9db38a3552c95"));
+        executeTest("test exclude annotations", spec);
+    }
+
     @Test
     public void testOverwritingHeader() {
         WalkerTestSpec spec = new WalkerTestSpec(
-                baseTestString() + " -G \"Standard\" --variant:VCF " + validationDataLocation + "vcfexample4.vcf -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam -L 1:10,001,292", 1,
+                baseTestString() + " -G Standard --variant " + validationDataLocation + "vcfexample4.vcf -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam -L 1:10,001,292", 1,
                 Arrays.asList("78d2c19f8107d865970dbaf3e12edd92"));
         executeTest("test overwriting header", spec);
     }
@@ -87,7 +95,7 @@ public class VariantAnnotatorIntegrationTest extends WalkerTest {
     @Test
     public void testNoReads() {
         WalkerTestSpec spec = new WalkerTestSpec(
-                baseTestString() + " -G \"Standard\" --variant:VCF3 " + validationDataLocation + "vcfexample3empty.vcf -BTI variant", 1,
+                baseTestString() + " -G Standard --variant " + validationDataLocation + "vcfexample3empty.vcf -L " + validationDataLocation + "vcfexample3empty.vcf", 1,
                 Arrays.asList("16e3a1403fc376320d7c69492cad9345"));
         executeTest("not passing it any reads", spec);
     }
@@ -95,7 +103,7 @@ public class VariantAnnotatorIntegrationTest extends WalkerTest {
     @Test
     public void testDBTagWithDbsnp() {
         WalkerTestSpec spec = new WalkerTestSpec(
-                baseTestString() + " --dbsnp " + b36dbSNP129 + " -G \"Standard\" --variant:VCF3 " + validationDataLocation + "vcfexample3empty.vcf -BTI variant", 1,
+                baseTestString() + " --dbsnp " + b36dbSNP129 + " -G Standard --variant " + validationDataLocation + "vcfexample3empty.vcf -L " + validationDataLocation + "vcfexample3empty.vcf", 1,
                 Arrays.asList("3da8ca2b6bdaf6e92d94a8c77a71313d"));
         executeTest("getting DB tag with dbSNP", spec);
     }
@@ -103,7 +111,7 @@ public class VariantAnnotatorIntegrationTest extends WalkerTest {
     @Test
     public void testDBTagWithHapMap() {
         WalkerTestSpec spec = new WalkerTestSpec(
-                baseTestString() + " --comp:H3 " + validationDataLocation + "fakeHM3.vcf -G \"Standard\" --variant:VCF3 " + validationDataLocation + "vcfexample3empty.vcf -BTI variant", 1,
+                baseTestString() + " --comp:H3 " + validationDataLocation + "fakeHM3.vcf -G Standard --variant " + validationDataLocation + "vcfexample3empty.vcf -L " + validationDataLocation + "vcfexample3empty.vcf", 1,
                 Arrays.asList("1bc01c5b3bd0b7aef75230310c3ce688"));
         executeTest("getting DB tag with HM3", spec);
     }
@@ -111,8 +119,8 @@ public class VariantAnnotatorIntegrationTest extends WalkerTest {
     @Test
     public void testUsingExpression() {
         WalkerTestSpec spec = new WalkerTestSpec(
-                baseTestString() + " --resource:foo " + validationDataLocation + "targetAnnotations.vcf -G \"Standard\" --variant:VCF3 " + validationDataLocation + "vcfexample3empty.vcf -E foo.AF -BTI variant", 1,
-                Arrays.asList("e9c0d832dc6b4ed06c955060f830c140"));
+                baseTestString() + " --resource:foo " + validationDataLocation + "targetAnnotations.vcf -G Standard --variant:VCF3 " + validationDataLocation + "vcfexample3empty.vcf -E foo.AF -L " + validationDataLocation + "vcfexample3empty.vcf", 1,
+                Arrays.asList("ae30a1ac7bfbc3d22a327f8b689cad31"));
         executeTest("using expression", spec);
     }
 
@@ -121,7 +129,7 @@ public class VariantAnnotatorIntegrationTest extends WalkerTest {
         final String MD5 = "13269d5a2e16f06fd755cc0fb9271acf";
         for ( String file : Arrays.asList("CEU.exon.2010_03.sites.vcf", "CEU.exon.2010_03.sites.vcf.gz")) {
             WalkerTestSpec spec = new WalkerTestSpec(
-                    baseTestString() + " -A HomopolymerRun --variant:VCF " + validationDataLocation + "/" + file + " -BTI variant -NO_HEADER", 1,
+                    baseTestString() + " -A HomopolymerRun --variant:vcf " + validationDataLocation + file + " -L " + validationDataLocation + "CEU.exon.2010_03.sites.vcf -NO_HEADER", 1,
                     Arrays.asList(MD5));
             executeTest("Testing lookup vcf tabix vs. vcf tribble", spec);
         }
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/coverage/DepthOfCoverageIntegrationTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/coverage/DepthOfCoverageIntegrationTest.java
index 59ac1a41e..646fb5e77 100644
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/coverage/DepthOfCoverageIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/coverage/DepthOfCoverageIntegrationTest.java
@@ -57,11 +57,11 @@ public class DepthOfCoverageIntegrationTest extends WalkerTest {
         // now add the expected files that get generated
         spec.addAuxFile("423571e4c05e7934322172654ac6dbb7", baseOutputFile);
         spec.addAuxFile("9df5e7e07efeb34926c94a724714c219", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_cumulative_coverage_counts"));
-        spec.addAuxFile("b9a7748e5aec4dc06daed893c901c00d", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_cumulative_coverage_proportions"));
+        spec.addAuxFile("229b9b5bc2141c86dbc69c8acc9eba6a", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_cumulative_coverage_proportions"));
         spec.addAuxFile("9cd395f47b329b9dd00ad024fcac9929", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_interval_statistics"));
-        spec.addAuxFile("aec669d64d9dd652dd088a5341835ea5", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_interval_summary"));
-        spec.addAuxFile("f6dbd74d32a48abe71ce08d300bce983", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_statistics"));
-        spec.addAuxFile("e3a3467ed259ee3680f8d01980f525b7", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_summary"));
+        spec.addAuxFile("471c34ad2e4f7228efd20702d5941ba9", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_interval_summary"));
+        spec.addAuxFile("9667c77284c2c08e647b162d0e9652d4", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_statistics"));
+        spec.addAuxFile("5a96c75f96d6fa6ee617451d731dae37", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_summary"));
         spec.addAuxFile("b82846df660f0aac8429aec57c2a62d6", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".read_group_cumulative_coverage_counts"));
         spec.addAuxFile("d32a8c425fadcc4c048bd8b48d0f61e5", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".read_group_cumulative_coverage_proportions"));
         spec.addAuxFile("7b9d0e93bf5b5313995be7010ef1f528", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".read_group_interval_statistics"));
@@ -69,11 +69,11 @@ public class DepthOfCoverageIntegrationTest extends WalkerTest {
         spec.addAuxFile("e70952f241eebb9b5448f2e7cb288131", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".read_group_statistics"));
         spec.addAuxFile("054ed1e184f46d6a170dc9bf6524270c", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".read_group_summary"));
         spec.addAuxFile("d53431022f7387fe9ac47814ab1fcd88", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".sample_cumulative_coverage_counts"));
-        spec.addAuxFile("650ee3714da7fbad7832c9d4ad49eb51", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".sample_cumulative_coverage_proportions"));
+        spec.addAuxFile("a395dafde101971d2b9e5ddb6cd4b7d0", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".sample_cumulative_coverage_proportions"));
         spec.addAuxFile("df0ba76e0e6082c0d29fcfd68efc6b77", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".sample_interval_statistics"));
-        spec.addAuxFile("7dcac2e8962c778081486332a4576dc3", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".sample_interval_summary"));
-        spec.addAuxFile("a50011571334f17e950ad3ed1149e350", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".sample_statistics"));
-        spec.addAuxFile("6f3260504295695d765af639539585c9", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".sample_summary"));
+        spec.addAuxFile("e013cb5b11b0321a81c8dbd7c1863787", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".sample_interval_summary"));
+        spec.addAuxFile("661160f571def8c323345b5859cfb9da", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".sample_statistics"));
+        spec.addAuxFile("c95a7a6840334cadd0e520939615c77b", createTempFileFromBase(baseOutputFile.getAbsolutePath()+".sample_summary"));
         
         execute("testBaseOutputNoFiltering",spec);
     }
@@ -90,7 +90,7 @@ public class DepthOfCoverageIntegrationTest extends WalkerTest {
         spec.setOutputFileLocation(baseOutputFile);
 
         spec.addAuxFile("6ccd7d8970ba98cb95fe41636a070c1c",baseOutputFile);
-        spec.addAuxFile("0ee40f3e5091536c14e077b77557083a",createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_interval_summary"));
+        spec.addAuxFile("7d87783b3d98b928cac16d383ceca807",createTempFileFromBase(baseOutputFile.getAbsolutePath()+".library_interval_summary"));
 
         execute("testNoCoverageDueToFiltering",spec);
     }
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/diffengine/DiffObjectsIntegrationTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/diffengine/DiffObjectsIntegrationTest.java
index 1f11b5886..c8a25c97b 100644
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/diffengine/DiffObjectsIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/diffengine/DiffObjectsIntegrationTest.java
@@ -50,8 +50,8 @@ public class DiffObjectsIntegrationTest extends WalkerTest {
 
     @DataProvider(name = "data")
     public Object[][] createData() {
-        new TestParams(testDir + "diffTestMaster.vcf", testDir + "diffTestTest.vcf", "dc1ca75c6ecf32641967d61e167acfff");
-        new TestParams(testDir + "exampleBAM.bam", testDir + "exampleBAM.simple.bam", "df0fcb568a3a49fc74830103b2e26f6c");
+        new TestParams(testDir + "diffTestMaster.vcf", testDir + "diffTestTest.vcf", "ed377322c615abc7dceb97025076078d");
+        new TestParams(testDir + "exampleBAM.bam", testDir + "exampleBAM.simple.bam", "02e46f5d2ebb3d49570850595b3f792e");
         return TestParams.getTests(TestParams.class);
     }
 
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/diffengine/DiffableReaderUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/diffengine/DiffableReaderUnitTest.java
index dee7bbd88..46b0df5b4 100644
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/diffengine/DiffableReaderUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/diffengine/DiffableReaderUnitTest.java
@@ -70,7 +70,7 @@ public class DiffableReaderUnitTest extends BaseTest {
     private static void testLeaf(DiffNode rec, String field, Object expected) {
         DiffElement value = rec.getElement(field);
         Assert.assertNotNull(value, "Expected to see leaf named " + field + " in rec " + rec);
-        Assert.assertEquals(value.getValue().getValue(), expected, "Expected to leaf named " + field + " to have value " + expected + " in rec " + rec);
+        Assert.assertEquals(value.getValue().getValue(), expected, "Expected to see leaf named " + field + " to have value " + expected + " in rec " + rec + " but got instead " + value.getValue().getValue());
     }
 
     @Test(enabled = true, dependsOnMethods = "testPluggableDiffableReaders")
@@ -95,7 +95,7 @@ public class DiffableReaderUnitTest extends BaseTest {
         testLeaf(rec1, "POS", 2646);
         testLeaf(rec1, "ID", "rs62635284");
         testLeaf(rec1, "REF", Allele.create("G", true));
-        testLeaf(rec1, "ALT", new HashSet<Allele>(Arrays.asList(Allele.create("A"))));
+        testLeaf(rec1, "ALT", Arrays.asList(Allele.create("A")));
         testLeaf(rec1, "QUAL", 0.15);
         testLeaf(rec1, "FILTER", Collections.<Object>emptySet());
         testLeaf(rec1, "AC", "2");
diff --git a/public/java/test/org/broadinstitute/sting/utils/genotype/DiploidGenotypeUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidGenotypeUnitTest.java
similarity index 95%
rename from public/java/test/org/broadinstitute/sting/utils/genotype/DiploidGenotypeUnitTest.java
rename to public/java/test/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidGenotypeUnitTest.java
index e4f8b12e3..4e72b37a4 100644
--- a/public/java/test/org/broadinstitute/sting/utils/genotype/DiploidGenotypeUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/genotyper/DiploidGenotypeUnitTest.java
@@ -1,5 +1,6 @@
-package org.broadinstitute.sting.utils.genotype;
+package org.broadinstitute.sting.gatk.walkers.genotyper;
 
+import org.broadinstitute.sting.gatk.walkers.genotyper.DiploidGenotype;
 import org.testng.Assert;
 import org.broadinstitute.sting.BaseTest;
 
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/genotyper/GenotypeLikelihoodsUnitTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/genotyper/GenotypeLikelihoodsUnitTest.java
index 9882ce869..425b969e2 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/genotyper/GenotypeLikelihoodsUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/genotyper/GenotypeLikelihoodsUnitTest.java
@@ -1,7 +1,6 @@
 package org.broadinstitute.sting.gatk.walkers.genotyper;
 
 import org.testng.Assert;
-import org.broadinstitute.sting.utils.genotype.DiploidGenotype;
 import org.broadinstitute.sting.BaseTest;
 import org.testng.annotations.Test;
 
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyperIntegrationTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyperIntegrationTest.java
index 7ef75ec53..b80f214b1 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyperIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/genotyper/UnifiedGenotyperIntegrationTest.java
@@ -18,8 +18,8 @@ import java.util.Map;
 public class UnifiedGenotyperIntegrationTest extends WalkerTest {
 
     private final static String baseCommand = "-T UnifiedGenotyper -R " + b36KGReference + " -NO_HEADER -glm BOTH --dbsnp " + b36dbSNP129;
-    private final static String baseCommandIndels = "-T UnifiedGenotyper -R " + b36KGReference + " -NO_HEADER -glm INDEL --dbsnp " + b36dbSNP129;
-    private final static String baseCommandIndelsb37 = "-T UnifiedGenotyper -R " + b37KGReference + " -NO_HEADER -glm INDEL --dbsnp " + b37dbSNP132;
+    private final static String baseCommandIndels = "-T UnifiedGenotyper -R " + b36KGReference + " -NO_HEADER -glm INDEL -mbq 20 --dbsnp " + b36dbSNP129;
+    private final static String baseCommandIndelsb37 = "-T UnifiedGenotyper -R " + b37KGReference + " -NO_HEADER -glm INDEL -mbq 20 --dbsnp " + b37dbSNP132;
 
     // --------------------------------------------------------------------------------------------------------------
     //
@@ -30,7 +30,7 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
     public void testMultiSamplePilot1() {
         WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
                 baseCommand + " -I " + validationDataLocation + "low_coverage_CEU.chr1.10k-11k.bam -o %s -L 1:10,022,000-10,025,000", 1,
-                Arrays.asList("e6639ea2dc81635c706e6c35921406d7"));
+                Arrays.asList("b27939251539439a382538e507e03507"));
         executeTest("test MultiSample Pilot1", spec);
     }
 
@@ -43,7 +43,7 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
 
         WalkerTest.WalkerTestSpec spec2 = new WalkerTest.WalkerTestSpec(
                 baseCommand + " --output_mode EMIT_ALL_SITES --genotyping_mode GENOTYPE_GIVEN_ALLELES -alleles " + validationDataLocation + "allelesForUG.vcf -I " + validationDataLocation + "pilot2_daughters.chr20.10k-11k.bam -o %s -L 20:10,000,000-10,025,000", 1,
-                Arrays.asList("ec43daadfb15b00b41aeb0017a45df0b"));
+                Arrays.asList("6458f3b8fe4954e2ffc2af972aaab19e"));
         executeTest("test MultiSample Pilot2 with alleles passed in and emitting all sites", spec2);
     }
 
@@ -51,7 +51,7 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
     public void testSingleSamplePilot2() {
         WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
                 baseCommand + " -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam -o %s -L 1:10,000,000-10,100,000", 1,
-                Arrays.asList("d1cbd1fb9f3f7323941a95bc2def7e5a"));
+                Arrays.asList("6762b72ae60155ad71738d7c76b80e4b"));
         executeTest("test SingleSample Pilot2", spec);
     }
 
@@ -61,7 +61,7 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
     //
     // --------------------------------------------------------------------------------------------------------------
 
-    private final static String COMPRESSED_OUTPUT_MD5 = "2732b169cdccb21eb3ea00429619de79";
+    private final static String COMPRESSED_OUTPUT_MD5 = "bc71dba7bbdb23e7d5cc60461fdd897b";
 
     @Test
     public void testCompressedOutput() {
@@ -82,7 +82,7 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
 
         // Note that we need to turn off any randomization for this to work, so no downsampling and no annotations
 
-        String md5 = "cbac3960bbcb9d6192c57549208c182c";
+        String md5 = "b9504e446b9313559c3ed97add7e8dc1";
 
         WalkerTest.WalkerTestSpec spec1 = new WalkerTest.WalkerTestSpec(
                 baseCommand + " -dt NONE -G none -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam -o %s -L 1:10,000,000-10,075,000", 1,
@@ -113,9 +113,8 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
     @Test
     public void testCallingParameters() {
         HashMap<String, String> e = new HashMap<String, String>();
-        e.put( "--min_base_quality_score 26", "531966aee1cd5dced61c96c4fedb59a9" );
-        e.put( "--min_mapping_quality_score 26", "c71ca370947739cb7d87b59452be7a07" );
-        e.put( "--computeSLOD", "1a5648f26c18ced27df4be031b44e72d" );
+        e.put( "--min_base_quality_score 26", "bb3f294eab3e2cf52c70e63b23aac5ee" );
+        e.put( "--computeSLOD", "eb34979efaadba1e34bd82bcacf5c722" );
 
         for ( Map.Entry<String, String> entry : e.entrySet() ) {
             WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
@@ -161,8 +160,8 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
     @Test
     public void testHeterozyosity() {
         HashMap<Double, String> e = new HashMap<Double, String>();
-        e.put( 0.01, "aed69402ddffe7f2ed5ca98563bfba02" );
-        e.put( 1.0 / 1850, "fa94a059f08c1821b721335d93ed2ea5" );
+        e.put( 0.01, "f84da90c310367bd51f2ab6e346fa3d8" );
+        e.put( 1.0 / 1850, "5791e7fef40d4412b6d8f84e0a809c6c" );
 
         for ( Map.Entry<Double, String> entry : e.entrySet() ) {
             WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
@@ -186,7 +185,7 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
                         " -o %s" +
                         " -L 1:10,000,000-10,100,000",
                 1,
-                Arrays.asList("1c080e6596d4c830bb5d147b04e2a82c"));
+                Arrays.asList("9cc9538ac83770e12bd0830d285bfbd0"));
 
         executeTest(String.format("test multiple technologies"), spec);
     }
@@ -205,7 +204,7 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
                         " -L 1:10,000,000-10,100,000" +
                         " -baq CALCULATE_AS_NECESSARY",
                 1,
-                Arrays.asList("9129ad748ca3be2d3b321d2d7e83ae5b"));
+                Arrays.asList("eaf8043edb46dfbe9f97ae03baa797ed"));
 
         executeTest(String.format("test calling with BAQ"), spec);
     }
@@ -224,7 +223,7 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
                         " -o %s" +
                         " -L 1:10,000,000-10,500,000",
                 1,
-                Arrays.asList("0bece77ce6bc447438ef9b2921b2dc41"));
+                Arrays.asList("eeba568272f9b42d5450da75c7cc6d2d"));
 
         executeTest(String.format("test indel caller in SLX"), spec);
     }
@@ -241,7 +240,7 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
                 1,
                 Arrays.asList("5fe98ee853586dc9db58f0bc97daea63"));
 
-        executeTest(String.format("test indel caller in SLX witn low min allele count"), spec);
+        executeTest(String.format("test indel caller in SLX with low min allele count"), spec);
     }
 
     @Test
@@ -252,38 +251,47 @@ public class UnifiedGenotyperIntegrationTest extends WalkerTest {
                          " -o %s" +
                          " -L 1:10,000,000-10,500,000",
                  1,
-                 Arrays.asList("790b1a1d6ab79eee8c24812bb8ca6fae"));
+                 Arrays.asList("19ff9bd3139480bdf79dcbf117cf2b24"));
 
          executeTest(String.format("test indel calling, multiple technologies"), spec);
      }
 
     @Test
-    public void testWithIndelAllelesPassedIn() {
+    public void testWithIndelAllelesPassedIn1() {
         WalkerTest.WalkerTestSpec spec1 = new WalkerTest.WalkerTestSpec(
                 baseCommandIndels + " --genotyping_mode GENOTYPE_GIVEN_ALLELES -alleles " + validationDataLocation + "indelAllelesForUG.vcf -I " + validationDataLocation +
                         "pilot2_daughters.chr20.10k-11k.bam -o %s -L 20:10,000,000-10,100,000", 1,
-                Arrays.asList("408d3aba4d094c067fc00a43992c2292"));
+                Arrays.asList("118918f2e9e56a3cfc5ccb2856d529c8"));
         executeTest("test MultiSample Pilot2 indels with alleles passed in", spec1);
+    }
 
+    @Test
+    public void testWithIndelAllelesPassedIn2() {
         WalkerTest.WalkerTestSpec spec2 = new WalkerTest.WalkerTestSpec(
                 baseCommandIndels + " --output_mode EMIT_ALL_SITES --genotyping_mode GENOTYPE_GIVEN_ALLELES -alleles "
                         + validationDataLocation + "indelAllelesForUG.vcf -I " + validationDataLocation +
                         "pilot2_daughters.chr20.10k-11k.bam -o %s -L 20:10,000,000-10,100,000", 1,
-                Arrays.asList("94977d6e42e764280e9deaf4e3ac8c80"));
+                Arrays.asList("a20799237accd52c1b8c2ac096309c8f"));
         executeTest("test MultiSample Pilot2 indels with alleles passed in and emitting all sites", spec2);
+    }
+
+    @Test
+    public void testWithIndelAllelesPassedIn3() {
 
         WalkerTest.WalkerTestSpec spec3 = new WalkerTest.WalkerTestSpec(
                 baseCommandIndels + " --genotyping_mode GENOTYPE_GIVEN_ALLELES -alleles " + validationDataLocation + "ALL.wgs.union_v2.20101123.indels.sites.vcf -I " + validationDataLocation +
                         "pilot2_daughters.chr20.10k-11k.bam -o %s -L 20:10,000,000-10,080,000", 1,
-                Arrays.asList("e66b7321e2ac91742ad3ef91040daafd"));
+                Arrays.asList("18ef8181157b4ac3eb8492f538467f92"));
         executeTest("test MultiSample Pilot2 indels with complicated records", spec3);
+    }
 
+    @Test
+    public void testWithIndelAllelesPassedIn4() {
         WalkerTest.WalkerTestSpec spec4 = new WalkerTest.WalkerTestSpec(
                 baseCommandIndelsb37 + " --genotyping_mode GENOTYPE_GIVEN_ALLELES -alleles " + validationDataLocation + "ALL.wgs.union_v2_chr20_100_110K.20101123.indels.sites.vcf -I " + validationDataLocation +
                         "phase1_GBR_realigned.chr20.100K-110K.bam -o %s -L 20:100,000-110,000", 1,
-                Arrays.asList("4be308fd9e8167ebee677f62a7a753b7"));
+                Arrays.asList("ad884e511a751b05e64db5314314365a"));
         executeTest("test MultiSample 1000G Phase1 indels with complicated records emitting all sites", spec4);
-
     }
 
     @Test
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/indels/RealignerTargetCreatorIntegrationTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/indels/RealignerTargetCreatorIntegrationTest.java
index 1873ccbe2..26e23e016 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/indels/RealignerTargetCreatorIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/indels/RealignerTargetCreatorIntegrationTest.java
@@ -8,22 +8,43 @@ import java.util.Arrays;
 public class RealignerTargetCreatorIntegrationTest extends WalkerTest {
 
     @Test
-    public void testIntervals() {
+    public void testIntervals1() {
+        String md5 = "3f0b63a393104d0c4158c7d1538153b8";
 
         WalkerTest.WalkerTestSpec spec1 = new WalkerTest.WalkerTestSpec(
                 "-T RealignerTargetCreator -R " + b36KGReference + " -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam --mismatchFraction 0.15 -L 1:10,000,000-10,050,000 -o %s",
                  1,
-                 Arrays.asList("e7accfa58415d6da80383953b1a3a986"));
-        executeTest("test standard", spec1);
+                 Arrays.asList(md5));
+        executeTest("test standard nt=1", spec1);
 
         WalkerTest.WalkerTestSpec spec2 = new WalkerTest.WalkerTestSpec(
-                "-T RealignerTargetCreator --known " + b36dbSNP129 + " -R " + b36KGReference + " -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam -L 1:10,000,000-10,050,000 -o %s",
+                "-nt 4 -T RealignerTargetCreator -R " + b36KGReference + " -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam --mismatchFraction 0.15 -L 1:10,000,000-10,050,000 -o %s",
                  1,
-                 Arrays.asList("0367d39a122c8ac0899fb868a82ef728"));
-        executeTest("test dbsnp", spec2);
+                 Arrays.asList(md5));
+        executeTest("test standard nt=4", spec2);
+    }
 
+    @Test
+    public void testIntervals2() {
+        String md5 = "e0f745b79b679c225314a2abef4919ff";
+
+        WalkerTest.WalkerTestSpec spec1 = new WalkerTest.WalkerTestSpec(
+                "-T RealignerTargetCreator --known " + b36dbSNP129 + " -R " + b36KGReference + " -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam -L 1:10,000,000-10,200,000 -o %s",
+                 1,
+                 Arrays.asList(md5));
+        executeTest("test with dbsnp nt=1", spec1);
+
+        WalkerTest.WalkerTestSpec spec2 = new WalkerTest.WalkerTestSpec(
+                "-nt 4 -T RealignerTargetCreator --known " + b36dbSNP129 + " -R " + b36KGReference + " -I " + validationDataLocation + "NA12878.1kg.p2.chr1_10mb_11_mb.SLX.bam -L 1:10,000,000-10,200,000 -o %s",
+                 1,
+                 Arrays.asList(md5));
+        executeTest("test with dbsnp nt=4", spec2);
+    }
+
+    @Test
+    public void testKnownsOnly() {
         WalkerTest.WalkerTestSpec spec3 = new WalkerTest.WalkerTestSpec(
-                "-T RealignerTargetCreator -R " + b36KGReference + " --known " + validationDataLocation + "NA12878.chr1_10mb_11mb.slx.indels.vcf4 -BTI known -o %s",
+                "-T RealignerTargetCreator -R " + b36KGReference + " --known " + validationDataLocation + "NA12878.chr1_10mb_11mb.slx.indels.vcf4 -L " + validationDataLocation + "NA12878.chr1_10mb_11mb.slx.indels.vcf4 -o %s",
                  1,
                  Arrays.asList("5206cee6c01b299417bf2feeb8b3dc96"));
         executeTest("test rods only", spec3);
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/validation/ValidationAmpliconsIntegrationTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/validation/ValidationAmpliconsIntegrationTest.java
index 0a0d8c5b2..155d3c4db 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/validation/ValidationAmpliconsIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/validation/ValidationAmpliconsIntegrationTest.java
@@ -20,7 +20,7 @@ public class ValidationAmpliconsIntegrationTest extends WalkerTest {
         String maskVCF = validationDataLocation + "amplicon_mask_sites.vcf";
         String intervalTable = validationDataLocation + "amplicon_interval_table1.table";
         String testArgs = "-R " + b37KGReference + " -T ValidationAmplicons --ValidateAlleles:VCF "+siteVCF+" -o %s";
-        testArgs += " --ProbeIntervals:table "+intervalTable+" -BTI ProbeIntervals --MaskAlleles:VCF "+maskVCF;
+        testArgs += " --ProbeIntervals:table "+intervalTable+" -L:table "+intervalTable+" --MaskAlleles:VCF "+maskVCF;
         testArgs += " --virtualPrimerSize 30";
         WalkerTestSpec spec = new WalkerTestSpec(testArgs, 1,
                 Arrays.asList("27f9450afa132888a8994167f0035fd7"));
@@ -33,7 +33,7 @@ public class ValidationAmpliconsIntegrationTest extends WalkerTest {
         String maskVCF = validationDataLocation + "amplicon_mask_sites.vcf";
         String intervalTable = validationDataLocation + "amplicon_interval_table1.table";
         String testArgs = "-R " + b37KGReference + " -T ValidationAmplicons --ValidateAlleles:VCF "+siteVCF+" -o %s";
-        testArgs += " --ProbeIntervals:table "+intervalTable+" -BTI ProbeIntervals --MaskAlleles:VCF "+maskVCF;
+        testArgs += " --ProbeIntervals:table "+intervalTable+" -L:table "+intervalTable+" --MaskAlleles:VCF "+maskVCF;
         testArgs += " --virtualPrimerSize 30 --doNotUseBWA";
         WalkerTestSpec spec = new WalkerTestSpec(testArgs, 1,
                 Arrays.asList("f2611ff1d9cd5bedaad003251fed8bc1"));
@@ -46,7 +46,7 @@ public class ValidationAmpliconsIntegrationTest extends WalkerTest {
         String maskVCF = validationDataLocation + "amplicon_mask_sites.vcf";
         String intervalTable = validationDataLocation + "amplicon_interval_table1.table";
         String testArgs = "-R " + b37KGReference + " -T ValidationAmplicons --ValidateAlleles:VCF "+siteVCF+" -o %s";
-        testArgs += " --ProbeIntervals:table "+intervalTable+" -BTI ProbeIntervals --MaskAlleles:VCF "+maskVCF;
+        testArgs += " --ProbeIntervals:table "+intervalTable+" -L:table "+intervalTable+" --MaskAlleles:VCF "+maskVCF;
         testArgs += " --virtualPrimerSize 30 --filterMonomorphic";
         WalkerTestSpec spec = new WalkerTestSpec(testArgs, 1,
                 Arrays.asList("77b3f30e38fedad812125bdf6cf3255f"));
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/varianteval/VariantEvalIntegrationTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/varianteval/VariantEvalIntegrationTest.java
index 9fe253ecb..cd2493dde 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/varianteval/VariantEvalIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/varianteval/VariantEvalIntegrationTest.java
@@ -26,7 +26,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                                         "-EV TiTvVariantEvaluator",
                                         "-noST",
                                         "-ST FunctionalClass",
-                                        "-BTI eval",
+                                        "-L " + validationDataLocation + "snpEff.AFR.unfiltered.VariantAnnotator.output.vcf",
                                         "-o %s"
                                 ),
                                 1,
@@ -46,7 +46,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                                         "-noEV",
                                         "-EV TiTvVariantEvaluator",
                                         "-ST Sample",
-                                        "-BTI eval",
+                                        "-L " + variantEvalTestDataRoot + "/CEU.trio.callsForVE.vcf",
                                         "-o %s"
                                 ),
                                 1,
@@ -66,7 +66,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                                         "-noEV",
                                         "-EV CountVariants",
                                         "-noST",
-                                        "-BTI eval",
+                                        "-L " + fundamentalTestVCF,
                                         "-o %s"
                                 ),
                                 1,
@@ -87,7 +87,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                         "-EV CountVariants",
                         "-noST",
                         "-ST Novelty",
-                        "-BTI eval",
+                        "-L " + fundamentalTestVCF,
                         "-o %s"
                 ),
                 1,
@@ -109,7 +109,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                         "-noST",
                         "-ST Novelty",
                         "-ST Filter",
-                        "-BTI eval",
+                        "-L " + fundamentalTestVCF,
                         "-o %s"
                 ),
                 1,
@@ -130,7 +130,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                         "-EV CountVariants",
                         "-noST",
                         "-ST CpG",
-                        "-BTI eval",
+                        "-L " + fundamentalTestVCF,
                         "-o %s"
                 ),
                 1,
@@ -151,7 +151,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                         "-EV CountVariants",
                         "-noST",
                         "-ST FunctionalClass",
-                        "-BTI eval",
+                        "-L " + fundamentalTestVCF,
                         "-o %s"
                 ),
                 1,
@@ -172,7 +172,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                         "-EV CountVariants",
                         "-noST",
                         "-ST Degeneracy",
-                        "-BTI eval",
+                        "-L " + fundamentalTestVCF,
                         "-o %s"
                 ),
                 1,
@@ -193,7 +193,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                         "-EV CountVariants",
                         "-noST",
                         "-ST Sample",
-                        "-BTI eval",
+                        "-L " + fundamentalTestVCF,
                         "-o %s"
                 ),
                 1,
@@ -216,7 +216,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                         "-ST JexlExpression",
                         "-select 'DP < 20'",
                         "-selectName DepthSelect",
-                        "-BTI eval",
+                        "-L " + fundamentalTestVCF,
                         "-o %s"
                 ),
                 1,
@@ -241,7 +241,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                         "-selectName DepthLt20",
                         "-select 'DP > 20'",
                         "-selectName DepthGt20",
-                        "-BTI eval",
+                        "-L " + fundamentalTestVCF,
                         "-o %s"
                 ),
                 1,
@@ -260,7 +260,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                         "-noEV",
                         "-EV CountVariants",
                         "-noST",
-                        "-BTI eval",
+                        "-L " + fundamentalTestVCF,
                         "-o %s"
                 ),
                 1,
@@ -371,7 +371,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                         "-EV CompOverlap",
                         "-sn HG00625",
                         "-noST",
-                        "-BTI eval",
+                        "-L " + fundamentalTestSNPsVCF,
                         "-o %s"
                 ),
                 1,
@@ -388,7 +388,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                         "-noEV",
                         "-EV CompOverlap",
                         "-noST",
-                        "-BTI eval",
+                        "-L " + fundamentalTestSNPsOneSampleVCF,
                         "-o %s"
                 ),
                 1,
@@ -410,7 +410,7 @@ public class VariantEvalIntegrationTest extends WalkerTest {
                                         "-EV CountVariants",
                                         "-noST",
                                         "-ST AlleleCount",
-                                        "-BTI eval",
+                                        "-L " + fundamentalTestSNPsVCF,
                                         "-o %s"
                                 ),
                                 1,
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/variantutils/CombineVariantsIntegrationTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/variantutils/CombineVariantsIntegrationTest.java
index b65de9d36..5a4d6e6a1 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/variantutils/CombineVariantsIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/variantutils/CombineVariantsIntegrationTest.java
@@ -78,26 +78,26 @@ public class CombineVariantsIntegrationTest extends WalkerTest {
          executeTest("combine PLs 1:" + new File(file1).getName() + " 2:" + new File(file2).getName(), spec);
     }
 
-    @Test public void test1SNP() { test1InOut("pilot2.snps.vcf4.genotypes.vcf", "c608b9fc1e36dba6cebb4f259883f9f0"); }
-    @Test public void test2SNP() { test1InOut("pilot2.snps.vcf4.genotypes.vcf", "20caad94411d6ab48153b214de916df8", " -setKey foo"); }
-    @Test public void test3SNP() { test1InOut("pilot2.snps.vcf4.genotypes.vcf", "004f3065cb1bc2ce2f9afd695caf0b48", " -setKey null"); }
+    @Test public void test1SNP() { test1InOut("pilot2.snps.vcf4.genotypes.vcf", "ea0a660cd04101ce7b534aba0310721d"); }
+    @Test public void test2SNP() { test1InOut("pilot2.snps.vcf4.genotypes.vcf", "cb0350e7a9d2483993482b69f5432b64", " -setKey foo"); }
+    @Test public void test3SNP() { test1InOut("pilot2.snps.vcf4.genotypes.vcf", "0571c48cc59cf244779caae52d562e79", " -setKey null"); }
     @Test public void testOfficialCEUPilotCalls() { test1InOut("CEU.trio.2010_03.genotypes.vcf.gz", "c9c901ff9ef2a982624b203a8086dff0"); } // official project VCF files in tabix format
 
-    @Test public void test1Indel1() { test1InOut("CEU.dindel.vcf4.trio.2010_06.indel.genotypes.vcf", "7593be578d4274d672fc22fced38012b"); }
+    @Test public void test1Indel1() { test1InOut("CEU.dindel.vcf4.trio.2010_06.indel.genotypes.vcf", "75901304abc1daa41b1906f881aa7bbc"); }
     @Test public void test1Indel2() { test1InOut("CEU.dindel.vcf4.low_coverage.2010_06.indel.genotypes.vcf", "1cd467863c4e948fadd970681552d57e"); }
 
-    @Test public void combineWithPLs() { combinePLs("combine.3.vcf", "combine.4.vcf", "0f873fed02aa99db5b140bcd6282c10a"); }
+    @Test public void combineWithPLs() { combinePLs("combine.3.vcf", "combine.4.vcf", "d08e933b6c81246e998d3ece50ddfdcc"); }
 
-    @Test public void combineTrioCalls() { combine2("CEU.trio.2010_03.genotypes.vcf.gz", "YRI.trio.2010_03.genotypes.vcf.gz", "", "1d5a021387a8a86554db45a29f66140f"); } // official project VCF files in tabix format
-    @Test public void combineTrioCallsMin() { combine2("CEU.trio.2010_03.genotypes.vcf.gz", "YRI.trio.2010_03.genotypes.vcf.gz", " -minimalVCF", "96941ee177b0614a9879af0ac3218963"); } // official project VCF files in tabix format
-    @Test public void combine2Indels() { combine2("CEU.dindel.vcf4.trio.2010_06.indel.genotypes.vcf", "CEU.dindel.vcf4.low_coverage.2010_06.indel.genotypes.vcf", "", "a8a6e7589f22e0b6c5d222066b9a2093"); }
+    @Test public void combineTrioCalls() { combine2("CEU.trio.2010_03.genotypes.vcf.gz", "YRI.trio.2010_03.genotypes.vcf.gz", "", "01967686e0e02dbccd2590b70f2d049b"); } // official project VCF files in tabix format
+    @Test public void combineTrioCallsMin() { combine2("CEU.trio.2010_03.genotypes.vcf.gz", "YRI.trio.2010_03.genotypes.vcf.gz", " -minimalVCF", "8c113199c4a93a4a408104b735d59044"); } // official project VCF files in tabix format
+    @Test public void combine2Indels() { combine2("CEU.dindel.vcf4.trio.2010_06.indel.genotypes.vcf", "CEU.dindel.vcf4.low_coverage.2010_06.indel.genotypes.vcf", "", "30e96a0cb614cd5bc056e1f7ec6d10bd"); }
 
     @Test public void combineSNPsAndIndels() { combine2("CEU.trio.2010_03.genotypes.vcf.gz", "CEU.dindel.vcf4.low_coverage.2010_06.indel.genotypes.vcf", "", "e144b6283765494bfe8189ac59965083"); }
 
-    @Test public void uniqueSNPs() { combine2("pilot2.snps.vcf4.genotypes.vcf", "yri.trio.gatk_glftrio.intersection.annotated.filtered.chr1.vcf", "", "89f55abea8f59e39d1effb908440548c"); }
+    @Test public void uniqueSNPs() { combine2("pilot2.snps.vcf4.genotypes.vcf", "yri.trio.gatk_glftrio.intersection.annotated.filtered.chr1.vcf", "", "78a49597f1abf1c738e67d50c8fbed2b"); }
 
-    @Test public void omniHM3Union() { combineSites(" -filteredRecordsMergeType KEEP_IF_ANY_UNFILTERED", "c6adeda751cb2a08690dd9202356629f"); }
-    @Test public void omniHM3Intersect() { combineSites(" -filteredRecordsMergeType KEEP_IF_ALL_UNFILTERED", "3a08fd5ee18993dfc8882156ccf5d2e9"); }
+    @Test public void omniHM3Union() { combineSites(" -filteredRecordsMergeType KEEP_IF_ANY_UNFILTERED", "4c63bfa5f73793aaca42e130ec49f238"); }
+    @Test public void omniHM3Intersect() { combineSites(" -filteredRecordsMergeType KEEP_IF_ALL_UNFILTERED", "86e326acbd8d2af8a6040eb146d92fc6"); }
 
     @Test public void threeWayWithRefs() {
         WalkerTestSpec spec = new WalkerTestSpec(
@@ -110,7 +110,7 @@ public class CombineVariantsIntegrationTest extends WalkerTest {
                         " -priority NA19240_BGI,NA19240_ILLUMINA,NA19240_WUGSC,denovoInfo" +
                         " -genotypeMergeOptions UNIQUIFY -L 1"),
                 1,
-                Arrays.asList("212d9d3df10bb29e2c7fb226da422dc0"));
+                Arrays.asList("b14f8cbb5d03a2e613b12da4da9efd9a"));
         executeTest("threeWayWithRefs", spec);
     }
 
@@ -127,17 +127,17 @@ public class CombineVariantsIntegrationTest extends WalkerTest {
         executeTest("combineComplexSites 1:" + new File(file1).getName() + " 2:" + new File(file2).getName() + " args = " + args, spec);
     }
 
-    @Test public void complexTestFull() { combineComplexSites("", "b5a53ee92bdaacd2bb3327e9004ae058"); }
-    @Test public void complexTestMinimal() { combineComplexSites(" -minimalVCF", "df96cb3beb2dbb5e02f80abec7d3571e"); }
-    @Test public void complexTestSitesOnly() { combineComplexSites(" -sites_only", "f704caeaaaed6711943014b847fe381a"); }
-    @Test public void complexTestSitesOnlyMinimal() { combineComplexSites(" -sites_only -minimalVCF", "f704caeaaaed6711943014b847fe381a"); }
+    @Test public void complexTestFull() { combineComplexSites("", "2842337e9943366f7a4d5f148f701b8c"); }
+    @Test public void complexTestMinimal() { combineComplexSites(" -minimalVCF", "39724318e6265d0318a3fe4609612785"); }
+    @Test public void complexTestSitesOnly() { combineComplexSites(" -sites_only", "fe9bb02ab8b3d0dd2ad6373ebdb6d915"); }
+    @Test public void complexTestSitesOnlyMinimal() { combineComplexSites(" -sites_only -minimalVCF", "fe9bb02ab8b3d0dd2ad6373ebdb6d915"); }
 
     @Test
     public void combineDBSNPDuplicateSites() {
          WalkerTestSpec spec = new WalkerTestSpec(
                  "-T CombineVariants -NO_HEADER -L 1:902000-903000 -o %s -R " + b37KGReference + " -V:v1 " + b37dbSNP132,
                  1,
-                 Arrays.asList(""));
+                 Arrays.asList("5969446769cb8377daa2db29304ae6b5"));
          executeTest("combineDBSNPDuplicateSites:", spec);
     }
 }
\ No newline at end of file
diff --git a/public/java/test/org/broadinstitute/sting/gatk/walkers/variantutils/SelectVariantsIntegrationTest.java b/public/java/test/org/broadinstitute/sting/gatk/walkers/variantutils/SelectVariantsIntegrationTest.java
index 20409d4ca..6e994be3a 100755
--- a/public/java/test/org/broadinstitute/sting/gatk/walkers/variantutils/SelectVariantsIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/gatk/walkers/variantutils/SelectVariantsIntegrationTest.java
@@ -16,7 +16,7 @@ public class SelectVariantsIntegrationTest extends WalkerTest {
         String samplesFile = validationDataLocation + "SelectVariants.samples.txt";
 
         WalkerTestSpec spec = new WalkerTestSpec(
-            baseTestString(" -sn A -se '[CDH]' -sf " + samplesFile + " -env -ef -select 'DP < 250' --variant:VCF3 " + testfile),
+            baseTestString(" -sn A -se '[CDH]' -sf " + samplesFile + " -env -ef -select 'DP < 250' --variant " + testfile),
             1,
             Arrays.asList("d18516c1963802e92cb9e425c0b75fd6")
         );
@@ -30,7 +30,7 @@ public class SelectVariantsIntegrationTest extends WalkerTest {
         String samplesFile = validationDataLocation + "SelectVariants.samples.txt";
 
         WalkerTestSpec spec = new WalkerTestSpec(
-            "-T SelectVariants -R " + b36KGReference + " -L 1:1-1000000 -o %s -NO_HEADER -xl_sn A -xl_sf " + samplesFile + " --variant:VCF3 " + testfile,
+            "-T SelectVariants -R " + b36KGReference + " -L 1:1-1000000 -o %s -NO_HEADER -xl_sn A -xl_sf " + samplesFile + " --variant " + testfile,
             1,
             Arrays.asList("730f021fd6ecf1d195dabbee2e233bfd")
         );
@@ -43,7 +43,7 @@ public class SelectVariantsIntegrationTest extends WalkerTest {
         String testfile = validationDataLocation + "test.dup.vcf";
 
         WalkerTestSpec spec = new WalkerTestSpec(
-                baseTestString(" -sn A -sn B -sn C --variant:VCF3 " + testfile),
+                baseTestString(" -sn A -sn B -sn C --variant " + testfile),
                 1,
                 Arrays.asList("b74038779fe6485dbb8734ae48178356")
         );
@@ -56,7 +56,7 @@ public class SelectVariantsIntegrationTest extends WalkerTest {
         String testFile = validationDataLocation + "NA12878.hg19.example1.vcf";
 
         WalkerTestSpec spec = new WalkerTestSpec(
-                "-T SelectVariants -R " + hg19Reference + " -sn NA12878 -L 20:1012700-1020000 --variant:VCF " + b37hapmapGenotypes + " -disc:VCF " + testFile + " -o %s -NO_HEADER",
+                "-T SelectVariants -R " + hg19Reference + " -sn NA12878 -L 20:1012700-1020000 --variant " + b37hapmapGenotypes + " -disc " + testFile + " -o %s -NO_HEADER",
                 1,
                 Arrays.asList("78e6842325f1f1bc9ab30d5e7737ee6e")
         );
@@ -64,12 +64,25 @@ public class SelectVariantsIntegrationTest extends WalkerTest {
         executeTest("testDiscordance--" + testFile, spec);
     }
 
+    @Test
+    public void testDiscordanceNoSampleSpecified() {
+        String testFile = validationDataLocation + "NA12878.hg19.example1.vcf";
+
+        WalkerTestSpec spec = new WalkerTestSpec(
+                "-T SelectVariants -R " + hg19Reference + " -L 20:1012700-1020000 --variant " + b37hapmapGenotypes + " -disc " + testFile + " -o %s -NO_HEADER",
+                1,
+                Arrays.asList("5d7d899c0c4954ec59104aebfe4addd5")
+        );
+
+        executeTest("testDiscordanceNoSampleSpecified--" + testFile, spec);
+    }
+
     @Test
     public void testConcordance() {
         String testFile = validationDataLocation + "NA12878.hg19.example1.vcf";
 
         WalkerTestSpec spec = new WalkerTestSpec(
-                "-T SelectVariants -R " + hg19Reference + " -sn NA12878 -L 20:1012700-1020000 -conc:VCF " + b37hapmapGenotypes + " --variant " + testFile + " -o %s -NO_HEADER",
+                "-T SelectVariants -R " + hg19Reference + " -sn NA12878 -L 20:1012700-1020000 -conc " + b37hapmapGenotypes + " --variant " + testFile + " -o %s -NO_HEADER",
                 1,
                 Arrays.asList("d2ba3ea30a810f6f0fbfb1b643292b6a")
         );
@@ -90,16 +103,16 @@ public class SelectVariantsIntegrationTest extends WalkerTest {
         executeTest("testVariantTypeSelection--" + testFile, spec);
     }
 
-    @Test(enabled=false)
-    public void testRemovePLs() {
+    @Test
+    public void testUsingDbsnpName() {
         String testFile = validationDataLocation + "combine.3.vcf";
 
         WalkerTestSpec spec = new WalkerTestSpec(
-                "-T SelectVariants -R " + b36KGReference + " -sn NA12892 --variant " + testFile + " -o %s -NO_HEADER",
+                "-T SelectVariants -R " + b36KGReference + " -sn NA12892 --variant:dbsnp " + testFile + " -o %s -NO_HEADER",
                 1,
-                Arrays.asList("")
+                Arrays.asList("167a1265df820978a74c267df44d5c43")
         );
 
-        executeTest("testWithPLs--" + testFile, spec);
+        executeTest("testUsingDbsnpName--" + testFile, spec);
     }
 }
diff --git a/public/java/test/org/broadinstitute/sting/utils/R/RScriptExecutorUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/R/RScriptExecutorUnitTest.java
index 836a4473f..f597694bb 100644
--- a/public/java/test/org/broadinstitute/sting/utils/R/RScriptExecutorUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/utils/R/RScriptExecutorUnitTest.java
@@ -26,60 +26,84 @@ package org.broadinstitute.sting.utils.R;
 
 import org.apache.commons.io.FileUtils;
 import org.broadinstitute.sting.BaseTest;
-import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.io.IOUtils;
+import org.testng.Assert;
 import org.testng.annotations.Test;
 
 import java.io.File;
-import java.io.IOException;
-import java.util.ArrayList;
-import java.util.List;
 
 /**
  * Basic unit test for RScriptExecutor in reduced reads
  */
 public class RScriptExecutorUnitTest extends BaseTest {
-    final static String testrscript = "print(\"hello, world\")\n";
-    final static String publicRScript = "plot_Tranches.R";
 
-    // --------------------------------------------------------------------------------
-    //
-    // Difference testing routines
-    //
-    // --------------------------------------------------------------------------------
-
-    private void testOne(String script, String pathToRscript, String anotherSearchPath, boolean exceptOnError) {
-        RScriptExecutor.RScriptArgumentCollection collection =
-                new RScriptExecutor.RScriptArgumentCollection();
-        if ( pathToRscript != null )
-            collection.PATH_TO_RSCRIPT = pathToRscript;
-        if ( anotherSearchPath != null ) {
-            List<String> x = new ArrayList<String>(collection.PATH_TO_RESOURCES);
-            x.add(anotherSearchPath);
-            collection.PATH_TO_RESOURCES = x;
-        }
-        RScriptExecutor executor = new RScriptExecutor(collection, exceptOnError);
-        executor.callRScripts(script);
-    }
+    private static final String HELLO_WORLD_SCRIPT = "print('hello, world')";
+    private static final String GSALIB_LOADED_SCRIPT = "if (!'package:gsalib' %in% search()) stop('gsalib not loaded')";
 
     @Test
-    public void testPublic() { testOne(publicRScript, null, null, true); }
-
-    @Test(expectedExceptions = UserException.class)
-    public void testNonExistantScriptException() { testOne("does_not_exist.R", null, null, true); }
-
-    @Test()
-    public void testNonExistantScriptNoException() { testOne("does_not_exist.R", null, null, false); }
-
-    @Test(expectedExceptions = UserException.class)
-    public void testNonExistantRScriptException() { testOne(publicRScript, "badRScriptValue", null, true); }
-
-    @Test()
-    public void testNonExistantRScriptNoException() { testOne(publicRScript, "badRScriptValue", null, false); }
-
-    @Test()
-    public void testScriptInNewPath() throws IOException {
-        File t = createTempFile("myTestScript", ".R");
-        FileUtils.writeStringToFile(t, testrscript);
-        testOne(t.getName(), null, t.getParent(), true);
+    public void testRscriptExists() {
+        Assert.assertTrue(RScriptExecutor.RSCRIPT_EXISTS, "Rscript not found in environment ${PATH}");
     }
-}
\ No newline at end of file
+
+    @Test(dependsOnMethods = "testRscriptExists")
+    public void testExistingScript() {
+        File script = writeScript(HELLO_WORLD_SCRIPT);
+        try {
+            RScriptExecutor executor = new RScriptExecutor();
+            executor.addScript(script);
+            executor.setExceptOnError(true);
+            Assert.assertTrue(executor.exec(), "Exec failed");
+        } finally {
+            FileUtils.deleteQuietly(script);
+        }
+    }
+
+    @Test(dependsOnMethods = "testRscriptExists", expectedExceptions = RScriptExecutorException.class)
+    public void testNonExistantScriptException() {
+        RScriptExecutor executor = new RScriptExecutor();
+        executor.setExceptOnError(true);
+        executor.addScript(new File("does_not_exists.R"));
+        executor.exec();
+    }
+
+    @Test(dependsOnMethods = "testRscriptExists")
+    public void testNonExistantScriptNoException() {
+        logger.warn("Testing that warning is printed an no exception thrown for missing script.");
+        RScriptExecutor executor = new RScriptExecutor();
+        executor.setExceptOnError(false);
+        executor.addScript(new File("does_not_exists.R"));
+        Assert.assertFalse(executor.exec(), "Exec should have returned false when the job failed");
+    }
+
+    @Test(dependsOnMethods = "testRscriptExists")
+    public void testLibrary() {
+        File script = writeScript(GSALIB_LOADED_SCRIPT);
+        try {
+            RScriptExecutor executor = new RScriptExecutor();
+            executor.addScript(script);
+            executor.addLibrary(RScriptLibrary.GSALIB);
+            executor.setExceptOnError(true);
+            Assert.assertTrue(executor.exec(), "Exec failed");
+        } finally {
+            FileUtils.deleteQuietly(script);
+        }
+    }
+
+    @Test(dependsOnMethods = "testRscriptExists", expectedExceptions = RScriptExecutorException.class)
+    public void testLibraryMissing() {
+        File script = writeScript(GSALIB_LOADED_SCRIPT);
+        try {
+            RScriptExecutor executor = new RScriptExecutor();
+            executor.addScript(script);
+            // GSALIB is not added nor imported in the script
+            executor.setExceptOnError(true);
+            executor.exec();
+        } finally {
+            FileUtils.deleteQuietly(script);
+        }
+    }
+
+    private File writeScript(String content) {
+        return IOUtils.writeTempFile(content, "myTestScript", ".R");
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/utils/R/RScriptLibraryUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/R/RScriptLibraryUnitTest.java
new file mode 100644
index 000000000..19fd5b316
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/utils/R/RScriptLibraryUnitTest.java
@@ -0,0 +1,46 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.R;
+
+import org.apache.commons.io.FileUtils;
+import org.testng.Assert;
+import org.testng.annotations.Test;
+
+import java.io.File;
+
+public class RScriptLibraryUnitTest {
+    @Test
+    public void testProperties() {
+        Assert.assertEquals(RScriptLibrary.GSALIB.getLibraryName(), "gsalib");
+        Assert.assertEquals(RScriptLibrary.GSALIB.getResourcePath(), "gsalib.tar.gz");
+    }
+
+    @Test
+    public void testWriteTemp() {
+        File file = RScriptLibrary.GSALIB.writeTemp();
+        Assert.assertTrue(file.exists(), "R library was not written to temp file: " + file);
+        FileUtils.deleteQuietly(file);
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/utils/ReadUtilsUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/ReadUtilsUnitTest.java
index 7cb7fec98..bc39d714e 100755
--- a/public/java/test/org/broadinstitute/sting/utils/ReadUtilsUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/utils/ReadUtilsUnitTest.java
@@ -3,18 +3,20 @@ package org.broadinstitute.sting.utils;
 import net.sf.samtools.SAMFileHeader;
 import net.sf.samtools.SAMRecord;
 import org.broadinstitute.sting.BaseTest;
+import org.broadinstitute.sting.utils.pileup.PileupElement;
 import org.broadinstitute.sting.utils.sam.ArtificialSAMUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.broadinstitute.sting.utils.sam.ReadUtils;
 import org.testng.Assert;
-import org.testng.annotations.BeforeClass;
 import org.testng.annotations.BeforeTest;
 import org.testng.annotations.Test;
 
 
 public class ReadUtilsUnitTest extends BaseTest {
-    SAMRecord read;
+    GATKSAMRecord read, reducedRead;
     final static String BASES = "ACTG";
     final static String QUALS = "!+5?";
+    final private static byte[] REDUCED_READ_COUNTS = new byte[]{10, 20, 30, 40};
 
     @BeforeTest
     public void init() {
@@ -23,9 +25,14 @@ public class ReadUtilsUnitTest extends BaseTest {
         read.setReadUnmappedFlag(true);
         read.setReadBases(new String(BASES).getBytes());
         read.setBaseQualityString(new String(QUALS));
+
+        reducedRead = ArtificialSAMUtils.createArtificialRead(header, "reducedRead", 0, 1, BASES.length());
+        reducedRead.setReadBases(BASES.getBytes());
+        reducedRead.setBaseQualityString(QUALS);
+        reducedRead.setAttribute(GATKSAMRecord.REDUCED_READ_QUALITY_TAG, REDUCED_READ_COUNTS);
     }
 
-    private void testReadBasesAndQuals(SAMRecord read, int expectedStart, int expectedStop) {
+    private void testReadBasesAndQuals(GATKSAMRecord read, int expectedStart, int expectedStop) {
         SAMRecord clipped = ReadUtils.hardClipBases(read, expectedStart, expectedStop - 1, null);
         String expectedBases = BASES.substring(expectedStart, expectedStop);
         String expectedQuals = QUALS.substring(expectedStart, expectedStop);
@@ -38,4 +45,27 @@ public class ReadUtilsUnitTest extends BaseTest {
     @Test public void testClip2Front() { testReadBasesAndQuals(read, 2, 4); }
     @Test public void testClip1Back() { testReadBasesAndQuals(read, 0, 3); }
     @Test public void testClip2Back() { testReadBasesAndQuals(read, 0, 2); }
+
+    @Test
+    public void testReducedReads() {
+        Assert.assertFalse(read.isReducedRead(), "isReducedRead is false for normal read");
+        Assert.assertEquals(read.getReducedReadCounts(), null, "No reduced read tag in normal read");
+
+        Assert.assertTrue(reducedRead.isReducedRead(), "isReducedRead is true for reduced read");
+        for ( int i = 0; i < reducedRead.getReadLength(); i++) {
+            Assert.assertEquals(reducedRead.getReducedCount(i), REDUCED_READ_COUNTS[i], "Reduced read count not set to the expected value at " + i);
+        }
+    }
+
+    @Test
+    public void testReducedReadPileupElement() {
+        PileupElement readp = new PileupElement(read,0);
+        PileupElement reducedreadp = new PileupElement(reducedRead,0);
+
+        Assert.assertFalse(readp.isReducedRead());
+
+        Assert.assertTrue(reducedreadp.isReducedRead());
+        Assert.assertEquals(reducedreadp.getRepresentativeCount(), REDUCED_READ_COUNTS[0]);
+        Assert.assertEquals(reducedreadp.getQual(), readp.getQual());
+    }
 }
diff --git a/public/java/test/org/broadinstitute/sting/utils/ReservoirDownsamplerUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/ReservoirDownsamplerUnitTest.java
index 76dd5d341..0f19e2f90 100644
--- a/public/java/test/org/broadinstitute/sting/utils/ReservoirDownsamplerUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/utils/ReservoirDownsamplerUnitTest.java
@@ -1,5 +1,6 @@
 package org.broadinstitute.sting.utils;
 
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.testng.Assert;
 import org.testng.annotations.Test;
 import org.broadinstitute.sting.utils.sam.ArtificialSAMUtils;
@@ -28,7 +29,7 @@ public class ReservoirDownsamplerUnitTest {
 
     @Test
     public void testOneElementWithPoolSizeOne() {
-        List<SAMRecord> reads = Collections.singletonList(ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,76));
+        List<GATKSAMRecord> reads = Collections.singletonList(ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,76));
         ReservoirDownsampler<SAMRecord> downsampler = new ReservoirDownsampler<SAMRecord>(1);
         downsampler.addAll(reads);
 
@@ -40,7 +41,7 @@ public class ReservoirDownsamplerUnitTest {
 
     @Test
     public void testOneElementWithPoolSizeGreaterThanOne() {
-        List<SAMRecord> reads = Collections.singletonList(ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,76));
+        List<GATKSAMRecord> reads = Collections.singletonList(ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,76));
         ReservoirDownsampler<SAMRecord> downsampler = new ReservoirDownsampler<SAMRecord>(5);
         downsampler.addAll(reads);
 
diff --git a/public/java/test/org/broadinstitute/sting/utils/bed/BedParserUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/bed/BedParserUnitTest.java
deleted file mode 100644
index 56bf66f53..000000000
--- a/public/java/test/org/broadinstitute/sting/utils/bed/BedParserUnitTest.java
+++ /dev/null
@@ -1,68 +0,0 @@
-package org.broadinstitute.sting.utils.bed;
-
-import org.broadinstitute.sting.utils.exceptions.UserException;
-import org.testng.Assert;
-import org.broadinstitute.sting.BaseTest;
-import org.broadinstitute.sting.utils.GenomeLocParser;
-import org.broadinstitute.sting.utils.GenomeLoc;
-import org.broadinstitute.sting.utils.fasta.CachingIndexedFastaSequenceFile;
-import org.testng.annotations.BeforeClass;
-import org.testng.annotations.Test;
-
-
-import java.io.File;
-import java.io.FileNotFoundException;
-import java.util.List;
-
-import net.sf.picard.reference.IndexedFastaSequenceFile;
-
-
-public class BedParserUnitTest extends BaseTest {
-
-    private static IndexedFastaSequenceFile seq;
-    private GenomeLocParser genomeLocParser;
-    private File bedFile = new File("public/testdata/sampleBedFile.bed");
-
-    @BeforeClass
-    public void beforeTests() {
-        File referenceFile = new File(b36KGReference);
-        try {
-            seq = new CachingIndexedFastaSequenceFile(referenceFile);
-        }
-        catch(FileNotFoundException ex) {
-            throw new UserException.CouldNotReadInputFile(referenceFile,ex);
-        }
-
-        genomeLocParser = new GenomeLocParser(seq);
-    }
-
-    @Test
-    public void testLoadBedFile() {
-        BedParser parser = new BedParser(genomeLocParser,bedFile);
-        List<GenomeLoc> location = parser.getLocations();
-        Assert.assertEquals(location.size(), 4);
-    }
-
-    @Test
-    public void testBedParsing() {
-        BedParser parser = new BedParser(genomeLocParser,bedFile);
-        List<GenomeLoc> location = parser.getLocations();
-        Assert.assertEquals(location.size(), 4);
-        Assert.assertTrue(location.get(0).getContig().equals("20"));
-        Assert.assertTrue(location.get(1).getContig().equals("20"));
-        Assert.assertTrue(location.get(2).getContig().equals("22"));
-        Assert.assertTrue(location.get(3).getContig().equals("22"));
-
-        // now check the the start positions
-        Assert.assertEquals(location.get(0).getStart(), 1);
-        Assert.assertEquals(location.get(1).getStart(), 1002);
-        Assert.assertEquals(location.get(2).getStart(), 1001);
-        Assert.assertEquals(location.get(3).getStart(), 2001);
-
-        // now check the the stop positions
-        Assert.assertEquals(location.get(0).getStop(), 999);
-        Assert.assertEquals(location.get(1).getStop(), 2000);
-        Assert.assertEquals(location.get(2).getStop(), 5000);
-        Assert.assertEquals(location.get(3).getStop(), 6000);
-    }
-}
diff --git a/public/java/test/org/broadinstitute/sting/utils/clipreads/ReadClipperUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/clipreads/ReadClipperUnitTest.java
new file mode 100644
index 000000000..f625af23c
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/utils/clipreads/ReadClipperUnitTest.java
@@ -0,0 +1,223 @@
+/*
+ * Copyright (c) 2010 The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ *
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR
+ * THE USE OR OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.clipreads;
+
+import net.sf.samtools.SAMFileHeader;
+import org.broadinstitute.sting.BaseTest;
+import org.broadinstitute.sting.utils.sam.ArtificialSAMUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
+import org.testng.Assert;
+import org.testng.annotations.BeforeClass;
+import org.testng.annotations.Test;
+
+/**
+ * Created by IntelliJ IDEA.
+ * User: roger
+ * Date: 9/28/11
+ * Time: 9:54 PM
+ * To change this template use File | Settings | File Templates.
+ */
+public class ReadClipperUnitTest extends BaseTest {
+
+    // TODO: Add error messages on failed tests
+
+    GATKSAMRecord read, expected;
+    ReadClipper readClipper;
+    final static String BASES = "ACTG";
+    final static String QUALS = "!+5?"; //ASCII values = 33,43,53,63
+
+    @BeforeClass
+    public void init() {
+        SAMFileHeader header = ArtificialSAMUtils.createArtificialSamHeader(1, 1, 1000);
+        read = ArtificialSAMUtils.createArtificialRead(header, "read1", 0, 1, BASES.length());
+        read.setReadUnmappedFlag(true);
+        read.setReadBases(new String(BASES).getBytes());
+        read.setBaseQualityString(new String(QUALS));
+
+        readClipper = new ReadClipper(read);
+    }
+
+    @Test ( enabled = false )
+    public void testHardClipBothEndsByReferenceCoordinates() {
+        logger.warn("Executing testHardClipBothEndsByReferenceCoordinates");
+
+        //Clip whole read
+        Assert.assertEquals(readClipper.hardClipBothEndsByReferenceCoordinates(0,0), new GATKSAMRecord(read.getHeader()));
+        //clip 1 base
+        expected = readClipper.hardClipBothEndsByReferenceCoordinates(0,3);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(1,3).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(1,3));
+        Assert.assertEquals(expected.getCigarString(), "1H2M1H");
+
+    }
+
+    @Test ( enabled = false )
+    public void testHardClipByReadCoordinates() {
+        logger.warn("Executing testHardClipByReadCoordinates");
+
+        //Clip whole read
+        Assert.assertEquals(readClipper.hardClipByReadCoordinates(0,3), new GATKSAMRecord(read.getHeader()));
+
+        //clip 1 base at start
+        expected = readClipper.hardClipByReadCoordinates(0,0);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(1,4).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(1,4));
+        Assert.assertEquals(expected.getCigarString(), "1H3M");
+
+        //clip 1 base at end
+        expected = readClipper.hardClipByReadCoordinates(3,3);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(0,3).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(0,3));
+        Assert.assertEquals(expected.getCigarString(), "3M1H");
+
+        //clip 2 bases at start
+        expected = readClipper.hardClipByReadCoordinates(0,1);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(2,4).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(2,4));
+        Assert.assertEquals(expected.getCigarString(), "2H2M");
+
+        //clip 2 bases at end
+        expected = readClipper.hardClipByReadCoordinates(2,3);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(0,2).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(0,2));
+        Assert.assertEquals(expected.getCigarString(), "2M2H");
+
+    }
+
+    @Test ( enabled = false )
+    public void testHardClipByReferenceCoordinates() {
+        logger.warn("Executing testHardClipByReferenceCoordinates");
+
+        //Clip whole read
+        Assert.assertEquals(readClipper.hardClipByReferenceCoordinates(1,4), new GATKSAMRecord(read.getHeader()));
+
+        //clip 1 base at start
+        expected = readClipper.hardClipByReferenceCoordinates(-1,1);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(1,4).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(1,4));
+        Assert.assertEquals(expected.getCigarString(), "1H3M");
+
+        //clip 1 base at end
+        expected = readClipper.hardClipByReferenceCoordinates(3,-1);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(0,3).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(0,3));
+        Assert.assertEquals(expected.getCigarString(), "3M1H");
+
+        //clip 2 bases at start
+        expected = readClipper.hardClipByReferenceCoordinates(-1,2);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(2,4).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(2,4));
+        Assert.assertEquals(expected.getCigarString(), "2H2M");
+
+        //clip 2 bases at end
+        expected = readClipper.hardClipByReferenceCoordinates(2,-1);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(0,2).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(0,2));
+        Assert.assertEquals(expected.getCigarString(), "2M2H");
+
+    }
+
+    @Test ( enabled = false )
+    public void testHardClipByReferenceCoordinatesLeftTail() {
+        logger.warn("Executing testHardClipByReferenceCoordinatesLeftTail");
+
+        //Clip whole read
+        Assert.assertEquals(readClipper.hardClipByReferenceCoordinatesLeftTail(4), new GATKSAMRecord(read.getHeader()));
+
+        //clip 1 base at start
+        expected = readClipper.hardClipByReferenceCoordinatesLeftTail(1);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(1,4).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(1,4));
+        Assert.assertEquals(expected.getCigarString(), "1H3M");
+
+        //clip 2 bases at start
+        expected = readClipper.hardClipByReferenceCoordinatesLeftTail(2);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(2,4).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(2,4));
+        Assert.assertEquals(expected.getCigarString(), "2H2M");
+
+    }
+
+    @Test ( enabled = false )
+    public void testHardClipByReferenceCoordinatesRightTail() {
+        logger.warn("Executing testHardClipByReferenceCoordinatesRightTail");
+
+        //Clip whole read
+        Assert.assertEquals(readClipper.hardClipByReferenceCoordinatesRightTail(1), new GATKSAMRecord(read.getHeader()));
+
+        //clip 1 base at end
+        expected = readClipper.hardClipByReferenceCoordinatesRightTail(3);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(0,3).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(0,3));
+        Assert.assertEquals(expected.getCigarString(), "3M1H");
+
+        //clip 2 bases at end
+        expected = readClipper.hardClipByReferenceCoordinatesRightTail(2);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(0,2).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(0,2));
+        Assert.assertEquals(expected.getCigarString(), "2M2H");
+
+    }
+
+    @Test ( enabled = false )
+    public void testHardClipLowQualEnds() {
+        logger.warn("Executing testHardClipByReferenceCoordinates");
+
+
+        //Clip whole read
+        Assert.assertEquals(readClipper.hardClipLowQualEnds((byte)64), new GATKSAMRecord(read.getHeader()));
+
+        //clip 1 base at start
+        expected = readClipper.hardClipLowQualEnds((byte)34);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(1,4).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(1,4));
+        Assert.assertEquals(expected.getCigarString(), "1H3M");
+
+        //clip 2 bases at start
+        expected = readClipper.hardClipLowQualEnds((byte)44);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(2,4).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(2,4));
+        Assert.assertEquals(expected.getCigarString(), "2H2M");
+
+        // Reverse Quals sequence
+        readClipper.getRead().setBaseQualityString("?5+!"); // 63,53,43,33
+
+        //clip 1 base at end
+        expected = readClipper.hardClipLowQualEnds((byte)34);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(0,3).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(0,3));
+        Assert.assertEquals(expected.getCigarString(), "3M1H");
+
+        //clip 2 bases at end
+        expected = readClipper.hardClipLowQualEnds((byte)44);
+        Assert.assertEquals(expected.getReadBases(), BASES.substring(0,2).getBytes());
+        Assert.assertEquals(expected.getBaseQualityString(), QUALS.substring(0,2));
+        Assert.assertEquals(expected.getCigarString(), "2M2H");
+
+        // revert Qual sequence
+        readClipper.getRead().setBaseQualityString(QUALS);
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/utils/codecs/vcf/IndexFactoryUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/codecs/vcf/IndexFactoryUnitTest.java
index d08cda949..55bd4783b 100755
--- a/public/java/test/org/broadinstitute/sting/utils/codecs/vcf/IndexFactoryUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/utils/codecs/vcf/IndexFactoryUnitTest.java
@@ -1,53 +1,43 @@
 package org.broadinstitute.sting.utils.codecs.vcf;
 
+import net.sf.samtools.SAMSequenceDictionary;
 import org.broad.tribble.Tribble;
 import org.broad.tribble.index.*;
 import org.broad.tribble.iterators.CloseableTribbleIterator;
 import org.broad.tribble.source.BasicFeatureSource;
+import org.broadinstitute.sting.BaseTest;
 import org.broadinstitute.sting.WalkerTest;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.fasta.CachingIndexedFastaSequenceFile;
 import org.broadinstitute.sting.utils.variantcontext.VariantContext;
 import org.testng.Assert;
+import org.testng.annotations.BeforeTest;
 import org.testng.annotations.Test;
 
 import java.io.File;
+import java.io.FileNotFoundException;
 import java.io.IOException;
 import java.util.*;
 
 /**
  * tests out the various functions in the index factory class
  */
-public class IndexFactoryUnitTest {
+public class IndexFactoryUnitTest extends BaseTest {
 
     File inputFile = new File("public/testdata/HiSeq.10000.vcf");
     File outputFile = new File("public/testdata/onTheFlyOutputTest.vcf");
     File outputFileIndex = Tribble.indexFile(outputFile);
 
-    /**
-     * test out scoring the indexes
-     */
-    @Test
-    public void testScoreIndexes() {
-        /*// make a list of indexes to score
-        Map<Class,IndexCreator> creators = new HashMap<Class,IndexCreator>();
-        // add a linear index with the default bin size
-        LinearIndexCreator linearNormal = new LinearIndexCreator();
-        linearNormal.initialize(inputFile, linearNormal.defaultBinSize());
-        creators.add(LInearIndexlinearNormal);
+    private SAMSequenceDictionary dict;
 
-        // create a tree index with a small index size
-        IntervalIndexCreator treeSmallBin = new IntervalIndexCreator();
-        treeSmallBin.initialize(inputFile, Math.max(200,treeSmallBin.defaultBinSize()/10));
-        creators.add(treeSmallBin);
-
-        List<Index> indexes = new ArrayList<Index>();
-        for (IndexCreator creator : creators)
-            indexes.add(creator.finalizeIndex(0));
-
-        ArrayList<Double> scores = IndexFactory.scoreIndexes(0.5,indexes,100, IndexFactory.IndexBalanceApproach.FOR_SEEK_TIME);
-        System.err.println("scores are : ");
-        for (Double score : scores) {
-            System.err.println(score);
-*/
+    @BeforeTest
+    public void setup() {
+        try {
+            dict = new CachingIndexedFastaSequenceFile(new File(b37KGReference)).getSequenceDictionary();
+        }
+        catch(FileNotFoundException ex) {
+            throw new UserException.CouldNotReadInputFile(b37KGReference,ex);
+        }
     }
 
     //
@@ -65,7 +55,7 @@ public class IndexFactoryUnitTest {
             BasicFeatureSource<VariantContext> source = new BasicFeatureSource<VariantContext>(inputFile.getAbsolutePath(), indexFromInputFile, new VCFCodec());
 
             int counter = 0;
-            VCFWriter writer = new StandardVCFWriter(outputFile);
+            VCFWriter writer = new StandardVCFWriter(outputFile, dict);
             writer.writeHeader((VCFHeader)source.getHeader());
             CloseableTribbleIterator<VariantContext> it = source.iterator();
             while (it.hasNext() && (counter++ < maxRecords || maxRecords == -1) ) {
diff --git a/public/java/test/org/broadinstitute/sting/utils/codecs/vcf/VCFIntegrationTest.java b/public/java/test/org/broadinstitute/sting/utils/codecs/vcf/VCFIntegrationTest.java
index 2ef116708..c8a0c0ed6 100644
--- a/public/java/test/org/broadinstitute/sting/utils/codecs/vcf/VCFIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/utils/codecs/vcf/VCFIntegrationTest.java
@@ -17,7 +17,7 @@ public class VCFIntegrationTest extends WalkerTest {
 
         String baseCommand = "-R " + b37KGReference + " -NO_HEADER -o %s ";
 
-        String test1 = baseCommand + "-T VariantAnnotator --variant " + testVCF + " -BTI variant";
+        String test1 = baseCommand + "-T VariantAnnotator --variant " + testVCF + " -L " + testVCF;
         WalkerTestSpec spec1 = new WalkerTestSpec(test1, 1, Arrays.asList(md5ofInputVCF));
         List<File> result = executeTest("Test Variant Annotator with no changes", spec1).getFirst();
 
diff --git a/public/java/test/org/broadinstitute/sting/utils/fragments/FragmentUtilsBenchmark.java b/public/java/test/org/broadinstitute/sting/utils/fragments/FragmentUtilsBenchmark.java
new file mode 100644
index 000000000..2771a7e45
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/utils/fragments/FragmentUtilsBenchmark.java
@@ -0,0 +1,80 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.fragments;
+
+import com.google.caliper.Param;
+import com.google.caliper.SimpleBenchmark;
+import com.google.caliper.runner.CaliperMain;
+import net.sf.samtools.SAMFileHeader;
+import org.broadinstitute.sting.utils.GenomeLoc;
+import org.broadinstitute.sting.utils.GenomeLocParser;
+import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
+import org.broadinstitute.sting.utils.sam.ArtificialSAMUtils;
+
+import java.util.*;
+
+/**
+ * Caliper microbenchmark of fragment pileup
+ */
+public class FragmentUtilsBenchmark extends SimpleBenchmark {
+    List<ReadBackedPileup> pileups;
+
+    @Param({"0", "4", "30", "150", "1000"})
+    int pileupSize; // set automatically by framework
+
+    @Param({"200", "400"})
+    int insertSize; // set automatically by framework
+
+    @Override protected void setUp() {
+        final int nPileupsToGenerate = 100;
+        pileups = new ArrayList<ReadBackedPileup>(nPileupsToGenerate);
+        SAMFileHeader header = ArtificialSAMUtils.createArtificialSamHeader(1, 1, 1000);
+        GenomeLocParser genomeLocParser;
+        genomeLocParser = new GenomeLocParser(header.getSequenceDictionary());
+        GenomeLoc loc = genomeLocParser.createGenomeLoc("chr1", 50);
+        final int readLen = 100;
+
+        for ( int pileupN = 0; pileupN < nPileupsToGenerate; pileupN++ ) {
+            ReadBackedPileup rbp = ArtificialSAMUtils.createReadBackedPileup(header, loc, readLen, insertSize, pileupSize);
+            pileups.add(rbp);
+        }
+    }
+
+//    public void timeOriginal(int rep) {
+//        run(rep, FragmentUtils.FragmentMatchingAlgorithm.ORIGINAL);
+//    }
+
+    public void timeSkipNonOverlapping(int rep) {
+        int nFrags = 0;
+        for ( int i = 0; i < rep; i++ ) {
+            for ( ReadBackedPileup rbp : pileups )
+                nFrags += FragmentUtils.create(rbp).getOverlappingPairs().size();
+        }
+    }
+
+    public static void main(String[] args) {
+        CaliperMain.main(FragmentUtilsBenchmark.class, args);
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/utils/fragments/FragmentUtilsUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/fragments/FragmentUtilsUnitTest.java
new file mode 100644
index 000000000..cbe580809
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/utils/fragments/FragmentUtilsUnitTest.java
@@ -0,0 +1,164 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.fragments;
+
+import net.sf.samtools.SAMFileHeader;
+import org.broadinstitute.sting.BaseTest;
+import org.broadinstitute.sting.utils.pileup.PileupElement;
+import org.broadinstitute.sting.utils.pileup.ReadBackedPileup;
+import org.broadinstitute.sting.utils.pileup.ReadBackedPileupImpl;
+import org.broadinstitute.sting.utils.sam.ArtificialSAMUtils;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
+import org.testng.Assert;
+import org.testng.annotations.BeforeTest;
+import org.testng.annotations.DataProvider;
+import org.testng.annotations.Test;
+
+import java.util.*;
+
+/**
+ * Test routines for read-backed pileup.
+ */
+public class FragmentUtilsUnitTest extends BaseTest {
+    private static SAMFileHeader header;
+
+    private class FragmentUtilsTest extends TestDataProvider {
+        List<TestState> statesForPileup = new ArrayList<TestState>();
+        List<TestState> statesForReads = new ArrayList<TestState>();
+
+        private FragmentUtilsTest(String name, int readLen, int leftStart, int rightStart,
+                                  boolean leftIsFirst, boolean leftIsNegative) {
+            super(FragmentUtilsTest.class, String.format("%s-leftIsFirst:%b-leftIsNegative:%b", name, leftIsFirst, leftIsNegative));
+
+            List<GATKSAMRecord> pair = ArtificialSAMUtils.createPair(header, "readpair", readLen, leftStart, rightStart, leftIsFirst, leftIsNegative);
+            GATKSAMRecord left = pair.get(0);
+            GATKSAMRecord right = pair.get(1);
+
+            for ( int pos = leftStart; pos < rightStart + readLen; pos++) {
+                boolean posCoveredByLeft = pos >= left.getAlignmentStart() && pos <= left.getAlignmentEnd();
+                boolean posCoveredByRight = pos >= right.getAlignmentStart() && pos <= right.getAlignmentEnd();
+
+                if ( posCoveredByLeft || posCoveredByRight ) {
+                    List<GATKSAMRecord> reads = new ArrayList<GATKSAMRecord>();
+                    List<Integer> offsets = new ArrayList<Integer>();
+
+                    if ( posCoveredByLeft ) {
+                        reads.add(left);
+                        offsets.add(pos - left.getAlignmentStart());
+                    }
+
+                    if ( posCoveredByRight ) {
+                        reads.add(right);
+                        offsets.add(pos - right.getAlignmentStart());
+                    }
+
+                    boolean shouldBeFragment = posCoveredByLeft && posCoveredByRight;
+                    ReadBackedPileup pileup = new ReadBackedPileupImpl(null, reads, offsets);
+                    TestState testState = new TestState(shouldBeFragment ? 0 : 1, shouldBeFragment ? 1 : 0, pileup, null);
+                    statesForPileup.add(testState);
+                }
+
+                TestState testState = left.getAlignmentEnd() >= right.getAlignmentStart() ? new TestState(0, 1, null, pair) : new TestState(2, 0, null, pair);
+                statesForReads.add(testState);
+            }
+        }
+    }
+
+    private class TestState {
+        int expectedSingletons, expectedPairs;
+        ReadBackedPileup pileup;
+        List<GATKSAMRecord> rawReads;
+
+        private TestState(final int expectedSingletons, final int expectedPairs, final ReadBackedPileup pileup, final List<GATKSAMRecord> rawReads) {
+            this.expectedSingletons = expectedSingletons;
+            this.expectedPairs = expectedPairs;
+            this.pileup = pileup;
+            this.rawReads = rawReads;
+        }
+    }
+
+    @DataProvider(name = "fragmentUtilsTest")
+    public Object[][] createTests() {
+        for ( boolean leftIsFirst : Arrays.asList(true, false) ) {
+            for ( boolean leftIsNegative : Arrays.asList(true, false) ) {
+                // Overlapping pair
+                // ---->        [first]
+                //   <---       [second]
+                new FragmentUtilsTest("overlapping-pair", 10, 1, 5, leftIsFirst, leftIsNegative);
+
+                // Non-overlapping pair
+                // ---->
+                //          <----
+                new FragmentUtilsTest("nonoverlapping-pair", 10, 1, 15, leftIsFirst, leftIsNegative);
+            }
+        }
+
+        return FragmentUtilsTest.getTests(FragmentUtilsTest.class);
+    }
+
+    @Test(enabled = true, dataProvider = "fragmentUtilsTest")
+    public void testAsPileup(FragmentUtilsTest test) {
+        for ( TestState testState : test.statesForPileup ) {
+            ReadBackedPileup rbp = testState.pileup;
+            FragmentCollection<PileupElement> fp = FragmentUtils.create(rbp);
+            Assert.assertEquals(fp.getOverlappingPairs().size(), testState.expectedPairs);
+            Assert.assertEquals(fp.getSingletonReads().size(), testState.expectedSingletons);
+        }
+    }
+
+    @Test(enabled = true, dataProvider = "fragmentUtilsTest")
+    public void testAsListOfReadsFromPileup(FragmentUtilsTest test) {
+        for ( TestState testState : test.statesForPileup ) {
+            FragmentCollection<GATKSAMRecord> fp = FragmentUtils.create(testState.pileup.getReads());
+            Assert.assertEquals(fp.getOverlappingPairs().size(), testState.expectedPairs);
+            Assert.assertEquals(fp.getSingletonReads().size(), testState.expectedSingletons);
+        }
+    }
+
+    @Test(enabled = true, dataProvider = "fragmentUtilsTest")
+    public void testAsListOfReads(FragmentUtilsTest test) {
+        for ( TestState testState : test.statesForReads ) {
+            FragmentCollection<GATKSAMRecord> fp = FragmentUtils.create(testState.rawReads);
+            Assert.assertEquals(fp.getOverlappingPairs().size(), testState.expectedPairs);
+            Assert.assertEquals(fp.getSingletonReads().size(), testState.expectedSingletons);
+        }
+    }
+
+    @Test(enabled = true, expectedExceptions = IllegalArgumentException.class)
+    public void testOutOfOrder() {
+        final List<GATKSAMRecord> pair = ArtificialSAMUtils.createPair(header, "readpair", 100, 1, 50, true, true);
+        final GATKSAMRecord left = pair.get(0);
+        final GATKSAMRecord right = pair.get(1);
+        final List<GATKSAMRecord> reads = Arrays.asList(right, left); // OUT OF ORDER!
+        final List<Integer> offsets = Arrays.asList(0, 50);
+        final ReadBackedPileup pileup = new ReadBackedPileupImpl(null, reads, offsets);
+        FragmentUtils.create(pileup); // should throw exception
+    }
+
+    @BeforeTest
+    public void setup() {
+        header = ArtificialSAMUtils.createArtificialSamHeader(1,1,1000);
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/utils/genotype/vcf/VCFWriterUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/genotype/vcf/VCFWriterUnitTest.java
index e3a926fb9..35c6a4993 100644
--- a/public/java/test/org/broadinstitute/sting/utils/genotype/vcf/VCFWriterUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/utils/genotype/vcf/VCFWriterUnitTest.java
@@ -38,12 +38,13 @@ public class VCFWriterUnitTest extends BaseTest {
     private Set<String> additionalColumns = new HashSet<String>();
     private File fakeVCFFile = new File("FAKEVCFFILEFORTESTING.vcf");
     private GenomeLocParser genomeLocParser;
+    private IndexedFastaSequenceFile seq;
 
     @BeforeClass
     public void beforeTests() {
         File referenceFile = new File(hg18Reference);
         try {
-            IndexedFastaSequenceFile seq = new CachingIndexedFastaSequenceFile(referenceFile);
+            seq = new CachingIndexedFastaSequenceFile(referenceFile);
             genomeLocParser = new GenomeLocParser(seq);
         }
         catch(FileNotFoundException ex) {
@@ -55,7 +56,7 @@ public class VCFWriterUnitTest extends BaseTest {
     @Test
     public void testBasicWriteAndRead() {
         VCFHeader header = createFakeHeader(metaData,additionalColumns);
-        VCFWriter writer = new StandardVCFWriter(fakeVCFFile);
+        VCFWriter writer = new StandardVCFWriter(fakeVCFFile, seq.getSequenceDictionary());
         writer.writeHeader(header);
         writer.add(createVC(header));
         writer.add(createVC(header));
@@ -104,7 +105,6 @@ public class VCFWriterUnitTest extends BaseTest {
     public static VCFHeader createFakeHeader(Set<VCFHeaderLine> metaData, Set<String> additionalColumns) {
         metaData.add(new VCFHeaderLine(VCFHeaderVersion.VCF4_0.getFormatString(), VCFHeaderVersion.VCF4_0.getVersionString()));
         metaData.add(new VCFHeaderLine("two", "2"));
-        additionalColumns.add("FORMAT");
         additionalColumns.add("extra1");
         additionalColumns.add("extra2");
         return new VCFHeader(metaData, additionalColumns);
@@ -158,6 +158,6 @@ public class VCFWriterUnitTest extends BaseTest {
             Assert.assertTrue(additionalColumns.contains(key));
             index++;
         }
-        Assert.assertEquals(index+1, additionalColumns.size()  /* for the header field we don't see */);
+        Assert.assertEquals(index, additionalColumns.size());
     }
 }
diff --git a/public/java/test/org/broadinstitute/sting/utils/interval/IntervalFileMergingIteratorUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/interval/IntervalFileMergingIteratorUnitTest.java
deleted file mode 100644
index 752695052..000000000
--- a/public/java/test/org/broadinstitute/sting/utils/interval/IntervalFileMergingIteratorUnitTest.java
+++ /dev/null
@@ -1,139 +0,0 @@
-/*
- * Copyright (c) 2010 The Broad Institute
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use,
- * copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following
- * conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- *
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
- * OTHER DEALINGS IN THE SOFTWARE.
- */
-
-package org.broadinstitute.sting.utils.interval;
-
-import org.testng.Assert;
-import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
-import org.testng.annotations.BeforeClass;
-import org.testng.annotations.Test;
-
-import org.broadinstitute.sting.BaseTest;
-import org.broadinstitute.sting.utils.GenomeLocParser;
-import org.broadinstitute.sting.utils.GenomeLoc;
-import net.sf.picard.reference.ReferenceSequenceFileFactory;
-
-import java.io.File;
-import java.util.Iterator;
-import java.util.List;
-import java.util.ArrayList;
-
-/**
- * Created by IntelliJ IDEA.
- * User: asivache
- * Date: Jun 14, 2010
- * Time: 10:15:52 AM
- * To change this template use File | Settings | File Templates.
- */
-public class IntervalFileMergingIteratorUnitTest extends BaseTest {
-
-        private static File refFile =  new File(validationDataLocation + "Homo_sapiens_assembly17.fasta");
-        private static String intervalFileNameGATK = validationDataLocation+"test.gatk.intervals";
-        private static String intervalFileNameBED = validationDataLocation+"test.bed";
-        private static List<GenomeLoc> results1 = null;
-        private static List<GenomeLoc> results2 = null;
-
-    private GenomeLocParser genomeLocParser;
-
-        @BeforeClass
-        public void init() {
-            genomeLocParser = new GenomeLocParser(ReferenceSequenceFileFactory.getReferenceSequenceFile(refFile));
-
-            results1 = new ArrayList<GenomeLoc>();
-            results2 = new ArrayList<GenomeLoc>();
-
-            results1.add(genomeLocParser.createGenomeLoc("chr1",1554));
-            results1.add(genomeLocParser.createGenomeLoc("chr1",2538,2568));
-            results1.add(genomeLocParser.createGenomeLoc("chr1",18932,19000));
-            results1.add(genomeLocParser.createGenomeLoc("chr1",19001,25000));
-            results1.add(genomeLocParser.createGenomeLoc("chr5",7415,7600));
-
-            results2.add(genomeLocParser.createGenomeLoc("chr1",1554));
-            results2.add(genomeLocParser.createGenomeLoc("chr1",2538,2568));
-            results2.add(genomeLocParser.createGenomeLoc("chr1",18932,25000));
-            results2.add(genomeLocParser.createGenomeLoc("chr5",7415,7600));
-
-        }
-
-        @Test
-        public void testGATKIntervalFileIterator_Overlap() {
-            logger.warn("Executing testGATKIntervalFileIterator_Overlap");
-
-            Iterator<GenomeLoc> it = new IntervalFileMergingIterator(genomeLocParser,new File(intervalFileNameGATK),IntervalMergingRule.OVERLAPPING_ONLY);
-            Iterator<GenomeLoc> check_it = results1.iterator();
-            while(it.hasNext()) {
-                    GenomeLoc l = it.next();
-                    GenomeLoc l_expected = check_it.next();
-                    //System.out.println("int: "+l+" expected: "+l_expected) ;
-                    Assert.assertEquals(l_expected, l, "Unexpected location returned by the iterator: "+l);
-            }
-       }
-
-      @Test
-      public void testGATKIntervalFileIterator_OverlapWithException() {
-            logger.warn("Executing testGATKIntervalFileIterator_OverlapWithException");
-
-            Iterator<GenomeLoc> it = new IntervalFileMergingIterator(genomeLocParser,new File(intervalFileNameGATK),IntervalMergingRule.OVERLAPPING_ONLY);
-            Iterator<GenomeLoc> check_it = results1.iterator();
-            try {
-                while(it.hasNext()) {
-                    GenomeLoc l = it.next();
-                    GenomeLoc l_expected = check_it.next();
-//                    System.out.println("int: "+l+" expected: "+l_expected) ;
-                }
-            } catch ( ReviewedStingException e) {
-                    Assert.assertEquals("Interval chr5:7414 in the interval file is out of order.", e.getMessage());
-            }
-        }
-
-     @Test
-     public void testGATKIntervalFileIterator_All() {
-        logger.warn("Executing testGATKIntervalFileIterator_All");
-
-        Iterator<GenomeLoc> it = new IntervalFileMergingIterator(genomeLocParser,new File(intervalFileNameGATK),IntervalMergingRule.ALL);
-        Iterator<GenomeLoc> check_it = results2.iterator();
-        while(it.hasNext()) {
-                GenomeLoc l = it.next();
-                GenomeLoc l_expected = check_it.next();
-//                System.out.println("int: "+l+" expected: "+l_expected) ;
-                Assert.assertEquals(l_expected, l, "Unexpected location returned by the iterator: "+l);
-        }
-   }
-
-    @Test
-    public void testBEDIntervalFileIterator_Overlap() {
-        logger.warn("Executing testBEDIntervalFileIterator_Overlap");
-
-        Iterator<GenomeLoc> it = new IntervalFileMergingIterator(genomeLocParser,new File(intervalFileNameBED),IntervalMergingRule.OVERLAPPING_ONLY);
-        Iterator<GenomeLoc> check_it = results1.iterator();
-        while(it.hasNext()) {
-                GenomeLoc l = it.next();
-                GenomeLoc l_expected = check_it.next();
-//                System.out.println("int: "+l+" expected: "+l_expected) ;
-                Assert.assertEquals(l_expected, l, "Unexpected location returned by the iterator: "+l);
-        }
-   }
-
-}
diff --git a/public/java/test/org/broadinstitute/sting/utils/interval/IntervalIntegrationTest.java b/public/java/test/org/broadinstitute/sting/utils/interval/IntervalIntegrationTest.java
index 379d79c84..75bdc3142 100644
--- a/public/java/test/org/broadinstitute/sting/utils/interval/IntervalIntegrationTest.java
+++ b/public/java/test/org/broadinstitute/sting/utils/interval/IntervalIntegrationTest.java
@@ -48,19 +48,20 @@ public class IntervalIntegrationTest extends WalkerTest {
         executeTest("testAllIntervalsImplicit",spec);
     }
 
-    @Test(enabled = true)
-    public void testAllExplicitIntervalParsing() {
-        String md5 = "7821db9e14d4f8e07029ff1959cd5a99";
-        WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
-                "-T CountLoci" +
-                        " -I " + validationDataLocation + "OV-0930.normal.chunk.bam" +
-                        " -R " + hg18Reference +
-                        " -L all" +
-                        " -o %s",
-                        1, // just one output file
-                        Arrays.asList(md5));                        
-        executeTest("testAllIntervalsExplicit",spec);
-    }
+// '-L all' is no longer supported
+//    @Test(enabled = true)
+//    public void testAllExplicitIntervalParsing() {
+//        String md5 = "7821db9e14d4f8e07029ff1959cd5a99";
+//        WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
+//                "-T CountLoci" +
+//                        " -I " + validationDataLocation + "OV-0930.normal.chunk.bam" +
+//                        " -R " + hg18Reference +
+//                        " -L all" +
+//                        " -o %s",
+//                        1, // just one output file
+//                        Arrays.asList(md5));
+//        executeTest("testAllIntervalsExplicit",spec);
+//    }
 
     @Test
     public void testUnmappedReadInclusion() {
@@ -82,7 +83,7 @@ public class IntervalIntegrationTest extends WalkerTest {
         executeTest("testUnmappedReadInclusion",spec);
     }
 
-    @Test(enabled = true)
+    @Test(enabled = false)
     public void testUnmappedReadExclusion() {
         WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
                 "-T PrintReads" +
@@ -102,5 +103,122 @@ public class IntervalIntegrationTest extends WalkerTest {
         executeTest("testUnmappedReadExclusion",spec);
     }
 
+    @Test(enabled = true)
+    public void testIntervalParsingFromFile() {
+        String md5 = "48a24b70a0b376535542b996af517398";
+        WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
+                "-T CountLoci" +
+                        " -I " + validationDataLocation + "OV-0930.normal.chunk.bam" +
+                        " -R " + hg18Reference +
+                        " -o %s" +
+                        " -L " + validationDataLocation + "intervalTest.1.vcf",
+                        1, // just one output file
+                        Arrays.asList(md5));
+        executeTest("testIntervalParsingFromFile", spec);
+    }
+
+    @Test(enabled = true)
+    public void testIntervalMergingFromFiles() {
+        String md5 = "9ae0ea9e3c9c6e1b9b6252c8395efdc1";
+        WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
+                "-T CountLoci" +
+                        " -I " + validationDataLocation + "OV-0930.normal.chunk.bam" +
+                        " -R " + hg18Reference +
+                        " -o %s" +
+                        " -L " + validationDataLocation + "intervalTest.1.vcf" +
+                        " -L " + validationDataLocation + "intervalTest.2.vcf",
+                        1, // just one output file
+                        Arrays.asList(md5));
+        executeTest("testIntervalMergingFromFiles", spec);
+    }
+
+    @Test(enabled = true)
+    public void testIntervalExclusionsFromFiles() {
+        String md5 = "26ab0db90d72e28ad0ba1e22ee510510";
+        WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
+                "-T CountLoci" +
+                        " -I " + validationDataLocation + "OV-0930.normal.chunk.bam" +
+                        " -R " + hg18Reference +
+                        " -o %s" +
+                        " -L " + validationDataLocation + "intervalTest.1.vcf" +
+                        " -XL " + validationDataLocation + "intervalTest.2.vcf",
+                        1, // just one output file
+                        Arrays.asList(md5));
+        executeTest("testIntervalExclusionsFromFiles", spec);
+    }
+
+    @Test(enabled = true)
+    public void testMixedIntervalMerging() {
+        String md5 = "7c5aba41f53293b712fd86d08ed5b36e";
+        WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
+                "-T CountLoci" +
+                        " -I " + validationDataLocation + "OV-0930.normal.chunk.bam" +
+                        " -R " + hg18Reference +
+                        " -o %s" +
+                        " -L " + validationDataLocation + "intervalTest.1.vcf" +
+                        " -L chr1:1677524-1677528",
+                        1, // just one output file
+                        Arrays.asList(md5));
+        executeTest("testMixedIntervalMerging", spec);
+    }
+
+    @Test(enabled = true)
+    public void testComplexVCF() {
+        String md5 = "166d77ac1b46a1ec38aa35ab7e628ab5";
+        WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
+                "-T CountLoci" +
+                        " -I " + validationDataLocation + "OV-0930.normal.chunk.bam" +
+                        " -R " + hg18Reference +
+                        " -o %s" +
+                        " -L " + validationDataLocation + "intervalTest.3.vcf",
+                        1, // just one output file
+                        Arrays.asList(md5));
+        executeTest("testComplexVCF", spec);
+    }
+
+    @Test(enabled = true)
+    public void testMergingWithComplexVCF() {
+        String md5 = "6d7fce9fee471194aa8b5b6e47267f03";
+        WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
+                "-T CountLoci" +
+                        " -I " + validationDataLocation + "OV-0930.normal.chunk.bam" +
+                        " -R " + hg18Reference +
+                        " -o %s" +
+                        " -L " + validationDataLocation + "intervalTest.1.vcf" +
+                        " -XL " + validationDataLocation + "intervalTest.3.vcf",
+                        1, // just one output file
+                        Arrays.asList(md5));
+        executeTest("testMergingWithComplexVCF", spec);
+    }
+
+    @Test(enabled = true)
+    public void testEmptyVCF() {
+        String md5 = "";
+        WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
+                "-T CountLoci" +
+                        " -I " + validationDataLocation + "OV-0930.normal.chunk.bam" +
+                        " -R " + hg18Reference +
+                        " -o %s" +
+                        " -L " + validationDataLocation + "intervalTest.empty.vcf",
+                        1, // just one output file
+                        Arrays.asList(md5));
+        executeTest("testEmptyVCFError", spec);
+    }
+
+    @Test(enabled = true)
+    public void testIncludeExcludeIsTheSame() {
+        String md5 = "";
+        WalkerTest.WalkerTestSpec spec = new WalkerTest.WalkerTestSpec(
+                "-T CountLoci" +
+                        " -I " + validationDataLocation + "OV-0930.normal.chunk.bam" +
+                        " -R " + hg18Reference +
+                        " -o %s" +
+                        " -L " + validationDataLocation + "intervalTest.1.vcf" +
+                        " -XL " + validationDataLocation + "intervalTest.1.vcf",
+                        1, // just one output file
+                        Arrays.asList(md5));
+        executeTest("testIncludeExcludeIsTheSame", spec);
+    }
+
 
 }
diff --git a/public/java/test/org/broadinstitute/sting/utils/interval/IntervalUtilsUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/interval/IntervalUtilsUnitTest.java
index bb892eec8..9c3b905c2 100644
--- a/public/java/test/org/broadinstitute/sting/utils/interval/IntervalUtilsUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/utils/interval/IntervalUtilsUnitTest.java
@@ -1,6 +1,7 @@
 package org.broadinstitute.sting.utils.interval;
 
 import net.sf.picard.reference.ReferenceSequenceFile;
+import net.sf.picard.util.IntervalUtil;
 import net.sf.samtools.SAMFileHeader;
 import org.broadinstitute.sting.BaseTest;
 import org.broadinstitute.sting.gatk.datasources.reference.ReferenceDataSource;
@@ -30,6 +31,20 @@ public class IntervalUtilsUnitTest extends BaseTest {
     private SAMFileHeader hg19Header;
     private GenomeLocParser hg19GenomeLocParser;
     private List<GenomeLoc> hg19ReferenceLocs;
+    private List<GenomeLoc> hg19exomeIntervals;
+
+    private List<GenomeLoc> getLocs(String... intervals) {
+        return getLocs(Arrays.asList(intervals));
+    }
+
+    private List<GenomeLoc> getLocs(List<String> intervals) {
+        if (intervals.size() == 0)
+            return hg18ReferenceLocs;
+        List<GenomeLoc> locs = new ArrayList<GenomeLoc>();
+        for (String interval: intervals)
+            locs.add(hg18GenomeLocParser.parseGenomeLoc(interval));
+        return locs;
+    }
 
     @BeforeClass
     public void init() {
@@ -54,12 +69,198 @@ public class IntervalUtilsUnitTest extends BaseTest {
             ReferenceSequenceFile seq = new CachingIndexedFastaSequenceFile(hg19Ref);
             hg19GenomeLocParser = new GenomeLocParser(seq);
             hg19ReferenceLocs = Collections.unmodifiableList(GenomeLocSortedSet.createSetFromSequenceDictionary(referenceDataSource.getReference().getSequenceDictionary()).toList()) ;
+
+            hg19exomeIntervals = Collections.unmodifiableList(IntervalUtils.parseIntervalArguments(hg19GenomeLocParser, Arrays.asList(hg19Intervals)));
         }
         catch(FileNotFoundException ex) {
             throw new UserException.CouldNotReadInputFile(hg19Ref,ex);
         }
     }
 
+    // -------------------------------------------------------------------------------------
+    //
+    // tests to ensure the quality of the interval cuts of the interval cutting functions
+    //
+    // -------------------------------------------------------------------------------------
+
+    private class IntervalSlicingTest extends TestDataProvider {
+        public int parts;
+        public double maxAllowableVariance;
+
+        private IntervalSlicingTest(final int parts, final double maxAllowableVariance) {
+            super(IntervalSlicingTest.class);
+            this.parts = parts;
+            this.maxAllowableVariance = maxAllowableVariance;
+        }
+
+        public String toString() {
+            return String.format("IntervalSlicingTest parts=%d maxVar=%.2f", parts, maxAllowableVariance);
+        }
+    }
+
+    @DataProvider(name = "intervalslicingdata")
+    public Object[][] createTrees() {
+        new IntervalSlicingTest(1, 0);
+        new IntervalSlicingTest(2, 1);
+        new IntervalSlicingTest(5, 1);
+        new IntervalSlicingTest(10, 1);
+        new IntervalSlicingTest(67, 1);
+        new IntervalSlicingTest(100, 1);
+        new IntervalSlicingTest(500, 1);
+        new IntervalSlicingTest(1000, 1);
+        return IntervalSlicingTest.getTests(IntervalSlicingTest.class);
+    }
+
+    @Test(enabled = true, dataProvider = "intervalslicingdata")
+    public void testFixedScatterIntervalsAlgorithm(IntervalSlicingTest test) {
+        List<List<GenomeLoc>> splits = IntervalUtils.splitFixedIntervals(hg19exomeIntervals, test.parts);
+
+        long totalSize = IntervalUtils.intervalSize(hg19exomeIntervals);
+        long idealSplitSize = totalSize / test.parts;
+
+        long sumOfSplitSizes = 0;
+        int counter = 0;
+        for ( final List<GenomeLoc> split : splits ) {
+            long splitSize = IntervalUtils.intervalSize(split);
+            double sigma = (splitSize - idealSplitSize) / (1.0 * idealSplitSize);
+            //logger.warn(String.format("Split %d size %d ideal %d sigma %.2f", counter, splitSize, idealSplitSize, sigma));
+            counter++;
+            sumOfSplitSizes += splitSize;
+            Assert.assertTrue(Math.abs(sigma) <= test.maxAllowableVariance, String.format("Interval %d (size %d ideal %d) has a variance %.2f outside of the tolerated range %.2f", counter, splitSize, idealSplitSize, sigma, test.maxAllowableVariance));
+        }
+
+        Assert.assertEquals(totalSize, sumOfSplitSizes, "Split intervals don't contain the exact number of bases in the origianl intervals");
+    }
+
+    // -------------------------------------------------------------------------------------
+    //
+    // splitLocusIntervals tests
+    //
+    // -------------------------------------------------------------------------------------
+
+    /** large scale tests for many intervals */
+    private class SplitLocusIntervalsTest extends TestDataProvider {
+        final List<GenomeLoc> originalIntervals;
+        final public int parts;
+
+        private SplitLocusIntervalsTest(final String name, List<GenomeLoc> originalIntervals, final int parts) {
+            super(SplitLocusIntervalsTest.class, name);
+            this.parts = parts;
+            this.originalIntervals = originalIntervals;
+        }
+
+        public String toString() {
+            return String.format("%s parts=%d", super.toString(), parts);
+        }
+    }
+
+    @DataProvider(name = "IntervalRepartitionTest")
+    public Object[][] createIntervalRepartitionTest() {
+        for ( int parts : Arrays.asList(1, 2, 3, 10, 13, 100, 151, 1000, 10000) ) {
+        //for ( int parts : Arrays.asList(10) ) {
+            new SplitLocusIntervalsTest("hg19RefLocs", hg19ReferenceLocs, parts);
+            new SplitLocusIntervalsTest("hg19ExomeLocs", hg19exomeIntervals, parts);
+        }
+
+        return SplitLocusIntervalsTest.getTests(SplitLocusIntervalsTest.class);
+    }
+
+    @Test(enabled = true, dataProvider = "IntervalRepartitionTest")
+    public void testIntervalRepartition(SplitLocusIntervalsTest test) {
+        List<List<GenomeLoc>> splitByLocus = IntervalUtils.splitLocusIntervals(test.originalIntervals, test.parts);
+        Assert.assertEquals(splitByLocus.size(), test.parts, "SplitLocusIntervals failed to generate correct number of intervals");
+        List<GenomeLoc> flat = IntervalUtils.flattenSplitIntervals(splitByLocus);
+
+        // test overall size
+        final long originalSize = IntervalUtils.intervalSize(test.originalIntervals);
+        final long flatSize = IntervalUtils.intervalSize(flat);
+        Assert.assertEquals(flatSize, originalSize, "SplitLocusIntervals locs cover an incorrect number of bases");
+
+        // test size of each split
+        final long ideal = (long)Math.floor(originalSize / (1.0 * test.parts));
+        final long maxSize = ideal + (originalSize % test.parts) * test.parts; // no more than N * rounding error in size
+        for ( final List<GenomeLoc> split : splitByLocus ) {
+            final long splitSize = IntervalUtils.intervalSize(split);
+            Assert.assertTrue(splitSize >= ideal && splitSize <= maxSize,
+                    String.format("SplitLocusIntervals interval (start=%s) has size %d outside of bounds ideal=%d, max=%d",
+                            split.get(0), splitSize, ideal, maxSize));
+        }
+
+        // test that every base in original is covered once by a base in split by locus intervals
+        String diff = IntervalUtils.equateIntervals(test.originalIntervals, flat);
+        Assert.assertNull(diff, diff);
+    }
+
+    /** small scale tests where the expected cuts are enumerated upfront for testing */
+    private class SplitLocusIntervalsSmallTest extends TestDataProvider {
+        final List<GenomeLoc> original;
+        final public int parts;
+        final public int expectedParts;
+        final List<GenomeLoc> expected;
+
+        private SplitLocusIntervalsSmallTest(final String name, List<GenomeLoc> originalIntervals, final int parts, List<GenomeLoc> expected) {
+            this(name, originalIntervals, parts,  expected, parts);
+        }
+
+        private SplitLocusIntervalsSmallTest(final String name, List<GenomeLoc> originalIntervals, final int parts, List<GenomeLoc> expected, int expectedParts) {
+            super(SplitLocusIntervalsSmallTest.class, name);
+            this.parts = parts;
+            this.expectedParts = expectedParts;
+            this.original = originalIntervals;
+            this.expected = expected;
+        }
+
+        public String toString() {
+            return String.format("%s parts=%d", super.toString(), parts);
+        }
+    }
+
+    @DataProvider(name = "SplitLocusIntervalsSmallTest")
+    public Object[][] createSplitLocusIntervalsSmallTest() {
+        GenomeLoc bp01_10 = hg19GenomeLocParser.createGenomeLoc("1", 1, 10);
+
+        GenomeLoc bp1_5 = hg19GenomeLocParser.createGenomeLoc("1", 1, 5);
+        GenomeLoc bp6_10 = hg19GenomeLocParser.createGenomeLoc("1", 6, 10);
+        new SplitLocusIntervalsSmallTest("cut into two", Arrays.asList(bp01_10), 2, Arrays.asList(bp1_5, bp6_10));
+
+        GenomeLoc bp20_30 = hg19GenomeLocParser.createGenomeLoc("1", 20, 30);
+        new SplitLocusIntervalsSmallTest("two in two", Arrays.asList(bp01_10, bp20_30), 2, Arrays.asList(bp01_10, bp20_30));
+
+        GenomeLoc bp1_7 = hg19GenomeLocParser.createGenomeLoc("1", 1, 7);
+        GenomeLoc bp8_10 = hg19GenomeLocParser.createGenomeLoc("1", 8, 10);
+        GenomeLoc bp20_23 = hg19GenomeLocParser.createGenomeLoc("1", 20, 23);
+        GenomeLoc bp24_30 = hg19GenomeLocParser.createGenomeLoc("1", 24, 30);
+        new SplitLocusIntervalsSmallTest("two in three", Arrays.asList(bp01_10, bp20_30), 3,
+                Arrays.asList(bp1_7, bp8_10, bp20_23, bp24_30));
+
+        GenomeLoc bp1_2 = hg19GenomeLocParser.createGenomeLoc("1", 1, 2);
+        GenomeLoc bp1_1 = hg19GenomeLocParser.createGenomeLoc("1", 1, 1);
+        GenomeLoc bp2_2 = hg19GenomeLocParser.createGenomeLoc("1", 2, 2);
+        new SplitLocusIntervalsSmallTest("too many pieces", Arrays.asList(bp1_2), 5, Arrays.asList(bp1_1, bp2_2), 2);
+
+        new SplitLocusIntervalsSmallTest("emptyList", Collections.<GenomeLoc>emptyList(), 5, Collections.<GenomeLoc>emptyList(), 0);
+
+        return SplitLocusIntervalsSmallTest.getTests(SplitLocusIntervalsSmallTest.class);
+    }
+
+    @Test(enabled = true, dataProvider = "SplitLocusIntervalsSmallTest")
+    public void splitLocusIntervalsSmallTest(SplitLocusIntervalsSmallTest test) {
+        List<List<GenomeLoc>> splitByLocus = IntervalUtils.splitLocusIntervals(test.original, test.parts);
+        Assert.assertEquals(splitByLocus.size(), test.expectedParts, "SplitLocusIntervals failed to generate correct number of intervals");
+        List<GenomeLoc> flat = IntervalUtils.flattenSplitIntervals(splitByLocus);
+
+        // test sizes
+        final long originalSize = IntervalUtils.intervalSize(test.original);
+        final long splitSize = IntervalUtils.intervalSize(flat);
+        Assert.assertEquals(splitSize, originalSize, "SplitLocusIntervals locs cover an incorrect number of bases");
+
+        Assert.assertEquals(flat, test.expected, "SplitLocusIntervals locs not expected intervals");
+    }
+
+    //
+    // Misc. tests
+    //
+
     @Test(expectedExceptions=UserException.class)
     public void testMergeListsBySetOperatorNoOverlap() {
         // a couple of lists we'll use for the testing
@@ -119,6 +320,22 @@ public class IntervalUtilsUnitTest extends BaseTest {
         Assert.assertEquals(ret.size(), 20);
     }
 
+    @Test
+    public void testOverlappingIntervalsFromSameSourceWithIntersection() {
+        // a couple of lists we'll use for the testing
+        List<GenomeLoc> source1 = new ArrayList<GenomeLoc>();
+        List<GenomeLoc> source2 = new ArrayList<GenomeLoc>();
+
+        source1.add(hg18GenomeLocParser.createGenomeLoc("chr1", 10, 20));
+        source1.add(hg18GenomeLocParser.createGenomeLoc("chr1", 15, 25));
+
+        source2.add(hg18GenomeLocParser.createGenomeLoc("chr1", 16, 18));
+        source2.add(hg18GenomeLocParser.createGenomeLoc("chr1", 22, 24));
+
+        List<GenomeLoc> ret = IntervalUtils.mergeListsBySetOperator(source1, source2, IntervalSetRule.INTERSECTION);
+        Assert.assertEquals(ret.size(), 2);
+    }
+
     @Test
     public void testGetContigLengths() {
         Map<String, Long> lengths = IntervalUtils.getContigSizes(new File(BaseTest.hg18Reference));
@@ -129,19 +346,6 @@ public class IntervalUtilsUnitTest extends BaseTest {
         Assert.assertEquals((long)lengths.get("chrX"), 154913754);
     }
 
-    private List<GenomeLoc> getLocs(String... intervals) {
-        return getLocs(Arrays.asList(intervals));
-    }
-
-    private List<GenomeLoc> getLocs(List<String> intervals) {
-        if (intervals.size() == 0)
-            return hg18ReferenceLocs;
-        List<GenomeLoc> locs = new ArrayList<GenomeLoc>();
-        for (String interval: intervals)
-            locs.add(hg18GenomeLocParser.parseGenomeLoc(interval));
-        return locs;
-    }
-
     @Test
     public void testParseIntervalArguments() {
         Assert.assertEquals(getLocs().size(), 45);
@@ -174,12 +378,12 @@ public class IntervalUtilsUnitTest extends BaseTest {
         List<File> files = testFiles("basic.", 3, ".intervals");
 
         List<GenomeLoc> locs = getLocs("chr1", "chr2", "chr3");
-        List<Integer> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
-        IntervalUtils.scatterFixedIntervals(hg18Header, locs, splits, files);
+        List<List<GenomeLoc>> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
+        IntervalUtils.scatterFixedIntervals(hg18Header, splits, files);
 
-        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()), false);
-        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()), false);
-        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()), false);
+        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()));
+        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()));
+        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()));
 
         Assert.assertEquals(locs1.size(), 1);
         Assert.assertEquals(locs2.size(), 1);
@@ -200,12 +404,12 @@ public class IntervalUtilsUnitTest extends BaseTest {
         List<File> files = testFiles("less.", 3, ".intervals");
 
         List<GenomeLoc> locs = getLocs("chr1", "chr2", "chr3", "chr4");
-        List<Integer> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
-        IntervalUtils.scatterFixedIntervals(hg18Header, locs, splits, files);
+        List<List<GenomeLoc>> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
+        IntervalUtils.scatterFixedIntervals(hg18Header, splits, files);
 
-        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()), false);
-        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()), false);
-        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()), false);
+        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()));
+        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()));
+        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()));
 
         Assert.assertEquals(locs1.size(), 1);
         Assert.assertEquals(locs2.size(), 1);
@@ -228,8 +432,8 @@ public class IntervalUtilsUnitTest extends BaseTest {
     public void testScatterFixedIntervalsMoreFiles() {
         List<File> files = testFiles("more.", 3, ".intervals");
         List<GenomeLoc> locs = getLocs("chr1", "chr2");
-        List<Integer> splits = IntervalUtils.splitFixedIntervals(locs, locs.size()); // locs.size() instead of files.size()
-        IntervalUtils.scatterFixedIntervals(hg18Header, locs, splits, files);
+        List<List<GenomeLoc>> splits = IntervalUtils.splitFixedIntervals(locs, locs.size()); // locs.size() instead of files.size()
+        IntervalUtils.scatterFixedIntervals(hg18Header, splits, files);
     }
     @Test
     public void testScatterFixedIntervalsStart() {
@@ -242,12 +446,12 @@ public class IntervalUtilsUnitTest extends BaseTest {
         List<File> files = testFiles("split.", 3, ".intervals");
 
         List<GenomeLoc> locs = getLocs(intervals);
-        List<Integer> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
-        IntervalUtils.scatterFixedIntervals(hg18Header, locs, splits, files);
+        List<List<GenomeLoc>> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
+        IntervalUtils.scatterFixedIntervals(hg18Header, splits, files);
 
-        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()), false);
-        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()), false);
-        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()), false);
+        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()));
+        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()));
+        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()));
 
         Assert.assertEquals(locs1.size(), 1);
         Assert.assertEquals(locs2.size(), 1);
@@ -270,12 +474,12 @@ public class IntervalUtilsUnitTest extends BaseTest {
         List<File> files = testFiles("split.", 3, ".intervals");
 
         List<GenomeLoc> locs = getLocs(intervals);
-        List<Integer> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
-        IntervalUtils.scatterFixedIntervals(hg18Header, locs, splits, files);
+        List<List<GenomeLoc>> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
+        IntervalUtils.scatterFixedIntervals(hg18Header, splits, files);
 
-        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()), false);
-        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()), false);
-        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()), false);
+        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()));
+        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()));
+        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()));
 
         Assert.assertEquals(locs1.size(), 1);
         Assert.assertEquals(locs2.size(), 1);
@@ -298,12 +502,12 @@ public class IntervalUtilsUnitTest extends BaseTest {
         List<File> files = testFiles("split.", 3, ".intervals");
 
         List<GenomeLoc> locs = getLocs(intervals);
-        List<Integer> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
-        IntervalUtils.scatterFixedIntervals(hg18Header, locs, splits, files);
+        List<List<GenomeLoc>> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
+        IntervalUtils.scatterFixedIntervals(hg18Header, splits, files);
 
-        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()), false);
-        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()), false);
-        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()), false);
+        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()));
+        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()));
+        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()));
 
         Assert.assertEquals(locs1.size(), 2);
         Assert.assertEquals(locs2.size(), 1);
@@ -318,8 +522,8 @@ public class IntervalUtilsUnitTest extends BaseTest {
     @Test
     public void testScatterFixedIntervalsFile() {
         List<File> files = testFiles("sg.", 20, ".intervals");
-        List<GenomeLoc> locs = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(BaseTest.GATKDataLocation + "whole_exome_agilent_designed_120.targets.hg18.chr20.interval_list"), false);
-        List<Integer> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
+        List<GenomeLoc> locs = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(BaseTest.GATKDataLocation + "whole_exome_agilent_designed_120.targets.hg18.chr20.interval_list"));
+        List<List<GenomeLoc>> splits = IntervalUtils.splitFixedIntervals(locs, files.size());
 
         int[] counts = {
                 125, 138, 287, 291, 312, 105, 155, 324,
@@ -332,21 +536,18 @@ public class IntervalUtilsUnitTest extends BaseTest {
         };
 
         //String splitCounts = "";
-        for (int lastIndex = 0, i = 0; i < splits.size(); i++) {
-            int splitIndex = splits.get(i);
-            int splitCount = (splitIndex - lastIndex);
-            //splitCounts += ", " + splitCount;
-            lastIndex = splitIndex;
+        for (int i = 0; i < splits.size(); i++) {
+            int splitCount = splits.get(i).size();
             Assert.assertEquals(splitCount, counts[i], "Num intervals in split " + i);
         }
         //System.out.println(splitCounts.substring(2));
 
-        IntervalUtils.scatterFixedIntervals(hg18Header, locs, splits, files);
+        IntervalUtils.scatterFixedIntervals(hg18Header, splits, files);
 
         int locIndex = 0;
         for (int i = 0; i < files.size(); i++) {
             String file = files.get(i).toString();
-            List<GenomeLoc> parsedLocs = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(file), false);
+            List<GenomeLoc> parsedLocs = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(file));
             Assert.assertEquals(parsedLocs.size(), counts[i], "Intervals in " + file);
             for (GenomeLoc parsedLoc: parsedLocs)
                 Assert.assertEquals(parsedLoc, locs.get(locIndex), String.format("Genome loc %d from file %d", locIndex++, i));
@@ -357,12 +558,12 @@ public class IntervalUtilsUnitTest extends BaseTest {
     @Test
     public void testScatterFixedIntervalsMax() {
         List<File> files = testFiles("sg.", 85, ".intervals");
-        List<Integer> splits = IntervalUtils.splitFixedIntervals(hg19ReferenceLocs, files.size());
-        IntervalUtils.scatterFixedIntervals(hg19Header, hg19ReferenceLocs, splits, files);
+        List<List<GenomeLoc>> splits = IntervalUtils.splitFixedIntervals(hg19ReferenceLocs, files.size());
+        IntervalUtils.scatterFixedIntervals(hg19Header, splits, files);
 
         for (int i = 0; i < files.size(); i++) {
             String file = files.get(i).toString();
-            List<GenomeLoc> parsedLocs = IntervalUtils.parseIntervalArguments(hg19GenomeLocParser, Arrays.asList(file), false);
+            List<GenomeLoc> parsedLocs = IntervalUtils.parseIntervalArguments(hg19GenomeLocParser, Arrays.asList(file));
             Assert.assertEquals(parsedLocs.size(), 1, "parsedLocs[" + i + "].size()");
             Assert.assertEquals(parsedLocs.get(0), hg19ReferenceLocs.get(i), "parsedLocs[" + i + "].get()");
         }
@@ -379,9 +580,9 @@ public class IntervalUtilsUnitTest extends BaseTest {
 
         IntervalUtils.scatterContigIntervals(hg18Header, getLocs(intervals), files);
 
-        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()), false);
-        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()), false);
-        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()), false);
+        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()));
+        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()));
+        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()));
 
         Assert.assertEquals(locs1.size(), 1);
         Assert.assertEquals(locs2.size(), 1);
@@ -402,9 +603,9 @@ public class IntervalUtilsUnitTest extends BaseTest {
 
         IntervalUtils.scatterContigIntervals(hg18Header, getLocs("chr1", "chr2", "chr3"), files);
 
-        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()), false);
-        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()), false);
-        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()), false);
+        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()));
+        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()));
+        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()));
 
         Assert.assertEquals(locs1.size(), 1);
         Assert.assertEquals(locs2.size(), 1);
@@ -426,9 +627,9 @@ public class IntervalUtilsUnitTest extends BaseTest {
 
         IntervalUtils.scatterContigIntervals(hg18Header, getLocs("chr1", "chr2", "chr3", "chr4"), files);
 
-        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()), false);
-        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()), false);
-        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()), false);
+        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()));
+        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()));
+        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()));
 
         Assert.assertEquals(locs1.size(), 1);
         Assert.assertEquals(locs2.size(), 1);
@@ -458,9 +659,9 @@ public class IntervalUtilsUnitTest extends BaseTest {
 
         IntervalUtils.scatterContigIntervals(hg18Header, getLocs(intervals), files);
 
-        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()), false);
-        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()), false);
-        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()), false);
+        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()));
+        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()));
+        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()));
 
         Assert.assertEquals(locs1.size(), 2);
         Assert.assertEquals(locs2.size(), 1);
@@ -484,9 +685,9 @@ public class IntervalUtilsUnitTest extends BaseTest {
 
         IntervalUtils.scatterContigIntervals(hg18Header, getLocs(intervals), files);
 
-        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()), false);
-        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()), false);
-        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()), false);
+        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()));
+        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()));
+        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()));
 
         Assert.assertEquals(locs1.size(), 1);
         Assert.assertEquals(locs2.size(), 2);
@@ -510,9 +711,9 @@ public class IntervalUtilsUnitTest extends BaseTest {
 
         IntervalUtils.scatterContigIntervals(hg18Header, getLocs(intervals), files);
 
-        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()), false);
-        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()), false);
-        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()), false);
+        List<GenomeLoc> locs1 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(0).toString()));
+        List<GenomeLoc> locs2 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(1).toString()));
+        List<GenomeLoc> locs3 = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Arrays.asList(files.get(2).toString()));
 
         Assert.assertEquals(locs1.size(), 1);
         Assert.assertEquals(locs2.size(), 1);
@@ -531,7 +732,7 @@ public class IntervalUtilsUnitTest extends BaseTest {
 
         for (int i = 0; i < files.size(); i++) {
             String file = files.get(i).toString();
-            List<GenomeLoc> parsedLocs = IntervalUtils.parseIntervalArguments(hg19GenomeLocParser, Arrays.asList(file), false);
+            List<GenomeLoc> parsedLocs = IntervalUtils.parseIntervalArguments(hg19GenomeLocParser, Arrays.asList(file));
             Assert.assertEquals(parsedLocs.size(), 1, "parsedLocs[" + i + "].size()");
             Assert.assertEquals(parsedLocs.get(0), hg19ReferenceLocs.get(i), "parsedLocs[" + i + "].get()");
         }
@@ -555,7 +756,7 @@ public class IntervalUtilsUnitTest extends BaseTest {
 
     @Test(dataProvider="unmergedIntervals")
     public void testUnmergedIntervals(String unmergedIntervals) {
-        List<GenomeLoc> locs = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Collections.singletonList(validationDataLocation + unmergedIntervals), false);
+        List<GenomeLoc> locs = IntervalUtils.parseIntervalArguments(hg18GenomeLocParser, Collections.singletonList(validationDataLocation + unmergedIntervals));
         Assert.assertEquals(locs.size(), 2);
 
         List<GenomeLoc> merged = IntervalUtils.mergeIntervalLocations(locs, IntervalMergingRule.ALL);
diff --git a/public/java/test/org/broadinstitute/sting/utils/interval/NwayIntervalMergingIteratorUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/interval/NwayIntervalMergingIteratorUnitTest.java
deleted file mode 100644
index 0b4e52a3d..000000000
--- a/public/java/test/org/broadinstitute/sting/utils/interval/NwayIntervalMergingIteratorUnitTest.java
+++ /dev/null
@@ -1,112 +0,0 @@
-/*
- * Copyright (c) 2010, The Broad Institute
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use,
- * copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following
- * conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
- * OTHER DEALINGS IN THE SOFTWARE.
- */
-
-package org.broadinstitute.sting.utils.interval;
-
-import org.broadinstitute.sting.BaseTest;
-import org.broadinstitute.sting.utils.GenomeLocParser;
-import org.broadinstitute.sting.utils.GenomeLoc;
-import net.sf.picard.reference.ReferenceSequenceFileFactory;
-import org.testng.Assert;
-import org.testng.annotations.BeforeClass;
-import org.testng.annotations.Test;
-
-import java.util.ArrayList;
-import java.util.List;
-import java.util.Iterator;
-import java.io.File;
-
-/**
- * Created by IntelliJ IDEA.
- * User: asivache
- * Date: Oct 28, 2010
- * Time: 2:46:03 PM
- * To change this template use File | Settings | File Templates.
- */
-public class NwayIntervalMergingIteratorUnitTest extends BaseTest {
-
-    private static File refFile =  new File(validationDataLocation + "Homo_sapiens_assembly17.fasta");
-    private GenomeLocParser genomeLocParser;
-
-    private static List<GenomeLoc> stream1 = null;
-    private static List<GenomeLoc> stream2 = null;
-    private static List<GenomeLoc> expected = null;
-
-    @BeforeClass
-    public static void init() {
-        GenomeLocParser genomeLocParser = new GenomeLocParser(ReferenceSequenceFileFactory.getReferenceSequenceFile(refFile));
-
-        stream1 = new ArrayList<GenomeLoc>();
-        stream2 = new ArrayList<GenomeLoc>();
-        expected = new ArrayList<GenomeLoc>();
-
-        stream1.add(genomeLocParser.createGenomeLoc("chr1",1554,1560)); // 1
-        stream1.add(genomeLocParser.createGenomeLoc("chr1",2538,2568)); // 3
-        stream1.add(genomeLocParser.createGenomeLoc("chr1",2600,2610));    // 4
-        stream1.add(genomeLocParser.createGenomeLoc("chr1",2609,2625));    // 4
-        stream1.add(genomeLocParser.createGenomeLoc("chr1",18932,19000));  // 6
-        stream1.add(genomeLocParser.createGenomeLoc("chr1",19001,25000));  //6
-
-        stream2.add(genomeLocParser.createGenomeLoc("chr1",1565,1570));    //2
-        stream2.add(genomeLocParser.createGenomeLoc("chr1",2598,2604));    // 4
-        stream2.add(genomeLocParser.createGenomeLoc("chr1",7415,7600));    // 5
-        stream2.add(genomeLocParser.createGenomeLoc("chr1",18932,25000));  // 6
-        stream2.add(genomeLocParser.createGenomeLoc("chr1",30000,35000));  // 7
-
-        expected.add(genomeLocParser.createGenomeLoc("chr1",1554,1560)); // 1
-        expected.add(genomeLocParser.createGenomeLoc("chr1",1565,1570));    //2
-        expected.add(genomeLocParser.createGenomeLoc("chr1",2538,2568)); // 3
-        expected.add(genomeLocParser.createGenomeLoc("chr1",2598,2625));    // 4
-        expected.add(genomeLocParser.createGenomeLoc("chr1",7415,7600));    // 5
-        expected.add(genomeLocParser.createGenomeLoc("chr1",18932,25000));  // 6
-        expected.add(genomeLocParser.createGenomeLoc("chr1",30000,35000));  // 7
-
-
-    }
-
-    @Test
-    public void testNwayIntervalMergingIterator() {
-        logger.warn("testNwayIntervalMergingIterator");
-
-        Iterator<GenomeLoc> it1 = stream1.iterator();
-        Iterator<GenomeLoc> it2 = stream2.iterator();
-
-        Iterator<GenomeLoc> e_it = expected.iterator();
-
-
-
-        NwayIntervalMergingIterator it = new NwayIntervalMergingIterator(IntervalMergingRule.OVERLAPPING_ONLY);
-        it.add(it1);
-        it.add(it2);
-        
-        while(it.hasNext()) {
-                GenomeLoc l = it.next();
-                GenomeLoc l_expected = e_it.next();
-                //System.out.println("int: "+l+" expected: "+l_expected) ;
-                Assert.assertEquals(l,l_expected,"Unexpected location returned by the iterator: "+l);
-        }
-   }
-
-
-}
diff --git a/public/java/test/org/broadinstitute/sting/utils/io/IOUtilsUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/io/IOUtilsUnitTest.java
new file mode 100644
index 000000000..4caf7f485
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/utils/io/IOUtilsUnitTest.java
@@ -0,0 +1,197 @@
+package org.broadinstitute.sting.utils.io;
+
+import org.apache.commons.io.FileUtils;
+import org.broadinstitute.sting.BaseTest;
+import java.io.File;
+import java.io.IOException;
+import java.util.Arrays;
+import java.util.List;
+
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.testng.Assert;
+import org.testng.annotations.Test;
+
+public class IOUtilsUnitTest extends BaseTest {
+  @Test
+  public void testGoodTempDir() {
+    IOUtils.checkTempDir(new File("/tmp/queue"));
+  }
+
+  @Test(expectedExceptions=UserException.BadTmpDir.class)
+  public void testBadTempDir() {
+    IOUtils.checkTempDir(new File("/tmp"));
+  }
+
+  @Test
+  public void testAbsoluteSubDir() {
+    File subDir = IOUtils.absolute(new File("."), new File("/path/to/file"));
+    Assert.assertEquals(subDir, new File("/path/to/file"));
+
+    subDir = IOUtils.absolute(new File("/different/path"), new File("/path/to/file"));
+    Assert.assertEquals(subDir, new File("/path/to/file"));
+
+    subDir = IOUtils.absolute(new File("/different/path"), new File("."));
+    Assert.assertEquals(subDir, new File("/different/path"));
+  }
+
+  @Test
+  public void testRelativeSubDir() throws IOException {
+    File subDir = IOUtils.absolute(new File("."), new File("path/to/file"));
+    Assert.assertEquals(subDir.getCanonicalFile(), new File("path/to/file").getCanonicalFile());
+
+    subDir = IOUtils.absolute(new File("/different/path"), new File("path/to/file"));
+    Assert.assertEquals(subDir, new File("/different/path/path/to/file"));
+  }
+
+  @Test
+  public void testDottedSubDir() throws IOException {
+    File subDir = IOUtils.absolute(new File("."), new File("path/../to/file"));
+    Assert.assertEquals(subDir.getCanonicalFile(), new File("path/../to/./file").getCanonicalFile());
+
+    subDir = IOUtils.absolute(new File("."), new File("/path/../to/file"));
+    Assert.assertEquals(subDir, new File("/path/../to/file"));
+
+    subDir = IOUtils.absolute(new File("/different/../path"), new File("path/to/file"));
+    Assert.assertEquals(subDir, new File("/different/../path/path/to/file"));
+
+    subDir = IOUtils.absolute(new File("/different/./path"), new File("/path/../to/file"));
+    Assert.assertEquals(subDir, new File("/path/../to/file"));
+  }
+
+  @Test
+  public void testTempDir() {
+    File tempDir = IOUtils.tempDir("Q-Unit-Test", "", new File("queueTempDirToDelete"));
+    Assert.assertTrue(tempDir.exists());
+    Assert.assertFalse(tempDir.isFile());
+    Assert.assertTrue(tempDir.isDirectory());
+    boolean deleted = IOUtils.tryDelete(tempDir);
+    Assert.assertTrue(deleted);
+    Assert.assertFalse(tempDir.exists());
+  }
+
+  @Test
+  public void testDirLevel() {
+    File dir = IOUtils.dirLevel(new File("/path/to/directory"), 1);
+    Assert.assertEquals(dir, new File("/path"));
+
+    dir = IOUtils.dirLevel(new File("/path/to/directory"), 2);
+    Assert.assertEquals(dir, new File("/path/to"));
+
+    dir = IOUtils.dirLevel(new File("/path/to/directory"), 3);
+    Assert.assertEquals(dir, new File("/path/to/directory"));
+
+    dir = IOUtils.dirLevel(new File("/path/to/directory"), 4);
+    Assert.assertEquals(dir, new File("/path/to/directory"));
+  }
+
+  @Test
+  public void testAbsolute() {
+    File dir = IOUtils.absolute(new File("/path/./to/./directory/."));
+    Assert.assertEquals(dir, new File("/path/to/directory"));
+
+    dir = IOUtils.absolute(new File("/"));
+    Assert.assertEquals(dir, new File("/"));
+
+    dir = IOUtils.absolute(new File("/."));
+    Assert.assertEquals(dir, new File("/"));
+
+    dir = IOUtils.absolute(new File("/././."));
+    Assert.assertEquals(dir, new File("/"));
+
+    dir = IOUtils.absolute(new File("/./directory/."));
+    Assert.assertEquals(dir, new File("/directory"));
+
+    dir = IOUtils.absolute(new File("/./directory/./"));
+    Assert.assertEquals(dir, new File("/directory"));
+
+    dir = IOUtils.absolute(new File("/./directory./"));
+    Assert.assertEquals(dir, new File("/directory."));
+
+    dir = IOUtils.absolute(new File("/./.directory/"));
+    Assert.assertEquals(dir, new File("/.directory"));
+  }
+
+  @Test
+  public void testTail() throws IOException {
+    List<String> lines = Arrays.asList(
+            "chr18_random	4262	3154410390	50	51",
+            "chr19_random	301858	3154414752	50	51",
+            "chr21_random	1679693	3154722662	50	51",
+            "chr22_random	257318	3156435963	50	51",
+            "chrX_random	1719168	3156698441	50	51");
+    List<String> tail = IOUtils.tail(new File(BaseTest.hg18Reference + ".fai"), 5);
+    Assert.assertEquals(tail.size(), 5);
+    for (int i = 0; i < 5; i++)
+      Assert.assertEquals(tail.get(i), lines.get(i));
+  }
+
+    @Test
+    public void testWriteSystemFile() throws IOException {
+        File temp = createTempFile("temp.", ".properties");
+        try {
+            IOUtils.writeResource(new Resource("StingText.properties", null), temp);
+        } finally {
+            FileUtils.deleteQuietly(temp);
+        }
+    }
+
+    @Test
+    public void testWriteSystemTempFile() throws IOException {
+        File temp = IOUtils.writeTempResource(new Resource("StingText.properties", null));
+        try {
+            Assert.assertTrue(temp.getName().startsWith("StingText"), "File does not start with 'StingText.': " + temp);
+            Assert.assertTrue(temp.getName().endsWith(".properties"), "File does not end with '.properties': " + temp);
+        } finally {
+            FileUtils.deleteQuietly(temp);
+        }
+    }
+
+    @Test(expectedExceptions = IllegalArgumentException.class)
+    public void testMissingSystemFile() throws IOException {
+        File temp = createTempFile("temp.", ".properties");
+        try {
+            IOUtils.writeResource(new Resource("MissingStingText.properties", null), temp);
+        } finally {
+            FileUtils.deleteQuietly(temp);
+        }
+    }
+
+    @Test
+    public void testWriteRelativeFile() throws IOException {
+        File temp = createTempFile("temp.", ".properties");
+        try {
+            IOUtils.writeResource(new Resource("/StingText.properties", IOUtils.class), temp);
+        } finally {
+            FileUtils.deleteQuietly(temp);
+        }
+    }
+
+    @Test
+    public void testWriteRelativeTempFile() throws IOException {
+        File temp = IOUtils.writeTempResource(new Resource("/StingText.properties", IOUtils.class));
+        try {
+            Assert.assertTrue(temp.getName().startsWith("StingText"), "File does not start with 'StingText.': " + temp);
+            Assert.assertTrue(temp.getName().endsWith(".properties"), "File does not end with '.properties': " + temp);
+        } finally {
+            FileUtils.deleteQuietly(temp);
+        }
+    }
+
+    @Test(expectedExceptions = IllegalArgumentException.class)
+    public void testMissingRelativeFile() throws IOException {
+        File temp = createTempFile("temp.", ".properties");
+        try {
+            // Looking for /org/broadinstitute/sting/utils/file/StingText.properties
+            IOUtils.writeResource(new Resource("StingText.properties", IOUtils.class), temp);
+        } finally {
+            FileUtils.deleteQuietly(temp);
+        }
+    }
+
+    @Test
+    public void testResourceProperties() {
+        Resource resource = new Resource("foo", Resource.class);
+        Assert.assertEquals(resource.getPath(), "foo");
+        Assert.assertEquals(resource.getRelativeClass(), Resource.class);
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/utils/pileup/ReadBackedPileupUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/pileup/ReadBackedPileupUnitTest.java
index fb479ab47..6e955289c 100644
--- a/public/java/test/org/broadinstitute/sting/utils/pileup/ReadBackedPileupUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/utils/pileup/ReadBackedPileupUnitTest.java
@@ -26,9 +26,8 @@ package org.broadinstitute.sting.utils.pileup;
 
 import net.sf.samtools.SAMFileHeader;
 import net.sf.samtools.SAMReadGroupRecord;
-import net.sf.samtools.SAMRecord;
+import org.broadinstitute.sting.utils.sam.GATKSAMRecord;
 import org.testng.Assert;
-import org.broadinstitute.sting.gatk.datasources.sample.Sample;
 import org.broadinstitute.sting.utils.sam.ArtificialSAMUtils;
 
 import org.testng.annotations.Test;
@@ -51,27 +50,25 @@ public class ReadBackedPileupUnitTest {
         header.addReadGroup(readGroupOne);
         header.addReadGroup(readGroupTwo);
 
-        SAMRecord read1 = ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,10);
+        GATKSAMRecord read1 = ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,10);
         read1.setAttribute("RG",readGroupOne.getId());
-        SAMRecord read2 = ArtificialSAMUtils.createArtificialRead(header,"read2",0,1,10);
+        GATKSAMRecord read2 = ArtificialSAMUtils.createArtificialRead(header,"read2",0,1,10);
         read2.setAttribute("RG",readGroupTwo.getId());
-        SAMRecord read3 = ArtificialSAMUtils.createArtificialRead(header,"read3",0,1,10);
+        GATKSAMRecord read3 = ArtificialSAMUtils.createArtificialRead(header,"read3",0,1,10);
         read3.setAttribute("RG",readGroupOne.getId());
-        SAMRecord read4 = ArtificialSAMUtils.createArtificialRead(header,"read4",0,1,10);
+        GATKSAMRecord read4 = ArtificialSAMUtils.createArtificialRead(header,"read4",0,1,10);
         read4.setAttribute("RG",readGroupTwo.getId());
-        SAMRecord read5 = ArtificialSAMUtils.createArtificialRead(header,"read5",0,1,10);
+        GATKSAMRecord read5 = ArtificialSAMUtils.createArtificialRead(header,"read5",0,1,10);
         read5.setAttribute("RG",readGroupTwo.getId());
-        SAMRecord read6 = ArtificialSAMUtils.createArtificialRead(header,"read6",0,1,10);
+        GATKSAMRecord read6 = ArtificialSAMUtils.createArtificialRead(header,"read6",0,1,10);
         read6.setAttribute("RG",readGroupOne.getId());
-        SAMRecord read7 = ArtificialSAMUtils.createArtificialRead(header,"read7",0,1,10);
+        GATKSAMRecord read7 = ArtificialSAMUtils.createArtificialRead(header,"read7",0,1,10);
         read7.setAttribute("RG",readGroupOne.getId());
 
-        ReadBackedPileup pileup = new ReadBackedPileupImpl(null,
-                                                           Arrays.asList(read1,read2,read3,read4,read5,read6,read7),
-                                                           Arrays.asList(1,1,1,1,1,1,1));
+        ReadBackedPileup pileup = new ReadBackedPileupImpl(null, Arrays.asList(read1,read2,read3,read4,read5,read6,read7), Arrays.asList(1,1,1,1,1,1,1));
 
         ReadBackedPileup rg1Pileup = pileup.getPileupForReadGroup("rg1");
-        List<SAMRecord> rg1Reads = rg1Pileup.getReads();
+        List<GATKSAMRecord> rg1Reads = rg1Pileup.getReads();
         Assert.assertEquals(rg1Reads.size(), 4, "Wrong number of reads in read group rg1");
         Assert.assertEquals(rg1Reads.get(0), read1, "Read " + read1.getReadName() + " should be in rg1 but isn't");
         Assert.assertEquals(rg1Reads.get(1), read3, "Read " + read3.getReadName() + " should be in rg1 but isn't");
@@ -79,7 +76,7 @@ public class ReadBackedPileupUnitTest {
         Assert.assertEquals(rg1Reads.get(3), read7, "Read " + read7.getReadName() + " should be in rg1 but isn't");
 
         ReadBackedPileup rg2Pileup = pileup.getPileupForReadGroup("rg2");
-        List<SAMRecord> rg2Reads = rg2Pileup.getReads();        
+        List<GATKSAMRecord> rg2Reads = rg2Pileup.getReads();        
         Assert.assertEquals(rg2Reads.size(), 3, "Wrong number of reads in read group rg2");
         Assert.assertEquals(rg2Reads.get(0), read2, "Read " + read2.getReadName() + " should be in rg2 but isn't");
         Assert.assertEquals(rg2Reads.get(1), read4, "Read " + read4.getReadName() + " should be in rg2 but isn't");
@@ -93,17 +90,17 @@ public class ReadBackedPileupUnitTest {
     public void testSplitByNullReadGroups() {
         SAMFileHeader header = ArtificialSAMUtils.createArtificialSamHeader(1,1,1000);
 
-        SAMRecord read1 = ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,10);
-        SAMRecord read2 = ArtificialSAMUtils.createArtificialRead(header,"read2",0,1,10);
-        SAMRecord read3 = ArtificialSAMUtils.createArtificialRead(header,"read3",0,1,10);
+        GATKSAMRecord read1 = ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,10);
+        GATKSAMRecord read2 = ArtificialSAMUtils.createArtificialRead(header,"read2",0,1,10);
+        GATKSAMRecord read3 = ArtificialSAMUtils.createArtificialRead(header,"read3",0,1,10);
 
         ReadBackedPileup pileup = new ReadBackedPileupImpl(null,
                                                            Arrays.asList(read1,read2,read3),
                                                            Arrays.asList(1,1,1));
 
         ReadBackedPileup nullRgPileup = pileup.getPileupForReadGroup(null);
-        List<SAMRecord> nullRgReads = nullRgPileup.getReads();
-        Assert.assertEquals(nullRgPileup.size(), 3, "Wrong number of reads in null read group");
+        List<GATKSAMRecord> nullRgReads = nullRgPileup.getReads();
+        Assert.assertEquals(nullRgPileup.getNumberOfElements(), 3, "Wrong number of reads in null read group");
         Assert.assertEquals(nullRgReads.get(0), read1, "Read " + read1.getReadName() + " should be in null rg but isn't");
         Assert.assertEquals(nullRgReads.get(1), read2, "Read " + read2.getReadName() + " should be in null rg but isn't");
         Assert.assertEquals(nullRgReads.get(2), read3, "Read " + read3.getReadName() + " should be in null rg but isn't");
@@ -126,13 +123,13 @@ public class ReadBackedPileupUnitTest {
         header.addReadGroup(readGroupOne);
         header.addReadGroup(readGroupTwo);
 
-        SAMRecord read1 = ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,10);
+        GATKSAMRecord read1 = ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,10);
         read1.setAttribute("RG",readGroupOne.getId());
-        SAMRecord read2 = ArtificialSAMUtils.createArtificialRead(header,"read2",0,1,10);
+        GATKSAMRecord read2 = ArtificialSAMUtils.createArtificialRead(header,"read2",0,1,10);
         read2.setAttribute("RG",readGroupTwo.getId());
-        SAMRecord read3 = ArtificialSAMUtils.createArtificialRead(header,"read3",0,1,10);
+        GATKSAMRecord read3 = ArtificialSAMUtils.createArtificialRead(header,"read3",0,1,10);
         read3.setAttribute("RG",readGroupOne.getId());
-        SAMRecord read4 = ArtificialSAMUtils.createArtificialRead(header,"read4",0,1,10);
+        GATKSAMRecord read4 = ArtificialSAMUtils.createArtificialRead(header,"read4",0,1,10);
         read4.setAttribute("RG",readGroupTwo.getId());
 
         ReadBackedPileupImpl sample1Pileup = new ReadBackedPileupImpl(null,
@@ -141,21 +138,21 @@ public class ReadBackedPileupUnitTest {
         ReadBackedPileupImpl sample2Pileup = new ReadBackedPileupImpl(null,
                                                                       Arrays.asList(read2,read4),
                                                                       Arrays.asList(1,1));
-        Map<Sample,ReadBackedPileupImpl> sampleToPileupMap = new HashMap<Sample,ReadBackedPileupImpl>();
-        sampleToPileupMap.put(new Sample(readGroupOne.getSample()),sample1Pileup);
-        sampleToPileupMap.put(new Sample(readGroupTwo.getSample()),sample2Pileup);
+        Map<String,ReadBackedPileupImpl> sampleToPileupMap = new HashMap<String,ReadBackedPileupImpl>();
+        sampleToPileupMap.put(readGroupOne.getSample(),sample1Pileup);
+        sampleToPileupMap.put(readGroupTwo.getSample(),sample2Pileup);
 
         ReadBackedPileup compositePileup = new ReadBackedPileupImpl(null,sampleToPileupMap);
 
         ReadBackedPileup rg1Pileup = compositePileup.getPileupForReadGroup("rg1");
-        List<SAMRecord> rg1Reads = rg1Pileup.getReads();
+        List<GATKSAMRecord> rg1Reads = rg1Pileup.getReads();
 
         Assert.assertEquals(rg1Reads.size(), 2, "Wrong number of reads in read group rg1");
         Assert.assertEquals(rg1Reads.get(0), read1, "Read " + read1.getReadName() + " should be in rg1 but isn't");
         Assert.assertEquals(rg1Reads.get(1), read3, "Read " + read3.getReadName() + " should be in rg1 but isn't");
 
         ReadBackedPileup rg2Pileup = compositePileup.getPileupForReadGroup("rg2");
-        List<SAMRecord> rg2Reads = rg2Pileup.getReads();
+        List<GATKSAMRecord> rg2Reads = rg2Pileup.getReads();
 
         Assert.assertEquals(rg1Reads.size(), 2, "Wrong number of reads in read group rg2");
         Assert.assertEquals(rg2Reads.get(0), read2, "Read " + read2.getReadName() + " should be in rg2 but isn't");
@@ -164,41 +161,37 @@ public class ReadBackedPileupUnitTest {
 
     @Test
     public void testGetPileupForSample() {
-        Sample sample1 = new Sample("sample1");
-        Sample sample2 = new Sample("sample2");
+        String sample1 = "sample1";
+        String sample2 = "sample2";
 
         SAMReadGroupRecord readGroupOne = new SAMReadGroupRecord("rg1");
-        readGroupOne.setSample(sample1.getId());
+        readGroupOne.setSample(sample1);
         SAMReadGroupRecord readGroupTwo = new SAMReadGroupRecord("rg2");
-        readGroupTwo.setSample(sample2.getId());        
+        readGroupTwo.setSample(sample2);
 
         SAMFileHeader header = ArtificialSAMUtils.createArtificialSamHeader(1,1,1000);
         header.addReadGroup(readGroupOne);
         header.addReadGroup(readGroupTwo);
 
-        SAMRecord read1 = ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,10);
+        GATKSAMRecord read1 = ArtificialSAMUtils.createArtificialRead(header,"read1",0,1,10);
         read1.setAttribute("RG",readGroupOne.getId());
-        SAMRecord read2 = ArtificialSAMUtils.createArtificialRead(header,"read2",0,1,10);
+        GATKSAMRecord read2 = ArtificialSAMUtils.createArtificialRead(header,"read2",0,1,10);
         read2.setAttribute("RG",readGroupTwo.getId());
 
-        Map<Sample,ReadBackedPileupImpl> sampleToPileupMap = new HashMap<Sample,ReadBackedPileupImpl>();
+        Map<String,ReadBackedPileupImpl> sampleToPileupMap = new HashMap<String,ReadBackedPileupImpl>();
         sampleToPileupMap.put(sample1,new ReadBackedPileupImpl(null,Collections.singletonList(read1),0));
         sampleToPileupMap.put(sample2,new ReadBackedPileupImpl(null,Collections.singletonList(read2),0));
 
         ReadBackedPileup pileup = new ReadBackedPileupImpl(null,sampleToPileupMap);
 
-        ReadBackedPileup sample1Pileup = pileup.getPileupForSample(sample1);
-        Assert.assertEquals(sample1Pileup.size(),1,"Sample 1 pileup has wrong number of elements");
-        Assert.assertEquals(sample1Pileup.getReads().get(0),read1,"Sample 1 pileup has incorrect read");
-
-        ReadBackedPileup sample2Pileup = pileup.getPileupForSampleName(sample2.getId());
-        Assert.assertEquals(sample2Pileup.size(),1,"Sample 2 pileup has wrong number of elements");
+        ReadBackedPileup sample2Pileup = pileup.getPileupForSample(sample2);
+        Assert.assertEquals(sample2Pileup.getNumberOfElements(),1,"Sample 2 pileup has wrong number of elements");
         Assert.assertEquals(sample2Pileup.getReads().get(0),read2,"Sample 2 pileup has incorrect read");
 
-        ReadBackedPileup missingSamplePileup = pileup.getPileupForSample(new Sample("missing"));
+        ReadBackedPileup missingSamplePileup = pileup.getPileupForSample("missing");
         Assert.assertNull(missingSamplePileup,"Pileup for sample 'missing' should be null but isn't");
 
-        missingSamplePileup = pileup.getPileupForSampleName("not here");
+        missingSamplePileup = pileup.getPileupForSample("not here");
         Assert.assertNull(missingSamplePileup,"Pileup for sample 'not here' should be null but isn't");
     }
 }
diff --git a/public/java/test/org/broadinstitute/sting/utils/runtime/ProcessControllerUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/runtime/ProcessControllerUnitTest.java
new file mode 100644
index 000000000..6db9d77ef
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/utils/runtime/ProcessControllerUnitTest.java
@@ -0,0 +1,517 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.runtime;
+
+import org.apache.commons.io.FileUtils;
+import org.apache.commons.lang.StringUtils;
+import org.broadinstitute.sting.BaseTest;
+import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.io.IOUtils;
+import org.testng.Assert;
+import org.testng.annotations.DataProvider;
+import org.testng.annotations.Test;
+
+import java.io.File;
+import java.io.IOException;
+import java.util.Arrays;
+import java.util.HashMap;
+import java.util.Map;
+
+public class ProcessControllerUnitTest extends BaseTest {
+    private static final String NL = String.format("%n");
+
+    @Test(timeOut = 60 * 1000)
+    public void testDestroyThreadLocal() throws InterruptedException {
+        for (int i = 0; i < 3; i++) {
+            final ProcessController controller = ProcessController.getThreadLocal();
+            final ProcessSettings job = new ProcessSettings(
+                    new String[] {"sh", "-c", "echo Hello World && sleep 600 && echo Goodbye"});
+            job.getStdoutSettings().setBufferSize(-1);
+
+            Thread t = new Thread(new Runnable() {
+                @Override
+                public void run() {
+                    System.out.println("BACK: Starting on background thread");
+                    ProcessOutput result = controller.exec(job);
+                    // Assert in background thread doesn't make it to main thread but does print a trace.
+                    Assert.assertTrue(result.getExitValue() != 0, "Destroy-attempted job returned zero exit status");
+                    System.out.println("BACK: Background thread exiting");
+                }
+            });
+
+            System.out.println("MAIN: Starting background thread");
+            t.start();
+            System.out.println("MAIN: Sleeping main thread 3s");
+            Thread.sleep(3000);
+            System.out.println("MAIN: Destroying job");
+            controller.tryDestroy();
+            System.out.println("MAIN: Not waiting on background thread to exit");
+            // Using standard java.io this was blocking on linux.
+            // TODO: try again with NIO.
+            //t.join();
+            //System.out.println("MAIN: Background thread exited");
+        }
+    }
+
+    @Test
+    public void testReuseAfterError() {
+        ProcessController controller = new ProcessController();
+
+        ProcessSettings job;
+
+        for (int i = 0; i < 3; i++) {
+            // Test bad command
+            job = new ProcessSettings(new String[] {"no_such_command"});
+            try {
+                controller.exec(job);
+            } catch (ReviewedStingException e) {
+                /* Was supposed to throw an exception */
+            }
+
+            // Test exit != 0
+            job = new ProcessSettings(new String[] {"cat", "non_existent_file"});
+            int exitValue = controller.exec(job).getExitValue();
+            Assert.assertTrue(exitValue != 0, "'cat' non existent file returned 0");
+
+            // Text success
+            job = new ProcessSettings(new String[] {"echo", "Hello World"});
+            exitValue = controller.exec(job).getExitValue();
+            Assert.assertEquals(exitValue, 0, "Echo failed");
+        }
+    }
+
+    @Test
+    public void testEnvironment() {
+        String key = "MY_NEW_VAR";
+        String value = "value is here";
+
+        ProcessSettings job = new ProcessSettings(new String[] {"sh", "-c", "echo $"+key});
+        job.getStdoutSettings().setBufferSize(-1);
+        job.setRedirectErrorStream(true);
+
+        Map<String, String> env = new HashMap<String, String>(System.getenv());
+        env.put(key, value);
+        job.setEnvironment(env);
+
+        ProcessController controller = new ProcessController();
+        ProcessOutput result = controller.exec(job);
+        int exitValue = result.getExitValue();
+
+        Assert.assertEquals(exitValue, 0, "Echo environment variable failed");
+        Assert.assertEquals(result.getStdout().getBufferString(), value + NL, "Echo environment returned unexpected output");
+    }
+
+    @Test
+    public void testDirectory() throws IOException {
+        File dir = null;
+        try {
+            dir = IOUtils.tempDir("temp.", "").getCanonicalFile();
+
+            ProcessSettings job = new ProcessSettings(new String[] {"pwd"});
+            job.getStdoutSettings().setBufferSize(-1);
+            job.setRedirectErrorStream(true);
+            job.setDirectory(dir);
+
+            ProcessController controller = new ProcessController();
+            ProcessOutput result = controller.exec(job);
+            int exitValue = result.getExitValue();
+
+            Assert.assertEquals(exitValue, 0, "Getting working directory failed");
+
+            Assert.assertEquals(result.getStdout().getBufferString(), dir.getAbsolutePath() + NL,
+                    "Setting/getting working directory returned unexpected output");
+        } finally {
+            FileUtils.deleteQuietly(dir);
+        }
+    }
+
+    @Test
+    public void testReadStdInBuffer() {
+        String bufferText = "Hello from buffer";
+        ProcessSettings job = new ProcessSettings(new String[] {"cat"});
+        job.getStdoutSettings().setBufferSize(-1);
+        job.setRedirectErrorStream(true);
+        job.getStdinSettings().setInputBuffer(bufferText);
+
+        ProcessController controller = new ProcessController();
+        ProcessOutput output = controller.exec(job);
+
+        Assert.assertEquals(output.getStdout().getBufferString(), bufferText,
+                "Unexpected output from cat stdin buffer");
+    }
+
+    @Test
+    public void testReadStdInFile() {
+        File input = null;
+        try {
+            String fileText = "Hello from file";
+            input = IOUtils.writeTempFile(fileText, "stdin.", ".txt");
+
+            ProcessSettings job = new ProcessSettings(new String[] {"cat"});
+            job.getStdoutSettings().setBufferSize(-1);
+            job.setRedirectErrorStream(true);
+            job.getStdinSettings().setInputFile(input);
+
+            ProcessController controller = new ProcessController();
+            ProcessOutput output = controller.exec(job);
+
+            Assert.assertEquals(output.getStdout().getBufferString(), fileText,
+                    "Unexpected output from cat stdin file");
+        } finally {
+            FileUtils.deleteQuietly(input);
+        }
+    }
+
+    @Test
+    public void testWriteStdOut() {
+        ProcessSettings job = new ProcessSettings(new String[] {"echo", "Testing to stdout"});
+        // Not going to call the System.setOut() for now. Just running a basic visual test.
+        job.getStdoutSettings().printStandard(true);
+        job.setRedirectErrorStream(true);
+
+        System.out.println("testWriteStdOut: Writing two lines to std out...");
+        ProcessController controller = new ProcessController();
+        controller.exec(job);
+        job.setCommand(new String[]{"cat", "non_existent_file"});
+        controller.exec(job);
+        System.out.println("testWriteStdOut: ...two lines should have been printed to std out");
+    }
+
+    @Test
+    public void testErrorToOut() throws IOException {
+        File outFile = null;
+        File errFile = null;
+        try {
+            outFile = BaseTest.createTempFile("temp", "");
+            errFile = BaseTest.createTempFile("temp", "");
+
+            ProcessSettings job = new ProcessSettings(new String[]{"cat", "non_existent_file"});
+            job.getStdoutSettings().setOutputFile(outFile);
+            job.getStdoutSettings().setBufferSize(-1);
+            job.getStderrSettings().setOutputFile(errFile);
+            job.getStderrSettings().setBufferSize(-1);
+            job.setRedirectErrorStream(true);
+
+            ProcessOutput result = new ProcessController().exec(job);
+            int exitValue = result.getExitValue();
+
+            Assert.assertTrue(exitValue != 0, "'cat' non existent file returned 0");
+
+            String fileString, bufferString;
+
+            fileString = FileUtils.readFileToString(outFile);
+            Assert.assertTrue(fileString.length() > 0, "Out file was length 0");
+
+            bufferString = result.getStdout().getBufferString();
+            Assert.assertTrue(bufferString.length() > 0, "Out buffer was length 0");
+
+            Assert.assertFalse(result.getStdout().isBufferTruncated(), "Out buffer was truncated");
+            Assert.assertEquals(bufferString.length(), fileString.length(), "Out buffer length did not match file length");
+
+            fileString = FileUtils.readFileToString(errFile);
+            Assert.assertEquals(fileString, "", "Unexpected output to err file");
+
+            bufferString = result.getStderr().getBufferString();
+            Assert.assertEquals(bufferString, "", "Unexepected output to err buffer");
+        } finally {
+            FileUtils.deleteQuietly(outFile);
+            FileUtils.deleteQuietly(errFile);
+        }
+    }
+
+    @Test
+    public void testErrorToErr() throws IOException {
+        File outFile = null;
+        File errFile = null;
+        try {
+            outFile = BaseTest.createTempFile("temp", "");
+            errFile = BaseTest.createTempFile("temp", "");
+
+            ProcessSettings job = new ProcessSettings(new String[]{"cat", "non_existent_file"});
+            job.getStdoutSettings().setOutputFile(outFile);
+            job.getStdoutSettings().setBufferSize(-1);
+            job.getStderrSettings().setOutputFile(errFile);
+            job.getStderrSettings().setBufferSize(-1);
+            job.setRedirectErrorStream(false);
+
+            ProcessOutput result = new ProcessController().exec(job);
+            int exitValue = result.getExitValue();
+
+            Assert.assertTrue(exitValue != 0, "'cat' non existent file returned 0");
+
+            String fileString, bufferString;
+
+            fileString = FileUtils.readFileToString(errFile);
+            Assert.assertTrue(fileString.length() > 0, "Err file was length 0");
+
+            bufferString = result.getStderr().getBufferString();
+            Assert.assertTrue(bufferString.length() > 0, "Err buffer was length 0");
+
+            Assert.assertFalse(result.getStderr().isBufferTruncated(), "Err buffer was truncated");
+            Assert.assertEquals(bufferString.length(), fileString.length(), "Err buffer length did not match file length");
+
+            fileString = FileUtils.readFileToString(outFile);
+            Assert.assertEquals(fileString, "", "Unexpected output to out file");
+
+            bufferString = result.getStdout().getBufferString();
+            Assert.assertEquals(bufferString, "", "Unexepected output to out buffer");
+        } finally {
+            FileUtils.deleteQuietly(outFile);
+            FileUtils.deleteQuietly(errFile);
+        }
+    }
+
+    private static final String TRUNCATE_TEXT = "Hello World";
+    private static final byte[] TRUNCATE_OUTPUT_BYTES = (TRUNCATE_TEXT + NL).getBytes();
+
+    /**
+     * @return Test truncating content vs. not truncating (run at -1/+1 size)
+     */
+    @DataProvider(name = "truncateSizes")
+    public Object[][] getTruncateBufferSizes() {
+        int l = TRUNCATE_OUTPUT_BYTES.length;
+        return new Object[][]{
+                new Object[]{0, 0},
+                new Object[]{l, l},
+                new Object[]{l + 1, l},
+                new Object[]{l - 1, l - 1}
+        };
+    }
+
+    @Test(dataProvider = "truncateSizes")
+    public void testTruncateBuffer(int truncateLen, int expectedLen) {
+        byte[] expected = Arrays.copyOf(TRUNCATE_OUTPUT_BYTES, expectedLen);
+
+        String[] command = {"echo", TRUNCATE_TEXT};
+        ProcessController controller = new ProcessController();
+
+        ProcessSettings job = new ProcessSettings(command);
+        job.getStdoutSettings().setBufferSize(truncateLen);
+        ProcessOutput result = controller.exec(job);
+
+        int exitValue = result.getExitValue();
+
+        Assert.assertEquals(exitValue, 0,
+                String.format("Echo returned %d: %s", exitValue, TRUNCATE_TEXT));
+
+        byte[] bufferBytes = result.getStdout().getBufferBytes();
+
+        Assert.assertEquals(bufferBytes, expected,
+                String.format("Output buffer didn't match (%d vs %d)", expected.length, bufferBytes.length));
+
+        boolean truncated = result.getStdout().isBufferTruncated();
+
+        Assert.assertEquals(truncated, TRUNCATE_OUTPUT_BYTES.length > truncateLen,
+                "Unexpected buffer truncation result");
+    }
+
+    private static final String[] LONG_COMMAND = getLongCommand();
+    private static final String LONG_COMMAND_STRING = StringUtils.join(LONG_COMMAND, " ");
+    private static final String LONG_COMMAND_DESCRIPTION = "<long command>";
+
+    @DataProvider(name = "echoCommands")
+    public Object[][] getEchoCommands() {
+
+        new EchoCommand(new String[]{"echo", "Hello", "World"}, "Hello World" + NL);
+        new EchoCommand(new String[]{"echo", "'Hello", "World"}, "'Hello World" + NL);
+        new EchoCommand(new String[]{"echo", "Hello", "World'"}, "Hello World'" + NL);
+        new EchoCommand(new String[]{"echo", "'Hello", "World'"}, "'Hello World'" + NL);
+
+        String[] longCommand = new String[LONG_COMMAND.length + 1];
+        longCommand[0] = "echo";
+        System.arraycopy(LONG_COMMAND, 0, longCommand, 1, LONG_COMMAND.length);
+        new EchoCommand(longCommand, LONG_COMMAND_STRING + NL) {
+            @Override
+            public String toString() {
+                return LONG_COMMAND_DESCRIPTION;
+            }
+        };
+
+        return TestDataProvider.getTests(EchoCommand.class);
+    }
+
+    @Test(dataProvider = "echoCommands")
+    public void testEcho(EchoCommand script) throws IOException {
+        File outputFile = null;
+        try {
+            outputFile = BaseTest.createTempFile("temp", "");
+
+            ProcessSettings job = new ProcessSettings(script.command);
+            if (script.output != null) {
+                job.getStdoutSettings().setOutputFile(outputFile);
+                job.getStdoutSettings().setBufferSize(script.output.getBytes().length);
+            }
+
+            ProcessOutput result = new ProcessController().exec(job);
+            int exitValue = result.getExitValue();
+
+            Assert.assertEquals(exitValue, 0,
+                    String.format("Echo returned %d: %s", exitValue, script));
+
+            if (script.output != null) {
+
+                String fileString = FileUtils.readFileToString(outputFile);
+                Assert.assertEquals(fileString, script.output,
+                        String.format("Output file didn't match (%d vs %d): %s",
+                                fileString.length(), script.output.length(), script));
+
+                String bufferString = result.getStdout().getBufferString();
+                Assert.assertEquals(bufferString, script.output,
+                        String.format("Output content didn't match (%d vs %d): %s",
+                                bufferString.length(), script.output.length(), script));
+
+                Assert.assertFalse(result.getStdout().isBufferTruncated(),
+                        "Output content was truncated: " + script);
+            }
+        } finally {
+            FileUtils.deleteQuietly(outputFile);
+        }
+    }
+
+    @Test(expectedExceptions = ReviewedStingException.class)
+    public void testUnableToStart() {
+        ProcessSettings job = new ProcessSettings(new String[]{"no_such_command"});
+        new ProcessController().exec(job);
+    }
+
+    @DataProvider(name = "scriptCommands")
+    public Object[][] getScriptCommands() {
+        new ScriptCommand(true, "echo Hello World", "Hello World" + NL);
+        new ScriptCommand(false, "echo 'Hello World", null);
+        new ScriptCommand(false, "echo Hello World'", null);
+        new ScriptCommand(true, "echo 'Hello World'", "Hello World" + NL);
+        new ScriptCommand(true, "echo \"Hello World\"", "Hello World" + NL);
+        new ScriptCommand(false, "no_such_echo Hello World", null);
+        new ScriptCommand(true, "echo #", NL);
+        new ScriptCommand(true, "echo \\#", "#" + NL);
+        new ScriptCommand(true, "echo \\\\#", "\\#" + NL);
+
+        new ScriptCommand(true, "echo " + LONG_COMMAND_STRING, LONG_COMMAND_STRING + NL) {
+            @Override
+            public String toString() {
+                return LONG_COMMAND_DESCRIPTION;
+            }
+        };
+
+        return TestDataProvider.getTests(ScriptCommand.class);
+    }
+
+    @Test(dataProvider = "scriptCommands")
+    public void testScript(ScriptCommand script) throws IOException {
+        File scriptFile = null;
+        File outputFile = null;
+        try {
+            scriptFile = writeScript(script.content);
+            outputFile = BaseTest.createTempFile("temp", "");
+
+            ProcessSettings job = new ProcessSettings(new String[]{"sh", scriptFile.getAbsolutePath()});
+            if (script.output != null) {
+                job.getStdoutSettings().setOutputFile(outputFile);
+                job.getStdoutSettings().setBufferSize(script.output.getBytes().length);
+            }
+
+            ProcessOutput result = new ProcessController().exec(job);
+            int exitValue = result.getExitValue();
+
+            Assert.assertEquals(exitValue == 0, script.succeed,
+                    String.format("Script returned %d: %s", exitValue, script));
+
+            if (script.output != null) {
+
+                String fileString = FileUtils.readFileToString(outputFile);
+                Assert.assertEquals(fileString, script.output,
+                        String.format("Output file didn't match (%d vs %d): %s",
+                                fileString.length(), script.output.length(), script));
+
+                String bufferString = result.getStdout().getBufferString();
+                Assert.assertEquals(bufferString, script.output,
+                        String.format("Output content didn't match (%d vs %d): %s",
+                                bufferString.length(), script.output.length(), script));
+
+                Assert.assertFalse(result.getStdout().isBufferTruncated(),
+                        "Output content was truncated: " + script);
+            }
+        } finally {
+            FileUtils.deleteQuietly(scriptFile);
+            FileUtils.deleteQuietly(outputFile);
+        }
+    }
+
+    private static String[] getLongCommand() {
+        // This command fails on some systems with a 4096 character limit when run via the old sh -c "echo ...",
+        // but works on the same systems when run via sh <script>
+        int cnt = 500;
+        String[] command = new String[cnt];
+        for (int i = 1; i <= cnt; i++) {
+            command[i - 1] = String.format("%03d______", i);
+        }
+        return command;
+    }
+
+    private static File writeScript(String contents) {
+        try {
+            File file = BaseTest.createTempFile("temp", "");
+            FileUtils.writeStringToFile(file, contents);
+            return file;
+        } catch (IOException e) {
+            throw new UserException.BadTmpDir(e.getMessage());
+        }
+    }
+
+    private static class EchoCommand extends TestDataProvider {
+        public final String[] command;
+        public final String output;
+
+        public EchoCommand(String[] command, String output) {
+            super(EchoCommand.class);
+            this.command = command;
+            this.output = output;
+        }
+
+        @Override
+        public String toString() {
+            return StringUtils.join(command, " ");
+        }
+    }
+
+    public static class ScriptCommand extends TestDataProvider {
+        public final boolean succeed;
+        public final String content;
+        public final String output;
+
+        public ScriptCommand(boolean succeed, String content, String output) {
+            super(ScriptCommand.class);
+            this.succeed = succeed;
+            this.content = content;
+            this.output = output;
+        }
+
+        @Override
+        public String toString() {
+            return content;
+        }
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/utils/runtime/RuntimeUtilsUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/runtime/RuntimeUtilsUnitTest.java
new file mode 100644
index 000000000..027fa0978
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/utils/runtime/RuntimeUtilsUnitTest.java
@@ -0,0 +1,41 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.utils.runtime;
+
+import org.broadinstitute.sting.BaseTest;
+import org.testng.Assert;
+import org.testng.annotations.Test;
+
+public class RuntimeUtilsUnitTest extends BaseTest {
+    @Test
+    public void testWhichExists() {
+        Assert.assertNotNull(RuntimeUtils.which("ls"), "Unable to locate ls");
+    }
+
+    @Test
+    public void testWhichNotExists() {
+        Assert.assertNull(RuntimeUtils.which("does_not_exist"), "Found nonexistent binary: does_not_exist");
+    }
+}
diff --git a/public/java/test/org/broadinstitute/sting/utils/variantcontext/GenotypeUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/variantcontext/GenotypeUnitTest.java
new file mode 100644
index 000000000..c4f1efd04
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/utils/variantcontext/GenotypeUnitTest.java
@@ -0,0 +1,84 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+// our package
+package org.broadinstitute.sting.utils.variantcontext;
+
+
+// the imports for unit testing.
+
+
+import org.broadinstitute.sting.BaseTest;
+import org.testng.Assert;
+import org.testng.annotations.BeforeSuite;
+import org.testng.annotations.Test;
+
+import java.util.Arrays;
+import java.util.List;
+
+
+public class GenotypeUnitTest extends BaseTest {
+    Allele A, Aref, T;
+
+    @BeforeSuite
+    public void before() {
+        A = Allele.create("A");
+        Aref = Allele.create("A", true);
+        T = Allele.create("T");
+    }
+
+//    public Genotype(String sampleName, List<Allele> alleles, double negLog10PError, Set<String> filters, Map<String, ?> attributes, boolean isPhased) {
+//    public Genotype(String sampleName, List<Allele> alleles, double negLog10PError, Set<String> filters, Map<String, ?> attributes, boolean isPhased, double[] log10Likelihoods) {
+//    public Genotype(String sampleName, List<Allele> alleles, double negLog10PError, double[] log10Likelihoods)
+//    public Genotype(String sampleName, List<Allele> alleles, double negLog10PError)
+//    public Genotype(String sampleName, List<Allele> alleles)
+//    public List<Allele> getAlleles()
+//    public List<Allele> getAlleles(Allele allele)
+//    public Allele getAllele(int i)
+//    public boolean isPhased()
+//    public int getPloidy()
+//    public Type getType()
+//    public boolean isHom()
+//    public boolean isHomRef()
+//    public boolean isHomVar()
+//    public boolean isHet()
+//    public boolean isNoCall()
+//    public boolean isCalled()
+//    public boolean isAvailable()
+//    public boolean hasLikelihoods()
+//    public GenotypeLikelihoods getLikelihoods()
+//    public boolean sameGenotype(Genotype other)
+//    public boolean sameGenotype(Genotype other, boolean ignorePhase)
+//    public String getSampleName()
+//    public boolean hasNegLog10PError()
+//    public double getNegLog10PError()
+//    public double getPhredScaledQual()
+//    public boolean hasAttribute(String key)
+//    public Object getAttribute(String key)
+//    public Object getAttribute(String key, Object defaultValue)
+//    public String getAttributeAsString(String key, String defaultValue)
+//    public int getAttributeAsInt(String key, int defaultValue)
+//    public double getAttributeAsDouble(String key, double  defaultValue)
+//    public boolean getAttributeAsBoolean(String key, boolean  defaultValue)
+}
diff --git a/public/java/test/org/broadinstitute/sting/utils/variantcontext/VCFJarClassLoadingUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/variantcontext/VCFJarClassLoadingUnitTest.java
index 50eebe179..a45aa4d4c 100644
--- a/public/java/test/org/broadinstitute/sting/utils/variantcontext/VCFJarClassLoadingUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/utils/variantcontext/VCFJarClassLoadingUnitTest.java
@@ -24,11 +24,12 @@
 
 package org.broadinstitute.sting.utils.variantcontext;
 
+import org.broadinstitute.sting.utils.exceptions.ReviewedStingException;
 import org.testng.annotations.Test;
 
 import java.io.File;
+import java.io.FileNotFoundException;
 import java.net.MalformedURLException;
-import java.net.URI;
 import java.net.URL;
 import java.net.URLClassLoader;
 
@@ -38,14 +39,67 @@ import java.net.URLClassLoader;
 public class VCFJarClassLoadingUnitTest {
     @Test
     public void testVCFJarClassLoading() throws ClassNotFoundException, MalformedURLException {
-        URI vcfURI = new File("dist/vcf.jar").toURI();
-        URI tribbleURI = new File("lib/tribble-24.jar").toURI();
+        URL[] jarURLs;
 
-        ClassLoader classLoader = new URLClassLoader(new URL[] {vcfURI.toURL(),tribbleURI.toURL()}, null);
+        try {
+            jarURLs = new URL[] { getVCFJarFile().toURI().toURL(), getTribbleJarFile().toURI().toURL() };
+        }
+        catch ( FileNotFoundException e ) {
+            throw new ReviewedStingException("Could not find the VCF jar and/or its dependencies", e);
+        }
+
+        ClassLoader classLoader = new URLClassLoader(jarURLs, null);
         classLoader.loadClass("org.broadinstitute.sting.utils.variantcontext.VariantContext");
         classLoader.loadClass("org.broadinstitute.sting.utils.codecs.vcf.VCFCodec");
         classLoader.loadClass("org.broadinstitute.sting.utils.codecs.vcf.VCF3Codec");
         classLoader.loadClass("org.broadinstitute.sting.utils.codecs.vcf.VCFWriter");
         classLoader.loadClass("org.broadinstitute.sting.utils.codecs.vcf.StandardVCFWriter");
     }
+
+    /**
+     * Locates the tribble jar within the dist directory.
+     *
+     * Makes the horrible assumption that tests will always be run from the root of a Sting clone,
+     * but this is much less problematic than using the classpath to locate tribble, since
+     * the classpath won't explicitly contain tribble when we're testing the fully-packaged
+     * GATK jar.
+     *
+     * @return The tribble jar file, if found
+     * @throws FileNotFoundException If we couldn't locate a tribble jar within the dist directory
+     */
+    private File getTribbleJarFile() throws FileNotFoundException {
+        File distDir = new File("dist");
+        if ( ! distDir.isDirectory() ) {
+            throw new FileNotFoundException("The dist directory does not exist");
+        }
+
+        for ( File distDirEntry : distDir.listFiles() ) {
+            if ( distDirEntry.getName().startsWith("tribble") && distDirEntry.getName().endsWith(".jar") ) {
+                return distDirEntry;
+            }
+        }
+
+        throw new FileNotFoundException("Could not find a tribble jar file in the dist directory.");
+    }
+
+    /**
+     * Locates the vcf jar within the dist directory.
+     *
+     * Makes the horrible assumption that tests will always be run from the root of a Sting clone,
+     * but this is much less problematic than using the classpath to locate vcf.jar, since
+     * the classpath won't explicitly contain vcf.jar when we're testing the fully-packaged
+     * GATK jar.
+     *
+     * @return The vcf jar file, if found
+     * @throws FileNotFoundException If we couldn't locate a vcf jar within the dist directory
+     */
+    private File getVCFJarFile() throws FileNotFoundException {
+        File vcfJar = new File("dist/vcf.jar");
+
+        if ( ! vcfJar.exists() ) {
+            throw new FileNotFoundException("Could not find dist/vcf.jar");
+        }
+
+        return vcfJar;
+    }
 }
diff --git a/public/java/test/org/broadinstitute/sting/utils/variantcontext/VariantContextUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/variantcontext/VariantContextUnitTest.java
index f8e6da20a..a4d78b637 100755
--- a/public/java/test/org/broadinstitute/sting/utils/variantcontext/VariantContextUnitTest.java
+++ b/public/java/test/org/broadinstitute/sting/utils/variantcontext/VariantContextUnitTest.java
@@ -5,20 +5,20 @@ package org.broadinstitute.sting.utils.variantcontext;
 // the imports for unit testing.
 
 
-import org.testng.Assert;
+import org.broadinstitute.sting.BaseTest;
 import org.testng.annotations.BeforeSuite;
-import org.testng.annotations.BeforeTest;
+import org.testng.annotations.DataProvider;
 import org.testng.annotations.Test;
+import org.testng.Assert;
 
+import java.util.ArrayList;
 import java.util.Arrays;
+import java.util.Collections;
 import java.util.List;
 
 
-/**
- * Basic unit test for RecalData
- */
-public class VariantContextUnitTest {
-    Allele A, Aref, T, Tref;
+public class VariantContextUnitTest extends BaseTest {
+    Allele A, Aref, C, T, Tref;
     Allele del, delRef, ATC, ATCref;
 
     // A [ref] / T at 10
@@ -47,6 +47,7 @@ public class VariantContextUnitTest {
         delRef = Allele.create("-", true);
 
         A = Allele.create("A");
+        C = Allele.create("C");
         Aref = Allele.create("A", true);
         T = Allele.create("T");
         Tref = Allele.create("T", true);
@@ -134,6 +135,16 @@ public class VariantContextUnitTest {
         Assert.assertEquals(vc.getType(), VariantContext.Type.SYMBOLIC);
     }
 
+    @Test
+    public void testMultipleSNPAlleleOrdering() {
+        final List<Allele> allelesNaturalOrder = Arrays.asList(Aref, C, T);
+        final List<Allele> allelesUnnaturalOrder = Arrays.asList(Aref, T, C);
+        VariantContext naturalVC = new VariantContext("natural", snpLoc, snpLocStart, snpLocStop, allelesNaturalOrder);
+        VariantContext unnaturalVC = new VariantContext("unnatural", snpLoc, snpLocStart, snpLocStop, allelesUnnaturalOrder);
+        Assert.assertEquals(new ArrayList<Allele>(naturalVC.getAlleles()), allelesNaturalOrder);
+        Assert.assertEquals(new ArrayList<Allele>(unnaturalVC.getAlleles()), allelesUnnaturalOrder);
+    }
+
     @Test
     public void testCreatingSNPVariantContext() {
 
@@ -241,6 +252,29 @@ public class VariantContextUnitTest {
         Assert.assertEquals(vc.getSampleNames().size(), 0);
     }
 
+    @Test
+    public void testCreatingPartiallyCalledGenotype() {
+        List<Allele> alleles = Arrays.asList(Aref, C);
+        Genotype g = new Genotype("foo", Arrays.asList(C, Allele.NO_CALL), 10);
+        VariantContext vc = new VariantContext("test", snpLoc, snpLocStart, snpLocStop, alleles, Arrays.asList(g));
+
+        Assert.assertTrue(vc.isSNP());
+        Assert.assertEquals(vc.getNAlleles(), 2);
+        Assert.assertTrue(vc.hasGenotypes());
+        Assert.assertFalse(vc.isMonomorphic());
+        Assert.assertTrue(vc.isPolymorphic());
+        Assert.assertEquals(vc.getGenotype("foo"), g);
+        Assert.assertEquals(vc.getChromosomeCount(), 2); // we know that there are 2 chromosomes, even though one isn't called
+        Assert.assertEquals(vc.getChromosomeCount(Aref), 0);
+        Assert.assertEquals(vc.getChromosomeCount(C), 1);
+        Assert.assertFalse(vc.getGenotype("foo").isHet());
+        Assert.assertFalse(vc.getGenotype("foo").isHom());
+        Assert.assertFalse(vc.getGenotype("foo").isNoCall());
+        Assert.assertFalse(vc.getGenotype("foo").isHom());
+        Assert.assertTrue(vc.getGenotype("foo").isMixed());
+        Assert.assertEquals(vc.getGenotype("foo").getType(), Genotype.Type.MIXED);
+    }
+
     @Test (expectedExceptions = IllegalArgumentException.class)
     public void testBadConstructorArgs1() {
         new VariantContext("test", insLoc, insLocStart, insLocStop, Arrays.asList(delRef, ATCref));
@@ -251,11 +285,16 @@ public class VariantContextUnitTest {
         new VariantContext("test", insLoc, insLocStart, insLocStop, Arrays.asList(delRef, del));
     }
 
-    @Test (expectedExceptions = IllegalStateException.class)
+    @Test (expectedExceptions = IllegalArgumentException.class)
     public void testBadConstructorArgs3() {
         new VariantContext("test", insLoc, insLocStart, insLocStop, Arrays.asList(del));
     }
 
+    @Test (expectedExceptions = IllegalArgumentException.class)
+    public void testBadConstructorArgs4() {
+        new VariantContext("test", insLoc, insLocStart, insLocStop, Collections.<Allele>emptyList());
+    }
+
     @Test (expectedExceptions = IllegalArgumentException.class)
     public void testBadConstructorArgsDuplicateAlleles1() {
         new VariantContext("test", insLoc, insLocStart, insLocStop, Arrays.asList(Aref, T, T));
@@ -445,14 +484,70 @@ public class VariantContextUnitTest {
         Assert.assertEquals(0, vc5.getChromosomeCount(Aref));
     }
 
+    // --------------------------------------------------------------------------------
+    //
+    // Test allele merging
+    //
+    // --------------------------------------------------------------------------------
 
-    @Test
-    public void testManipulatingAlleles() {
-        // todo -- add tests that call add/set/remove
+    private class GetAllelesTest extends TestDataProvider {
+        List<Allele> alleles;
+
+        private GetAllelesTest(String name, Allele... arg) {
+            super(GetAllelesTest.class, name);
+            this.alleles = Arrays.asList(arg);
+        }
+
+        public String toString() {
+            return String.format("%s input=%s", super.toString(), alleles);
+        }
     }
 
-    @Test
-    public void testManipulatingGenotypes() {
-        // todo -- add tests that call add/set/remove
+    @DataProvider(name = "getAlleles")
+    public Object[][] mergeAllelesData() {
+        new GetAllelesTest("A*",   Aref);
+        new GetAllelesTest("-*",   delRef);
+        new GetAllelesTest("A*/C", Aref, C);
+        new GetAllelesTest("A*/C/T", Aref, C, T);
+        new GetAllelesTest("A*/T/C", Aref, T, C);
+        new GetAllelesTest("A*/C/T/-", Aref, C, T, del);
+        new GetAllelesTest("A*/T/C/-", Aref, T, C, del);
+        new GetAllelesTest("A*/-/T/C", Aref, del, T, C);
+
+        return GetAllelesTest.getTests(GetAllelesTest.class);
+    }
+
+    @Test(dataProvider = "getAlleles")
+    public void testMergeAlleles(GetAllelesTest cfg) {
+        final List<Allele> altAlleles = cfg.alleles.subList(1, cfg.alleles.size());
+        final VariantContext vc = new VariantContext("test", snpLoc, snpLocStart, snpLocStop, cfg.alleles, null, InferredGeneticContext.NO_NEG_LOG_10PERROR, null, null, (byte)'A');
+
+        Assert.assertEquals(vc.getAlleles(), cfg.alleles, "VC alleles not the same as input alleles");
+        Assert.assertEquals(vc.getNAlleles(), cfg.alleles.size(), "VC getNAlleles not the same as input alleles size");
+        Assert.assertEquals(vc.getAlternateAlleles(), altAlleles, "VC alt alleles not the same as input alt alleles");
+
+
+        for ( int i = 0; i < cfg.alleles.size(); i++ ) {
+            final Allele inputAllele = cfg.alleles.get(i);
+
+            Assert.assertTrue(vc.hasAllele(inputAllele));
+            if ( inputAllele.isReference() ) {
+                final Allele nonRefVersion = Allele.create(inputAllele.getBases(), false);
+                Assert.assertTrue(vc.hasAllele(nonRefVersion, true));
+                Assert.assertFalse(vc.hasAllele(nonRefVersion, false));
+            }
+
+            Assert.assertEquals(inputAllele, vc.getAllele(inputAllele.getBaseString()));
+            Assert.assertEquals(inputAllele, vc.getAllele(inputAllele.getBases()));
+
+            if ( i > 0 ) { // it's an alt allele
+                Assert.assertEquals(inputAllele, vc.getAlternateAllele(i-1));
+            }
+        }
+
+        final Allele missingAllele = Allele.create("AACCGGTT"); // does not exist
+        Assert.assertNull(vc.getAllele(missingAllele.getBases()));
+        Assert.assertFalse(vc.hasAllele(missingAllele));
+        Assert.assertFalse(vc.hasAllele(missingAllele, true));
     }
 }
diff --git a/public/java/test/org/broadinstitute/sting/utils/variantcontext/VariantContextUtilsUnitTest.java b/public/java/test/org/broadinstitute/sting/utils/variantcontext/VariantContextUtilsUnitTest.java
new file mode 100644
index 000000000..845d9c216
--- /dev/null
+++ b/public/java/test/org/broadinstitute/sting/utils/variantcontext/VariantContextUtilsUnitTest.java
@@ -0,0 +1,597 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+package org.broadinstitute.sting.utils.variantcontext;
+
+import net.sf.picard.reference.IndexedFastaSequenceFile;
+import org.broadinstitute.sting.BaseTest;
+import org.broadinstitute.sting.utils.GenomeLocParser;
+import org.broadinstitute.sting.utils.exceptions.UserException;
+import org.broadinstitute.sting.utils.fasta.CachingIndexedFastaSequenceFile;
+import org.testng.Assert;
+import org.testng.annotations.BeforeSuite;
+import org.testng.annotations.DataProvider;
+import org.testng.annotations.Test;
+
+import java.io.File;
+import java.io.FileNotFoundException;
+import java.util.*;
+
+public class VariantContextUtilsUnitTest extends BaseTest {
+    Allele Aref, T, C, delRef, Cref, ATC, ATCATC;
+    private GenomeLocParser genomeLocParser;
+
+    @BeforeSuite
+    public void setup() {
+        final File referenceFile = new File(b37KGReference);
+        try {
+            IndexedFastaSequenceFile seq = new CachingIndexedFastaSequenceFile(referenceFile);
+            genomeLocParser = new GenomeLocParser(seq);
+        }
+        catch(FileNotFoundException ex) {
+            throw new UserException.CouldNotReadInputFile(referenceFile,ex);
+        }
+
+        // alleles
+        Aref = Allele.create("A", true);
+        Cref = Allele.create("C", true);
+        delRef = Allele.create("-", true);
+        T = Allele.create("T");
+        C = Allele.create("C");
+        ATC = Allele.create("ATC");
+        ATCATC = Allele.create("ATCATC");
+    }
+
+    private Genotype makeG(String sample, Allele a1, Allele a2) {
+        return new Genotype(sample, Arrays.asList(a1, a2));
+    }
+
+    private Genotype makeG(String sample, Allele a1, Allele a2, double log10pError, double... pls) {
+        return new Genotype(sample, Arrays.asList(a1, a2), log10pError, pls);
+    }
+
+
+    private Genotype makeG(String sample, Allele a1, Allele a2, double log10pError) {
+        return new Genotype(sample, Arrays.asList(a1, a2), log10pError);
+    }
+
+    private VariantContext makeVC(String source, List<Allele> alleles) {
+        return makeVC(source, alleles, null, null);
+    }
+
+    private VariantContext makeVC(String source, List<Allele> alleles, Genotype... g1) {
+        return makeVC(source, alleles, Arrays.asList(g1));
+    }
+
+    private VariantContext makeVC(String source, List<Allele> alleles, String filter) {
+        return makeVC(source, alleles, filter.equals(".") ? null : new HashSet<String>(Arrays.asList(filter)));
+    }
+
+    private VariantContext makeVC(String source, List<Allele> alleles, Set<String> filters) {
+        return makeVC(source, alleles, null, filters);
+    }
+
+    private VariantContext makeVC(String source, List<Allele> alleles, Collection<Genotype> genotypes) {
+        return makeVC(source, alleles, genotypes, null);
+    }
+
+    private VariantContext makeVC(String source, List<Allele> alleles, Collection<Genotype> genotypes, Set<String> filters) {
+        int start = 10;
+        int stop = start; // alleles.contains(ATC) ? start + 3 : start;
+        return new VariantContext(source, "1", start, stop, alleles,
+                genotypes == null ? null : VariantContext.genotypeCollectionToMap(new TreeMap<String, Genotype>(), genotypes),
+                1.0, filters, null, Cref.getBases()[0]);
+    }
+
+    // --------------------------------------------------------------------------------
+    //
+    // Test allele merging
+    //
+    // --------------------------------------------------------------------------------
+
+    private class MergeAllelesTest extends TestDataProvider {
+        List<List<Allele>> inputs;
+        List<Allele> expected;
+
+        private MergeAllelesTest(List<Allele>... arg) {
+            super(MergeAllelesTest.class);
+            LinkedList<List<Allele>> all = new LinkedList<List<Allele>>(Arrays.asList(arg));
+            expected = all.pollLast();
+            inputs = all;
+        }
+
+        public String toString() {
+            return String.format("MergeAllelesTest input=%s expected=%s", inputs, expected);
+        }
+    }
+    @DataProvider(name = "mergeAlleles")
+    public Object[][] mergeAllelesData() {
+        // first, do no harm
+        new MergeAllelesTest(Arrays.asList(Aref),
+                Arrays.asList(Aref));
+
+        new MergeAllelesTest(Arrays.asList(Aref),
+                Arrays.asList(Aref),
+                Arrays.asList(Aref));
+
+        new MergeAllelesTest(Arrays.asList(Aref),
+                Arrays.asList(Aref, T),
+                Arrays.asList(Aref, T));
+
+        new MergeAllelesTest(Arrays.asList(Aref, C),
+                Arrays.asList(Aref, T),
+                Arrays.asList(Aref, C, T));
+
+        new MergeAllelesTest(Arrays.asList(Aref, T),
+                Arrays.asList(Aref, C),
+                Arrays.asList(Aref, T, C)); // in order of appearence
+
+        new MergeAllelesTest(Arrays.asList(Aref, C, T),
+                Arrays.asList(Aref, C),
+                Arrays.asList(Aref, C, T));
+
+        new MergeAllelesTest(Arrays.asList(Aref, C, T), Arrays.asList(Aref, C, T));
+        new MergeAllelesTest(Arrays.asList(Aref, T, C), Arrays.asList(Aref, T, C));
+
+        new MergeAllelesTest(Arrays.asList(Aref, T, C),
+                Arrays.asList(Aref, C),
+                Arrays.asList(Aref, T, C)); // in order of appearence
+
+        // The following is actually a pathological case - there's no way on a vcf to represent a null allele that's non-variant.
+        // The code converts this (correctly) to a single-base non-variant vc with whatever base was there as a reference.
+        new MergeAllelesTest(Arrays.asList(delRef),
+                Arrays.asList(Cref));
+
+        new MergeAllelesTest(Arrays.asList(delRef),
+                Arrays.asList(delRef, ATC),
+                Arrays.asList(delRef, ATC));
+
+        new MergeAllelesTest(Arrays.asList(delRef),
+                Arrays.asList(delRef, ATC, ATCATC),
+                Arrays.asList(delRef, ATC, ATCATC));
+
+        // alleles in the order we see them
+        new MergeAllelesTest(Arrays.asList(delRef, ATCATC),
+                Arrays.asList(delRef, ATC, ATCATC),
+                Arrays.asList(delRef, ATCATC, ATC));
+
+        // same
+        new MergeAllelesTest(Arrays.asList(delRef, ATC),
+                Arrays.asList(delRef, ATCATC),
+                Arrays.asList(delRef, ATC, ATCATC));
+
+        return MergeAllelesTest.getTests(MergeAllelesTest.class);
+    }
+
+    @Test(dataProvider = "mergeAlleles")
+    public void testMergeAlleles(MergeAllelesTest cfg) {
+        final List<VariantContext> inputs = new ArrayList<VariantContext>();
+
+        int i = 0;
+        for ( final List<Allele> alleles : cfg.inputs ) {
+            final String name = "vcf" + ++i;
+            inputs.add(makeVC(name, alleles));
+        }
+
+        final List<String> priority = vcs2priority(inputs);
+
+        final VariantContext merged = VariantContextUtils.simpleMerge(genomeLocParser,
+                inputs, priority,
+                VariantContextUtils.FilteredRecordMergeType.KEEP_IF_ANY_UNFILTERED,
+                VariantContextUtils.GenotypeMergeType.PRIORITIZE, false, false, "set", false, false);
+
+        Assert.assertEquals(merged.getAlleles(), cfg.expected);
+    }
+
+    // --------------------------------------------------------------------------------
+    //
+    // Test rsID merging
+    //
+    // --------------------------------------------------------------------------------
+
+    private class SimpleMergeRSIDTest extends TestDataProvider {
+        List<String> inputs;
+        String expected;
+
+        private SimpleMergeRSIDTest(String... arg) {
+            super(SimpleMergeRSIDTest.class);
+            LinkedList<String> allStrings = new LinkedList<String>(Arrays.asList(arg));
+            expected = allStrings.pollLast();
+            inputs = allStrings;
+        }
+
+        public String toString() {
+            return String.format("SimpleMergeRSIDTest vc=%s expected=%s", inputs, expected);
+        }
+    }
+
+    @DataProvider(name = "simplemergersiddata")
+    public Object[][] createSimpleMergeRSIDData() {
+        new SimpleMergeRSIDTest(".", ".");
+        new SimpleMergeRSIDTest(".", ".", ".");
+        new SimpleMergeRSIDTest("rs1", "rs1");
+        new SimpleMergeRSIDTest("rs1", "rs1", "rs1");
+        new SimpleMergeRSIDTest(".", "rs1", "rs1");
+        new SimpleMergeRSIDTest("rs1", ".", "rs1");
+        new SimpleMergeRSIDTest("rs1", "rs2", "rs1,rs2");
+        new SimpleMergeRSIDTest("rs1", "rs2", "rs1", "rs1,rs2"); // duplicates
+        new SimpleMergeRSIDTest("rs2", "rs1", "rs2,rs1");
+        new SimpleMergeRSIDTest("rs2", "rs1", ".", "rs2,rs1");
+        new SimpleMergeRSIDTest("rs2", ".", "rs1", "rs2,rs1");
+        new SimpleMergeRSIDTest("rs1", ".", ".", "rs1");
+        new SimpleMergeRSIDTest("rs1", "rs2", "rs3", "rs1,rs2,rs3");
+
+        return SimpleMergeRSIDTest.getTests(SimpleMergeRSIDTest.class);
+    }
+
+    @Test(dataProvider = "simplemergersiddata")
+    public void testRSIDMerge(SimpleMergeRSIDTest cfg) {
+        final VariantContext snpVC1 = makeVC("snpvc1", Arrays.asList(Aref, T));
+        final List<VariantContext> inputs = new ArrayList<VariantContext>();
+
+        for ( final String id : cfg.inputs ) {
+            MutableVariantContext vc = new MutableVariantContext(snpVC1);
+            if ( ! id.equals(".") ) vc.setID(id);
+            inputs.add(vc);
+        }
+
+        final VariantContext merged = VariantContextUtils.simpleMerge(genomeLocParser,
+                inputs, null,
+                VariantContextUtils.FilteredRecordMergeType.KEEP_IF_ANY_UNFILTERED,
+                VariantContextUtils.GenotypeMergeType.UNSORTED, false, false, "set", false, false);
+        Assert.assertEquals(merged.getID(), cfg.expected.equals(".") ? null : cfg.expected);
+    }
+
+    // --------------------------------------------------------------------------------
+    //
+    // Test filtered merging
+    //
+    // --------------------------------------------------------------------------------
+
+    private class MergeFilteredTest extends TestDataProvider {
+        List<VariantContext> inputs;
+        VariantContext expected;
+        String setExpected;
+        VariantContextUtils.FilteredRecordMergeType type;
+
+
+        private MergeFilteredTest(String name, VariantContext input1, VariantContext input2, VariantContext expected, String setExpected) {
+            this(name, input1, input2, expected, VariantContextUtils.FilteredRecordMergeType.KEEP_IF_ANY_UNFILTERED, setExpected);
+        }
+
+        private MergeFilteredTest(String name, VariantContext input1, VariantContext input2, VariantContext expected, VariantContextUtils.FilteredRecordMergeType type, String setExpected) {
+            super(MergeFilteredTest.class, name);
+            LinkedList<VariantContext> all = new LinkedList<VariantContext>(Arrays.asList(input1, input2));
+            this.expected = expected;
+            this.type = type;
+            inputs = all;
+            this.setExpected = setExpected;
+        }
+
+        public String toString() {
+            return String.format("%s input=%s expected=%s", super.toString(), inputs, expected);
+        }
+    }
+
+    @DataProvider(name = "mergeFiltered")
+    public Object[][] mergeFilteredData() {
+        new MergeFilteredTest("AllPass",
+                makeVC("1", Arrays.asList(Aref, T), VariantContext.PASSES_FILTERS),
+                makeVC("2", Arrays.asList(Aref, T), VariantContext.PASSES_FILTERS),
+                makeVC("3", Arrays.asList(Aref, T), VariantContext.PASSES_FILTERS),
+                VariantContextUtils.MERGE_INTERSECTION);
+
+        new MergeFilteredTest("noFilters",
+                makeVC("1", Arrays.asList(Aref, T), "."),
+                makeVC("2", Arrays.asList(Aref, T), "."),
+                makeVC("3", Arrays.asList(Aref, T), "."),
+                VariantContextUtils.MERGE_INTERSECTION);
+
+        new MergeFilteredTest("oneFiltered",
+                makeVC("1", Arrays.asList(Aref, T), "."),
+                makeVC("2", Arrays.asList(Aref, T), "FAIL"),
+                makeVC("3", Arrays.asList(Aref, T), "."),
+                String.format("1-%s2", VariantContextUtils.MERGE_FILTER_PREFIX));
+
+        new MergeFilteredTest("onePassOneFail",
+                makeVC("1", Arrays.asList(Aref, T), VariantContext.PASSES_FILTERS),
+                makeVC("2", Arrays.asList(Aref, T), "FAIL"),
+                makeVC("3", Arrays.asList(Aref, T), VariantContext.PASSES_FILTERS),
+                String.format("1-%s2", VariantContextUtils.MERGE_FILTER_PREFIX));
+
+        new MergeFilteredTest("AllFiltered",
+                makeVC("1", Arrays.asList(Aref, T), "FAIL"),
+                makeVC("2", Arrays.asList(Aref, T), "FAIL"),
+                makeVC("3", Arrays.asList(Aref, T), "FAIL"),
+                VariantContextUtils.MERGE_FILTER_IN_ALL);
+
+        // test ALL vs. ANY
+        new MergeFilteredTest("FailOneUnfiltered",
+                makeVC("1", Arrays.asList(Aref, T), "FAIL"),
+                makeVC("2", Arrays.asList(Aref, T), "."),
+                makeVC("3", Arrays.asList(Aref, T), "."),
+                VariantContextUtils.FilteredRecordMergeType.KEEP_IF_ANY_UNFILTERED,
+                String.format("%s1-2", VariantContextUtils.MERGE_FILTER_PREFIX));
+
+        new MergeFilteredTest("OneFailAllUnfilteredArg",
+                makeVC("1", Arrays.asList(Aref, T), "FAIL"),
+                makeVC("2", Arrays.asList(Aref, T), "."),
+                makeVC("3", Arrays.asList(Aref, T), "FAIL"),
+                VariantContextUtils.FilteredRecordMergeType.KEEP_IF_ALL_UNFILTERED,
+                String.format("%s1-2", VariantContextUtils.MERGE_FILTER_PREFIX));
+
+        // test excluding allele in filtered record
+        new MergeFilteredTest("DontIncludeAlleleOfFilteredRecords",
+                makeVC("1", Arrays.asList(Aref, T), "."),
+                makeVC("2", Arrays.asList(Aref, T), "FAIL"),
+                makeVC("3", Arrays.asList(Aref, T), "."),
+                String.format("1-%s2", VariantContextUtils.MERGE_FILTER_PREFIX));
+
+        // promotion of site from unfiltered to PASSES
+        new MergeFilteredTest("UnfilteredPlusPassIsPass",
+                makeVC("1", Arrays.asList(Aref, T), "."),
+                makeVC("2", Arrays.asList(Aref, T), VariantContext.PASSES_FILTERS),
+                makeVC("3", Arrays.asList(Aref, T), VariantContext.PASSES_FILTERS),
+                VariantContextUtils.MERGE_INTERSECTION);
+
+        new MergeFilteredTest("RefInAll",
+                makeVC("1", Arrays.asList(Aref), VariantContext.PASSES_FILTERS),
+                makeVC("2", Arrays.asList(Aref), VariantContext.PASSES_FILTERS),
+                makeVC("3", Arrays.asList(Aref), VariantContext.PASSES_FILTERS),
+                VariantContextUtils.MERGE_REF_IN_ALL);
+
+        new MergeFilteredTest("RefInOne",
+                makeVC("1", Arrays.asList(Aref), VariantContext.PASSES_FILTERS),
+                makeVC("2", Arrays.asList(Aref, T), VariantContext.PASSES_FILTERS),
+                makeVC("3", Arrays.asList(Aref, T), VariantContext.PASSES_FILTERS),
+                "2");
+
+        return MergeFilteredTest.getTests(MergeFilteredTest.class);
+    }
+
+    @Test(dataProvider = "mergeFiltered")
+    public void testMergeFiltered(MergeFilteredTest cfg) {
+        final List<String> priority = vcs2priority(cfg.inputs);
+        final VariantContext merged = VariantContextUtils.simpleMerge(genomeLocParser,
+                cfg.inputs, priority, cfg.type, VariantContextUtils.GenotypeMergeType.PRIORITIZE, true, false, "set", false, false);
+
+        // test alleles are equal
+        Assert.assertEquals(merged.getAlleles(), cfg.expected.getAlleles());
+
+        // test set field
+        Assert.assertEquals(merged.getAttribute("set"), cfg.setExpected);
+
+        // test filter field
+        Assert.assertEquals(merged.getFilters(), cfg.expected.getFilters());
+    }
+
+    // --------------------------------------------------------------------------------
+    //
+    // Test genotype merging
+    //
+    // --------------------------------------------------------------------------------
+
+    private class MergeGenotypesTest extends TestDataProvider {
+        List<VariantContext> inputs;
+        VariantContext expected;
+        List<String> priority;
+
+        private MergeGenotypesTest(String name, String priority, VariantContext... arg) {
+            super(MergeGenotypesTest.class, name);
+            LinkedList<VariantContext> all = new LinkedList<VariantContext>(Arrays.asList(arg));
+            this.expected = all.pollLast();
+            inputs = all;
+            this.priority = Arrays.asList(priority.split(","));
+        }
+
+        public String toString() {
+            return String.format("%s input=%s expected=%s", super.toString(), inputs, expected);
+        }
+    }
+
+    @DataProvider(name = "mergeGenotypes")
+    public Object[][] mergeGenotypesData() {
+        new MergeGenotypesTest("TakeGenotypeByPriority-1,2", "1,2",
+                makeVC("1", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1)),
+                makeVC("2", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2)),
+                makeVC("3", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1)));
+
+        new MergeGenotypesTest("TakeGenotypeByPriority-1,2-nocall", "1,2",
+                makeVC("1", Arrays.asList(Aref, T), makeG("s1", Allele.NO_CALL, Allele.NO_CALL, 1)),
+                makeVC("2", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2)),
+                makeVC("3", Arrays.asList(Aref, T), makeG("s1", Allele.NO_CALL, Allele.NO_CALL, 1)));
+
+        new MergeGenotypesTest("TakeGenotypeByPriority-2,1", "2,1",
+                makeVC("1", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1)),
+                makeVC("2", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2)),
+                makeVC("3", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2)));
+
+        new MergeGenotypesTest("NonOverlappingGenotypes", "1,2",
+                makeVC("1", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1)),
+                makeVC("2", Arrays.asList(Aref, T), makeG("s2", Aref, T, 2)),
+                makeVC("3", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1), makeG("s2", Aref, T, 2)));
+
+        new MergeGenotypesTest("PreserveNoCall", "1,2",
+                makeVC("1", Arrays.asList(Aref, T), makeG("s1", Allele.NO_CALL, Allele.NO_CALL, 1)),
+                makeVC("2", Arrays.asList(Aref, T), makeG("s2", Aref, T, 2)),
+                makeVC("3", Arrays.asList(Aref, T), makeG("s1", Allele.NO_CALL, Allele.NO_CALL, 1), makeG("s2", Aref, T, 2)));
+
+        new MergeGenotypesTest("PerserveAlleles", "1,2",
+                makeVC("1", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1)),
+                makeVC("2", Arrays.asList(Aref, C), makeG("s2", Aref, C, 2)),
+                makeVC("3", Arrays.asList(Aref, T, C), makeG("s1", Aref, T, 1), makeG("s2", Aref, C, 2)));
+
+        new MergeGenotypesTest("TakeGenotypePartialOverlap-1,2", "1,2",
+                makeVC("1", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1)),
+                makeVC("2", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2), makeG("s3", Aref, T, 3)),
+                makeVC("3", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1), makeG("s3", Aref, T, 3)));
+
+        new MergeGenotypesTest("TakeGenotypePartialOverlap-2,1", "2,1",
+                makeVC("1", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1)),
+                makeVC("2", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2), makeG("s3", Aref, T, 3)),
+                makeVC("3", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2), makeG("s3", Aref, T, 3)));
+
+        //
+        // merging genothpes with PLs
+        //
+
+        // first, do no harm
+        new MergeGenotypesTest("OrderedPLs", "1",
+                makeVC("1", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1, 1, 2, 3)),
+                makeVC("1", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1, 1, 2, 3)));
+
+        // first, do no harm
+        new MergeGenotypesTest("OrderedPLs-3Alleles", "1",
+                makeVC("1", Arrays.asList(Aref, C, T), makeG("s1", Aref, T, 1, 1, 2, 3, 4, 5, 6)),
+                makeVC("1", Arrays.asList(Aref, C, T), makeG("s1", Aref, T, 1, 1, 2, 3, 4, 5, 6)));
+
+        // first, do no harm
+        new MergeGenotypesTest("OrderedPLs-3Alleles-2", "1",
+                makeVC("1", Arrays.asList(Aref, T, C), makeG("s1", Aref, T, 1, 1, 2, 3, 4, 5, 6)),
+                makeVC("1", Arrays.asList(Aref, T, C), makeG("s1", Aref, T, 1, 1, 2, 3, 4, 5, 6)));
+
+        // first, do no harm
+        new MergeGenotypesTest("OrderedPLs-3Alleles-2", "1",
+                makeVC("1", Arrays.asList(Aref, T, C), makeG("s1", Aref, T, 1, 1, 2, 3, 4, 5, 6)),
+                makeVC("1", Arrays.asList(Aref, T, C), makeG("s2", Aref, C, 1, 1, 2, 3, 4, 5, 6)),
+                makeVC("1", Arrays.asList(Aref, T, C), makeG("s1", Aref, T, 1, 1, 2, 3, 4, 5, 6), makeG("s2", Aref, C, 1, 1, 2, 3, 4, 5, 6)));
+
+        new MergeGenotypesTest("TakeGenotypePartialOverlapWithPLs-2,1", "2,1",
+                makeVC("1", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1,5,0,3)),
+                makeVC("2", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2,4,0,2), makeG("s3", Aref, T, 3,3,0,2)),
+                makeVC("3", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2,4,0,2), makeG("s3", Aref, T, 3,3,0,2)));
+
+        new MergeGenotypesTest("TakeGenotypePartialOverlapWithPLs-1,2", "1,2",
+                makeVC("1", Arrays.asList(Aref,ATC), makeG("s1", Aref, ATC, 1,5,0,3)),
+                makeVC("2", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2,4,0,2), makeG("s3", Aref, T, 3,3,0,2)),
+                // no likelihoods on result since type changes to mixed multiallelic
+                makeVC("3", Arrays.asList(Aref, ATC, T), makeG("s1", Aref, ATC, 1), makeG("s3", Aref, T, 3)));
+
+        new MergeGenotypesTest("MultipleSamplePLsDifferentOrder", "1,2",
+                makeVC("1", Arrays.asList(Aref, C, T), makeG("s1", Aref, C, 1, 1, 2, 3, 4, 5, 6)),
+                makeVC("2", Arrays.asList(Aref, T, C), makeG("s2", Aref, T, 2, 6, 5, 4, 3, 2, 1)),
+                // no likelihoods on result since type changes to mixed multiallelic
+                makeVC("3", Arrays.asList(Aref, C, T), makeG("s1", Aref, C, 1), makeG("s2", Aref, T, 2)));
+
+        return MergeGenotypesTest.getTests(MergeGenotypesTest.class);
+    }
+
+    @Test(dataProvider = "mergeGenotypes")
+    public void testMergeGenotypes(MergeGenotypesTest cfg) {
+        final VariantContext merged = VariantContextUtils.simpleMerge(genomeLocParser,
+                cfg.inputs, cfg.priority, VariantContextUtils.FilteredRecordMergeType.KEEP_IF_ANY_UNFILTERED,
+                VariantContextUtils.GenotypeMergeType.PRIORITIZE, true, false, "set", false, false);
+
+        // test alleles are equal
+        Assert.assertEquals(merged.getAlleles(), cfg.expected.getAlleles());
+
+        // test genotypes
+        assertGenotypesAreMostlyEqual(merged.getGenotypes(), cfg.expected.getGenotypes());
+    }
+
+    // necessary to not overload equals for genotypes
+    private void assertGenotypesAreMostlyEqual(Map<String, Genotype> actual, Map<String, Genotype> expected) {
+        if (actual == expected) {
+            return;
+        }
+
+        if (actual == null || expected == null) {
+            Assert.fail("Maps not equal: expected: " + expected + " and actual: " + actual);
+        }
+
+        if (actual.size() != expected.size()) {
+            Assert.fail("Maps do not have the same size:" + actual.size() + " != " + expected.size());
+        }
+
+        for (Map.Entry<String, Genotype> entry : actual.entrySet()) {
+            String key = entry.getKey();
+            Genotype value = entry.getValue();
+            Genotype expectedValue = expected.get(key);
+
+            Assert.assertEquals(value.alleles, expectedValue.alleles, "Alleles in Genotype aren't equal");
+            Assert.assertEquals(value.getNegLog10PError(), expectedValue.getNegLog10PError(), "GQ values aren't equal");
+            Assert.assertEquals(value.hasLikelihoods(), expectedValue.hasLikelihoods(), "Either both have likelihoods or both not");
+            if ( value.hasLikelihoods() )
+                Assert.assertEquals(value.getLikelihoods().getAsVector(), expectedValue.getLikelihoods().getAsVector(), "Genotype likelihoods aren't equal");
+        }
+    }
+
+    @Test
+    public void testMergeGenotypesUniquify() {
+        final VariantContext vc1 = makeVC("1", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1));
+        final VariantContext vc2 = makeVC("2", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2));
+
+        final VariantContext merged = VariantContextUtils.simpleMerge(genomeLocParser,
+                Arrays.asList(vc1, vc2), null, VariantContextUtils.FilteredRecordMergeType.KEEP_IF_ANY_UNFILTERED,
+                VariantContextUtils.GenotypeMergeType.UNIQUIFY, false, false, "set", false, false);
+
+        // test genotypes
+        Assert.assertEquals(merged.getGenotypes().keySet(), new HashSet<String>(Arrays.asList("s1.1", "s1.2")));
+    }
+
+    @Test(expectedExceptions = UserException.class)
+    public void testMergeGenotypesRequireUnique() {
+        final VariantContext vc1 = makeVC("1", Arrays.asList(Aref, T), makeG("s1", Aref, T, 1));
+        final VariantContext vc2 = makeVC("2", Arrays.asList(Aref, T), makeG("s1", Aref, T, 2));
+
+        final VariantContext merged = VariantContextUtils.simpleMerge(genomeLocParser,
+                Arrays.asList(vc1, vc2), null, VariantContextUtils.FilteredRecordMergeType.KEEP_IF_ANY_UNFILTERED,
+                VariantContextUtils.GenotypeMergeType.REQUIRE_UNIQUE, false, false, "set", false, false);
+    }
+
+    // --------------------------------------------------------------------------------
+    //
+    // Misc. tests
+    //
+    // --------------------------------------------------------------------------------
+
+    @Test
+    public void testAnnotationSet() {
+        for ( final boolean annotate : Arrays.asList(true, false)) {
+            for ( final String set : Arrays.asList("set", "combine", "x")) {
+                final List<String> priority = Arrays.asList("1", "2");
+                VariantContext vc1 = makeVC("1", Arrays.asList(Aref, T), VariantContext.PASSES_FILTERS);
+                VariantContext vc2 = makeVC("2", Arrays.asList(Aref, T), VariantContext.PASSES_FILTERS);
+
+                final VariantContext merged = VariantContextUtils.simpleMerge(genomeLocParser,
+                        Arrays.asList(vc1, vc2), priority, VariantContextUtils.FilteredRecordMergeType.KEEP_IF_ANY_UNFILTERED,
+                        VariantContextUtils.GenotypeMergeType.PRIORITIZE, annotate, false, set, false, false);
+
+                if ( annotate )
+                    Assert.assertEquals(merged.getAttribute(set), VariantContextUtils.MERGE_INTERSECTION);
+                else
+                    Assert.assertFalse(merged.hasAttribute(set));
+            }
+        }
+    }
+
+    private static final List<String> vcs2priority(final Collection<VariantContext> vcs) {
+        final List<String> priority = new ArrayList<String>();
+
+        for ( final VariantContext vc : vcs ) {
+            priority.add(vc.getSource());
+        }
+
+        return priority;
+    }
+}
diff --git a/public/packages/AnalyzeCovariates.xml b/public/packages/AnalyzeCovariates.xml
index e8d58862a..27a72eabd 100644
--- a/public/packages/AnalyzeCovariates.xml
+++ b/public/packages/AnalyzeCovariates.xml
@@ -7,11 +7,8 @@
       <!-- Recalibration analysis script -->
       <class name="org.broadinstitute.sting.analyzecovariates.AnalyzeCovariates" />
       <package name="org.broadinstitute.sting.gatk.walkers.recalibration" />
+      <!-- Supplemental scripts for graph generation, etc. -->
+      <dir name="org/broadinstitute/sting/analyzecovariates" includes="**/*.R" />
     </dependencies>
   </executable>
-  <resources>
-    <!-- Supplemental scripts for graph generation, etc. -->
-    <file name="public/R/plot_residualError_OtherCovariate.R" />
-    <file name="public/R/plot_residualError_QualityScoreCovariate.R" />
-  </resources>
 </package>
diff --git a/public/packages/CreatePackager.xsl b/public/packages/CreatePackager.xsl
index 887107b9c..a89b6bb35 100644
--- a/public/packages/CreatePackager.xsl
+++ b/public/packages/CreatePackager.xsl
@@ -179,13 +179,19 @@
       </xsl:when>
     </xsl:choose>
   </xsl:for-each>
-    <xsl:for-each select="dir">
-        <fileset dir="{$staging.dir}">
-            <xsl:attribute name="includes">
-                <xsl:value-of select="concat(@name,'/**')"/>
-            </xsl:attribute>
-        </fileset>
-    </xsl:for-each>
+  <xsl:for-each select="dir">
+    <xsl:variable name="includes">
+      <xsl:choose>
+        <xsl:when test="@includes = ''">
+          <xsl:value-of select="concat(@name,'/**')"/>
+        </xsl:when>
+        <xsl:otherwise>
+          <xsl:value-of select="concat(@name,'/',@includes)"/>
+        </xsl:otherwise>
+      </xsl:choose>
+    </xsl:variable>
+    <fileset dir="{$staging.dir}" includes="{$includes}"/>
+  </xsl:for-each>
 </xsl:template>
 
 <!-- Determine the short name (filename w/o directory structure of the given filename -->
diff --git a/public/packages/GATKEngine.xml b/public/packages/GATKEngine.xml
index e6056408e..283b5eabf 100644
--- a/public/packages/GATKEngine.xml
+++ b/public/packages/GATKEngine.xml
@@ -32,6 +32,10 @@
       <package name="org.broad.tribble.**" />
       <!-- Workaround - depend on the logger impl required by JEXL -->
       <package name="org.apache.commons.logging.impl" />
+      <!-- R packages -->
+      <dir name="org/broadinstitute/sting/utils/R" includes="**/*.tar.gz" />
+      <!-- All R scripts in org.broadinstitute.sting -->
+      <dir name="org/broadinstitute/sting" includes="**/*.R" />
     </dependencies>
   </executable>
   <resources>
diff --git a/public/packages/GenomeAnalysisTK.xml b/public/packages/GenomeAnalysisTK.xml
index 14b837211..3d666b6e9 100644
--- a/public/packages/GenomeAnalysisTK.xml
+++ b/public/packages/GenomeAnalysisTK.xml
@@ -19,7 +19,6 @@
     <file name="public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CountLociWalker.java" />
     <file name="public/java/src/org/broadinstitute/sting/gatk/walkers/qc/CountReadsWalker.java" />
     <file name="public/java/src/org/broadinstitute/sting/gatk/walkers/qc/ValidatingPileupWalker.java" />
-    <file name="public/R/plot_Tranches.R" />
     <file name="public/R/titvFPEst.R" />
   </resources>
   <release>
diff --git a/public/packages/Queue.xml b/public/packages/Queue.xml
index c256e5687..86902ae99 100644
--- a/public/packages/Queue.xml
+++ b/public/packages/Queue.xml
@@ -65,6 +65,10 @@
             <package name="ca.mcgill.mcb.pcingola.**" />
             <file path="snpEff_genes.ftl" />
             <file path="snpEff_summary.ftl" />
+            
+            <!-- R scripts -->
+            <dir name="org/broadinstitute/sting/queue" includes="**/*.R" />
+
         </dependencies>
         <modules>
             <module file="GATKEngine.xml"/>
diff --git a/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/DataProcessingPipeline.scala b/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/DataProcessingPipeline.scala
index 59fcfea96..ccbe648d6 100755
--- a/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/DataProcessingPipeline.scala
+++ b/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/DataProcessingPipeline.scala
@@ -12,21 +12,19 @@ import net.sf.samtools.SAMFileHeader.SortOrder
 
 import org.broadinstitute.sting.queue.util.QScriptUtils
 import org.broadinstitute.sting.queue.function.ListWriterFunction
+import org.broadinstitute.sting.commandline.Hidden
 
 class DataProcessingPipeline extends QScript {
   qscript =>
 
   /****************************************************************************
-  * Required Parameters (if default values are not good for you)
+  * Required Parameters
   ****************************************************************************/
 
 
   @Input(doc="input BAM file - or list of BAM files", fullName="input", shortName="i", required=true)
   var input: File = _
 
-  @Input(doc="path to R resources folder inside the Sting repository", fullName="path_to_r", shortName="r", required=true)
-  var R: String = _
-
   @Input(doc="Reference fasta file", fullName="reference", shortName="R", required=true)
   var reference: File = _
 
@@ -64,6 +62,9 @@ class DataProcessingPipeline extends QScript {
   @Input(doc="Decompose input BAM file and fully realign it using BWA and assume Pair Ended reads", fullName="use_bwa_pair_ended", shortName="bwape", required=false)
   var useBWApe: Boolean = false
 
+  @Input(doc="Decompose input BAM file and fully realign it using BWA SW", fullName="use_bwa_sw", shortName="bwasw", required=false)
+  var useBWAsw: Boolean = false
+
   @Input(doc="Number of threads BWA should use", fullName="bwa_threads", shortName="bt", required=false)
   var bwaThreads: Int = 1
 
@@ -71,12 +72,24 @@ class DataProcessingPipeline extends QScript {
   var noValidation: Boolean = false
 
 
+  /****************************************************************************
+  * Hidden Parameters
+  ****************************************************************************/
+  @Hidden
+  @Input(doc="How many ways to scatter/gather", fullName="scatter_gather", shortName="sg", required=false)
+  var nContigs: Int = -1
+
+  @Hidden
+  @Input(doc="Define the default platform for Count Covariates -- useful for techdev purposes only.", fullName="default_platform", shortName="dp", required=false)
+  var defaultPlatform: String = ""
+
+
   /****************************************************************************
   * Global Variables
   ****************************************************************************/
 
   val queueLogDir: String = ".qlog/"  // Gracefully hide Queue's output
-  var nContigs: Int = 0               // Use the number of contigs for scatter gathering jobs
+
   var cleanModelEnum: ConsensusDeterminationModel = ConsensusDeterminationModel.USE_READS
 
 
@@ -149,22 +162,28 @@ class DataProcessingPipeline extends QScript {
     var index = 1
     for (bam <- bams) {
       // first revert the BAM file to the original qualities
-      val revertedBAM = revertBAM(bam, true)
-      val readSortedBam = swapExt(revertedBAM, ".bam", "." + index + ".sorted.bam" )
       val saiFile1 = swapExt(bam, ".bam", "." + index + ".1.sai")
       val saiFile2 = swapExt(bam, ".bam", "." + index + ".2.sai")
       val realignedSamFile = swapExt(bam, ".bam", "." + index + ".realigned.sam")
       val realignedBamFile = swapExt(bam, ".bam", "." + index + ".realigned.bam")
       val rgRealignedBamFile = swapExt(bam, ".bam", "." + index + ".realigned.rg.bam")
+
       if (useBWAse) {
+        val revertedBAM = revertBAM(bam, true)
         add(bwa_aln_se(revertedBAM, saiFile1),
             bwa_sam_se(revertedBAM, saiFile1, realignedSamFile))
       }
-      else {
-        add(sortSam(revertedBAM, readSortedBam, SortOrder.queryname),
-            bwa_aln_pe(readSortedBam, saiFile1, 1),
-            bwa_aln_pe(readSortedBam, saiFile2, 2),
-            bwa_sam_pe(readSortedBam, saiFile1, saiFile2, realignedSamFile))
+      else if (useBWApe) {
+        val revertedBAM = revertBAM(bam, true)
+        add(bwa_aln_pe(revertedBAM, saiFile1, 1),
+            bwa_aln_pe(revertedBAM, saiFile2, 2),
+            bwa_sam_pe(revertedBAM, saiFile1, saiFile2, realignedSamFile))
+      }
+      else if (useBWAsw) {
+        val revertedBAM = revertBAM(bam, false)
+        val fastQ = swapExt(revertedBAM, ".bam", ".fq")
+        add(convertToFastQ(revertedBAM, fastQ),
+            bwa_sw(fastQ, realignedSamFile))
       }
       add(sortSam(realignedSamFile, realignedBamFile, SortOrder.coordinate))
       addReadGroups(realignedBamFile, rgRealignedBamFile, new SAMFileReader(bam))
@@ -210,9 +229,10 @@ class DataProcessingPipeline extends QScript {
 
     // keep a record of the number of contigs in the first bam file in the list
     val bams = QScriptUtils.createListFromFile(input)
-    nContigs = QScriptUtils.getNumberOfContigs(bams(0))
+    if (nContigs < 0)
+     nContigs = QScriptUtils.getNumberOfContigs(bams(0))
 
-    val realignedBAMs = if (useBWApe || useBWAse) {performAlignment(bams)} else {revertBams(bams, false)}
+    val realignedBAMs = if (useBWApe || useBWAse  || useBWAsw) {performAlignment(bams)} else {revertBams(bams, false)}
 
     // generate a BAM file per sample joining all per lane files if necessary
     val sampleBAMFiles: Map[String, List[File]] = createSampleFiles(bams, realignedBAMs)
@@ -325,6 +345,7 @@ class DataProcessingPipeline extends QScript {
     this.covariate ++= List("ReadGroupCovariate", "QualityScoreCovariate", "CycleCovariate", "DinucCovariate")
     this.input_file :+= inBam
     this.recal_file = outRecalFile
+    if (!defaultPlatform.isEmpty) this.default_platform = defaultPlatform
     if (!qscript.intervalString.isEmpty()) this.intervalsString ++= List(qscript.intervalString)
     else if (qscript.intervals != null) this.intervals :+= qscript.intervals
     this.scatterCount = nContigs
@@ -353,7 +374,6 @@ class DataProcessingPipeline extends QScript {
 
 
   case class analyzeCovariates (inRecalFile: File, outPath: File) extends AnalyzeCovariates {
-    this.resources = qscript.R
     this.recal_file = inRecalFile
     this.output_dir = outPath.toString
     this.analysisName = queueLogDir + inRecalFile + ".analyze_covariates"
@@ -412,9 +432,16 @@ class DataProcessingPipeline extends QScript {
     this.output = outBam
     this.input :+= inBam
     this.removeAlignmentInformation = removeAlignmentInfo;
+    this.sortOrder = if (removeAlignmentInfo) {SortOrder.queryname} else {SortOrder.coordinate}
     this.analysisName = queueLogDir + outBam + "revert"
     this.jobName = queueLogDir + outBam + ".revert"
+  }
 
+  case class convertToFastQ (inBam: File, outFQ: File) extends SamToFastq with ExternalCommonArgs {
+    this.input :+= inBam
+    this.fastq = outFQ
+    this.analysisName = queueLogDir + outFQ + "convert_to_fastq"
+    this.jobName = queueLogDir + outFQ + ".convert_to_fastq"
   }
 
   case class bwa_aln_se (inBam: File, outSai: File) extends CommandLineFunction with ExternalCommonArgs {
@@ -454,6 +481,14 @@ class DataProcessingPipeline extends QScript {
     this.jobName = queueLogDir + outBam + ".bwa_sam_pe"
   }
 
+  case class bwa_sw (inFastQ: File, outBam: File) extends CommandLineFunction with ExternalCommonArgs {
+    @Input(doc="fastq file to be aligned") var fq = inFastQ
+    @Output(doc="output bam file") var bam = outBam
+    def commandLine = bwaPath + " bwasw -t " + bwaThreads + " " + reference + " " + fq + " > " + bam
+    this.analysisName = queueLogDir + outBam + ".bwasw"
+    this.jobName = queueLogDir + outBam + ".bwasw"
+  }
+
   case class writeList(inBams: List[File], outBamList: File) extends ListWriterFunction {
     this.inputFiles = inBams
     this.listFile = outBamList
diff --git a/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/GATKResourcesBundle.scala b/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/GATKResourcesBundle.scala
index 59c00b8cd..036a77b58 100755
--- a/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/GATKResourcesBundle.scala
+++ b/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/GATKResourcesBundle.scala
@@ -131,11 +131,11 @@ class GATKResourcesBundle extends QScript {
     addResource(new Resource("/humgen/gsa-hpprojects/GATK/data/Comparisons/Validated/HapMap/3.3/genotypes_r27_nr.b37_fwd.vcf",
       "hapmap_3.3", b37, true, true))
 
-    addResource(new Resource("/humgen/gsa-hpprojects/GATK/data/Comparisons/Unvalidated/AFR+EUR+ASN+1KG.dindel_august_release_merged_pilot1.20110126.sites.vcf",
-      "1000G_indels_for_realignment", b37, true, false))
+    addResource(new Resource("/humgen/1kg/processing/official_release/phase1/ALL.wgs.VQSR_consensus_biallelic.20101123.indels.sites.vcf",
+      "1000G_biallelic.indels", b37, true, false))
 
     addResource(new Resource("/humgen/gsa-hpprojects/GATK/data/Comparisons/Validated/Mills_Devine_Indels_2011/ALL.wgs.indels_mills_devine_hg19_leftAligned_collapsed_double_hit.sites.vcf",
-      "indels_mills_devine", b37, true, true))
+      "Mills_Devine_2hit.indels", b37, true, true))
     
     //
     // example call set for wiki tutorial
@@ -300,9 +300,9 @@ class GATKResourcesBundle extends QScript {
     bamFile = bamIn
   }
 
-  class IndexVCF(@Input vcf: File, @Input ref: File) extends CountRod with UNIVERSAL_GATK_ARGS {
+  class IndexVCF(@Input vcf: File, @Input ref: File) extends CountRODs with UNIVERSAL_GATK_ARGS {
     //@Output val vcfIndex: File = swapExt(vcf.getParent, vcf, ".vcf", ".vcf.idx")
-    this.rodBind :+= RodBind(vcf.getName, "VCF", vcf)
+    this.rod :+= vcf
     this.reference_sequence = ref
   }
 
@@ -313,7 +313,7 @@ class GATKResourcesBundle extends QScript {
   }
 
   class MakeDBSNP129(@Input dbsnp: File, @Input ref: File, @Output dbsnp129: File) extends SelectVariants with UNIVERSAL_GATK_ARGS {
-    this.rodBind :+= RodBind("variant", "VCF", dbsnp)
+    this.variant = dbsnp
     this.select ++= List("\"dbSNPBuildID <= 129\"")
     this.reference_sequence = ref
     this.out = dbsnp129
diff --git a/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/MethodsDevelopmentCallingPipeline.scala b/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/MethodsDevelopmentCallingPipeline.scala
index 109139d20..da02c8ac5 100755
--- a/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/MethodsDevelopmentCallingPipeline.scala
+++ b/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/MethodsDevelopmentCallingPipeline.scala
@@ -98,40 +98,56 @@ class MethodsDevelopmentCallingPipeline extends QScript {
   // BUGBUG: We no longer support b36/hg18 because several of the necessary files aren't available aligned to those references
 
   val targetDataSets: Map[String, Target] = Map(
-    "HiSeq" -> new Target("NA12878.HiSeq", hg18, dbSNP_hg18_129, hapmap_hg18,
+    "NA12878_gold" -> new Target("NA12878.goldStandard", hg19, dbSNP_b37, hapmap_b37, indelMask_b37,
+              new File("/humgen/gsa-hpprojects/dev/carneiro/NA12878/data/goldStandard.list"),
+              new File("/humgen/gsa-hpprojects/dev/carneiro/NA12878/analysis/snps/NA12878.HiSeq19.filtered.vcf"),          // ** There is no gold standard for the gold standard **
+              "/humgen/1kg/processing/pipeline_test_bams/whole_genome_chunked.noChrY.hg19.intervals", 2.14, 99.0, lowPass, !exome, 391),
+    "NA12878_wgs_b37" -> new Target("NA12878.HiSeq.WGS.b37", hg19, dbSNP_b37, hapmap_b37, indelMask_b37,
+              new File("/humgen/gsa-hpprojects/NA12878Collection/bams/NA12878.HiSeq.WGS.bwa.cleaned.recal.hg19.bam"),
+              new File("/humgen/gsa-hpprojects/dev/carneiro/NA12878/analysis/snps/NA12878.HiSeq19.filtered.vcf"),
+              "/humgen/1kg/processing/pipeline_test_bams/whole_genome_chunked.noChrY.hg19.intervals", 2.14, 99.0, !lowPass, !exome, 1),
+    "NA12878_wgs_decoy" -> new Target("NA12878.HiSeq.WGS.b37_decoy", b37_decoy, dbSNP_b37, hapmap_b37, indelMask_b37,
+              new File("/humgen/gsa-hpprojects/NA12878Collection/bams/CEUTrio.HiSeq.WGS.b37_decoy.NA12878.clean.dedup.recal.bam"),
+              new File("/humgen/gsa-hpprojects/dev/carneiro/NA12878/analysis/snps/NA12878.HiSeq19.filtered.vcf"),          // ** THIS GOLD STANDARD NEEDS TO BE CORRECTED **
+              "/humgen/1kg/processing/pipeline_test_bams/whole_genome_chunked.noChrY.hg19.intervals", 2.14, 99.0, !lowPass, !exome, 1),
+    "NA12878_wgs_hg18" -> new Target("NA12878.HiSeq.WGS.hg18", hg18, dbSNP_hg18_129, hapmap_hg18,
               "/humgen/gsa-hpprojects/dev/depristo/oneOffProjects/1000GenomesProcessingPaper/wgs.v13/HiSeq.WGS.cleaned.indels.10.mask",
               new File("/humgen/gsa-hpprojects/NA12878Collection/bams/NA12878.HiSeq.WGS.bwa.cleaned.recal.bam"),
               new File("/home/radon01/depristo/work/oneOffProjects/1000GenomesProcessingPaper/wgs.v13/HiSeq.WGS.cleaned.ug.snpfiltered.indelfiltered.vcf"),
               "/humgen/1kg/processing/pipeline_test_bams/whole_genome_chunked.hg18.intervals", 2.14, 99.0, !lowPass, !exome, 1),
-    "HiSeq19" -> new Target("NA12878.HiSeq19", hg19, dbSNP_b37, hapmap_b37, indelMask_b37,
-              new File("/humgen/gsa-hpprojects/NA12878Collection/bams/NA12878.HiSeq.WGS.bwa.cleaned.recal.hg19.bam"),
-              new File("/humgen/gsa-hpprojects/dev/carneiro/hiseq19/analysis/snps/NA12878.HiSeq19.filtered.vcf"),
-              "/humgen/1kg/processing/pipeline_test_bams/whole_genome_chunked.noChrY.hg19.intervals", 2.14, 99.0, !lowPass, !exome, 1),
-    "GA2hg19" -> new Target("NA12878.GA2.hg19", hg19, dbSNP_b37, hapmap_b37, indelMask_b37,
-              new File("/humgen/gsa-hpprojects/NA12878Collection/bams/NA12878.GA2.WGS.bwa.cleaned.hg19.bam"),
-              new File("/humgen/gsa-hpprojects/dev/carneiro/hiseq19/analysis/snps/NA12878.GA2.hg19.filtered.vcf"),
-              "/humgen/1kg/processing/pipeline_test_bams/whole_genome_chunked.hg19.intervals", 2.14, 99.0, !lowPass, !exome, 1),
-    "WEx" -> new Target("NA12878.WEx", hg18, dbSNP_hg18_129, hapmap_hg18,
+    "NA12878_wex_b37" -> new Target("NA12878.HiSeq.WEx.b37", hg19, dbSNP_b37, hapmap_b37, indelMask_b37,
+              new File("/seq/picard_aggregation/C339/NA12878/v3/NA12878.bam"),
+              new File("/humgen/gsa-hpprojects/dev/carneiro/trio/analysis/snps/CEUTrio.WEx.filtered.vcf"),                  // ** THIS GOLD STANDARD NEEDS TO BE CORRECTED **
+              "/seq/references/HybSelOligos/whole_exome_agilent_1.1_refseq_plus_3_boosters/whole_exome_agilent_1.1_refseq_plus_3_boosters.Homo_sapiens_assembly19.targets.interval_list", 3.3, 98.0, !lowPass, exome, 1),
+    "NA12878_wex_hg18" -> new Target("NA12878.HiSeq.WEx.hg18", hg18, dbSNP_hg18_129, hapmap_hg18,
               "/humgen/gsa-hpprojects/dev/depristo/oneOffProjects/1000GenomesProcessingPaper/wgs.v13/GA2.WEx.cleaned.indels.10.mask",
               new File("/humgen/gsa-hpprojects/NA12878Collection/bams/NA12878.WEx.cleaned.recal.bam"),
               new File("/home/radon01/depristo/work/oneOffProjects/1000GenomesProcessingPaper/wgs.v13/GA2.WEx.cleaned.ug.snpfiltered.indelfiltered.vcf"),
               "/seq/references/HybSelOligos/whole_exome_agilent_1.1_refseq_plus_3_boosters/whole_exome_agilent_1.1_refseq_plus_3_boosters.targets.interval_list", 3.3, 98.0, !lowPass, exome, 1),
-    "WExTrio" -> new Target("CEUTrio.WEx", hg19, dbSNP_b37, hapmap_b37, indelMask_b37,
+    "NA12878_wex_decoy" -> new Target("NA12878.HiSeq.WEx.b37_decoy", b37_decoy, dbSNP_b37, hapmap_b37, indelMask_b37,
+              new File("/humgen/gsa-hpprojects/NA12878Collection/bams/CEUTrio.HiSeq.WEx.b37_decoy.NA12878.clean.dedup.recal.bam"),
+              new File("/humgen/gsa-hpprojects/dev/carneiro/trio/analysis/snps/CEUTrio.WEx.filtered.vcf"),                  // ** THIS GOLD STANDARD NEEDS TO BE CORRECTED **
+              "/seq/references/HybSelOligos/whole_exome_agilent_1.1_refseq_plus_3_boosters/whole_exome_agilent_1.1_refseq_plus_3_boosters.Homo_sapiens_assembly19.targets.interval_list", 3.3, 98.0, !lowPass, exome, 1),
+    "CEUTrio_wex_b37" -> new Target("CEUTrio.HiSeq.WEx.b37", hg19, dbSNP_b37, hapmap_b37, indelMask_b37,
               new File("/humgen/gsa-hpprojects/NA12878Collection/bams/CEUTrio.HiSeq.WEx.bwa.cleaned.recal.bam"),
               new File("/humgen/gsa-hpprojects/dev/carneiro/trio/analysis/snps/CEUTrio.WEx.filtered.vcf"),
               "/seq/references/HybSelOligos/whole_exome_agilent_1.1_refseq_plus_3_boosters/whole_exome_agilent_1.1_refseq_plus_3_boosters.Homo_sapiens_assembly19.targets.interval_list", 3.3, 98.0, !lowPass, exome, 3),
-    "WGSTrio" -> new Target("CEUTrio.WGS", hg19, dbSNP_b37, hapmap_b37, indelMask_b37,
+    "CEUTrio_wgs_b37" -> new Target("CEUTrio.HiSeq.WGS.b37", hg19, dbSNP_b37, hapmap_b37, indelMask_b37,
               new File("/humgen/gsa-hpprojects/NA12878Collection/bams/CEUTrio.HiSeq.WGS.bwa.cleaned.recal.bam"),
               new File("/humgen/gsa-hpprojects/dev/carneiro/trio/analysis/snps/CEUTrio.WEx.filtered.vcf"),                  // ** THIS GOLD STANDARD NEEDS TO BE CORRECTED **
               "/humgen/1kg/processing/pipeline_test_bams/whole_genome_chunked.hg19.intervals", 2.3, 99.0, !lowPass, !exome, 3),
-    "WExTrioDecoy" -> new Target("CEUTrio.HiSeq.WEx.b37_decoy", b37_decoy, dbSNP_b37, hapmap_b37, indelMask_b37,
+    "CEUTrio_wex_decoy" -> new Target("CEUTrio.HiSeq.WEx.b37_decoy", b37_decoy, dbSNP_b37, hapmap_b37, indelMask_b37,
               new File("/humgen/gsa-hpprojects/NA12878Collection/bams/CEUTrio.HiSeq.WEx.b37_decoy.list"),
               new File("/humgen/gsa-hpprojects/dev/carneiro/trio/analysis/snps/CEUTrio.WEx.filtered.vcf"),                  // ** THIS GOLD STANDARD NEEDS TO BE CORRECTED **
               "/seq/references/HybSelOligos/whole_exome_agilent_1.1_refseq_plus_3_boosters/whole_exome_agilent_1.1_refseq_plus_3_boosters.Homo_sapiens_assembly19.targets.interval_list", 3.3, 98.0, !lowPass, exome, 3),
-    "WGSTrioDecoy" -> new Target("CEUTrio.HiSeq.WGS.b37_decoy", b37_decoy, dbSNP_b37, hapmap_b37, indelMask_b37,
+    "CEUTrio_wgs_decoy" -> new Target("CEUTrio.HiSeq.WGS.b37_decoy", b37_decoy, dbSNP_b37, hapmap_b37, indelMask_b37,
               new File("/humgen/gsa-hpprojects/NA12878Collection/bams/CEUTrio.HiSeq.WGS.b37_decoy.list"),
               new File("/humgen/gsa-hpprojects/dev/carneiro/trio/analysis/snps/CEUTrio.WEx.filtered.vcf"),                  // ** THIS GOLD STANDARD NEEDS TO BE CORRECTED **
               "/humgen/1kg/processing/pipeline_test_bams/whole_genome_chunked.hg19.intervals", 2.3, 99.0, !lowPass, !exome, 3),
+    "GA2hg19" -> new Target("NA12878.GA2.hg19", hg19, dbSNP_b37, hapmap_b37, indelMask_b37,
+              new File("/humgen/gsa-hpprojects/NA12878Collection/bams/NA12878.GA2.WGS.bwa.cleaned.hg19.bam"),
+              new File("/humgen/gsa-hpprojects/dev/carneiro/NA12878/analysis/snps/NA12878.GA2.hg19.filtered.vcf"),
+              "/humgen/1kg/processing/pipeline_test_bams/whole_genome_chunked.hg19.intervals", 2.14, 99.0, !lowPass, !exome, 1),
     "FIN" -> new Target("FIN", b37, dbSNP_b37, hapmap_b37, indelMask_b37,
               new File("/humgen/1kg/processing/pipeline_test_bams/FIN.79sample.Nov2010.chr20.bam"),
               new File("/humgen/gsa-hpprojects/dev/data/AugChr20Calls_v4_3state/ALL.august.v4.chr20.filtered.vcf"),         // ** THIS GOLD STANDARD NEEDS TO BE CORRECTED **
@@ -189,7 +205,6 @@ class MethodsDevelopmentCallingPipeline extends QScript {
 
   // 1.) Unified Genotyper Base
   class GenotyperBase (t: Target) extends UnifiedGenotyper with UNIVERSAL_GATK_ARGS {
-    this.memoryLimit = 3
     this.reference_sequence = t.reference
     this.intervalsString ++= List(t.intervals)
     this.scatterCount = 140
@@ -209,13 +224,14 @@ class MethodsDevelopmentCallingPipeline extends QScript {
       this.max_deletion_fraction = qscript.deletions
     this.out = t.rawVCF
     this.glm = org.broadinstitute.sting.gatk.walkers.genotyper.GenotypeLikelihoodsCalculationModel.Model.SNP
-    this.baq = if (noBAQ) {org.broadinstitute.sting.utils.baq.BAQ.CalculationMode.OFF} else {org.broadinstitute.sting.utils.baq.BAQ.CalculationMode.CALCULATE_AS_NECESSARY}
+    this.baq = if (noBAQ ||  t.isExome) {org.broadinstitute.sting.utils.baq.BAQ.CalculationMode.OFF} else {org.broadinstitute.sting.utils.baq.BAQ.CalculationMode.CALCULATE_AS_NECESSARY}
     this.analysisName = t.name + "_UGs"
     this.jobName =  queueLogDir + t.name + ".snpcall"
   }
 
   // 1b.) Call Indels with UG
   class indelCall (t: Target) extends GenotyperBase(t) {
+    this.memoryLimit = 6
     this.out = t.rawIndelVCF
     this.glm = org.broadinstitute.sting.gatk.walkers.genotyper.GenotypeLikelihoodsCalculationModel.Model.INDEL
     this.baq = org.broadinstitute.sting.utils.baq.BAQ.CalculationMode.OFF
@@ -243,7 +259,6 @@ class MethodsDevelopmentCallingPipeline extends QScript {
 
   // 3.) Variant Quality Score Recalibration - Generate Recalibration table
   class VQSR(t: Target, goldStandard: Boolean) extends VariantRecalibrator with UNIVERSAL_GATK_ARGS {
-    this.memoryLimit = 4
     this.nt = 2
     this.reference_sequence = t.reference
     this.intervalsString ++= List(t.intervals)
@@ -254,13 +269,18 @@ class MethodsDevelopmentCallingPipeline extends QScript {
     this.resource :+= new TaggedFile( t.dbsnpFile, "known=true,prior=2.0" )
     this.resource :+= new TaggedFile( projectConsensus_1000G, "prior=8.0" )
     this.use_annotation ++= List("QD", "HaplotypeScore", "MQRankSum", "ReadPosRankSum", "MQ", "FS")
-    if(t.nSamples >= 10) {
+    if(t.nSamples >= 10) { // InbreedingCoeff is a population-wide statistic that requires at least 10 samples to calculate
         this.use_annotation ++= List("InbreedingCoeff")
     }
     if(!t.isExome) {
         this.use_annotation ++= List("DP")
-    } else {
+    } else { // exome specific parameters
+        this.resource :+= new TaggedFile( badSites_1000G, "bad=true,prior=2.0" )
         this.mG = 6
+        if(t.nSamples <= 3) { // very few exome samples means very few variants
+            this.mG = 4
+            this.percentBad = 0.04
+        }
     }
     this.tranches_file = if ( goldStandard ) { t.goldStandardTranchesFile } else { t.tranchesFile }
     this.recal_file = if ( goldStandard ) { t.goldStandardRecalFile } else { t.recalFile }
diff --git a/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/StandardVariantEvaluation.scala b/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/StandardVariantEvaluation.scala
deleted file mode 100755
index d333e1dc0..000000000
--- a/public/scala/qscript/org/broadinstitute/sting/queue/qscripts/StandardVariantEvaluation.scala
+++ /dev/null
@@ -1,202 +0,0 @@
-package org.broadinstitute.sting.queue.qscripts
-
-import org.broadinstitute.sting.queue.QScript
-import org.broadinstitute.sting.queue.extensions.gatk.RodBind
-import org.broadinstitute.sting.queue.extensions.gatk._
-
-class StandardVariantEvaluation extends QScript {
-  // todo -- update to released version when things stabilize
-  @Argument(doc="gatkJarFile", required=false)
-  var gatkJarFile: File = new File("/home/radon01/depristo/dev/GenomeAnalysisTKFromLaptop/trunk/dist/GenomeAnalysisTK.jar")
-
-  @Argument(shortName = "R", doc="B37 reference sequence: defaults to broad standard location", required=false)
-  var referenceFile: File = new File("/humgen/1kg/reference/human_g1k_v37.fasta")
-
-  @Argument(shortName = "intervals", doc="intervals to evaluate.  Only supports evaluation on chromosome 20 now, as most evaluation data is there", required=false)
-  val TARGET_INTERVAL: String = "20"
-
-  @Argument(shortName = "includeUnion", doc="If provided, we'll create a union of the evaluation data sets for evaluation", required=false)
-  val CREATE_UNION: Boolean = false
-
-  @Argument(shortName = "dataDir", doc="Path to the standard evaluation data files", required=false)
-  val DATA_DIR = "/humgen/gsa-hpprojects/GATK/data/Comparisons/StandardForEvaluation/b37/"
-
-  @Argument(shortName = "evalStandard1000GCalls", doc="If provided, we'll include some standard 1000G data for evaluation", required=false)
-  val EVAL_STANDARD_1000G_CALLS: Boolean = false
-
-  val COMPS_DIR = DATA_DIR + "/comps/"
-  val EVALS_DIR = DATA_DIR + "/evals/"
-
-  @Argument(shortName = "moreSNPsToEval", doc="Path to additional SNP call sets for evaluation", required=false)
-  val moreSNPsToEval: List[File] = Nil
-
-  @Argument(shortName = "moreIndelsToEval", doc="Path to additional Indel call sets for evaluation", required=false)
-  val moreIndelsToEval: List[File] = Nil
-
-  val VARIANT_TYPES: List[String] = List("indels", "snps")
-  val VARIANT_TYPE_VT: Map[String, List[org.broad.tribble.util.variantcontext.VariantContext.Type]] = Map(
-    "indels" -> List(org.broad.tribble.util.variantcontext.VariantContext.Type.INDEL, org.broad.tribble.util.variantcontext.VariantContext.Type.MIXED, org.broad.tribble.util.variantcontext.VariantContext.Type.NO_VARIATION),
-    "snps" -> List(org.broad.tribble.util.variantcontext.VariantContext.Type.SNP, org.broad.tribble.util.variantcontext.VariantContext.Type.NO_VARIATION)
-  )
-
-  val SITES_DIR: String = "sitesFiles"
-
-  // path to b37 DBSNP
-  @Argument(shortName = "dbsnp", doc="Path to DBSNP **VCF** for evaluation", required=false)
-  val MY_DBSNP: File = new File("/humgen/gsa-hpprojects/GATK/data/Comparisons/Validated/dbSNP/dbsnp_129_b37.leftAligned.vcf")
-  //val MY_DBSNP: File = new File("/humgen/gsa-hpprojects/GATK/data/dbsnp_132_b37.leftAligned.vcf");
-
-  class Comp(val name: String, val evalType: String, val filename: String, val MakeHomVar: Boolean = false) {
-    val originalFile = new File(COMPS_DIR + filename)
-    val file: File = if ( MakeHomVar ) swapExt(originalFile, ".vcf",".homvar.vcf") else originalFile
-    val sitesFile = new File(SITES_DIR + "/" + swapExt(file, ".vcf", ".sites.vcf").getName)
-  }
-
-  class Eval(val name: String, val evalType: String, val filename: String, val overrideFile: File = null ) {
-    val file: File = if ( overrideFile != null ) overrideFile else new File(EVALS_DIR + "/" + filename)
-  }
-
-  var COMPS: List[Comp] = Nil
-  def addComp(comp: Comp) { COMPS = comp :: COMPS }
-
-  var EVALS: List[Eval] = Nil
-  def addEval(eval: Eval) { EVALS = eval :: EVALS }
-  def addEvalFromCMD(file: File, t: String) { addEval(new Eval(file.getName, t, null, file)) }
-
-  trait UNIVERSAL_GATK_ARGS extends CommandLineGATK {
-    this.logging_level = "INFO";
-    this.jarFile = gatkJarFile;
-    this.intervalsString = List(TARGET_INTERVAL);
-    this.reference_sequence = referenceFile;
-    this.memoryLimit = 2
-  }
-
-  def initializeStandardDataFiles() = {
-    //
-    // Standard evaluation files for indels
-    //
-    addComp(new Comp("NA12878.homvar.GATK", "indels", "Indels.NA12878_WGS.filtered_Q50.0_QD5.0_SB-1.0_HR18.vcf", true))
-    addComp(new Comp("CG.38samples", "indels", "CG.Indels.leftAligned.b37.vcf"))
-    addComp(new Comp("NA12878.homvar.CG", "indels", "NA12878.CG.b37.indels.vcf", true))
-    addComp(new Comp("g1k.pilot1.validation", "indels", "pilot1_indel_validation_2009.b37.vcf"))
-    addComp(new Comp("NA12878.hand_curated", "indels", "NA12878.validated.curated.polymorphic.indels.vcf"))
-    addComp(new Comp("NA12878.Mullikin", "indels", "NA12878.DIPline.NQScm.expanded.chr20.b37.minReads_2_or_gt2bp.vcf"))
-
-
-    //
-    // INDEL call sets
-    //
-    if ( EVAL_STANDARD_1000G_CALLS ) {
-      addEval(new Eval("dindel", "indels", "20110208.chr20.dindel2.EUR.sites.vcf"))
-      addEval(new Eval("si", "indels", "20101123.chr20.si.v2.EUR.sites.vcf"))
-      addEval(new Eval("gatk", "indels", "EUR.phase1.chr20.broad.filtered.indels.sites.vcf"))
-    }
-
-    //
-    // Standard evaluation files for SNPs
-    //
-    addComp(new Comp("NA12878.homvar.GATK", "snps", "NA12878.HiSeq19.cut.vcf", true))
-    addComp(new Comp("CG.38samples", "snps", "CG.38samples.b37.vcf"))
-    addComp(new Comp("NA12878.homvar.CG", "snps", "NA12878.CG.b37.snps.vcf", true))
-    addComp(new Comp("HapMap3.3", "snps", "hapmap3.3.sites_r27_nr.b37_fwd.vcf"))
-    addComp(new Comp("OMNI.2.5M", "snps", "omni2.5.1212samples.b37.sites.chr20.monoAreAC0.vcf"))
-    addComp(new Comp("g1k.pilot1.validation", "snps", "1000G.snp.validation.b37.vcf"))
-
-    //
-    // SNP call sets
-    //
-    if ( EVAL_STANDARD_1000G_CALLS ) {
-      addEval(new Eval("1000G.gatk.eurPlus.phase1", "snps", "EUR+.phase1.chr20.broad.recal.vrcut1p0.sites.vcf"))
-      addEval(new Eval("1000G.high_specificity.phase1", "snps", "ALL.phase1.chr20.projectConsensus.highSpecificity.snps.genotypes.sites.vcf"))
-    }
-  }
-
-  def script = {
-    val sitesDir = new File(SITES_DIR)
-    if ( ! sitesDir.exists ) sitesDir.mkdirs()
-
-    initializeStandardDataFiles();
-
-    // add additional files for evaluation, if necessary
-    moreSNPsToEval.foreach(addEvalFromCMD(_, "snps"))
-    moreIndelsToEval.foreach(addEvalFromCMD(_, "indels"))
-
-    //
-    // create hom-var versions of key files
-    //
-    for ( comp <- COMPS )
-      if ( comp.MakeHomVar )
-        add(new SelectHomVars(comp.originalFile, comp.file))
-
-    for ( comp <- COMPS )
-        add(new JustSites(comp.file, comp.sitesFile))
-
-    //
-    // Loop over evaluation types
-    //
-    for ( evalType <- VARIANT_TYPES ) {
-      var evalsOfType = EVALS.filter(_.evalType == evalType)
-      val compsOfType = COMPS.filter(_.evalType == evalType)
-
-      if ( evalsOfType.size > 0 ) {
-
-        // if desired and possible, create a union.X.vcf file
-        if ( CREATE_UNION && evalsOfType.size > 1 ) {
-          val union: File = new File("union.%s.vcf".format(evalType))
-          add(new MyCombine(evalsOfType.map(_.file), union));
-          evalsOfType = new Eval("union", evalType, null, union) :: evalsOfType
-        }
-
-        // our root VE
-        val VE = new MyEval()
-        VE.VT = VARIANT_TYPE_VT(evalType)
-        VE.o = new File(evalType + ".eval")
-
-        // add evals
-        for ( calls <- evalsOfType )
-          VE.rodBind :+= RodBind("eval_" + calls.name, "VCF", calls.file)
-
-        // add comps
-        //VE.rodBind :+= RodBind("dbsnp", "VCF", MY_DBSNP)
-        for ( comp <- compsOfType )
-          VE.rodBind :+= RodBind("comp_" + comp.name, "VCF", comp.sitesFile)
-
-        add(VE)
-      }
-    }
-  }
-
-  /**
-   * Select homozygous non-reference sites from a single deep data set
-   */
-  class SelectHomVars(@Input(doc="foo") vcf: File, @Output(doc="foo") out: File) extends SelectVariants with UNIVERSAL_GATK_ARGS {
-    this.rodBind :+= RodBind("variant", "VCF", vcf)
-    this.o = out
-    this.select ++= List("\"AC == 2\"")
-  }
-
-  /**
-   * A simple union
-   */
-  class MyCombine(@Input(doc="foo") vcfs: List[File], @Output(doc="foo") out: File) extends CombineVariants with UNIVERSAL_GATK_ARGS {
-    for ( vcf <- vcfs )
-      this.rodBind :+= RodBind(vcf.getName, "VCF", vcf)
-    this.o = out
-  }
-
-  /**
-   * A command line (cut) that removes all genotyping information from a file
-   */
-  class JustSites(@Input(doc="foo") in: File, @Output(doc="foo") out: File) extends CommandLineFunction {
-    def commandLine = "cut -f 1-8 %s > %s".format(in, out)
-  }
-
-  /**
-   * Base class for VariantEval used here
-   */
-  class MyEval() extends VariantEval with UNIVERSAL_GATK_ARGS {
-    this.noST = true
-    this.evalModule :+= "ValidationReport"
-  }
-}
-
diff --git a/public/scala/src/org/broadinstitute/sting/queue/QCommandLine.scala b/public/scala/src/org/broadinstitute/sting/queue/QCommandLine.scala
old mode 100755
new mode 100644
index 297da8cc9..e8091cde7
--- a/public/scala/src/org/broadinstitute/sting/queue/QCommandLine.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/QCommandLine.scala
@@ -33,11 +33,12 @@ import org.broadinstitute.sting.queue.engine.{QGraphSettings, QGraph}
 import collection.JavaConversions._
 import org.broadinstitute.sting.utils.classloader.PluginManager
 import org.broadinstitute.sting.utils.exceptions.UserException
+import org.broadinstitute.sting.utils.io.IOUtils
 
 /**
  * Entry point of Queue.  Compiles and runs QScripts passed in to the command line.
  */
-object QCommandLine {
+object QCommandLine extends Logging {
   /**
    * Main.
    * @param argv Arguments.
@@ -45,22 +46,26 @@ object QCommandLine {
   def main(argv: Array[String]) {
     val qCommandLine = new QCommandLine
 
-    Runtime.getRuntime.addShutdownHook(new Thread {
-      /** Cleanup as the JVM shuts down. */
+    val shutdownHook = new Thread {
       override def run() {
-        ProcessController.shutdown()
+        logger.info("Shutting down jobs. Please wait...")
         qCommandLine.shutdown()
       }
-    })
+    }
+
+    Runtime.getRuntime.addShutdownHook(shutdownHook)
 
     try {
-      CommandLineProgram.start(qCommandLine, argv);
+      CommandLineProgram.start(qCommandLine, argv)
+      try {
+        Runtime.getRuntime.removeShutdownHook(shutdownHook)
+      } catch {
+        case _ => /* ignore, example 'java.lang.IllegalStateException: Shutdown in progress' */
+      }
       if (CommandLineProgram.result != 0)
         System.exit(CommandLineProgram.result);
     } catch {
       case e: Exception => CommandLineProgram.exitSystemWithError(e)
-    } finally {
-
     }
   }
 }
@@ -79,6 +84,7 @@ class QCommandLine extends CommandLineProgram with Logging {
   private val qScriptManager = new QScriptManager
   private val qGraph = new QGraph
   private var qScriptClasses: File = _
+  private var shuttingDown = false
 
   private lazy val pluginManager = {
     qScriptClasses = IOUtils.tempDir("Q-Classes", "", settings.qSettings.tempDirectory)
@@ -117,10 +123,16 @@ class QCommandLine extends CommandLineProgram with Logging {
       script.onExecutionDone(qGraph.getFunctionsAndStatus(script.functions), qGraph.success)
       if ( ! settings.disableJobReport ) {
         val jobStringName = (QScriptUtils.?(settings.jobReportFile)).getOrElse(settings.qSettings.jobNamePrefix + ".jobreport.txt")
-        val jobReportFile = new File(jobStringName)
-        logger.info("Writing JobLogging GATKReport to file " + jobReportFile)
-        QJobReport.printReport(qGraph.getFunctionsAndStatus(script.functions), jobReportFile)
-        QJobReport.plotReport(settings.rScriptArgs, jobReportFile)
+
+        if (!shuttingDown) {
+          val reportFile = new File(jobStringName)
+          logger.info("Writing JobLogging GATKReport to file " + reportFile)
+          QJobReport.printReport(qGraph.getFunctionsAndStatus(script.functions), reportFile)
+
+          val pdfFile = new File(jobStringName + ".pdf")
+          logger.info("Plotting JobLogging GATKReport to file " + pdfFile)
+          QJobReport.plotReport(reportFile, pdfFile)
+        }
       }
     }
 
@@ -162,6 +174,7 @@ class QCommandLine extends CommandLineProgram with Logging {
     Arrays.asList(new ScalaCompoundArgumentTypeDescriptor)
 
   def shutdown() = {
+    shuttingDown = true
     qGraph.shutdown()
     if (qScriptClasses != null) IOUtils.tryDelete(qScriptClasses)
   }
diff --git a/public/scala/src/org/broadinstitute/sting/queue/QScriptManager.scala b/public/scala/src/org/broadinstitute/sting/queue/QScriptManager.scala
index a70276bef..512a9f8dd 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/QScriptManager.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/QScriptManager.scala
@@ -2,7 +2,7 @@ package org.broadinstitute.sting.queue
 
 import scala.tools.nsc.{Global, Settings}
 import scala.tools.nsc.io.PlainFile
-import org.broadinstitute.sting.queue.util.{Logging, IOUtils}
+import org.broadinstitute.sting.queue.util.Logging
 import collection.JavaConversions._
 import java.io.File
 import scala.tools.nsc.reporters.AbstractReporter
@@ -20,7 +20,7 @@ class QScriptManager() extends Logging {
    * Compiles and loads the scripts in the files into the current classloader.
    * Heavily based on scala/src/compiler/scala/tools/ant/Scalac.scala
    */
-  def loadScripts(scripts: List[File], tempDir: File) = {
+  def loadScripts(scripts: List[File], tempDir: File) {
     if (scripts.size > 0) {
       val settings = new Settings((error: String) => logger.error(error))
       settings.deprecation.value = true
@@ -63,7 +63,7 @@ object QScriptManager extends Logging {
    * Heavily based on scala/src/compiler/scala/tools/nsc/reporters/ConsoleReporter.scala
    */
   private class Log4JReporter(val settings: Settings) extends AbstractReporter {
-    def displayPrompt = throw new UnsupportedOperationException("Unable to prompt the user.  Prompting should be off.")
+    def displayPrompt { throw new UnsupportedOperationException("Unable to prompt the user.  Prompting should be off.") }
 
     /**
      * Displays the message at position with severity.
@@ -71,7 +71,7 @@ object QScriptManager extends Logging {
      * @param msg Message to display.
      * @param severity Severity of the event.
      */
-    def display(posIn: Position, msg: String, severity: Severity) = {
+    def display(posIn: Position, msg: String, severity: Severity) {
       severity.count += 1
       val level = severity match {
         case INFO => Level.INFO
@@ -87,7 +87,6 @@ object QScriptManager extends Logging {
         case NoPosition =>
           printMessage(level, msg)
         case _ =>
-          val buf = new StringBuilder(msg)
           val file = pos.source.file
           printMessage(level, file.name+":"+pos.line+": "+msg)
           printSourceLine(level, pos)
@@ -97,7 +96,7 @@ object QScriptManager extends Logging {
     /**
      * Prints a summary count of warnings and errors.
      */
-    def printSummary() = {
+    def printSummary() {
       if (WARNING.count > 0)
         printMessage(Level.WARN, countElementsAsString(WARNING.count, "warning") + " found")
       if (ERROR.count > 0)
@@ -119,15 +118,16 @@ object QScriptManager extends Logging {
      * @param level Severity level.
      * @param pos Position in the file of the event.
      */
-    private def printColumnMarker(level: Level, pos: Position) =
+    private def printColumnMarker(level: Level, pos: Position) {
       if (pos.isDefined) { printMessage(level, " " * (pos.column - 1) + "^") }
+    }
 
     /**
      * Prints the message at the severity level.
      * @param level Severity level.
      * @param message Message content.
      */
-    private def printMessage(level: Level, message: String) = {
+    private def printMessage(level: Level, message: String) {
       logger.log(level, message)
     }
   }
diff --git a/public/scala/src/org/broadinstitute/sting/queue/engine/CommandLineJobRunner.scala b/public/scala/src/org/broadinstitute/sting/queue/engine/CommandLineJobRunner.scala
index 2c960d8f6..ee6cbcbc4 100755
--- a/public/scala/src/org/broadinstitute/sting/queue/engine/CommandLineJobRunner.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/engine/CommandLineJobRunner.scala
@@ -26,7 +26,8 @@ package org.broadinstitute.sting.queue.engine
 
 import org.broadinstitute.sting.queue.function.CommandLineFunction
 import java.io.File
-import org.broadinstitute.sting.queue.util.{Logging, IOUtils}
+import org.broadinstitute.sting.queue.util.Logging
+import org.broadinstitute.sting.utils.io.IOUtils
 
 /**
  * Runs a command line function.
@@ -69,7 +70,7 @@ trait CommandLineJobRunner extends JobRunner[CommandLineFunction] with Logging {
 
   override def init() {
     super.init()
-    var exec = new StringBuilder
+    val exec = new StringBuilder
     
     var dirs = Set.empty[File]
     for (dir <- function.jobDirectories)
diff --git a/public/scala/src/org/broadinstitute/sting/queue/engine/FunctionEdge.scala b/public/scala/src/org/broadinstitute/sting/queue/engine/FunctionEdge.scala
index 4cb925d9f..55ed94267 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/engine/FunctionEdge.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/engine/FunctionEdge.scala
@@ -2,7 +2,10 @@ package org.broadinstitute.sting.queue.engine
 
 import org.broadinstitute.sting.queue.function.QFunction
 import java.io.{StringWriter, PrintWriter}
-import org.broadinstitute.sting.queue.util.{Logging, IOUtils}
+import org.broadinstitute.sting.queue.util.Logging
+import org.broadinstitute.sting.utils.io.IOUtils
+import org.apache.commons.io.FileUtils
+import org.apache.commons.lang.StringUtils
 
 /**
  * An edge in the QGraph that runs a QFunction.
@@ -150,26 +153,19 @@ class FunctionEdge(val function: QFunction, val inputs: QNode, val outputs: QNod
   /**
    * Outputs the last lines of the error logs.
    */
-  private def tailError() = {
+  private def tailError() {
     val errorFile = functionErrorFile
     if (IOUtils.waitFor(errorFile, 120)) {
       val maxLines = 100
       val tailLines = IOUtils.tail(errorFile, maxLines)
       val nl = "%n".format()
       val summary = if (tailLines.size > maxLines) "Last %d lines".format(maxLines) else "Contents"
-      logger.error("%s of %s:%n%s".format(summary, errorFile, tailLines.mkString(nl)))
+      logger.error("%s of %s:%n%s".format(summary, errorFile, StringUtils.join(tailLines, nl)))
     } else {
       logger.error("Unable to access log file: %s".format(errorFile))
     }
   }
 
-  /**
-   * Writes the contents of the error to the error file.
-   */
-  private def writeError(content: String) {
-    IOUtils.writeContents(functionErrorFile, content)
-  }
-
   /**
    * Writes the stack trace to the error file.
    */
@@ -178,8 +174,8 @@ class FunctionEdge(val function: QFunction, val inputs: QNode, val outputs: QNod
     val printWriter = new PrintWriter(stackTrace)
     printWriter.println(function.description)
     e.printStackTrace(printWriter)
-    printWriter.close
-    IOUtils.writeContents(functionErrorFile, stackTrace.toString)
+    printWriter.close()
+    FileUtils.writeStringToFile(functionErrorFile, stackTrace.toString)
   }
 
   def getRunInfo = {
diff --git a/public/scala/src/org/broadinstitute/sting/queue/engine/InProcessRunner.scala b/public/scala/src/org/broadinstitute/sting/queue/engine/InProcessRunner.scala
index a580be473..d006cde4b 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/engine/InProcessRunner.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/engine/InProcessRunner.scala
@@ -2,8 +2,8 @@ package org.broadinstitute.sting.queue.engine
 
 import org.broadinstitute.sting.queue.function.InProcessFunction
 import java.util.Date
-import org.broadinstitute.sting.queue.util.{Logging, IOUtils}
 import org.broadinstitute.sting.utils.Utils
+import org.apache.commons.io.FileUtils
 
 /**
  * Runs a function that executes in process and does not fork out an external process.
@@ -11,7 +11,7 @@ import org.broadinstitute.sting.utils.Utils
 class InProcessRunner(val function: InProcessFunction) extends JobRunner[InProcessFunction] {
   private var runStatus: RunnerStatus.Value = _
 
-  def start() = {
+  def start() {
     getRunInfo.startTime = new Date()
     getRunInfo.exechosts = Utils.resolveHostname()
     runStatus = RunnerStatus.RUNNING
@@ -20,7 +20,7 @@ class InProcessRunner(val function: InProcessFunction) extends JobRunner[InProce
 
     getRunInfo.doneTime = new Date()
     val content = "%s%nDone.".format(function.description)
-    IOUtils.writeContents(function.jobOutputFile, content)
+    FileUtils.writeStringToFile(function.jobOutputFile, content)
     runStatus = RunnerStatus.DONE
   }
 
diff --git a/public/scala/src/org/broadinstitute/sting/queue/engine/QGraph.scala b/public/scala/src/org/broadinstitute/sting/queue/engine/QGraph.scala
index 4469874e2..42ddf9104 100755
--- a/public/scala/src/org/broadinstitute/sting/queue/engine/QGraph.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/engine/QGraph.scala
@@ -40,6 +40,7 @@ import collection.immutable.{TreeSet, TreeMap}
 import org.broadinstitute.sting.queue.function.scattergather.{ScatterFunction, CloneFunction, GatherFunction, ScatterGatherableFunction}
 import java.util.Date
 import org.broadinstitute.sting.utils.Utils
+import org.broadinstitute.sting.utils.io.IOUtils
 
 /**
  * The internal dependency tracker between sets of function input and output files.
@@ -416,8 +417,15 @@ class QGraph extends Logging {
           startedJobsToEmail = Set.empty[FunctionEdge]
         }
 
-        if (readyJobs.size == 0 && runningJobs.size > 0)
-          Thread.sleep(nextRunningCheck(lastRunningCheck))
+        if (readyJobs.size == 0 && runningJobs.size > 0) {
+          runningLock.synchronized {
+            if (running) {
+              val timeout = nextRunningCheck(lastRunningCheck)
+              if (timeout > 0)
+                runningLock.wait(timeout)
+            }
+          }
+        }
 
         lastRunningCheck = System.currentTimeMillis
         updateStatus()
@@ -466,7 +474,7 @@ class QGraph extends Logging {
     lastRunningCheck > 0 && nextRunningCheck(lastRunningCheck) <= 0
 
   private def nextRunningCheck(lastRunningCheck: Long) =
-    0L max ((30 * 1000L) - (System.currentTimeMillis - lastRunningCheck))
+    ((30 * 1000L) - (System.currentTimeMillis - lastRunningCheck))
 
   private def logStatusCounts {
     logger.info("%d Pend, %d Run, %d Fail, %d Done".format(
@@ -1002,7 +1010,12 @@ class QGraph extends Logging {
       true
     } else {
       !this.jobGraph.edgeSet.exists(edge => {
-        edge.isInstanceOf[FunctionEdge] && edge.asInstanceOf[FunctionEdge].status == RunnerStatus.FAILED
+        if (edge.isInstanceOf[FunctionEdge]) {
+          val status = edge.asInstanceOf[FunctionEdge].status
+          (status == RunnerStatus.PENDING || status == RunnerStatus.RUNNING || status == RunnerStatus.FAILED)
+        } else {
+          false
+        }
       })
     }
   }
@@ -1051,7 +1064,13 @@ class QGraph extends Logging {
   def shutdown() {
     // Signal the main thread to shutdown.
     running = false
-    // Wait for the thread to finish and exit normally.
+
+    // Try and wait for the thread to finish and exit normally.
+    runningLock.synchronized {
+      runningLock.notify()
+    }
+
+    // Start killing jobs.
     runningLock.synchronized {
       val runners = runningJobs.map(_.runner)
       runningJobs = Set.empty[FunctionEdge]
diff --git a/public/scala/src/org/broadinstitute/sting/queue/engine/QGraphSettings.scala b/public/scala/src/org/broadinstitute/sting/queue/engine/QGraphSettings.scala
index ee498c8a0..56d6975a5 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/engine/QGraphSettings.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/engine/QGraphSettings.scala
@@ -28,7 +28,6 @@ import java.io.File
 import org.broadinstitute.sting.queue.QSettings
 import org.broadinstitute.sting.queue.util.SystemUtils
 import org.broadinstitute.sting.commandline.{Advanced, ArgumentCollection, Argument}
-import org.broadinstitute.sting.utils.R.RScriptExecutor
 
 /**
  * Command line options for a QGraph.
@@ -77,9 +76,6 @@ class QGraphSettings {
   @Argument(fullName="disableJobReport", shortName="disabpleJobReport", doc="If provided, we will not create a job report", required=false)
   var disableJobReport: Boolean = false
 
-  @ArgumentCollection
-  var rScriptArgs = new RScriptExecutor.RScriptArgumentCollection
-
   @ArgumentCollection
   val qSettings = new QSettings
 }
diff --git a/public/scala/src/org/broadinstitute/sting/queue/engine/drmaa/DrmaaJobManager.scala b/public/scala/src/org/broadinstitute/sting/queue/engine/drmaa/DrmaaJobManager.scala
index 4c9cc1890..3ff9f280e 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/engine/drmaa/DrmaaJobManager.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/engine/drmaa/DrmaaJobManager.scala
@@ -56,6 +56,6 @@ class DrmaaJobManager extends CommandLineJobManager[DrmaaJobRunner] {
     updatedRunners
   }
   override def tryStop(runners: Set[DrmaaJobRunner]) {
-    runners.filterNot(_.jobId == null).foreach(_.tryStop())
+    runners.foreach(_.tryStop())
   }
 }
diff --git a/public/scala/src/org/broadinstitute/sting/queue/engine/drmaa/DrmaaJobRunner.scala b/public/scala/src/org/broadinstitute/sting/queue/engine/drmaa/DrmaaJobRunner.scala
index b48dcd2a9..227261912 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/engine/drmaa/DrmaaJobRunner.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/engine/drmaa/DrmaaJobRunner.scala
@@ -135,14 +135,18 @@ class DrmaaJobRunner(val session: Session, val function: CommandLineFunction) ex
 
   def tryStop() {
     session.synchronized {
-      try {
-        // Stop runners. SIGTERM(15) is preferred to SIGKILL(9).
-        // Only way to send SIGTERM is for the Sys Admin set the terminate_method
-        // resource of the designated queue to SIGTERM
-        session.control(jobId, Session.TERMINATE)
-      } catch {
-        case e =>
-          logger.error("Unable to kill job " + jobId, e)
+      // Assumes that after being set the job may be
+      // reassigned but will not be reset back to null
+      if (jobId != null) {
+        try {
+          // Stop runners. SIGTERM(15) is preferred to SIGKILL(9).
+          // Only way to send SIGTERM is for the Sys Admin set the terminate_method
+          // resource of the designated queue to SIGTERM
+          session.control(jobId, Session.TERMINATE)
+        } catch {
+          case e =>
+            logger.error("Unable to kill job " + jobId, e)
+        }
       }
     }
   }
diff --git a/public/scala/src/org/broadinstitute/sting/queue/engine/shell/ShellJobManager.scala b/public/scala/src/org/broadinstitute/sting/queue/engine/shell/ShellJobManager.scala
index c5c8d719c..d72ff6e1d 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/engine/shell/ShellJobManager.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/engine/shell/ShellJobManager.scala
@@ -30,4 +30,5 @@ import org.broadinstitute.sting.queue.engine.CommandLineJobManager
 class ShellJobManager extends CommandLineJobManager[ShellJobRunner] {
   def runnerType = classOf[ShellJobRunner]
   def create(function: CommandLineFunction) = new ShellJobRunner(function)
+  override def tryStop(runners: Set[ShellJobRunner]) { runners.foreach(_.tryStop()) }
 }
diff --git a/public/scala/src/org/broadinstitute/sting/queue/engine/shell/ShellJobRunner.scala b/public/scala/src/org/broadinstitute/sting/queue/engine/shell/ShellJobRunner.scala
index ae899868a..5232dd4ea 100755
--- a/public/scala/src/org/broadinstitute/sting/queue/engine/shell/ShellJobRunner.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/engine/shell/ShellJobRunner.scala
@@ -25,41 +25,66 @@
 package org.broadinstitute.sting.queue.engine.shell
 
 import org.broadinstitute.sting.queue.function.CommandLineFunction
-import org.broadinstitute.sting.queue.util.ShellJob
 import org.broadinstitute.sting.queue.engine.{RunnerStatus, CommandLineJobRunner}
 import java.util.Date
-import org.broadinstitute.sting.gatk.phonehome.GATKRunReport
 import org.broadinstitute.sting.utils.Utils
+import org.broadinstitute.sting.utils.runtime.{ProcessSettings, OutputStreamSettings, ProcessController}
 
 /**
  * Runs jobs one at a time locally
  */
 class ShellJobRunner(val function: CommandLineFunction) extends CommandLineJobRunner {
-  private var runStatus: RunnerStatus.Value = _
+  // Controller on the thread that started the job
+  private var controller: ProcessController = null
 
   /**
    * Runs the function on the local shell.
    * @param function Command to run.
    */
   def start() {
-    val job = new ShellJob
+    val commandLine = Array("sh", jobScript.getAbsolutePath)
+    val stdoutSettings = new OutputStreamSettings
+    val stderrSettings = new OutputStreamSettings
+    val mergeError = (function.jobErrorFile != null)
 
-    job.workingDir = function.commandDirectory
-    job.outputFile = function.jobOutputFile
-    job.errorFile = function.jobErrorFile
+    stdoutSettings.setOutputFile(function.jobOutputFile, true)
+    if (function.jobErrorFile != null)
+      stderrSettings.setOutputFile(function.jobErrorFile, true)
 
-    job.shellScript = jobScript
+    if (logger.isDebugEnabled) {
+      stdoutSettings.printStandard(true)
+      stderrSettings.printStandard(true)
+    }
 
-    // Allow advanced users to update the job.
-    updateJobRun(job)
+    val processSettings = new ProcessSettings(
+      commandLine, mergeError, function.commandDirectory, null,
+      null, stdoutSettings, stderrSettings)
+
+    updateJobRun(processSettings)
 
     getRunInfo.startTime = new Date()
     getRunInfo.exechosts = Utils.resolveHostname()
     updateStatus(RunnerStatus.RUNNING)
-    job.run()
+    controller = ProcessController.getThreadLocal
+    val exitStatus = controller.exec(processSettings).getExitValue
     getRunInfo.doneTime = new Date()
-    updateStatus(RunnerStatus.DONE)
+    updateStatus(if (exitStatus == 0) RunnerStatus.DONE else RunnerStatus.FAILED)
   }
 
-  override def checkUnknownStatus() {}
+  /**
+   * Possibly invoked from a shutdown thread, find and
+   * stop the controller from the originating thread
+   */
+  def tryStop() {
+    // Assumes that after being set the job may be
+    // reassigned but will not be reset back to null
+    if (controller != null) {
+      try {
+        controller.tryDestroy()
+      } catch {
+        case e =>
+          logger.error("Unable to kill shell job: " + function.description)
+      }
+    }
+  }
 }
diff --git a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/ContigScatterFunction.scala b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/ContigScatterFunction.scala
index ee4cb9c4a..2609c3607 100755
--- a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/ContigScatterFunction.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/ContigScatterFunction.scala
@@ -35,6 +35,8 @@ class ContigScatterFunction extends GATKScatterFunction with InProcessFunction {
   // Include unmapped reads by default.
   this.includeUnmapped = true
 
+  override def scatterCount = if (intervalFilesExist) super.scatterCount min this.maxIntervals else super.scatterCount
+
   protected override def maxIntervals = {
     GATKScatterFunction.getGATKIntervals(this.referenceSequence, this.intervals).contigs.size
   }
@@ -44,3 +46,4 @@ class ContigScatterFunction extends GATKScatterFunction with InProcessFunction {
     IntervalUtils.scatterContigIntervals(gi.samFileHeader, gi.locs, this.scatterOutputFiles)
   }
 }
+
diff --git a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/GATKIntervals.scala b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/GATKIntervals.scala
index aae5e438c..9e47f64a1 100755
--- a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/GATKIntervals.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/GATKIntervals.scala
@@ -1,65 +1,65 @@
-/*
- * Copyright (c) 2011, The Broad Institute
- *
- * Permission is hereby granted, free of charge, to any person
- * obtaining a copy of this software and associated documentation
- * files (the "Software"), to deal in the Software without
- * restriction, including without limitation the rights to use,
- * copy, modify, merge, publish, distribute, sublicense, and/or sell
- * copies of the Software, and to permit persons to whom the
- * Software is furnished to do so, subject to the following
- * conditions:
- *
- * The above copyright notice and this permission notice shall be
- * included in all copies or substantial portions of the Software.
- * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
- * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
- * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
- * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
- * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
- * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
- * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
- * OTHER DEALINGS IN THE SOFTWARE.
- */
-
-package org.broadinstitute.sting.queue.extensions.gatk
-
-import java.io.File
-import collection.JavaConversions._
-import org.broadinstitute.sting.utils.interval.IntervalUtils
-import org.broadinstitute.sting.gatk.datasources.reference.ReferenceDataSource
-import net.sf.samtools.SAMFileHeader
-import java.util.Collections
-import org.broadinstitute.sting.utils.{GenomeLoc, GenomeLocSortedSet, GenomeLocParser}
-
-case class GATKIntervals(reference: File, intervals: List[String]) {
-  private lazy val referenceDataSource = new ReferenceDataSource(reference)
-  private var splitsBySize = Map.empty[Int, java.util.List[java.lang.Integer]]
-
-  lazy val samFileHeader = {
-    val header = new SAMFileHeader
-    header.setSequenceDictionary(referenceDataSource.getReference.getSequenceDictionary)
-    header
-  }
-
-  lazy val locs: java.util.List[GenomeLoc] = {
-    val parser = new GenomeLocParser(referenceDataSource.getReference)
-    val parsedLocs =
-      if (intervals.isEmpty)
-        GenomeLocSortedSet.createSetFromSequenceDictionary(samFileHeader.getSequenceDictionary).toList
-      else
-        IntervalUtils.parseIntervalArguments(parser, intervals, false)
-    Collections.sort(parsedLocs)
-    Collections.unmodifiableList(parsedLocs)
-  }
-
-  lazy val contigs = locs.map(_.getContig).distinct.toList
-
-  def getSplits(size: Int) = {
-    splitsBySize.getOrElse(size, {
-      val splits: java.util.List[java.lang.Integer] = IntervalUtils.splitFixedIntervals(locs, size)
-      splitsBySize += size -> splits
-      splits
-    })
-  }
-}
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.queue.extensions.gatk
+
+import java.io.File
+import collection.JavaConversions._
+import org.broadinstitute.sting.utils.interval.IntervalUtils
+import org.broadinstitute.sting.gatk.datasources.reference.ReferenceDataSource
+import net.sf.samtools.SAMFileHeader
+import java.util.Collections
+import org.broadinstitute.sting.utils.{GenomeLoc, GenomeLocSortedSet, GenomeLocParser}
+
+case class GATKIntervals(reference: File, intervals: List[String]) {
+  private lazy val referenceDataSource = new ReferenceDataSource(reference)
+//  private var splitsBySize = Map.empty[Int, java.util.List[java.lang.Integer]]
+
+  lazy val samFileHeader = {
+    val header = new SAMFileHeader
+    header.setSequenceDictionary(referenceDataSource.getReference.getSequenceDictionary)
+    header
+  }
+
+  lazy val locs: java.util.List[GenomeLoc] = {
+    val parser = new GenomeLocParser(referenceDataSource.getReference)
+    val parsedLocs =
+      if (intervals.isEmpty)
+        GenomeLocSortedSet.createSetFromSequenceDictionary(samFileHeader.getSequenceDictionary).toList
+      else
+        IntervalUtils.parseIntervalArguments(parser, intervals)
+    Collections.sort(parsedLocs)
+    Collections.unmodifiableList(parsedLocs)
+  }
+
+  lazy val contigs = locs.map(_.getContig).distinct.toList
+
+//  def getSplits(size: Int) = {
+//    splitsBySize.getOrElse(size, {
+//      val splits: java.util.List[java.lang.Integer] = IntervalUtils.splitFixedIntervals(locs, size)
+//      splitsBySize += size -> splits
+//      splits
+//    })
+//  }
+}
diff --git a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/GATKScatterFunction.scala b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/GATKScatterFunction.scala
index 32e58ca6a..c9adff026 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/GATKScatterFunction.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/GATKScatterFunction.scala
@@ -27,7 +27,7 @@ package org.broadinstitute.sting.queue.extensions.gatk
 import org.broadinstitute.sting.utils.interval.IntervalUtils
 import java.io.File
 import collection.JavaConversions._
-import org.broadinstitute.sting.queue.util.IOUtils
+import org.broadinstitute.sting.utils.io.IOUtils
 import org.broadinstitute.sting.queue.function.scattergather.{CloneFunction, ScatterFunction}
 import org.broadinstitute.sting.commandline.Output
 
@@ -53,13 +53,10 @@ trait GATKScatterFunction extends ScatterFunction {
   /** Whether the last scatter job should also include any unmapped reads. */
   protected var includeUnmapped: Boolean = _
 
-  /** The total number of clone jobs that will be created. */
-  override def scatterCount = if (intervalFilesExist) super.scatterCount min this.maxIntervals else super.scatterCount
-
   override def init() {
     this.originalGATK = this.originalFunction.asInstanceOf[CommandLineGATK]
     this.referenceSequence = this.originalGATK.reference_sequence
-    if (this.originalGATK.intervals.isEmpty && this.originalGATK.intervalsString.isEmpty) {
+    if (this.originalGATK.intervals.isEmpty && (this.originalGATK.intervalsString == null || this.originalGATK.intervalsString.isEmpty)) {
       this.intervals ++= GATKScatterFunction.getGATKIntervals(this.referenceSequence, List.empty[String]).contigs
     } else {
       this.intervals ++= this.originalGATK.intervals.map(_.toString)
@@ -69,8 +66,6 @@ trait GATKScatterFunction extends ScatterFunction {
   }
 
   override def isScatterGatherable = {
-    if (this.originalGATK.BTI != null && this.originalGATK.BTIMR == null)
-      throw new IllegalArgumentException("BTI requires BTIMR for use with scatter-gather (recommended: INTERSECTION)")
     this.originalGATK.reference_sequence != null
   }
 
diff --git a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/IntervalScatterFunction.scala b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/IntervalScatterFunction.scala
index d88d272b9..40a6fc4b4 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/IntervalScatterFunction.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/IntervalScatterFunction.scala
@@ -35,9 +35,11 @@ class IntervalScatterFunction extends GATKScatterFunction with InProcessFunction
   protected override def maxIntervals =
     GATKScatterFunction.getGATKIntervals(this.referenceSequence, this.intervals).locs.size
 
+  override def scatterCount = if (intervalFilesExist) super.scatterCount min this.maxIntervals else super.scatterCount
+
   def run() {
     val gi = GATKScatterFunction.getGATKIntervals(this.referenceSequence, this.intervals)
-    IntervalUtils.scatterFixedIntervals(gi.samFileHeader, gi.locs,
-      gi.getSplits(this.scatterOutputFiles.size), this.scatterOutputFiles)
+    val splits = IntervalUtils.splitFixedIntervals(gi.locs, this.scatterOutputFiles.size)
+    IntervalUtils.scatterFixedIntervals(gi.samFileHeader, splits, this.scatterOutputFiles)
   }
 }
diff --git a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/LocusScatterFunction.scala b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/LocusScatterFunction.scala
index 50482033f..8f52b9b82 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/LocusScatterFunction.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/LocusScatterFunction.scala
@@ -24,8 +24,21 @@
 
 package org.broadinstitute.sting.queue.extensions.gatk
 
+import collection.JavaConversions._
+import org.broadinstitute.sting.utils.interval.IntervalUtils
+import org.broadinstitute.sting.queue.function.InProcessFunction
+
 /**
- * For now returns an IntervalScatterFunction.
- * TODO: A scatter function that divides down to the locus level.
+ * A scatter function that divides down to the locus level.
  */
-class LocusScatterFunction extends IntervalScatterFunction {}
+//class LocusScatterFunction extends IntervalScatterFunction { }
+
+class LocusScatterFunction extends GATKScatterFunction with InProcessFunction {
+  protected override def maxIntervals = scatterCount
+
+  def run() {
+    val gi = GATKScatterFunction.getGATKIntervals(this.referenceSequence, this.intervals)
+    val splits = IntervalUtils.splitLocusIntervals(gi.locs, this.scatterOutputFiles.size)
+    IntervalUtils.scatterFixedIntervals(gi.samFileHeader, splits, this.scatterOutputFiles)
+  }
+}
\ No newline at end of file
diff --git a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/ReadScatterFunction.scala b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/ReadScatterFunction.scala
new file mode 100644
index 000000000..f56c4aa02
--- /dev/null
+++ b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/ReadScatterFunction.scala
@@ -0,0 +1,56 @@
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+package org.broadinstitute.sting.queue.extensions.gatk
+
+/*
+ * Copyright (c) 2011, The Broad Institute
+ *
+ * Permission is hereby granted, free of charge, to any person
+ * obtaining a copy of this software and associated documentation
+ * files (the "Software"), to deal in the Software without
+ * restriction, including without limitation the rights to use,
+ * copy, modify, merge, publish, distribute, sublicense, and/or sell
+ * copies of the Software, and to permit persons to whom the
+ * Software is furnished to do so, subject to the following
+ * conditions:
+ *
+ * The above copyright notice and this permission notice shall be
+ * included in all copies or substantial portions of the Software.
+ * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND,
+ * EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES
+ * OF MERCHANTABILITY, FITNESS FOR A PARTICULAR PURPOSE AND
+ * NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT
+ * HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
+ * WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
+ * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR
+ * OTHER DEALINGS IN THE SOFTWARE.
+ */
+
+/**
+ * Currently ReadScatterFunction only does ContigScattering, but it
+ * could in principle do something more aggressive.
+ */
+class ReadScatterFunction extends ContigScatterFunction { }
+
diff --git a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/RodBind.scala b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/RodBind.scala
index b4c5d91d3..9af4d9bcf 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/RodBind.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/RodBind.scala
@@ -1,7 +1,7 @@
 package org.broadinstitute.sting.queue.extensions.gatk
 
 import java.io.File
-import org.broadinstitute.sting.queue.util.FileExtension
+import org.broadinstitute.sting.utils.io.FileExtension
 import java.lang.String
 
 /**
diff --git a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/TaggedFile.scala b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/TaggedFile.scala
index b19f9e430..295199993 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/TaggedFile.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/TaggedFile.scala
@@ -1,7 +1,7 @@
 package org.broadinstitute.sting.queue.extensions.gatk
 
 import java.io.File
-import org.broadinstitute.sting.queue.util.FileExtension
+import org.broadinstitute.sting.utils.io.FileExtension
 
 /**
  * Used to provide tagged -I input_file arguments to the GATK.
diff --git a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/VcfGatherFunction.scala b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/VcfGatherFunction.scala
index d70022147..70046c913 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/VcfGatherFunction.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/extensions/gatk/VcfGatherFunction.scala
@@ -36,8 +36,6 @@ class VcfGatherFunction extends CombineVariants with GatherFunction {
   private lazy val originalGATK = this.originalFunction.asInstanceOf[CommandLineGATK]
 
   override def freezeFieldValues {
-    this.memoryLimit = Some(1)
-
     this.jarFile = this.originalGATK.jarFile
     this.reference_sequence = this.originalGATK.reference_sequence
     this.intervals = this.originalGATK.intervals
diff --git a/public/scala/src/org/broadinstitute/sting/queue/extensions/picard/PicardBamFunction.scala b/public/scala/src/org/broadinstitute/sting/queue/extensions/picard/PicardBamFunction.scala
index 2654e4a3d..427c09f82 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/extensions/picard/PicardBamFunction.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/extensions/picard/PicardBamFunction.scala
@@ -50,8 +50,8 @@ trait PicardBamFunction extends JavaCommandLineFunction {
   abstract override def commandLine = super.commandLine +
     Array(
       repeat(" INPUT=", inputBams),
-      " OUTPUT=" + outputBam,
       " TMP_DIR=" + jobTempDir,
+      optional(" OUTPUT=", outputBam),
       optional(" COMPRESSION_LEVEL=", compressionLevel),
       optional(" VALIDATION_STRINGENCY=", validationStringency),
       optional(" SO=", sortOrder),
diff --git a/public/scala/src/org/broadinstitute/sting/queue/extensions/picard/SamToFastq.scala b/public/scala/src/org/broadinstitute/sting/queue/extensions/picard/SamToFastq.scala
new file mode 100644
index 000000000..3a4217e60
--- /dev/null
+++ b/public/scala/src/org/broadinstitute/sting/queue/extensions/picard/SamToFastq.scala
@@ -0,0 +1,77 @@
+package org.broadinstitute.sting.queue.extensions.picard
+
+import org.broadinstitute.sting.commandline._
+
+import java.io.File
+
+/*
+ * Created by IntelliJ IDEA.
+ * User: carneiro
+ * Date: 6/22/11
+ * Time: 10:35 AM
+ */
+class SamToFastq extends org.broadinstitute.sting.queue.function.JavaCommandLineFunction with PicardBamFunction {
+  analysisName = "SamToFastq"
+  javaMainClass = "net.sf.picard.sam.SamToFastq"
+
+  @Input(shortName = "input", fullName = "input_bam_files", required = true, doc = "Input SAM/BAM file to extract reads from.")
+  var input: List[File] = Nil
+
+  @Output(shortName = "fastq", fullName = "output_fastq_file", required = true, doc = "Output fastq file (single-end fastq or, if paired, first end of the pair fastq).")
+  var fastq: File = _
+
+  @Output(shortName = "se", fullName = "second_end_fastq", required = false, doc = "Output fastq file (if paired, second end of the pair fastq).")
+  var secondEndFastQ: File = _
+
+  @Argument(shortName = "opg", fullName = "output_per_readgroup", required = false, doc = "Output a fastq file per read group (two fastq files per read group if the group is paired).")
+  var outputPerReadGroup: Boolean = false
+
+  @Argument(shortName = "od", fullName = "output_dir", required = false, doc = "Directory in which to output the fastq file(s). Used only when OUTPUT_PER_RG is true.")
+  var outputDir: File = _
+
+  @Argument(shortName = "rr", fullName = "re_reverse", required = false, doc = "Re-reverse bases and qualities of reads with negative strand flag set before writing them to fastq.")
+  var reReverse: Boolean = true
+
+  @Argument(shortName = "nonpf", fullName = "include_non_pf_reads", required = false, doc = "Include non-PF reads from the SAM file into the output FASTQ files.")
+  var includeNonPFReads: Boolean = false
+
+  @Argument(shortName = "cat", fullName = "clipping_attribute", required = false, doc = "The attribute that stores the position at which the SAM record should be clipped.")
+  var clippingAttribute: String = null
+
+  @Argument(shortName = "cac", fullName = "clipping_action", required = false, doc = "The action that should be taken with clipped reads: 'X' means the reads and qualities should be trimmed at the clipped position; 'N' means the bases should be changed to Ns in the clipped region; and any integer means that the base qualities should be set to that value in the clipped region.")
+  var clippingAction: String = null
+
+  @Argument(shortName = "r1t", fullName = "read_one_trim", required = false, doc = "The number of bases to trim from the beginning of read 1.")
+  var readOneTrim: Int = -1
+
+  @Argument(shortName = "r1mbtw", fullName = "read_one_max_bases_to_write", required = false, doc = "The maximum number of bases to write from read 1 after trimming. If there are fewer than this many bases left after trimming, all will be written. If this value is null then all bases left after trimming will be written.")
+  var readOneMaxBasesToWrite: Int = -1
+
+  @Argument(shortName = "r2t", fullName = "read_two_trim", required = false, doc = "The number of bases to trim from the beginning of read 2.")
+  var readTwoTrim: Int = -1
+
+  @Argument(shortName = "r2mbtw", fullName = "read_two_max_bases_to_write", required = false, doc = "The maximum number of bases to write from read 2 after trimming. If there are fewer than this many bases left after trimming, all will be written. If this value is null then all bases left after trimming will be written.")
+  var readTwoMaxBasesToWrite: Int = -1
+
+  @Argument(shortName = "inpa", fullName = "include_non_primary_alignments", required = false, doc = "If true, include non-primary alignments in the output. Support of non-primary alignments in SamToFastq is not comprehensive, so there may be exceptions if this is set to true and there are paired reads with non-primary alignments.")
+  var includeNonPrimaryAlignments: Boolean = false
+
+  override def inputBams = input
+  override def outputBam = null
+  this.sortOrder = null
+
+  override def commandLine = super.commandLine +
+       " FASTQ=" + fastq +
+       optional(" SECOND_END_FASTQ=", secondEndFastQ) +
+       conditionalParameter(outputPerReadGroup, optional(" OUTPUT_PER_RG=", outputPerReadGroup)) +
+       optional(" OUTPUT_DIR=", outputDir) +
+       conditionalParameter(!reReverse, optional(" RE_REVERSE=", reReverse)) +
+       conditionalParameter(includeNonPFReads, optional(" INCLUDE_NON_PF_READS=", includeNonPFReads)) +
+       optional(" CLIPPING_ATTRIBUTE=", clippingAttribute) +
+       optional(" CLIPPING_ACTION=", clippingAction) +
+       conditionalParameter (readOneTrim >= 0, optional(" READ1_TRIM=", readOneTrim)) +
+       conditionalParameter (readOneMaxBasesToWrite >= 0, optional(" READ1_MAX_BASES_TO_WRITE=", readOneMaxBasesToWrite)) +
+       conditionalParameter (readTwoTrim >= 0, optional(" READ2_TRIM=", readTwoTrim)) +
+       conditionalParameter (readTwoMaxBasesToWrite >=0, optional(" READ2_MAX_BASES_TO_WRITE=", readTwoMaxBasesToWrite)) +
+       conditionalParameter (includeNonPrimaryAlignments, optional(" INCLUDE_NON_PRIMARY_ALIGNMENTS=", includeNonPrimaryAlignments))
+}
\ No newline at end of file
diff --git a/public/scala/src/org/broadinstitute/sting/queue/function/JavaCommandLineFunction.scala b/public/scala/src/org/broadinstitute/sting/queue/function/JavaCommandLineFunction.scala
index e8279f62b..4a50a72ac 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/function/JavaCommandLineFunction.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/function/JavaCommandLineFunction.scala
@@ -25,7 +25,7 @@
 package org.broadinstitute.sting.queue.function
 
 import org.broadinstitute.sting.commandline.Argument
-import org.broadinstitute.sting.queue.util.IOUtils
+import org.broadinstitute.sting.utils.io.IOUtils
 import java.io.File
 
 /**
diff --git a/public/scala/src/org/broadinstitute/sting/queue/function/QFunction.scala b/public/scala/src/org/broadinstitute/sting/queue/function/QFunction.scala
index 500f7b200..59f2ada44 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/function/QFunction.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/function/QFunction.scala
@@ -31,6 +31,7 @@ import org.broadinstitute.sting.queue.{QException, QSettings}
 import collection.JavaConversions._
 import org.broadinstitute.sting.queue.function.scattergather.SimpleTextGatherFunction
 import org.broadinstitute.sting.queue.util._
+import org.broadinstitute.sting.utils.io.IOUtils
 
 /**
  * The base interface for all functions in Queue.
diff --git a/public/scala/src/org/broadinstitute/sting/queue/function/scattergather/GatherFunction.scala b/public/scala/src/org/broadinstitute/sting/queue/function/scattergather/GatherFunction.scala
index 16d31b777..6b8b5d143 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/function/scattergather/GatherFunction.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/function/scattergather/GatherFunction.scala
@@ -4,7 +4,8 @@ import java.io.File
 import org.broadinstitute.sting.commandline.{Input, Output}
 import org.broadinstitute.sting.queue.function.QFunction
 import org.broadinstitute.sting.queue.QException
-import org.broadinstitute.sting.queue.util.IOUtils
+import org.broadinstitute.sting.utils.io.IOUtils
+import collection.JavaConversions._
 
 /**
  * Base class for Gather command line functions.
@@ -29,7 +30,7 @@ trait GatherFunction extends QFunction {
   /**
    * Waits for gather parts to propagate over NFS or throws an exception.
    */
-  protected def waitForGatherParts = {
+  protected def waitForGatherParts() {
     val missing = IOUtils.waitFor(gatherParts, 120)
     if (!missing.isEmpty)
       throw new QException("Unable to find gather inputs: " + missing.mkString(", "))
diff --git a/public/scala/src/org/broadinstitute/sting/queue/function/scattergather/ScatterGatherableFunction.scala b/public/scala/src/org/broadinstitute/sting/queue/function/scattergather/ScatterGatherableFunction.scala
index e6294c093..402da4a7a 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/function/scattergather/ScatterGatherableFunction.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/function/scattergather/ScatterGatherableFunction.scala
@@ -29,6 +29,7 @@ import org.broadinstitute.sting.queue.util._
 import org.broadinstitute.sting.commandline.{Gatherer, Gather, ArgumentSource}
 import org.broadinstitute.sting.queue.function.{QFunction, CommandLineFunction}
 import org.broadinstitute.sting.queue.QException
+import org.broadinstitute.sting.utils.io.IOUtils
 
 /**
  * A function that can be run faster by splitting it up into pieces and then joining together the results.
@@ -82,8 +83,8 @@ trait ScatterGatherableFunction extends CommandLineFunction {
   /**
    * Sets the scatter gather directory to the command directory if it is not already set.
    */
-  override def freezeFieldValues = {
-    super.freezeFieldValues
+  override def freezeFieldValues() {
+    super.freezeFieldValues()
 
     if (this.scatterGatherDirectory == null) {
       if (qSettings.jobScatterGatherDirectory != null) {
@@ -98,10 +99,14 @@ trait ScatterGatherableFunction extends CommandLineFunction {
    * The scatter function.
    */
   private lazy val scatterFunction = {
+    // Only depend on input fields that have a value
+    val inputFieldsWithValues = this.inputFields.filter(hasFieldValue(_))
+    val inputFiles = inputFieldsWithValues.flatMap(getFieldFiles(_)).toSet
+
     val scatterFunction = newScatterFunction()
     this.copySettingsTo(scatterFunction)
     scatterFunction.originalFunction = this
-    scatterFunction.originalInputs = this.inputs
+    scatterFunction.originalInputs = inputFiles
     scatterFunction.commandDirectory = this.scatterGatherTempDir("scatter")
     scatterFunction.isIntermediate = true
     scatterFunction.addOrder = this.addOrder :+ 1
@@ -121,8 +126,6 @@ trait ScatterGatherableFunction extends CommandLineFunction {
   def generateFunctions() = {
     var functions = List.empty[QFunction]
 
-    // Only depend on input fields that have a value
-    val inputFieldsWithValues = this.inputFields.filter(hasFieldValue(_))
     // Only gather up fields that will have a value
     val outputFieldsWithValues = this.outputFields.filter(hasFieldValue(_))
 
@@ -228,7 +231,7 @@ trait ScatterGatherableFunction extends CommandLineFunction {
    * Calls setupScatterFunction with scatterFunction.
    * @param scatterFunction The function that will create the scatter pieces in the temporary directories.
    */
-  protected def initScatterFunction(scatterFunction: ScatterFunction) = {
+  protected def initScatterFunction(scatterFunction: ScatterFunction) {
     if (this.setupScatterFunction != null)
       if (this.setupScatterFunction.isDefinedAt(scatterFunction))
         this.setupScatterFunction(scatterFunction)
@@ -272,7 +275,7 @@ trait ScatterGatherableFunction extends CommandLineFunction {
    * @param gatherFunction The function that will merge the gather pieces from the temporary directories.
    * @param gatherField The output field being gathered.
    */
-  protected def initGatherFunction(gatherFunction: GatherFunction, gatherField: ArgumentSource) = {
+  protected def initGatherFunction(gatherFunction: GatherFunction, gatherField: ArgumentSource) {
     if (this.setupGatherFunction != null)
       if (this.setupGatherFunction.isDefinedAt(gatherFunction, gatherField))
         this.setupGatherFunction(gatherFunction, gatherField)
@@ -289,7 +292,7 @@ trait ScatterGatherableFunction extends CommandLineFunction {
    * @param cloneFunction The clone of this ScatterGatherableFunction
    * @param index The one based index (from 1..scatterCount inclusive) of the scatter piece.
    */
-  protected def initCloneFunction(cloneFunction: CloneFunction, index: Int) = {
+  protected def initCloneFunction(cloneFunction: CloneFunction, index: Int) {
     if (this.setupCloneFunction != null)
       if (this.setupCloneFunction.isDefinedAt(cloneFunction, index))
         this.setupCloneFunction(cloneFunction, index)
diff --git a/public/scala/src/org/broadinstitute/sting/queue/util/CommandLineJob.scala b/public/scala/src/org/broadinstitute/sting/queue/util/CommandLineJob.scala
deleted file mode 100644
index f38f2b369..000000000
--- a/public/scala/src/org/broadinstitute/sting/queue/util/CommandLineJob.scala
+++ /dev/null
@@ -1,51 +0,0 @@
-package org.broadinstitute.sting.queue.util
-
-import java.io.File
-
-/**
- * Base utility class for a command line job.
- */
-abstract class CommandLineJob {
-  var shellScript: File = _
-  var workingDir: File = _
-  var inputFile: File = _
-  var outputFile: File = _
-  var errorFile: File = _
-
-  /**
-   * Runs the command, either immediately or dispatching it to a compute farm.
-   * If it is dispatched to a compute farm it should not start until jobs it depends on are finished.
-   */
-  def run()
-
-  /**
-   * Returns the content of a command output.
-   * @param streamOutput The output of the command.
-   * @return The content of the command, along with a message if it was truncated.
-   */
-  protected def content(streamOutput: ProcessController.StreamOutput) = {
-    var content = streamOutput.content
-    if (streamOutput.contentTruncated)
-      content += "%n%n<truncated>".format()
-    content
-  }
-
-  /**
-   * Returns the ProcessController for this thread.
-   * @return The ProcessController for this thread.
-   */
-  protected def processController = CommandLineJob.threadProcessController.get
-
-  /** A five mb limit of characters for display. */
-  protected val FIVE_MB = 1024 * 512 * 5;
-}
-
-/**
- * Base class for a command line job.
- */
-object CommandLineJob {
-  /** Thread local process controller container. */
-  private val threadProcessController = new ThreadLocal[ProcessController] {
-    override def initialValue = new ProcessController
-  }
-}
diff --git a/public/scala/src/org/broadinstitute/sting/queue/util/FileExtension.scala b/public/scala/src/org/broadinstitute/sting/queue/util/FileExtension.scala
deleted file mode 100644
index 9b6e52c8e..000000000
--- a/public/scala/src/org/broadinstitute/sting/queue/util/FileExtension.scala
+++ /dev/null
@@ -1,15 +0,0 @@
-package org.broadinstitute.sting.queue.util
-
-import java.io.File
-
-/**
- * An trait for @Input or @Output CommandLineFunction fields that are extensions of files.
- */
-trait FileExtension extends File {
-  /**
-   * Returns a clone of the FileExtension with the new path.
-   * @param newPath new path for the clone of this FileExtension
-   * @return a clone of the FileExtension with the new path.
-   */
-  def withPath(newPath: String): File
-}
diff --git a/public/scala/src/org/broadinstitute/sting/queue/util/IOUtils.scala b/public/scala/src/org/broadinstitute/sting/queue/util/IOUtils.scala
deleted file mode 100644
index b17ccc0d5..000000000
--- a/public/scala/src/org/broadinstitute/sting/queue/util/IOUtils.scala
+++ /dev/null
@@ -1,253 +0,0 @@
-package org.broadinstitute.sting.queue.util
-
-import org.apache.commons.io.FileUtils
-import java.io.{FileReader, File}
-import org.broadinstitute.sting.utils.exceptions.UserException
-import org.broadinstitute.sting.queue.QException
-
-/**
- * A collection of utilities for modifying java.io.
- */
-object IOUtils extends Logging {
-  /**
-   * Checks if the temp directory has been setup and throws an exception if they user hasn't set it correctly.
-   * @param tempDir Temporary directory.
-   */
-  def checkTempDir(tempDir: File) {
-    val tempDirPath = tempDir.getAbsolutePath
-    // Keeps the user from leaving the temp directory as the default, and on Macs from having pluses
-    // in the path which can cause problems with the Google Reflections library.
-    // see also: http://benjchristensen.com/2009/09/22/mac-osx-10-6-java-java-io-tmpdir/
-    if (tempDirPath.startsWith("/var/folders/") || (tempDirPath == "/tmp") || (tempDirPath == "/tmp/"))
-      throw new UserException.BadTmpDir("java.io.tmpdir must be explicitly set")
-    if (!tempDir.exists && !tempDir.mkdirs)
-      throw new UserException.BadTmpDir("Could not create directory: " + tempDir.getAbsolutePath)
-  }
-
-  /**
-   * Creates a temp directory with the prefix and optional suffix.
-   * @param prefix Prefix for the directory name.
-   * @param suffix Optional suffix for the directory name.
-   * @param tempDirParent Parent directory for the temp directory.
-   * @return The created temporary directory.
-   */
-  def tempDir(prefix: String, suffix: String = "", tempDirParent: File) = {
-    if (!tempDirParent.exists && !tempDirParent.mkdirs)
-       throw new UserException.BadTmpDir("Could not create temp directory: " + tempDirParent)
-    val temp = File.createTempFile(prefix + "-", suffix, tempDirParent)
-    if (!temp.delete)
-      throw new UserException.BadTmpDir("Could not delete sub file: " + temp.getAbsolutePath)
-    if (!temp.mkdir)
-      throw new UserException.BadTmpDir("Could not create sub directory: " + temp.getAbsolutePath)
-    absolute(temp)
-  }
-
-  /**
-   * Writes content into a file.
-   * @param file File to write to.
-   * @param content Content to write.
-   */
-  def writeContents(file: File, content: String) { FileUtils.writeStringToFile(file, content) }
-
-  /**
-   * Reads content of a file into a string.
-   * Only for use on really small files!
-   * @param file File to read to.
-   * @return content Content of the file.
-   */
-  def readContents(file: File) = FileUtils.readFileToString(file)
-
-  /**
-   * Writes content to a temp file and returns the path to the temporary file.
-   * @param content to write.
-   * @param prefix Prefix for the temp file.
-   * @param suffix Suffix for the temp file.
-   * @param directory Directory for the temp file.
-   * @return the path to the temp file.
-   */
-  def writeTempFile(content: String, prefix: String, suffix: String, directory: File) = {
-    val tempFile = absolute(File.createTempFile(prefix, suffix, directory))
-    writeContents(tempFile, content)
-    tempFile
-  }
-
-  /**
-   * Waits for NFS to propagate a file creation, imposing a timeout.
-   *
-   * Based on Apache Commons IO FileUtils.waitFor()
-   *
-   * @param file The file to wait for.
-   * @param seconds The maximum time in seconds to wait.
-   * @return true if the file exists
-   */
-  def waitFor(file: File, seconds: Int): Boolean = waitFor(List(file), seconds).isEmpty
-
-  /**
-   * Waits for NFS to propagate a file creation, imposing a timeout.
-   *
-   * Based on Apache Commons IO FileUtils.waitFor()
-   *
-   * @param files The list of files to wait for.
-   * @param seconds The maximum time in seconds to wait.
-   * @return Files that still do not exists at the end of the timeout, or a empty list if all files exists.
-   */
-  def waitFor[T <: Traversable[File]](files: T, seconds: Int): Traversable[File] = {
-      var timeout = 0;
-      var tick = 0;
-      var missingFiles = files.filterNot(_.exists)
-      while (!missingFiles.isEmpty && timeout <= seconds) {
-        if (tick >= 10) {
-          tick = 0;
-          timeout += 1
-        }
-        tick += 1
-        try {
-            Thread.sleep(100)
-        } catch {
-          case ignore: InterruptedException =>
-        }
-        missingFiles = missingFiles.filterNot(_.exists)
-      }
-      missingFiles
-  }
-
-  /**
-   * Returns the directory at the number of levels deep.
-   * For example 2 levels of /path/to/dir will return /path/to
-   * @param dir Directory path.
-   * @param level how many levels deep from the root.
-   * @return The path to the parent directory that is level-levels deep.
-   */
-  def dirLevel(dir: File, level: Int): File = {
-    var directories = List.empty[File]
-    var parentDir = absolute(dir)
-    while (parentDir != null) {
-      directories +:= parentDir
-      parentDir = parentDir.getParentFile
-    }
-    if (directories.size <= level)
-      directories.last
-    else
-      directories(level)
-  }
-
-  /**
-   * Returns the sub path rooted at the parent.
-   * @param parent The parent directory.
-   * @param path The sub path to append to the parent, if the path is not absolute.
-   * @return The absolute path to the file in the parent dir if the path was not absolute, otherwise the original path.
-   */
-  def absolute(parent: File, path: String): File =
-    absolute(parent, new File(path))
-
-  /**
-   * Returns the sub path rooted at the parent.
-   * @param parent The parent directory.
-   * @param file The sub path to append to the parent, if the path is not absolute.
-   * @return The absolute path to the file in the parent dir if the path was not absolute, otherwise the original path.
-   */
-  def absolute(parent: File, file: File): File = {
-    val newPath =
-      if (file.isAbsolute)
-        absolutePath(file)
-      else
-        absolutePath(new File(parent, file.getPath))
-    replacePath(file, newPath)
-  }
-
-  /**
-   * A mix of getCanonicalFile and getAbsoluteFile that returns the
-   * absolute path to the file without deferencing symbolic links.
-   * @param file the file.
-   * @return the absolute path to the file.
-   */
-  def absolute(file: File) = {
-    replacePath(file, absolutePath(file))
-  }
-
-  private def absolutePath(file: File) = {
-    var fileAbs = file.getAbsoluteFile
-    var names = List.empty[String]
-    while (fileAbs != null) {
-      val name = fileAbs.getName
-      fileAbs = fileAbs.getParentFile
-
-      if (name == ".") {
-        /* skip */
-
-        /* TODO: What do we do for ".."?
-      } else if (name == "..") {
-
-        CentOS tcsh says use getCanonicalFile:
-        ~ $ mkdir -p test1/test2
-        ~ $ ln -s test1/test2 test3
-        ~ $ cd test3/..
-        ~/test1 $
-
-        Mac bash says keep going with getAbsoluteFile:
-        ~ $ mkdir -p test1/test2
-        ~ $ ln -s test1/test2 test3
-        ~ $ cd test3/..
-        ~ $
-
-        For now, leave it and let the shell figure it out.
-        */
-      } else {
-        names +:= name
-      }
-    }
-
-    names.mkString("/", "/", "")
-  }
-
-  private def replacePath(file: File, path: String) = {
-    file match {
-      case fileExtension: FileExtension =>
-        fileExtension.withPath(path)
-      case file: File =>
-        if (file.getClass != classOf[File])
-          throw new QException("Sub classes of java.io.File must also implement FileExtension so that the path can be modified.")
-        new File(path)
-    }
-  }
-
-  /**
-   * Returns the last lines of the file.
-   * NOTE: This is only safe to run on smaller files!
-   * @param file File to read.
-   * @param count Maximum number of lines to return.
-   * @return The last count lines from file.
-   */
-  def tail(file: File, count: Int) = {
-    var tailLines = List.empty[String]
-    var reader = new FileReader(file)
-    try {
-      val iterator = org.apache.commons.io.IOUtils.lineIterator(reader)
-      var lineCount = 0
-      while (iterator.hasNext) {
-        val line = iterator.nextLine
-        lineCount += 1
-        if (lineCount > count)
-          tailLines = tailLines.tail
-        tailLines :+= line
-      }
-    } finally {
-      org.apache.commons.io.IOUtils.closeQuietly(reader)
-    }
-    tailLines
-  }
-
-  /**
-   * Tries to delete a file.  Emits a warning if the file was unable to be deleted.
-   * @param file File to delete.
-   * @return true if the file was deleted.
-   */
-  def tryDelete(file: File) = {
-    val deleted = FileUtils.deleteQuietly(file)
-    if (deleted)
-      logger.debug("Deleted " + file)
-    else if (file.exists)
-      logger.warn("Unable to delete " + file)
-    deleted
-  }
-}
diff --git a/public/scala/src/org/broadinstitute/sting/queue/util/JobExitException.scala b/public/scala/src/org/broadinstitute/sting/queue/util/JobExitException.scala
deleted file mode 100644
index 827b6132f..000000000
--- a/public/scala/src/org/broadinstitute/sting/queue/util/JobExitException.scala
+++ /dev/null
@@ -1,11 +0,0 @@
-package org.broadinstitute.sting.queue.util
-
-import org.broadinstitute.sting.queue.QException
-
-/**
- * Captures the exit code and error text from a failed process.
- */
-class JobExitException(val exitText: String, val commandLine: Array[String], val exitCode: Int, val stdErr: String)
-        extends QException("%s%nCommand line:%n%s%nExit code: %s%nStandard error contained: %n%s"
-                .format(exitText, commandLine.mkString(" "), exitCode, stdErr)) {
-}
diff --git a/public/scala/src/org/broadinstitute/sting/queue/util/ProcessController.scala b/public/scala/src/org/broadinstitute/sting/queue/util/ProcessController.scala
deleted file mode 100644
index e5cb50202..000000000
--- a/public/scala/src/org/broadinstitute/sting/queue/util/ProcessController.scala
+++ /dev/null
@@ -1,369 +0,0 @@
-package org.broadinstitute.sting.queue.util
-
-import java.io._
-import scala.collection.mutable.{HashSet, ListMap}
-
-/**
- * Facade to Runtime.exec() and java.lang.Process.  Handles
- * running a process to completion and returns stdout and stderr
- * as strings.  Creates separate threads for reading stdout and stderr,
- * then reuses those threads for each process most efficient use is
- * to create one of these and use it repeatedly.  Instances are not
- * thread-safe, however.
- *
- * @author originally by Michael Koehrsen ported to scala and enhanced by Khalid Shakir
- */
-class ProcessController extends Logging {
-
-  // Threads that capture stdout and stderr
-  private val stdoutCapture = new OutputCapture(ProcessController.STDOUT_KEY)
-  private val stderrCapture = new OutputCapture(ProcessController.STDERR_KEY)
-
-  // Communication channels with output capture threads
-  /** Holds the stdout and stderr sent to the background capture threads */
-  private val toCapture = new ListMap[String, ProcessController.CapturedStreamOutput]
-
-  /** Holds the results of the capture from the background capture threads.
-   * May be the content via toCapture or an EmptyStreamOutput if the capture was interrupted. */
-  private val fromCapture = new ListMap[String, ProcessController.StreamOutput]
-
-  // Start the background threads for this controller.
-  stdoutCapture.start()
-  stderrCapture.start()
-
-  /**
-   * Executes a command line program with the settings and waits for it to return, processing the output on a background thread.
-   * @param settings Settings to be run.
-   * @return The output of the command.
-   */
-  def exec(settings: ProcessController.ProcessSettings): ProcessController.ProcessOutput = {
-    var builder = new ProcessBuilder(settings.cmdarray:_*)
-    builder.directory(settings.directory)
-
-    if (settings.environment != null) {
-      val builderEnvironment = builder.environment
-      builderEnvironment.clear()
-      settings.environment.foreach{case (name, value) => builderEnvironment.put(name, value)}
-    }
-
-    builder.redirectErrorStream(settings.redirectErrorStream)
-
-    var stdout: ProcessController.StreamOutput = null
-    var stderr: ProcessController.StreamOutput = null
-    val process = builder.start
-
-    ProcessController.running.add(process)
-    try {
-      val stdoutSettings = if (settings.stdoutSettings == null) ProcessController.EmptyStreamSettings else settings.stdoutSettings
-      val stderrSettings = if (settings.stderrSettings == null) ProcessController.EmptyStreamSettings else settings.stderrSettings
-
-      toCapture.synchronized {
-        toCapture.put(ProcessController.STDOUT_KEY, new ProcessController.CapturedStreamOutput(process.getInputStream, stdoutSettings, scala.Console.out))
-        toCapture.put(ProcessController.STDERR_KEY, new ProcessController.CapturedStreamOutput(process.getErrorStream, stderrSettings, scala.Console.err))
-        toCapture.notifyAll()
-      }
-
-      if (settings.stdinSettings.input != null) {
-        val writer = new OutputStreamWriter(process.getOutputStream)
-        writer.write(settings.stdinSettings.input)
-        writer.flush()
-      }
-      if (settings.stdinSettings.inputFile != null) {
-        val reader = new FileReader(settings.stdinSettings.inputFile)
-        val writer = new OutputStreamWriter(process.getOutputStream)
-        val buf = new Array[Char](4096)
-        var readCount = 0
-        while ({readCount = reader.read(buf); readCount} >= 0)
-          writer.write(buf, 0, readCount)
-        writer.flush()
-        reader.close()
-      }
-      
-      try {
-        process.getOutputStream.close()
-        process.waitFor()
-      } finally {
-        while (stdout == null || stderr == null) {
-          fromCapture.synchronized {
-            fromCapture.remove(ProcessController.STDOUT_KEY) match {
-              case Some(stream) => stdout = stream
-              case None => /* ignore */
-            }
-            fromCapture.remove(ProcessController.STDERR_KEY) match {
-              case Some(stream) => stderr = stream
-              case None => /* ignore */
-            }
-
-            try {
-              if (stdout == null || stderr == null)
-                fromCapture.wait()
-            } catch {
-              case e: InterruptedException =>
-                logger.error(e)
-            }
-          }
-        }
-      }
-    } finally {
-      ProcessController.running.remove(process)
-    }
-
-    new ProcessController.ProcessOutput(process.exitValue, stdout, stderr)
-  }
-
-  /** Ensures that the threads used to manipulate the IO for the process are cleaned up properly. */
-  def close() = {
-    try {
-      stdoutCapture.interrupt()
-      stderrCapture.interrupt()
-    } catch {
-      case e =>
-        logger.error(e)
-    }
-  }
-
-  /** calls close() */
-  override def finalize = close()
-
-  /**
-   * Reads in the output of a stream on a background thread to keep the output pipe from backing up and freezing the called process.
-   * @param key The stdout or stderr key for this output capture.
-   */
-  private class OutputCapture(private val key: String)
-          extends Thread("OutputCapture-" + key + "-" + Thread.currentThread.getName) {
-
-    setDaemon(true)
-
-    /** Runs the capture. */
-    override def run = {
-      var break = false
-      while (!break) {
-        var processStream: ProcessController.StreamOutput = ProcessController.EmptyStreamOutput
-        try {
-          // Wait for a new input stream to be passed from this process controller.
-          var capturedProcessStream: ProcessController.CapturedStreamOutput = null
-          while (capturedProcessStream == null) {
-            toCapture.synchronized {
-              toCapture.remove(key) match {
-                case Some(stream) => capturedProcessStream = stream
-                case None => toCapture.wait()
-              }
-            }
-          }
-          // Read in the input stream
-          processStream = capturedProcessStream
-          capturedProcessStream.read
-        } catch {
-          case e: InterruptedException => {
-            logger.info("OutputReader interrupted, exiting")
-            break = true
-          }
-          case e: IOException => {
-            logger.error("Error reading process output", e)
-          }
-        } finally {
-          // Send the string back to the process controller.
-          fromCapture.synchronized {
-            fromCapture.put(key, processStream)
-            fromCapture.notify()
-          }
-        }
-      }
-    }
-  }
-}
-
-/**
- * Facade to Runtime.exec() and java.lang.Process.  Handles
- * running a process to completion and returns stdout and stderr
- * as strings.  Creates separate threads for reading stdout and stderr,
- * then reuses those threads for each process most efficient use is
- * to create one of these and use it repeatedly.  Instances are not
- * thread-safe, however.
- *
- * @author originally by Michael Koehrsen ported to scala and enhanced by Khalid Shakir
- */
-object ProcessController extends Logging {
-
-  /**
-   * Settings that define how to run a process.
-   * @param cmdarray Command line to run.
-   * @param environment Environment settings to override System.getEnv, or null to use System.getEnv.
-   * @param directory The directory to run the command in, or null to run in the current directory.
-   * @param stdinSettings Settings for writing to the process stdin.
-   * @param stdoutSettings Settings for capturing the process stdout.
-   * @param stderrSettings Setting for capturing the process stderr.
-   * @param redirectErrorStream true if stderr should be sent to stdout.
-   */
-  class ProcessSettings(val cmdarray: Array[String], val environment: Map[String, String], val directory: File,
-                        val stdinSettings: InputStreamSettings, val stdoutSettings: OutputStreamSettings,
-                        val stderrSettings: OutputStreamSettings, val redirectErrorStream: Boolean)
-
-  /**
-   * Settings that define text to write to the process stdin.
-   * @param input String to write to stdin.
-   * @param inputFile File to write to stdin.
-   */
-  class InputStreamSettings(val input: String, val inputFile: File)
-
-  /**
-   * Settings that define text to capture from a process stream.
-   * @param stringSize The number of characters to capture, or -1 for unlimited.
-   * @param outputFile The file to write output to, or null to skip output.
-   * @param outputFileAppend true if the output file should be appended to.
-   */
-  class OutputStreamSettings(val stringSize: Int, val outputFile: File, val outputFileAppend: Boolean)
-
-  /**
-   * The output of a process.
-   * @param exitValue The exit value.
-   * @param stdout The capture of stdout as defined by the stdout OutputStreamSettings.
-   * @param stderr The capture of stderr as defined by the stderr OutputStreamSettings.
-   */
-  class ProcessOutput(val exitValue: Int, val stdout: StreamOutput, val stderr: StreamOutput)
-
-  /**
-   * The base class of stream output.
-   */
-  abstract class StreamOutput {
-    /**
-     * Returns the content as a string.
-     * @return The content as a string.
-     */
-    def content: String
-
-    /**
-     * Returns true if the content was truncated.
-     * @return true if the content was truncated.
-     */
-    def contentTruncated: Boolean
-  }
-
-  private var currentCaptureId = 0
-  /**
-   * Returns the next output capture id.
-   * @return The next output capture id.
-   */
-  private def NEXT_OUTPUT_CAPTURE_ID = {
-    currentCaptureId += 1
-    currentCaptureId
-  }
-  private val STDOUT_KEY = "stdout"
-  private val STDERR_KEY = "stderr"
-
-  /** Tracks running processes so that they can be killed as the JVM shuts down. */
-  private val running = new HashSet[Process]
-
-  def shutdown() = {
-    for (process <- running.clone) {
-      logger.warn("Killing: " + process)
-      try {
-        process.destroy
-      } catch {
-        case _ => /* ignore */
-      }
-    }
-  }
-
-  /** Empty stream settings used when no output is requested. */
-  private object EmptyStreamSettings extends OutputStreamSettings(0, null, false)
-
-  /** Empty stream output when no output is captured due to an error. */
-  private object EmptyStreamOutput extends StreamOutput {
-    def content = ""
-    def contentTruncated = false
-  }
-
-  /**
-   * Stream output captured from a stream.
-   * @param stream Stream to capture output.
-   * @param settings Settings that define what to capture.
-   */
-  private class CapturedStreamOutput(val stream: InputStream, val settings: OutputStreamSettings, val debugStream: PrintStream) extends StreamOutput {
-    /**
-     * Returns the captured content as a string.
-     * @return The captured content as a string.
-     */
-    def content = stringWriter.toString()
-
-    /**
-     * Returns true if the captured content was truncated.
-     * @return true if the captured content was truncated.
-     */
-    def contentTruncated = stringTruncated
-
-    /**
-     * Drain the input stream to keep the process from backing up until it's empty.
-     */
-    def read() = {
-      val reader = new InputStreamReader(stream)
-      val buf = new Array[Char](4096)
-      var readCount = 0
-      while ({readCount = reader.read(buf); readCount} >= 0) {
-        writeString(buf, readCount)
-        writeFile(buf, readCount)
-      }
-      closeFile()
-      stream.close()
-    }
-
-    /** The string to write capture content. */
-    private lazy val stringWriter = if (settings.stringSize < 0) new StringWriter else new StringWriter(settings.stringSize)
-
-    /** True if the content is truncated. */
-    private var stringTruncated = false
-
-    /** The number of characters left until the buffer is full. */
-    private var stringRemaining = settings.stringSize
-
-    /**
-     * Writes the buffer to the stringWriter up to stringRemaining characters.
-     * @param chars Character buffer to write.
-     * @param len Number of characters in the buffer.
-     */
-    private def writeString(chars: Array[Char], len: Int) = {
-      // If debug is enabled bypass the logger and dump directly to the screen
-      if (logger.isDebugEnabled)
-        debugStream.print(new String(chars, 0, len))
-      if (settings.stringSize < 0) {
-        stringWriter.write(chars, 0, len)
-      } else {
-        if (!stringTruncated) {
-          stringWriter.write(chars, 0, if (len > stringRemaining) stringRemaining else len)
-          stringRemaining -= len
-          if (stringRemaining < 0)
-            stringTruncated = true
-        }
-      }
-    }
-
-    /** The file writer to capture content or null if no output file was requested. */
-    private lazy val fileWriter = {
-      if (settings.outputFile == null) {
-        null
-      } else {
-        new FileWriter(settings.outputFile, settings.outputFileAppend)
-      }
-    }
-
-    /**
-     * Writes the buffer to the fileWriter if it is not null.
-     * @param chars Character buffer to write.
-     * @param len Number of characters in the buffer.
-     */
-    private def writeFile(chars: Array[Char], len: Int) = {
-      if (fileWriter != null) {
-        fileWriter.write(chars, 0, len)
-        fileWriter.flush()
-      }
-    }
-
-    /** Closes the fileWriter if it is not null. */
-    private def closeFile() = {
-      if (fileWriter != null) {
-        fileWriter.flush
-        fileWriter.close
-      }
-    }
-  }
-}
diff --git a/public/scala/src/org/broadinstitute/sting/queue/util/QJobReport.scala b/public/scala/src/org/broadinstitute/sting/queue/util/QJobReport.scala
index 85896da66..bb14bb6e6 100644
--- a/public/scala/src/org/broadinstitute/sting/queue/util/QJobReport.scala
+++ b/public/scala/src/org/broadinstitute/sting/queue/util/QJobReport.scala
@@ -23,15 +23,14 @@
  */
 
 package org.broadinstitute.sting.queue.util
+
 import org.broadinstitute.sting.queue.function.QFunction
 import org.broadinstitute.sting.gatk.report.{GATKReportTable, GATKReport}
 import org.broadinstitute.sting.utils.exceptions.UserException
 import org.broadinstitute.sting.queue.engine.JobRunInfo
 import java.io.{FileOutputStream, PrintStream, File}
-import org.broadinstitute.sting.queue.function.scattergather.{GathererFunction, ScatterFunction}
-import org.broadinstitute.sting.utils.R.RScriptExecutor.RScriptArgumentCollection
-import org.broadinstitute.sting.utils.R.RScriptExecutor
-import org.broadinstitute.sting.queue.QScript
+import org.broadinstitute.sting.utils.R.{RScriptLibrary, RScriptExecutor}
+import org.broadinstitute.sting.utils.io.Resource
 
 /**
  * A mixin to add Job info to the class
@@ -104,10 +103,12 @@ object QJobReport {
     stream.close()
   }
 
-  def plotReport(args: RScriptArgumentCollection, jobReportFile: File) {
-    val executor = new RScriptExecutor(args, false) // don't except on error
-    val pdf = jobReportFile.getAbsolutePath + ".pdf"
-    executor.callRScripts(JOB_REPORT_QUEUE_SCRIPT, jobReportFile.getAbsolutePath, pdf)
+  def plotReport(reportFile: File, pdfFile: File) {
+    val executor = new RScriptExecutor
+    executor.addLibrary(RScriptLibrary.GSALIB)
+    executor.addScript(new Resource(JOB_REPORT_QUEUE_SCRIPT, classOf[QJobReport]))
+    executor.addArgs(reportFile.getAbsolutePath, pdfFile.getAbsolutePath)
+    executor.exec()
   }
 
   def workAroundSameJobNames(func: QFunction):String = {
diff --git a/public/scala/src/org/broadinstitute/sting/queue/util/ShellJob.scala b/public/scala/src/org/broadinstitute/sting/queue/util/ShellJob.scala
deleted file mode 100755
index d35633ebf..000000000
--- a/public/scala/src/org/broadinstitute/sting/queue/util/ShellJob.scala
+++ /dev/null
@@ -1,27 +0,0 @@
-package org.broadinstitute.sting.queue.util
-
-/**
- * Runs a job on the command line by invoking "sh -c <command>"
- */
-class ShellJob extends CommandLineJob with Logging {
-  /**
-   * Runs the command and waits for the output.
-   */
-  def run() = {
-    val (redirectError, errorFile) = if (this.errorFile == null) (true, null) else (false, this.errorFile)
-    val bufferSize = if (redirectError || logger.isDebugEnabled) FIVE_MB else 0
-    val stdinSettings = new ProcessController.InputStreamSettings(null, this.inputFile)
-    val stdoutSettings = new ProcessController.OutputStreamSettings(bufferSize, this.outputFile, true)
-    val stderrSettings = new ProcessController.OutputStreamSettings(FIVE_MB, errorFile, true)
-    val commandLine = Array("sh", shellScript.toString)
-    val processSettings = new ProcessController.ProcessSettings(
-      commandLine, null, this.workingDir, stdinSettings, stdoutSettings, stderrSettings, redirectError)
-
-    val output = processController.exec(processSettings)
-
-    if (output.exitValue != 0) {
-      val streamOutput = if (redirectError) output.stdout else output.stderr
-      throw new JobExitException("Failed to run job.", commandLine, output.exitValue, content(streamOutput))
-    }
-  }
-}
diff --git a/public/scala/test/org/broadinstitute/sting/queue/extensions/gatk/GATKIntervalsUnitTest.scala b/public/scala/test/org/broadinstitute/sting/queue/extensions/gatk/GATKIntervalsUnitTest.scala
index b3a2d23ae..38abe24ef 100644
--- a/public/scala/test/org/broadinstitute/sting/queue/extensions/gatk/GATKIntervalsUnitTest.scala
+++ b/public/scala/test/org/broadinstitute/sting/queue/extensions/gatk/GATKIntervalsUnitTest.scala
@@ -53,8 +53,8 @@ class GATKIntervalsUnitTest {
     val gi = new GATKIntervals(hg18Reference, List("chr1:1-1", "chr2:2-3", "chr3:3-5"))
     Assert.assertEquals(gi.locs.toList, List(chr1, chr2, chr3))
     Assert.assertEquals(gi.contigs, List("chr1", "chr2", "chr3"))
-    Assert.assertEquals(gi.getSplits(2).toList, List(2, 3))
-    Assert.assertEquals(gi.getSplits(3).toList, List(1, 2, 3))
+//    Assert.assertEquals(gi.getSplits(2).toList, List(2, 3))
+//    Assert.assertEquals(gi.getSplits(3).toList, List(1, 2, 3))
   }
 
   @Test(timeOut = 30000)
@@ -65,7 +65,7 @@ class GATKIntervalsUnitTest {
     //   for(Item item: javaConvertedScalaList)
     // This for loop is actually an O(N^2) operation as the iterator calls the
     // O(N) javaConvertedScalaList.size() for each iteration of the loop.
-    Assert.assertEquals(gi.getSplits(gi.locs.size).size, 189894)
+    //Assert.assertEquals(gi.getSplits(gi.locs.size).size, 189894)
     Assert.assertEquals(gi.contigs.size, 24)
   }
 
@@ -74,8 +74,8 @@ class GATKIntervalsUnitTest {
     val gi = new GATKIntervals(hg18Reference, Nil)
     Assert.assertEquals(gi.locs, hg18ReferenceLocs)
     Assert.assertEquals(gi.contigs.size, hg18ReferenceLocs.size)
-    Assert.assertEquals(gi.getSplits(2).toList, List(10, 45))
-    Assert.assertEquals(gi.getSplits(4).toList, List(5, 10, 16, 45))
+//    Assert.assertEquals(gi.getSplits(2).toList, List(10, 45))
+//    Assert.assertEquals(gi.getSplits(4).toList, List(5, 10, 16, 45))
   }
 
   @Test
diff --git a/public/scala/test/org/broadinstitute/sting/queue/pipeline/PipelineTest.scala b/public/scala/test/org/broadinstitute/sting/queue/pipeline/PipelineTest.scala
index 5de474340..aedbc1cd3 100644
--- a/public/scala/test/org/broadinstitute/sting/queue/pipeline/PipelineTest.scala
+++ b/public/scala/test/org/broadinstitute/sting/queue/pipeline/PipelineTest.scala
@@ -33,7 +33,7 @@ import java.text.SimpleDateFormat
 import org.broadinstitute.sting.BaseTest
 import org.broadinstitute.sting.MD5DB
 import org.broadinstitute.sting.queue.QCommandLine
-import org.broadinstitute.sting.queue.util.{Logging, ProcessController}
+import org.broadinstitute.sting.queue.util.Logging
 import java.io.File
 import org.broadinstitute.sting.gatk.report.GATKReport
 import org.apache.commons.io.FileUtils
@@ -217,11 +217,6 @@ object PipelineTest extends BaseTest with Logging {
   Runtime.getRuntime.addShutdownHook(new Thread {
     /** Cleanup as the JVM shuts down. */
     override def run() {
-      try {
-        ProcessController.shutdown()
-      } catch {
-        case _ => /*ignore */
-      }
       runningCommandLines.foreach(commandLine =>
         try {
           commandLine.shutdown()
diff --git a/public/scala/test/org/broadinstitute/sting/queue/pipeline/examples/ExampleCountLociPipelineTest.scala b/public/scala/test/org/broadinstitute/sting/queue/pipeline/examples/ExampleCountLociPipelineTest.scala
index 1e6c93cff..5901cab46 100644
--- a/public/scala/test/org/broadinstitute/sting/queue/pipeline/examples/ExampleCountLociPipelineTest.scala
+++ b/public/scala/test/org/broadinstitute/sting/queue/pipeline/examples/ExampleCountLociPipelineTest.scala
@@ -36,8 +36,8 @@ class ExampleCountLociPipelineTest {
     spec.name = "countloci"
     spec.args = Array(
       " -S public/scala/qscript/org/broadinstitute/sting/queue/qscripts/examples/ExampleCountLoci.scala",
-      " -R " + BaseTest.hg18Reference,
-      " -I " + BaseTest.validationDataLocation + "small_bam_for_countloci.bam",
+      " -R " + BaseTest.testDir + "exampleFASTA.fasta",
+      " -I " + BaseTest.testDir + "exampleBAM.bam",
       " -o " + testOut).mkString
     spec.fileMD5s += testOut -> "67823e4722495eb10a5e4c42c267b3a6"
     PipelineTest.executeTest(spec)
diff --git a/public/scala/test/org/broadinstitute/sting/queue/util/IOUtilsUnitTest.scala b/public/scala/test/org/broadinstitute/sting/queue/util/IOUtilsUnitTest.scala
deleted file mode 100644
index f0e5153a4..000000000
--- a/public/scala/test/org/broadinstitute/sting/queue/util/IOUtilsUnitTest.scala
+++ /dev/null
@@ -1,122 +0,0 @@
-package org.broadinstitute.sting.queue.util
-
-import org.broadinstitute.sting.BaseTest
-import java.io.File
-import org.broadinstitute.sting.utils.exceptions.UserException
-import org.testng.Assert
-import org.testng.annotations.Test
-
-class IOUtilsUnitTest extends BaseTest {
-  @Test
-  def testGoodTempDir = {
-    IOUtils.checkTempDir(new File("/tmp/queue"))
-  }
-
-  @Test(expectedExceptions=Array(classOf[UserException.BadTmpDir]))
-  def testBadTempDir = {
-    IOUtils.checkTempDir(new File("/tmp"))
-  }
-
-  @Test
-  def testAbsoluteSubDir = {
-    var subDir = IOUtils.absolute(new File("."), new File("/path/to/file"))
-    Assert.assertEquals(subDir, new File("/path/to/file"))
-
-    subDir = IOUtils.absolute(new File("/different/path"), new File("/path/to/file"))
-    Assert.assertEquals(subDir, new File("/path/to/file"))
-
-    subDir = IOUtils.absolute(new File("/different/path"), new File("."))
-    Assert.assertEquals(subDir, new File("/different/path"))
-  }
-
-  @Test
-  def testRelativeSubDir = {
-    var subDir = IOUtils.absolute(new File("."), new File("path/to/file"))
-    Assert.assertEquals(subDir.getCanonicalFile, new File("path/to/file").getCanonicalFile)
-
-    subDir = IOUtils.absolute(new File("/different/path"), new File("path/to/file"))
-    Assert.assertEquals(subDir, new File("/different/path/path/to/file"))
-  }
-
-  @Test
-  def testDottedSubDir = {
-    var subDir = IOUtils.absolute(new File("."), new File("path/../to/file"))
-    Assert.assertEquals(subDir.getCanonicalFile, new File("path/../to/./file").getCanonicalFile)
-
-    subDir = IOUtils.absolute(new File("."), new File("/path/../to/file"))
-    Assert.assertEquals(subDir, new File("/path/../to/file"))
-
-    subDir = IOUtils.absolute(new File("/different/../path"), new File("path/to/file"))
-    Assert.assertEquals(subDir, new File("/different/../path/path/to/file"))
-
-    subDir = IOUtils.absolute(new File("/different/./path"), new File("/path/../to/file"))
-    Assert.assertEquals(subDir, new File("/path/../to/file"))
-  }
-
-  @Test
-  def testTempDir = {
-    val tempDir = IOUtils.tempDir("Q-Unit-Test", "", new File("queueTempDirToDelete"))
-    Assert.assertTrue(tempDir.exists)
-    Assert.assertFalse(tempDir.isFile)
-    Assert.assertTrue(tempDir.isDirectory)
-    val deleted = IOUtils.tryDelete(tempDir)
-    Assert.assertTrue(deleted)
-    Assert.assertFalse(tempDir.exists)
-  }
-
-  @Test
-  def testDirLevel = {
-    var dir = IOUtils.dirLevel(new File("/path/to/directory"), 1)
-    Assert.assertEquals(dir, new File("/path"))
-
-    dir = IOUtils.dirLevel(new File("/path/to/directory"), 2)
-    Assert.assertEquals(dir, new File("/path/to"))
-
-    dir = IOUtils.dirLevel(new File("/path/to/directory"), 3)
-    Assert.assertEquals(dir, new File("/path/to/directory"))
-
-    dir = IOUtils.dirLevel(new File("/path/to/directory"), 4)
-    Assert.assertEquals(dir, new File("/path/to/directory"))
-  }
-
-  @Test
-  def testAbsolute = {
-    var dir = IOUtils.absolute(new File("/path/./to/./directory/."))
-    Assert.assertEquals(dir, new File("/path/to/directory"))
-
-    dir = IOUtils.absolute(new File("/"))
-    Assert.assertEquals(dir, new File("/"))
-
-    dir = IOUtils.absolute(new File("/."))
-    Assert.assertEquals(dir, new File("/"))
-
-    dir = IOUtils.absolute(new File("/././."))
-    Assert.assertEquals(dir, new File("/"))
-
-    dir = IOUtils.absolute(new File("/./directory/."))
-    Assert.assertEquals(dir, new File("/directory"))
-
-    dir = IOUtils.absolute(new File("/./directory/./"))
-    Assert.assertEquals(dir, new File("/directory"))
-
-    dir = IOUtils.absolute(new File("/./directory./"))
-    Assert.assertEquals(dir, new File("/directory."))
-
-    dir = IOUtils.absolute(new File("/./.directory/"))
-    Assert.assertEquals(dir, new File("/.directory"))
-  }
-
-  @Test
-  def testTail = {
-    val lines = List(
-      "chr18_random	4262	3154410390	50	51",
-      "chr19_random	301858	3154414752	50	51",
-      "chr21_random	1679693	3154722662	50	51",
-      "chr22_random	257318	3156435963	50	51",
-      "chrX_random	1719168	3156698441	50	51")
-    val tail = IOUtils.tail(new File(BaseTest.hg18Reference + ".fai"), 5)
-    Assert.assertEquals(tail.size, 5)
-    for (i <- 0 until 5)
-      Assert.assertEquals(tail(i), lines(i))
-  }
-}
diff --git a/public/scala/test/org/broadinstitute/sting/queue/util/ShellJobUnitTest.scala b/public/scala/test/org/broadinstitute/sting/queue/util/ShellJobUnitTest.scala
deleted file mode 100644
index a2e6fb7c0..000000000
--- a/public/scala/test/org/broadinstitute/sting/queue/util/ShellJobUnitTest.scala
+++ /dev/null
@@ -1,73 +0,0 @@
-package org.broadinstitute.sting.queue.util
-
-import org.broadinstitute.sting.BaseTest
-import org.testng.annotations.Test
-import org.testng.Assert
-
-class ShellJobUnitTest {
-  @Test
-  def testEcho {
-    val job = new ShellJob
-    job.shellScript = writeScript("echo Hello World")
-    job.run()
-  }
-
-  @Test(expectedExceptions=Array(classOf[JobExitException]))
-  def testBadQuotes {
-    val job = new ShellJob
-    job.shellScript = writeScript("echo 'Hello World")
-    job.run()
-  }
-
-  @Test
-  def testGoodQuotes {
-    val job = new ShellJob
-    job.shellScript = writeScript("echo 'Hello World'")
-    job.run()
-  }
-
-  @Test
-  def testEscapeCharacters {
-    var job: ShellJob = null
-
-    job = new ShellJob
-    job.shellScript = writeScript("echo #")
-    job.outputFile = BaseTest.createTempFile("temp", "")
-    job.run()
-    Assert.assertEquals(IOUtils.readContents(job.outputFile).trim, "")
-
-    job = new ShellJob
-    job.shellScript = writeScript("""echo \#""")
-    job.outputFile = BaseTest.createTempFile("temp", "")
-    job.run()
-    Assert.assertEquals(IOUtils.readContents(job.outputFile).trim, "#")
-
-    job = new ShellJob
-    job.shellScript = writeScript("""echo \\#""")
-    job.outputFile = BaseTest.createTempFile("temp", "")
-    job.run()
-    Assert.assertEquals(IOUtils.readContents(job.outputFile).trim, """\#""")
-  }
-
-  @Test
-  def testLongCommand {
-    // This command fails on some systems with a 4096 character limit when run via the old sh -c "echo ...",
-    // but works on the same systems when run via sh <script>
-    val builder = new StringBuilder
-    builder.append("echo ")
-    for (i <- 1 to 500) {
-      val s = i.toString
-      builder.append("000".take(3-s.length)).append(s).append("______ ")
-    }
-
-    val job = new ShellJob
-    job.shellScript = writeScript(builder.toString)
-    job.run()
-  }
-
-  private def writeScript(contents: String) = {
-    val file = BaseTest.createTempFile("temp", "")
-    IOUtils.writeContents(file, contents)
-    file
-  }
-}
diff --git a/public/testdata/HiSeq.10000.bgzip.vcf.gz b/public/testdata/HiSeq.10000.bgzip.vcf.gz
new file mode 100644
index 000000000..3f2b9bf14
Binary files /dev/null and b/public/testdata/HiSeq.10000.bgzip.vcf.gz differ
diff --git a/public/testdata/ceutrio.ped b/public/testdata/ceutrio.ped
new file mode 100644
index 000000000..1302e1a2d
--- /dev/null
+++ b/public/testdata/ceutrio.ped
@@ -0,0 +1,3 @@
+fam1 kid dad mom 1 2
+fam1 dad 0   0   1 1
+fam1 mom 0   0   2 2
diff --git a/settings/repository/edu.mit.broad/picard-private-parts-2034.jar b/settings/repository/edu.mit.broad/picard-private-parts-2034.jar
deleted file mode 100644
index 11f59420c..000000000
Binary files a/settings/repository/edu.mit.broad/picard-private-parts-2034.jar and /dev/null differ
diff --git a/settings/repository/edu.mit.broad/picard-private-parts-2068.jar b/settings/repository/edu.mit.broad/picard-private-parts-2068.jar
new file mode 100644
index 000000000..bb6805d8d
Binary files /dev/null and b/settings/repository/edu.mit.broad/picard-private-parts-2068.jar differ
diff --git a/settings/repository/edu.mit.broad/picard-private-parts-2034.xml b/settings/repository/edu.mit.broad/picard-private-parts-2068.xml
similarity index 58%
rename from settings/repository/edu.mit.broad/picard-private-parts-2034.xml
rename to settings/repository/edu.mit.broad/picard-private-parts-2068.xml
index 1a60a2015..1ce10c193 100644
--- a/settings/repository/edu.mit.broad/picard-private-parts-2034.xml
+++ b/settings/repository/edu.mit.broad/picard-private-parts-2068.xml
@@ -1,3 +1,3 @@
 <ivy-module version="1.0">
-    <info organisation="edu.mit.broad" module="picard-private-parts" revision="2034" status="integration" publication="20110718185300" />
+    <info organisation="edu.mit.broad" module="picard-private-parts" revision="2068" status="integration" publication="20111024162900" />
 </ivy-module>
diff --git a/settings/repository/net.sf/picard-1.52.944.xml b/settings/repository/net.sf/picard-1.52.944.xml
deleted file mode 100644
index 61fac6644..000000000
--- a/settings/repository/net.sf/picard-1.52.944.xml
+++ /dev/null
@@ -1,3 +0,0 @@
-<ivy-module version="1.0">
-    <info organisation="net.sf" module="picard" revision="1.52.944" status="release" />
-</ivy-module>
diff --git a/settings/repository/net.sf/picard-1.52.944.jar b/settings/repository/net.sf/picard-1.55.985.jar
similarity index 80%
rename from settings/repository/net.sf/picard-1.52.944.jar
rename to settings/repository/net.sf/picard-1.55.985.jar
index e147ebbba..a8ceaa878 100644
Binary files a/settings/repository/net.sf/picard-1.52.944.jar and b/settings/repository/net.sf/picard-1.55.985.jar differ
diff --git a/settings/repository/net.sf/picard-1.55.985.xml b/settings/repository/net.sf/picard-1.55.985.xml
new file mode 100644
index 000000000..e74b12604
--- /dev/null
+++ b/settings/repository/net.sf/picard-1.55.985.xml
@@ -0,0 +1,3 @@
+<ivy-module version="1.0">
+    <info organisation="net.sf" module="picard" revision="1.55.985" status="release" />
+</ivy-module>
diff --git a/settings/repository/net.sf/sam-1.52.944.xml b/settings/repository/net.sf/sam-1.52.944.xml
deleted file mode 100644
index 2229395b2..000000000
--- a/settings/repository/net.sf/sam-1.52.944.xml
+++ /dev/null
@@ -1,3 +0,0 @@
-<ivy-module version="1.0">
-    <info organisation="net.sf" module="sam" revision="1.52.944" status="release" />
-</ivy-module>
diff --git a/settings/repository/net.sf/sam-1.52.944.jar b/settings/repository/net.sf/sam-1.55.985.jar
similarity index 78%
rename from settings/repository/net.sf/sam-1.52.944.jar
rename to settings/repository/net.sf/sam-1.55.985.jar
index 7037c7a96..ff3d9a945 100644
Binary files a/settings/repository/net.sf/sam-1.52.944.jar and b/settings/repository/net.sf/sam-1.55.985.jar differ
diff --git a/settings/repository/net.sf/sam-1.55.985.xml b/settings/repository/net.sf/sam-1.55.985.xml
new file mode 100644
index 000000000..415063a62
--- /dev/null
+++ b/settings/repository/net.sf/sam-1.55.985.xml
@@ -0,0 +1,3 @@
+<ivy-module version="1.0">
+    <info organisation="net.sf" module="sam" revision="1.55.985" status="release" />
+</ivy-module>
diff --git a/settings/repository/org.broad/tribble-24.jar b/settings/repository/org.broad/tribble-40.jar
similarity index 80%
rename from settings/repository/org.broad/tribble-24.jar
rename to settings/repository/org.broad/tribble-40.jar
index b1c39e60a..7f68b4b36 100644
Binary files a/settings/repository/org.broad/tribble-24.jar and b/settings/repository/org.broad/tribble-40.jar differ
diff --git a/settings/repository/org.broad/tribble-24.xml b/settings/repository/org.broad/tribble-40.xml
similarity index 51%
rename from settings/repository/org.broad/tribble-24.xml
rename to settings/repository/org.broad/tribble-40.xml
index 9b2b967f8..6a01b3790 100644
--- a/settings/repository/org.broad/tribble-24.xml
+++ b/settings/repository/org.broad/tribble-40.xml
@@ -1,3 +1,3 @@
 <ivy-module version="1.0">
-    <info organisation="org.broad" module="tribble" revision="24" status="integration" />
+    <info organisation="org.broad" module="tribble" revision="40" status="integration" />
 </ivy-module>