From 422e16c62e7b99c1928de1655dfa359dc9945428 Mon Sep 17 00:00:00 2001
From: David Roazen <droazen@broadinstitute.org>
Date: Thu, 25 Oct 2012 16:16:00 -0400
Subject: [PATCH 1/3] BaseRecalibration: don't cache instances of
 ReadCovariates across reads

Caching and reusing ReadCovariates instances across reads sounds good in theory, but:

-it doesn't work unless you zero out the internal arrays before each read
-the internal arrays must be sized proportionally to the maximum POSSIBLE
recalibrated read length (5000!!!), instead of the ACTUAL read lengths

By contrast, creating a new instance per read is basically equivalent to doing an
efficient low-level memset-style clear on a much smaller array (since we use the actual
rather than the maximum read length to create it). So this should be faster than caching
instances and calling clear() but slower than caching instances and not calling clear().

Credit to Ryan to proposing this approach.
---
 .../recalibration/BaseRecalibration.java      | 22 +------------------
 1 file changed, 1 insertion(+), 21 deletions(-)
diff --git a/public/java/src/org/broadinstitute/sting/utils/recalibration/BaseRecalibration.java b/public/java/src/org/broadinstitute/sting/utils/recalibration/BaseRecalibration.java
index 2f9387acb..5d4020a07 100644
--- a/public/java/src/org/broadinstitute/sting/utils/recalibration/BaseRecalibration.java
+++ b/public/java/src/org/broadinstitute/sting/utils/recalibration/BaseRecalibration.java
@@ -61,17 +61,6 @@ public class BaseRecalibration {
 //            qualityScoreByFullCovariateKey[i] = new NestedHashMap();
 //    }
 
-    /**
-     * Thread local cache to allow multi-threaded use of this class
-     */
-    private ThreadLocal<ReadCovariates> readCovariatesCache;
-    {
-        readCovariatesCache = new ThreadLocal<ReadCovariates> () {
-            @Override protected ReadCovariates initialValue() {
-                return new ReadCovariates(MAXIMUM_RECALIBRATED_READ_LENGTH, requestedCovariates.length);
-            }
-        };
-    }
 
     /**
      * Constructor using a GATK Report file
@@ -113,16 +102,7 @@ public class BaseRecalibration {
             }
         }
 
-        // Compute all covariates for the read
-        // TODO -- the need to clear here suggests there's an error in the indexing / assumption code
-        // TODO -- for BI and DI. Perhaps due to the indel buffer size on the ends of the reads?
-        // TODO -- the output varies depending on whether we clear or not
-        //final ReadCovariates readCovariates = readCovariatesCache.get().clear();
-
-        // the original code -- doesn't do any clearing
-        final ReadCovariates readCovariates = readCovariatesCache.get();
-
-        RecalUtils.computeCovariates(read, requestedCovariates, readCovariates);
+        final ReadCovariates readCovariates = RecalUtils.computeCovariates(read, requestedCovariates);
 
         for (final EventType errorModel : EventType.values()) { // recalibrate all three quality strings
             if (disableIndelQuals && errorModel != EventType.BASE_SUBSTITUTION) {

From 6b8b7df6517647d05bedf3acc9411c599e5a95cd Mon Sep 17 00:00:00 2001
From: Mark DePristo <depristo@broadinstitute.org>
Date: Thu, 25 Oct 2012 17:26:29 -0400
Subject: [PATCH 2/3] Queue now understands -nct and requests the appropriate
 number of cores from LSF, SGE, etc

-- NCT wasn't previously recognized by Queue as needing more processors per machine.  This commit fixes this.  Also a potential cause of poor GATKPerformanceOverTime, in that runs with -nct could flood a node and cause it to have hundreds of cores in contention.
---
 .../sting/queue/extensions/gatk/ArgumentDefinitionField.java    | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/public/java/src/org/broadinstitute/sting/queue/extensions/gatk/ArgumentDefinitionField.java b/public/java/src/org/broadinstitute/sting/queue/extensions/gatk/ArgumentDefinitionField.java
index 368cb3d11..2226c6458 100644
--- a/public/java/src/org/broadinstitute/sting/queue/extensions/gatk/ArgumentDefinitionField.java
+++ b/public/java/src/org/broadinstitute/sting/queue/extensions/gatk/ArgumentDefinitionField.java
@@ -346,7 +346,7 @@ public abstract class ArgumentDefinitionField extends ArgumentField {
 
         @Override
         protected String getFreezeFields() {
-            return String.format("if (num_threads.isDefined) nCoresRequest = num_threads%n");
+            return String.format("if (num_threads.isDefined) nCoresRequest = num_threads%nif (num_cpu_threads_per_data_thread.isDefined) nCoresRequest = Some(nCoresRequest.getOrElse(1) * num_cpu_threads_per_data_thread.getOrElse(1))%n");
         }
     }