From 813a4e838f0794519ca66d3c4be6341faaf7c93b Mon Sep 17 00:00:00 2001
From: depristo <depristo@348d0f76-0448-11de-a6fe-93d51630548a>
Date: Sun, 30 Aug 2009 19:27:11 +0000
Subject: [PATCH] Removing old code

git-svn-id: file:///humgen/gsa-scr1/gsa-engineering/svn_contents/trunk@1482 348d0f76-0448-11de-a6fe-93d51630548a
---
 .../NewHotnessGenotypeLikelihoods.java        | 483 ------------------
 1 file changed, 483 deletions(-)
 delete mode 100755 java/src/org/broadinstitute/sting/gatk/walkers/genotyper/NewHotnessGenotypeLikelihoods.java

diff --git a/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/NewHotnessGenotypeLikelihoods.java b/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/NewHotnessGenotypeLikelihoods.java
deleted file mode 100755
index 93864d39f..000000000
--- a/java/src/org/broadinstitute/sting/gatk/walkers/genotyper/NewHotnessGenotypeLikelihoods.java
+++ /dev/null
@@ -1,483 +0,0 @@
-package org.broadinstitute.sting.gatk.walkers.genotyper;
-
-import net.sf.samtools.SAMRecord;
-import org.broadinstitute.sting.utils.*;
-import edu.mit.broad.picard.util.MathUtil;
-
-import java.util.Arrays;
-import static java.lang.Math.log10;
-import static java.lang.Math.pow;
-
-/**
- * Stable, error checking version of the Bayesian genotyper.  Useful for calculating the likelihoods, priors,
- * and posteriors given a pile of bases and quality scores
- *
- * Suppose we have bases b1, b2, ..., bN with qualities scores q1, q2, ..., qN.  This object
- * calculates:
- *
- * P(G | D) = P(G) * P(D | G)
- *
- * where
- *
- * P(D | G) = sum_i log10 P(bi | G)
- *
- * and
- *
- * P(bi | G) = 1 - P(error | q1) if bi is in G
- *           = P(error | q1) / 3 if bi is not in G
- *
- * for homozygous genotypes and for heterozygous genotypes:
- *
- * P(bi | G) = 1 - P(error | q1) / 2 + P(error | q1) / 6 if bi is in G
- *           = P(error | q1) / 3 if bi is not in G
- *
- * for each of the 10 unique diploid genotypes AA, AC, AG, .., TT
- *
- * Everything is stored as arrays indexed by DiploidGenotype.ordinal() values in log10 space.
- *
- * The priors contain the relative probabilities of each genotype, and must be provided at object creation.
- * From then on, you can call any of the add() routines to update the likelihoods and posteriors in the above
- * model.
- */
-public class NewHotnessGenotypeLikelihoods extends GenotypeLikelihoods implements Cloneable {
-    private final static int FIXED_PLOIDY = 2;
-    private final static int MAX_PLOIDY = FIXED_PLOIDY + 1;
-
-    //
-    // The three fundamental data arrays associated with a Genotype Likelhoods object
-    //
-    protected double[] likelihoods = null;
-    protected double[] posteriors = null;
-
-    private DiploidGenotypePriors priors = null;
-
-    private boolean verbose = false;
-    private int minQScoreToInclude = 0;
-
-    /**
-     * Create a new GenotypeLikelhoods object with flat priors for each diploid genotype
-     */
-    public NewHotnessGenotypeLikelihoods() {
-        this.priors = new DiploidGenotypePriors();
-        initialize();
-    }
-
-    /**
-     * Create a new GenotypeLikelhoods object with flat priors for each diploid genotype
-     */
-    public NewHotnessGenotypeLikelihoods(DiploidGenotypePriors priors) {
-        this.priors = priors;
-        initialize();
-    }
-
-    /**
-     * Cloning of the object
-     * @return
-     * @throws CloneNotSupportedException
-     */
-    protected Object clone() throws CloneNotSupportedException {
-        NewHotnessGenotypeLikelihoods c = (NewHotnessGenotypeLikelihoods)super.clone();
-        c.priors = priors;
-        c.likelihoods = likelihoods.clone();
-        c.posteriors = posteriors.clone();
-        return c;
-    }
-
-    private void initialize() {
-        likelihoods = zeros.clone();            // likelihoods are all zeros
-        posteriors = priors.getPriors().clone();            // posteriors are all the priors
-    }
-
-
-    public void setVerbose(boolean v) {
-        verbose = v;
-    }
-
-    public boolean isVerbose() {
-        return verbose;
-    }
-
-    public int getMinQScoreToInclude() {
-        return minQScoreToInclude;
-    }
-
-    public void setMinQScoreToInclude(int minQScoreToInclude) {
-        this.minQScoreToInclude = minQScoreToInclude;
-    }
-
-    /**
-     * Returns an array of log10 likelihoods for each genotype, indexed by DiploidGenotype.ordinal values()
-     * @return
-     */
-    public double[] getLikelihoods() {
-        return likelihoods;
-    }
-
-    /**
-     * Returns the likelihood associated with DiploidGenotype g
-     * @param g
-     * @return log10 likelihood as a double
-     */
-    public double getLikelihood(DiploidGenotype g) {
-        return getLikelihoods()[g.ordinal()];
-    }
-
-    /**
-     * Returns an array of posteriors for each genotype, indexed by DiploidGenotype.ordinal values().
-     *
-     * @return raw log10 (not-normalized posteriors) as a double array
-     */
-    public double[] getPosteriors() {
-        return posteriors;
-    }
-
-    /**
-     * Returns the posterior associated with DiploidGenotype g
-     * @param g
-     * @return raw log10 (not-normalized posteror) as a double
-     */
-    public double getPosterior(DiploidGenotype g) {
-        return getPosteriors()[g.ordinal()];
-    }
-
-    public DiploidGenotypePriors getPriorObject() {
-        return priors;
-    }
-
-    /**
-     * Returns an array of priors for each genotype, indexed by DiploidGenotype.ordinal values().
-     *
-     * @return log10 prior as a double array
-     */
-    public double[] getPriors() {
-        return priors.getPriors();
-    }
-
-    /**
-     * Returns the prior associated with DiploidGenotype g
-     * @param g
-     * @return log10 prior as a double
-     */
-    public double getPrior(DiploidGenotype g) {
-        return getPriors()[g.ordinal()];
-    }
-
-    // -----------------------------------------------------------------------------------------------------------------
-    //
-    //
-    // add() -- the heart of 
-    //
-    //
-    // -----------------------------------------------------------------------------------------------------------------
-
-    /**
-     * Updates likelihoods and posteriors to reflect an additional observation of observedBase with
-     * qualityScore.
-     *
-     * @param observedBase
-     * @param qualityScore
-     * @return 1 if the base was considered good enough to add to the likelihoods (not Q0 or 'N', for example)
-     */
-    public int add(char observedBase, byte qualityScore, SAMRecord read, int offset) {
-        return reallyAdd(observedBase, qualityScore, read, offset, true);
-    }
-
-    /**
-     * Updates likelihoods and posteriors to reflect the additional observations contained within the
-     * read-based pileup up by calling add(observedBase, qualityScore) for each base / qual in the
-     * pileup
-     *
-     * @param pileup
-     * @return the number of good bases found in the pileup
-     */
-    public int add(ReadBackedPileup pileup, boolean ignoreBadBases) {
-        int n = 0;
-
-        for (int i = 0; i < pileup.getReads().size(); i++) {
-            SAMRecord read = pileup.getReads().get(i);
-            int offset = pileup.getOffsets().get(i);
-            char base = read.getReadString().charAt(offset);
-            byte qual = read.getBaseQualities()[offset];
-            if ( ! ignoreBadBases || ! badBase(base) ) {
-                n += add(base, qual, read, offset);
-            }
-        }
-
-        return n;
-    }
-
-    public int add(ReadBackedPileup pileup) {
-        return add(pileup, false);
-    }
-
-
-    private int reallyAdd(char observedBase, byte qualityScore, SAMRecord read, int offset, boolean enableCache) {
-        if ( badBase(observedBase) ) {
-            throw new RuntimeException(String.format("BUG: unexpected base %c with Q%d passed to GenotypeLikelihoods", observedBase, qualityScore));
-        }
-
-        int nBasesAdded = 0; // the result -- how many bases did we add?
-
-        if ( qualityScore > getMinQScoreToInclude() ) {
-            // Handle caching if requested.  Just look up the cached result if its available, or compute and store it
-            NewHotnessGenotypeLikelihoods cached = null;
-            if ( enableCache ) {
-                if ( ! inCache( observedBase, qualityScore, FIXED_PLOIDY, read, offset ) ) {
-                    cached = calculateCachedGenotypeLikelihoods(observedBase, qualityScore, FIXED_PLOIDY, read, offset );
-                } else {
-                    cached = getCachedGenotypeLikelihoods(observedBase, qualityScore, FIXED_PLOIDY, read, offset );
-                }
-            }
-
-            for ( DiploidGenotype g : DiploidGenotype.values() ) {
-                double likelihoodCalc = ! enableCache ? log10PofObservingBaseGivenGenotype(observedBase, g, qualityScore, read, offset) : 0.0;
-                double likelihoodCached = enableCache ? cached.likelihoods[g.ordinal()] : 0.0;
-                double likelihood = enableCache ? likelihoodCached : likelihoodCalc;
-
-                //if ( enableCache && likelihoodCalc != 0.0 && MathUtils.compareDoubles(likelihoodCached, likelihoodCalc) != 0 ) {
-                //    System.out.printf("ERROR: Likelihoods not equal is cache=%f != calc=%f for %c %d %s%n",
-                //            likelihoodCached, likelihoodCalc, observedBase, qualityScore, g.toString());
-                //}
-
-                if ( isVerbose() ) {
-                    boolean fwdStrand = ! read.getReadNegativeStrandFlag();
-                    System.out.printf("  L(%c | G=%s, Q=%d, S=%s) = %f / %f%n",
-                            observedBase, g, qualityScore, fwdStrand ? "+" : "-", pow(10,likelihood) * 100, likelihood);
-                }
-
-                likelihoods[g.ordinal()] += likelihood;
-                posteriors[g.ordinal()] += likelihood;
-            }
-
-            if ( isVerbose() ) {
-                for ( DiploidGenotype g : DiploidGenotype.values() ) { System.out.printf("%s\t", g); }
-                System.out.println();
-                for ( DiploidGenotype g : DiploidGenotype.values() ) { System.out.printf("%.2f\t", likelihoods[g.ordinal()]); }
-                System.out.println();
-            }
-
-            nBasesAdded = 1;
-        }
-
-        return nBasesAdded;
-    }
-
-    // -----------------------------------------------------------------------------------------------------------------
-    //
-    //
-    // caching routines
-    //
-    //
-    // -----------------------------------------------------------------------------------------------------------------
-    final static NewHotnessGenotypeLikelihoods[][][][][] cache =
-            new NewHotnessGenotypeLikelihoods[EmpiricalSubstitutionGenotypeLikelihoods.SequencerPlatform.values().length][BaseUtils.BASES.length][QualityUtils.MAX_QUAL_SCORE][MAX_PLOIDY][2];
-    static int cacheSize = 0;
-
-    private NewHotnessGenotypeLikelihoods getSetCache( char observedBase, byte qualityScore, int ploidy,
-                                                       SAMRecord read, int offset, NewHotnessGenotypeLikelihoods val ) {
-
-        int a = EmpiricalSubstitutionGenotypeLikelihoods.getReadSequencerPlatform(read).ordinal();
-        int i = BaseUtils.simpleBaseToBaseIndex(observedBase);
-        int j = qualityScore;
-        int k = ploidy;
-        int x = strandIndex(! read.getReadNegativeStrandFlag());
-
-        if ( val != null )
-            cache[a][i][j][k][x] = val;
-
-        return cache[a][i][j][k][x];
-    }
-
-    private NewHotnessGenotypeLikelihoods getCache( char observedBase, byte qualityScore, int ploidy, SAMRecord read, int offset ) {
-        return getSetCache( observedBase, qualityScore, ploidy, read, offset, null );
-    }
-
-    private void setCache( char observedBase, byte qualityScore, int ploidy, SAMRecord read, int offset, NewHotnessGenotypeLikelihoods val ) {
-        getSetCache( observedBase, qualityScore, ploidy, read, offset, val );
-    }
-
-    private int strandIndex(boolean fwdStrand) {
-        return fwdStrand ? 0 : 1;
-    }
-
-    private boolean inCache( char observedBase, byte qualityScore, int ploidy, SAMRecord read, int offset ) {
-        return getCache(observedBase, qualityScore, ploidy, read, offset) != null;
-    }
-
-    private NewHotnessGenotypeLikelihoods getCachedGenotypeLikelihoods( char observedBase, byte qualityScore, int ploidy, SAMRecord read, int offset ) {
-        if ( ! inCache(observedBase, qualityScore, ploidy, read, offset ) )
-            throw new RuntimeException(String.format("BUG: trying to fetch an unset cached genotype likelihood at base=%c, qual=%d, ploidy=%d, read=%s",
-                    observedBase, qualityScore, ploidy, read));
-
-        return getCache(observedBase, qualityScore, ploidy, read, offset);
-    }
-
-    private NewHotnessGenotypeLikelihoods calculateCachedGenotypeLikelihoods( char observedBase, byte qualityScore, int ploidy, SAMRecord read, int offset ) {
-        if ( inCache(observedBase, qualityScore, ploidy, read, offset ) )
-            throw new RuntimeException(String.format("BUG: trying to set an already set cached genotype likelihood at base=%c, qual=%d, ploidy=%d, read=%s",
-                    observedBase, qualityScore, ploidy, read));
-
-        // create a new genotype likelihoods object and add this single base to it -- now we have a cached result
-        try {
-            NewHotnessGenotypeLikelihoods g = (NewHotnessGenotypeLikelihoods)this.clone();
-            g.initialize();
-            g.reallyAdd(observedBase, qualityScore, read, offset, false);
-
-            setCache(observedBase, qualityScore, ploidy, read, offset, g);
-            cacheSize++;
-
-            //System.out.printf("Caching %c %d %d %s %s (%d total entries)%n", observedBase, qualityScore, ploidy, read.getReadName(), EmpiricalSubstitutionGenotypeLikelihoods.getReadSequencerPlatform(read), cacheSize);
-            return g;
-        } catch ( CloneNotSupportedException e ) {
-            throw new RuntimeException(e);
-        }
-    }
-
-    // -----------------------------------------------------------------------------------------------------------------
-    //
-    //
-    // helper routines
-    //
-    //
-    // -----------------------------------------------------------------------------------------------------------------
-
-    /**
-     * Returns true when the observedBase is considered bad and shouldn't be processed by this object.  A base
-     * is considered bad if:
-     *
-     *   Criterion 1: observed base isn't a A,C,T,G or lower case equivalent
-     *
-     * @param observedBase
-     * @return true if the base is a bad base
-     */
-    private boolean badBase(char observedBase) {
-        return BaseUtils.simpleBaseToBaseIndex(observedBase) == -1;
-    }
-
-    /**
-     * Return a string representation of this object in a moderately usable form
-     *
-     * @return
-     */
-    public String toString() {
-        double sum = 0;
-        StringBuilder s = new StringBuilder();
-        for (DiploidGenotype g : DiploidGenotype.values()) {
-            s.append(String.format("%s %.10f ", g, likelihoods[g.ordinal()]));
-			sum += Math.pow(10,likelihoods[g.ordinal()]);
-        }
-		s.append(String.format(" %f", sum));
-        return s.toString();
-    }
-
-    // -----------------------------------------------------------------------------------------------------------------
-    //
-    //
-    // Validation routines
-    //
-    //
-    // -----------------------------------------------------------------------------------------------------------------
-
-    public boolean validate() {
-        return validate(true);
-    }
-
-    public boolean validate(boolean throwException) {
-        try {
-            priors.validate(throwException);
-
-            for ( DiploidGenotype g : DiploidGenotype.values() ) {
-                String bad = null;
-
-                int i = g.ordinal();
-                if ( ! MathUtils.wellFormedDouble(likelihoods[i]) || ! MathUtils.isNegativeOrZero(likelihoods[i]) ) {
-                    bad = String.format("Likelihood %f is badly formed", likelihoods[i]);
-                } else if ( ! MathUtils.wellFormedDouble(posteriors[i]) || ! MathUtils.isNegativeOrZero(posteriors[i]) ) {
-                    bad = String.format("Posterior %f is badly formed", posteriors[i]);
-                }
-
-                if ( bad != null ) {
-                    throw new IllegalStateException(String.format("At %s: %s", g.toString(), bad));
-                }
-            }
-        } catch ( IllegalStateException e ) {
-            if ( throwException )
-                throw new RuntimeException(e);
-            else
-                return false;
-        }
-
-        return true;
-    }
-
-    // -----------------------------------------------------------------------------------------------------------------
-    //
-    //
-    // Hearty math calculations follow
-    //
-    //    -- these should not be messed with unless you know what you are doing
-    //
-    // -----------------------------------------------------------------------------------------------------------------
-
-    /**
-     * Works for any ploidy (in organization).
-     *
-     * @param observedBase
-     * @param g
-     * @param qual
-     * @return
-     */
-    protected double log10PofObservingBaseGivenGenotype(char observedBase, DiploidGenotype g, byte qual, SAMRecord read, int offset ) {
-        if (qual == 0) { // zero quals are wrong
-            throw new RuntimeException(String.format("Unexpected Q0 base discovered in calculateAlleleLikelihood: %c %s %d at %d in %s",
-                    observedBase, g, qual, offset, read));
-        }
-
-        // todo assumes ploidy is 2 -- should be generalized.  Obviously the below code can be turned into a loop
-        double p_base = 0.0;
-        p_base += pow(10, log10PofObservingBaseGivenChromosome(observedBase, g.base1, qual, FIXED_PLOIDY, read, offset ));
-        p_base += pow(10, log10PofObservingBaseGivenChromosome(observedBase, g.base2, qual, FIXED_PLOIDY, read, offset ));
-        return log10(p_base);
-    }
-
-    protected double log10PofObservingBaseGivenChromosome(char observedBase, char chromBase, byte qual, int ploidy, SAMRecord read, int offset) {
-        double logP = 0.0;
-
-        if ( observedBase == chromBase ) {
-            // the base is consistent with the chromosome -- it's 1 - e
-            //logP = oneMinusData[qual];
-            double e = pow(10, (qual / -10.0));
-            logP = log10(1.0 - e);
-        } else {
-            // the base is inconsistent with the chromosome -- it's e * P(chromBase | observedBase is an error)
-            logP = qual / -10.0 + log10PofTrueBaseGivenMiscall(observedBase, chromBase, read, offset);
-        }
-
-        // adjust for ploidy.  We take the raw p(obs | chrom) / ploidy, which is -log10(ploidy) in log space
-        //logP -= log10N[ploidy];
-        logP -= log10(ploidy);
-
-        //System.out.printf("%c %c %d %d => %f%n", observedBase, chromBase, qual, ploidy, logP);
-        return logP;
-    }
-
-    /**
-     * Simple log10(3) cached value
-     */
-    protected static final double log103 = log10(3.0);
-
-    protected double log10PofTrueBaseGivenMiscall(char observedBase, char chromBase, SAMRecord read, int offset) {
-        return -log103; // currently equivalent to e/3 model
-    }
-
-    //
-    // Constant static data
-    //
-    private final static double[] zeros = new double[DiploidGenotype.values().length];
-
-    static {
-        for ( DiploidGenotype g : DiploidGenotype.values() ) {
-            zeros[g.ordinal()] = 0.0;
-        }
-    }
-}
\ No newline at end of file