2009-06-22 22:39:41 +08:00
|
|
|
package org.broadinstitute.sting.utils;
|
|
|
|
|
|
2009-12-24 05:59:14 +08:00
|
|
|
|
2009-06-22 22:39:41 +08:00
|
|
|
import net.sf.samtools.SAMFileHeader;
|
|
|
|
|
import org.broadinstitute.sting.BaseTest;
|
2010-01-15 08:14:35 +08:00
|
|
|
import org.broadinstitute.sting.gatk.arguments.IntervalMergingRule;
|
2009-06-22 22:39:41 +08:00
|
|
|
import org.broadinstitute.sting.utils.sam.ArtificialSAMUtils;
|
2009-12-24 05:59:14 +08:00
|
|
|
|
2009-06-22 22:39:41 +08:00
|
|
|
import static org.junit.Assert.assertEquals;
|
2010-02-17 04:35:35 +08:00
|
|
|
import static org.junit.Assert.assertTrue;
|
2009-12-24 05:59:14 +08:00
|
|
|
|
2009-09-22 07:32:24 +08:00
|
|
|
import org.junit.BeforeClass;
|
2009-06-22 22:39:41 +08:00
|
|
|
import org.junit.Test;
|
2009-12-24 05:59:14 +08:00
|
|
|
|
|
|
|
|
import java.util.List;
|
2009-06-22 22:39:41 +08:00
|
|
|
|
|
|
|
|
/**
|
|
|
|
|
* @author aaron
|
|
|
|
|
* <p/>
|
|
|
|
|
* Class GenomeLocParserTest
|
|
|
|
|
* <p/>
|
|
|
|
|
* Test out the functionality of the new genome loc parser
|
|
|
|
|
*/
|
|
|
|
|
public class GenomeLocParserTest extends BaseTest {
|
|
|
|
|
@Test(expected = StingException.class)
|
|
|
|
|
public void testUnsetupException() {
|
2009-09-22 07:32:24 +08:00
|
|
|
GenomeLocParser.contigInfo = null;
|
2009-06-22 22:39:41 +08:00
|
|
|
GenomeLocParser.createGenomeLoc(0, 0, 0);
|
|
|
|
|
}
|
|
|
|
|
|
2009-09-22 07:32:24 +08:00
|
|
|
@BeforeClass
|
|
|
|
|
public static void init() {
|
|
|
|
|
SAMFileHeader header = ArtificialSAMUtils.createArtificialSamHeader(1, 1, 10);
|
|
|
|
|
GenomeLocParser.setupRefContigOrdering(header.getSequenceDictionary());
|
|
|
|
|
}
|
|
|
|
|
|
2009-06-22 22:39:41 +08:00
|
|
|
@Test
|
|
|
|
|
public void testKnownContigOrder() {
|
|
|
|
|
SAMFileHeader header = ArtificialSAMUtils.createArtificialSamHeader(1, 1, 10);
|
2009-09-22 07:32:24 +08:00
|
|
|
GenomeLocParser.contigInfo = null;
|
2009-06-22 22:39:41 +08:00
|
|
|
// assert that it's false when the contig ordering is not setup
|
|
|
|
|
assertTrue(!GenomeLocParser.hasKnownContigOrdering());
|
|
|
|
|
GenomeLocParser.setupRefContigOrdering(header.getSequenceDictionary());
|
|
|
|
|
// assert that it's true when it is setup
|
|
|
|
|
assertTrue(GenomeLocParser.hasKnownContigOrdering());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test(expected = RuntimeException.class)
|
|
|
|
|
public void testGetContigIndex() {
|
2010-02-17 04:35:35 +08:00
|
|
|
assertEquals(-1, GenomeLocParser.getContigIndex("blah",true)); // should not be in the reference
|
2009-06-22 22:39:41 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testGetContigIndexValid() {
|
|
|
|
|
SAMFileHeader header = ArtificialSAMUtils.createArtificialSamHeader(1, 1, 10);
|
2010-02-17 04:35:35 +08:00
|
|
|
assertEquals(0, GenomeLocParser.getContigIndex("chr1",true)); // should be in the reference
|
2009-06-22 22:39:41 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testGetContigInfoUnknownContig() {
|
|
|
|
|
assertEquals(null, GenomeLocParser.getContigInfo("blah")); // should be in the reference
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testGetContigInfoKnownContig() {
|
|
|
|
|
SAMFileHeader header = ArtificialSAMUtils.createArtificialSamHeader(1, 1, 10);
|
|
|
|
|
assertEquals("chr1".compareTo(GenomeLocParser.getContigInfo("chr1").getSequenceName()), 0); // should be in the reference
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test(expected = StingException.class)
|
|
|
|
|
public void testParseBadString() {
|
|
|
|
|
GenomeLocParser.parseGenomeLoc("Bad:0-1");
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testParseGoodString() {
|
|
|
|
|
GenomeLoc loc = GenomeLocParser.parseGenomeLoc("chr1:1-100");
|
|
|
|
|
assertEquals(loc.getContigIndex(), 0);
|
|
|
|
|
assertEquals(100, loc.getStop());
|
|
|
|
|
assertEquals(1, loc.getStart());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test(expected = RuntimeException.class)
|
|
|
|
|
public void testParseBadLocations() {
|
2010-01-15 08:14:35 +08:00
|
|
|
GenomeLocParser.parseGenomeLocs("chr1:1-1;badChr:1-0", IntervalMergingRule.ALL);
|
2009-06-22 22:39:41 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testParseGoodLocations() {
|
2010-01-15 08:14:35 +08:00
|
|
|
GenomeLocParser.parseGenomeLocs("chr1:1-1;chr1:5-9", IntervalMergingRule.ALL);
|
2009-06-22 22:39:41 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test(expected = RuntimeException.class)
|
|
|
|
|
public void testParseGoodLocationsTooManySemiColons() {
|
2010-01-15 08:14:35 +08:00
|
|
|
GenomeLocParser.parseGenomeLocs("chr1:1-1;;chr1:5-9;", IntervalMergingRule.ALL);
|
2009-12-24 05:59:14 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testOverlappingGoodLocationsWithAbuttingFlag() {
|
2010-01-15 08:14:35 +08:00
|
|
|
List<GenomeLoc> locs = GenomeLocParser.parseGenomeLocs("chr1:1-8;chr1:5-9", IntervalMergingRule.OVERLAPPING_ONLY);
|
2009-12-24 05:59:14 +08:00
|
|
|
assertEquals(1, locs.size());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testAbuttingGoodLocationsWithAbuttingOffFlag() {
|
2010-01-15 08:14:35 +08:00
|
|
|
List<GenomeLoc> locs = GenomeLocParser.parseGenomeLocs("chr1:1-4;chr1:5-9", IntervalMergingRule.OVERLAPPING_ONLY);
|
2009-12-24 05:59:14 +08:00
|
|
|
assertEquals(2, locs.size());
|
|
|
|
|
}
|
|
|
|
|
@Test
|
|
|
|
|
public void testAbuttingGoodLocationsWithNoneFlag() {
|
2010-01-15 08:14:35 +08:00
|
|
|
List<GenomeLoc> locs = GenomeLocParser.parseGenomeLocs("chr1:1-8;chr1:5-9", IntervalMergingRule.NONE);
|
2009-12-24 05:59:14 +08:00
|
|
|
assertEquals(2, locs.size());
|
2009-06-22 22:39:41 +08:00
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testCreateGenomeLoc1() {
|
|
|
|
|
GenomeLoc loc = GenomeLocParser.createGenomeLoc("chr1", 1, 100);
|
|
|
|
|
assertEquals(loc.getContigIndex(), 0);
|
|
|
|
|
assertEquals(100, loc.getStop());
|
|
|
|
|
assertEquals(1, loc.getStart());
|
|
|
|
|
}
|
|
|
|
|
|
2009-09-22 07:32:24 +08:00
|
|
|
@Test
|
|
|
|
|
public void testCreateGenomeLoc1point5() { // in honor of VAAL!
|
|
|
|
|
GenomeLoc loc = GenomeLocParser.parseGenomeLoc("chr1:1");
|
|
|
|
|
assertEquals(loc.getContigIndex(), 0);
|
|
|
|
|
assertEquals(1, loc.getStop());
|
|
|
|
|
assertEquals(1, loc.getStart());
|
|
|
|
|
}
|
|
|
|
|
|
2009-06-22 22:39:41 +08:00
|
|
|
@Test
|
|
|
|
|
public void testCreateGenomeLoc2() {
|
|
|
|
|
GenomeLoc loc = GenomeLocParser.createGenomeLoc(0, 1, 100);
|
|
|
|
|
assertEquals(loc.getContigIndex(), 0);
|
|
|
|
|
assertEquals(100, loc.getStop());
|
|
|
|
|
assertEquals(1, loc.getStart());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testCreateGenomeLoc3() {
|
|
|
|
|
GenomeLoc loc = GenomeLocParser.createGenomeLoc(0, 1);
|
|
|
|
|
assertEquals(loc.getContigIndex(), 0);
|
|
|
|
|
assertEquals(1, loc.getStop());
|
|
|
|
|
assertEquals(1, loc.getStart());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testCreateGenomeLoc4() {
|
|
|
|
|
GenomeLoc loc = GenomeLocParser.createGenomeLoc("chr1", 1);
|
|
|
|
|
assertEquals(loc.getContigIndex(), 0);
|
|
|
|
|
assertEquals(1, loc.getStop());
|
|
|
|
|
assertEquals(1, loc.getStart());
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testCreateGenomeLoc5() {
|
2009-09-22 06:37:47 +08:00
|
|
|
GenomeLoc loc = GenomeLocParser.createGenomeLoc(0, 1, 100);
|
2009-06-22 22:39:41 +08:00
|
|
|
GenomeLoc copy = GenomeLocParser.createGenomeLoc(loc);
|
|
|
|
|
assertEquals(copy.getContigIndex(), 0);
|
|
|
|
|
assertEquals(100, copy.getStop());
|
2009-09-22 06:37:47 +08:00
|
|
|
assertEquals(1, copy.getStart());
|
|
|
|
|
}
|
|
|
|
|
|
2009-09-22 07:32:24 +08:00
|
|
|
/*@Test // - uncomment if you want to test speed
|
2009-09-22 06:37:47 +08:00
|
|
|
public void testGenomeLocParserList() {
|
|
|
|
|
long start = System.currentTimeMillis();
|
|
|
|
|
List<GenomeLoc> parsedIntervals = GenomeAnalysisEngine.parseIntervalRegion(Arrays.asList(new String[]{"/humgen/gsa-scr1/GATK_Data/Validation_Data/bigChr1IntervalList.list"}));
|
|
|
|
|
Collections.sort(parsedIntervals);
|
2009-12-24 05:59:14 +08:00
|
|
|
LinkedList<GenomeLoc> loc = new LinkedList<GenomeLoc>(GenomeLocParser.mergeIntervalLocations(parsedIntervals));
|
2009-09-22 06:37:47 +08:00
|
|
|
long stop = System.currentTimeMillis();
|
|
|
|
|
logger.warn("Elapsed time = " + (stop - start));
|
2009-09-22 07:32:24 +08:00
|
|
|
}*/
|
|
|
|
|
|
|
|
|
|
@Test
|
|
|
|
|
public void testGenomeLocPlusSign() {
|
|
|
|
|
GenomeLoc loc = GenomeLocParser.parseGenomeLoc("chr1:1+");
|
|
|
|
|
assertEquals(0, loc.getContigIndex());
|
|
|
|
|
assertEquals(10, loc.getStop()); // the size
|
|
|
|
|
assertEquals(1, loc.getStart());
|
|
|
|
|
}
|
|
|
|
|
|
2009-12-24 05:59:14 +08:00
|
|
|
@Test
|
2009-09-22 12:34:18 +08:00
|
|
|
public void testGenomeLocParseOnlyChrome() {
|
2009-12-24 05:59:14 +08:00
|
|
|
GenomeLoc loc = GenomeLocParser.parseGenomeLoc("chr1");
|
2009-09-22 12:34:18 +08:00
|
|
|
assertEquals(0, loc.getContigIndex());
|
|
|
|
|
assertEquals(10, loc.getStop()); // the size
|
|
|
|
|
assertEquals(1, loc.getStart());
|
|
|
|
|
}
|
2009-12-24 05:59:14 +08:00
|
|
|
|
|
|
|
|
@Test(expected = StingException.class)
|
2009-09-22 12:34:18 +08:00
|
|
|
public void testGenomeLocParseOnlyBadChrome() {
|
2009-12-24 05:59:14 +08:00
|
|
|
GenomeLoc loc = GenomeLocParser.parseGenomeLoc("chr12");
|
2009-09-22 12:34:18 +08:00
|
|
|
assertEquals(0, loc.getContigIndex());
|
|
|
|
|
assertEquals(10, loc.getStop()); // the size
|
|
|
|
|
assertEquals(1, loc.getStart());
|
|
|
|
|
}
|
2009-12-24 05:59:14 +08:00
|
|
|
|
2009-09-22 12:34:18 +08:00
|
|
|
@Test(expected = StingException.class)
|
2009-09-22 07:32:24 +08:00
|
|
|
public void testGenomeLocBad() {
|
|
|
|
|
GenomeLoc loc = GenomeLocParser.parseGenomeLoc("chr1:1-");
|
|
|
|
|
assertEquals(0, loc.getContigIndex());
|
|
|
|
|
assertEquals(10, loc.getStop()); // the size
|
|
|
|
|
assertEquals(1, loc.getStart());
|
2009-06-22 22:39:41 +08:00
|
|
|
}
|
2009-12-24 05:59:14 +08:00
|
|
|
|
|
|
|
|
@Test(expected = StingException.class)
|
2009-09-22 12:34:18 +08:00
|
|
|
public void testGenomeLocBad2() {
|
|
|
|
|
GenomeLoc loc = GenomeLocParser.parseGenomeLoc("chr1:1-500-0");
|
|
|
|
|
assertEquals(0, loc.getContigIndex());
|
|
|
|
|
assertEquals(10, loc.getStop()); // the size
|
|
|
|
|
assertEquals(1, loc.getStart());
|
|
|
|
|
}
|
2009-12-24 05:59:14 +08:00
|
|
|
|
|
|
|
|
@Test(expected = StingException.class)
|
2009-09-22 12:34:18 +08:00
|
|
|
public void testGenomeLocBad3() {
|
|
|
|
|
GenomeLoc loc = GenomeLocParser.parseGenomeLoc("chr1:1--0");
|
|
|
|
|
assertEquals(0, loc.getContigIndex());
|
|
|
|
|
assertEquals(10, loc.getStop()); // the size
|
|
|
|
|
assertEquals(1, loc.getStart());
|
|
|
|
|
}
|
2010-02-17 04:35:35 +08:00
|
|
|
|
|
|
|
|
// test out the validating methods
|
|
|
|
|
@Test
|
|
|
|
|
public void testValidationOfGenomeLocs() {
|
|
|
|
|
assertTrue(GenomeLocParser.validGenomeLoc("chr1",1,1));
|
|
|
|
|
assertTrue(!GenomeLocParser.validGenomeLoc("chr2",1,1)); // shouldn't have an entry
|
|
|
|
|
assertTrue(!GenomeLocParser.validGenomeLoc("chr1",1,11)); // past the end of the contig
|
|
|
|
|
assertTrue(!GenomeLocParser.validGenomeLoc("chr1",-1,10)); // bad start
|
|
|
|
|
assertTrue(!GenomeLocParser.validGenomeLoc("chr1",1,-2)); // bad stop
|
|
|
|
|
assertTrue(!GenomeLocParser.validGenomeLoc("chr1",10,11)); // bad start, past end
|
|
|
|
|
|
|
|
|
|
assertTrue(GenomeLocParser.validGenomeLoc(0,1,1));
|
|
|
|
|
assertTrue(!GenomeLocParser.validGenomeLoc(1,1,1)); // shouldn't have an entry
|
|
|
|
|
assertTrue(!GenomeLocParser.validGenomeLoc(0,1,11)); // past the end of the contig
|
|
|
|
|
assertTrue(!GenomeLocParser.validGenomeLoc(-1,0,10)); // bad start
|
|
|
|
|
assertTrue(!GenomeLocParser.validGenomeLoc(0,1,-2)); // bad stop
|
|
|
|
|
assertTrue(!GenomeLocParser.validGenomeLoc(0,10,11)); // bad start, past end
|
|
|
|
|
|
|
|
|
|
}
|
2009-06-22 22:39:41 +08:00
|
|
|
}
|