Added the capability of running count covariates only on a given interval.

git-svn-id: file:///humgen/gsa-scr1/gsa-engineering/svn_contents/trunk@5717 348d0f76-0448-11de-a6fe-93d51630548a
This commit is contained in:
carneiro 2011-04-29 21:30:14 +00:00
parent 34092fd32f
commit 2384e23274
2 changed files with 10 additions and 7 deletions

View File

@ -9,6 +9,7 @@ import net.sf.samtools.{SAMFileReader,SAMReadGroupRecord}
import scala.io.Source._
import collection.JavaConversions._
import org.broadinstitute.sting.queue.function.scattergather.ScatterFunction
class dataProcessingV2 extends QScript {
@ -192,6 +193,8 @@ class dataProcessingV2 extends QScript {
// keep a record of the number of contigs in the first bam file in the list
nContigs = getNumberOfContigs(perLaneAlignedBamFiles(0))
println("nContigs: " + nContigs)
// Final output list of processed bam files
var cohortList: List[File] = List()
@ -279,9 +282,9 @@ class dataProcessingV2 extends QScript {
this.rodBind :+= RodBind("dbsnp", "VCF", dbSNP)
this.rodBind :+= RodBind("indels", "VCF", qscript.indels)
this.useOnlyKnownIndels = knownsOnly
this.doNotUseSW = useSW
this.doNotUseSW = !useSW
this.compress = 0
this.U = org.broadinstitute.sting.gatk.arguments.ValidationExclusion.TYPE.NO_READ_ORDER_VERIFICATION // todo -- update this with the last consensus between Tim, Matt and Eric. This is ugly!
// this.U = org.broadinstitute.sting.gatk.arguments.ValidationExclusion.TYPE.NO_READ_ORDER_VERIFICATION // todo -- update this with the last consensus between Tim, Matt and Eric. This is ugly!
this.scatterCount = nContigs
this.analysisName = queueLogDir + outBam + ".clean"
this.jobName = queueLogDir + outBam + ".clean"
@ -292,6 +295,8 @@ class dataProcessingV2 extends QScript {
this.covariate ++= List("ReadGroupCovariate", "QualityScoreCovariate", "CycleCovariate", "DinucCovariate")
this.input_file :+= inBam
this.recal_file = outRecalFile
if (!qscript.intervalString.isEmpty()) this.intervalsString ++= List(qscript.intervalString)
else if (qscript.intervals != null) this.intervals :+= qscript.intervals
this.scatterCount = nContigs
this.analysisName = queueLogDir + outRecalFile + ".covariates"
this.jobName = queueLogDir + outRecalFile + ".covariates"
@ -304,7 +309,7 @@ class dataProcessingV2 extends QScript {
this.out = outBam
if (!qscript.intervalString.isEmpty()) this.intervalsString ++= List(qscript.intervalString)
else if (qscript.intervals != null) this.intervals :+= qscript.intervals
this.U = org.broadinstitute.sting.gatk.arguments.ValidationExclusion.TYPE.NO_READ_ORDER_VERIFICATION // todo -- update this with the last consensus between Tim, Matt and Eric. This is ugly!
// this.U = org.broadinstitute.sting.gatk.arguments.ValidationExclusion.TYPE.NO_READ_ORDER_VERIFICATION // todo -- update this with the last consensus between Tim, Matt and Eric. This is ugly!
// this.index_output_bam_on_the_fly = true
this.scatterCount = nContigs
this.isIntermediate = false

View File

@ -35,7 +35,7 @@ class justClean extends QScript {
println(GATKjar)
val outBam = swapExt(input, ".bam", ".Qclean.bam")
val outBam = swapExt(input, ".bam", ".clean.bam")
val tIntervals = swapExt(input, ".bam", ".all_indels.intervals")
val target = new RealignerTargetCreator()
@ -60,11 +60,9 @@ class justClean extends QScript {
clean.rodBind :+= RodBind("dbsnp", "VCF", dbSNP)
clean.rodBind :+= RodBind("indels", "VCF", indels)
clean.doNotUseSW = false
clean.compress = 0
// clean.U = org.broadinstitute.sting.gatk.arguments.ValidationExclusion.TYPE.NO_READ_ORDER_VERIFICATION // todo -- update clean with the last consensus between Tim, Matt and Eric. This is ugly!
clean.jobName = queueLogDir + outBam + ".clean"
clean.jarFile = GATKjar
clean.memoryLimit = 6
clean.memoryLimit = 24
clean.scatterCount = 84
add(target, clean);