Added the capability of running count covariates only on a given interval.
git-svn-id: file:///humgen/gsa-scr1/gsa-engineering/svn_contents/trunk@5717 348d0f76-0448-11de-a6fe-93d51630548a
This commit is contained in:
parent
34092fd32f
commit
2384e23274
|
|
@ -9,6 +9,7 @@ import net.sf.samtools.{SAMFileReader,SAMReadGroupRecord}
|
||||||
|
|
||||||
import scala.io.Source._
|
import scala.io.Source._
|
||||||
import collection.JavaConversions._
|
import collection.JavaConversions._
|
||||||
|
import org.broadinstitute.sting.queue.function.scattergather.ScatterFunction
|
||||||
|
|
||||||
|
|
||||||
class dataProcessingV2 extends QScript {
|
class dataProcessingV2 extends QScript {
|
||||||
|
|
@ -192,6 +193,8 @@ class dataProcessingV2 extends QScript {
|
||||||
// keep a record of the number of contigs in the first bam file in the list
|
// keep a record of the number of contigs in the first bam file in the list
|
||||||
nContigs = getNumberOfContigs(perLaneAlignedBamFiles(0))
|
nContigs = getNumberOfContigs(perLaneAlignedBamFiles(0))
|
||||||
|
|
||||||
|
println("nContigs: " + nContigs)
|
||||||
|
|
||||||
// Final output list of processed bam files
|
// Final output list of processed bam files
|
||||||
var cohortList: List[File] = List()
|
var cohortList: List[File] = List()
|
||||||
|
|
||||||
|
|
@ -279,9 +282,9 @@ class dataProcessingV2 extends QScript {
|
||||||
this.rodBind :+= RodBind("dbsnp", "VCF", dbSNP)
|
this.rodBind :+= RodBind("dbsnp", "VCF", dbSNP)
|
||||||
this.rodBind :+= RodBind("indels", "VCF", qscript.indels)
|
this.rodBind :+= RodBind("indels", "VCF", qscript.indels)
|
||||||
this.useOnlyKnownIndels = knownsOnly
|
this.useOnlyKnownIndels = knownsOnly
|
||||||
this.doNotUseSW = useSW
|
this.doNotUseSW = !useSW
|
||||||
this.compress = 0
|
this.compress = 0
|
||||||
this.U = org.broadinstitute.sting.gatk.arguments.ValidationExclusion.TYPE.NO_READ_ORDER_VERIFICATION // todo -- update this with the last consensus between Tim, Matt and Eric. This is ugly!
|
// this.U = org.broadinstitute.sting.gatk.arguments.ValidationExclusion.TYPE.NO_READ_ORDER_VERIFICATION // todo -- update this with the last consensus between Tim, Matt and Eric. This is ugly!
|
||||||
this.scatterCount = nContigs
|
this.scatterCount = nContigs
|
||||||
this.analysisName = queueLogDir + outBam + ".clean"
|
this.analysisName = queueLogDir + outBam + ".clean"
|
||||||
this.jobName = queueLogDir + outBam + ".clean"
|
this.jobName = queueLogDir + outBam + ".clean"
|
||||||
|
|
@ -292,6 +295,8 @@ class dataProcessingV2 extends QScript {
|
||||||
this.covariate ++= List("ReadGroupCovariate", "QualityScoreCovariate", "CycleCovariate", "DinucCovariate")
|
this.covariate ++= List("ReadGroupCovariate", "QualityScoreCovariate", "CycleCovariate", "DinucCovariate")
|
||||||
this.input_file :+= inBam
|
this.input_file :+= inBam
|
||||||
this.recal_file = outRecalFile
|
this.recal_file = outRecalFile
|
||||||
|
if (!qscript.intervalString.isEmpty()) this.intervalsString ++= List(qscript.intervalString)
|
||||||
|
else if (qscript.intervals != null) this.intervals :+= qscript.intervals
|
||||||
this.scatterCount = nContigs
|
this.scatterCount = nContigs
|
||||||
this.analysisName = queueLogDir + outRecalFile + ".covariates"
|
this.analysisName = queueLogDir + outRecalFile + ".covariates"
|
||||||
this.jobName = queueLogDir + outRecalFile + ".covariates"
|
this.jobName = queueLogDir + outRecalFile + ".covariates"
|
||||||
|
|
@ -304,7 +309,7 @@ class dataProcessingV2 extends QScript {
|
||||||
this.out = outBam
|
this.out = outBam
|
||||||
if (!qscript.intervalString.isEmpty()) this.intervalsString ++= List(qscript.intervalString)
|
if (!qscript.intervalString.isEmpty()) this.intervalsString ++= List(qscript.intervalString)
|
||||||
else if (qscript.intervals != null) this.intervals :+= qscript.intervals
|
else if (qscript.intervals != null) this.intervals :+= qscript.intervals
|
||||||
this.U = org.broadinstitute.sting.gatk.arguments.ValidationExclusion.TYPE.NO_READ_ORDER_VERIFICATION // todo -- update this with the last consensus between Tim, Matt and Eric. This is ugly!
|
// this.U = org.broadinstitute.sting.gatk.arguments.ValidationExclusion.TYPE.NO_READ_ORDER_VERIFICATION // todo -- update this with the last consensus between Tim, Matt and Eric. This is ugly!
|
||||||
// this.index_output_bam_on_the_fly = true
|
// this.index_output_bam_on_the_fly = true
|
||||||
this.scatterCount = nContigs
|
this.scatterCount = nContigs
|
||||||
this.isIntermediate = false
|
this.isIntermediate = false
|
||||||
|
|
|
||||||
|
|
@ -35,7 +35,7 @@ class justClean extends QScript {
|
||||||
|
|
||||||
println(GATKjar)
|
println(GATKjar)
|
||||||
|
|
||||||
val outBam = swapExt(input, ".bam", ".Qclean.bam")
|
val outBam = swapExt(input, ".bam", ".clean.bam")
|
||||||
val tIntervals = swapExt(input, ".bam", ".all_indels.intervals")
|
val tIntervals = swapExt(input, ".bam", ".all_indels.intervals")
|
||||||
|
|
||||||
val target = new RealignerTargetCreator()
|
val target = new RealignerTargetCreator()
|
||||||
|
|
@ -60,11 +60,9 @@ class justClean extends QScript {
|
||||||
clean.rodBind :+= RodBind("dbsnp", "VCF", dbSNP)
|
clean.rodBind :+= RodBind("dbsnp", "VCF", dbSNP)
|
||||||
clean.rodBind :+= RodBind("indels", "VCF", indels)
|
clean.rodBind :+= RodBind("indels", "VCF", indels)
|
||||||
clean.doNotUseSW = false
|
clean.doNotUseSW = false
|
||||||
clean.compress = 0
|
|
||||||
// clean.U = org.broadinstitute.sting.gatk.arguments.ValidationExclusion.TYPE.NO_READ_ORDER_VERIFICATION // todo -- update clean with the last consensus between Tim, Matt and Eric. This is ugly!
|
|
||||||
clean.jobName = queueLogDir + outBam + ".clean"
|
clean.jobName = queueLogDir + outBam + ".clean"
|
||||||
clean.jarFile = GATKjar
|
clean.jarFile = GATKjar
|
||||||
clean.memoryLimit = 6
|
clean.memoryLimit = 24
|
||||||
clean.scatterCount = 84
|
clean.scatterCount = 84
|
||||||
|
|
||||||
add(target, clean);
|
add(target, clean);
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue