While generating YAML now warning and skipping TSV rows that don't have all values.
Fixed log message typo in PipelineTest. git-svn-id: file:///humgen/gsa-scr1/gsa-engineering/svn_contents/trunk@5320 348d0f76-0448-11de-a6fe-93d51630548a
This commit is contained in:
parent
81414a21dd
commit
15ce375787
|
|
@ -257,7 +257,7 @@ object PipelineTest extends BaseTest with Logging {
|
||||||
Assert.fail("Test %s expected exception %s but none was thrown".format(name, expectedException.toString))
|
Assert.fail("Test %s expected exception %s but none was thrown".format(name, expectedException.toString))
|
||||||
} else {
|
} else {
|
||||||
if (CommandLineProgram.result != 0)
|
if (CommandLineProgram.result != 0)
|
||||||
throw new RuntimeException("Error running the GATK with arguments: " + args)
|
throw new RuntimeException("Error running Queue with arguments: " + args)
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
|
||||||
|
|
@ -82,32 +82,32 @@ awk '
|
||||||
bamFile = columnFields[key]
|
bamFile = columnFields[key]
|
||||||
|
|
||||||
if (referenceFile == "") {
|
if (referenceFile == "") {
|
||||||
print "Column header reference_file missing from " tsvFile > "/dev/stderr"
|
print "ERROR: Column header reference_file missing from " tsvFile > "/dev/stderr"
|
||||||
exitWithError = 1
|
exitWithError = 1
|
||||||
}
|
}
|
||||||
|
|
||||||
if (intervalList == "") {
|
if (intervalList == "") {
|
||||||
print "Column header interval_list missing from " tsvFile > "/dev/stderr"
|
print "ERROR: Column header interval_list missing from " tsvFile > "/dev/stderr"
|
||||||
exitWithError = 1
|
exitWithError = 1
|
||||||
}
|
}
|
||||||
|
|
||||||
if (sampleId == "") {
|
if (sampleId == "") {
|
||||||
print "Column header sample_id missing from " tsvFile > "/dev/stderr"
|
print "ERROR: Column header sample_id missing from " tsvFile > "/dev/stderr"
|
||||||
exitWithError = 1
|
exitWithError = 1
|
||||||
}
|
}
|
||||||
|
|
||||||
if (squidProject == "") {
|
if (squidProject == "") {
|
||||||
print "Column header squid_project missing from " tsvFile > "/dev/stderr"
|
print "ERROR: Column header squid_project missing from " tsvFile > "/dev/stderr"
|
||||||
exitWithError = 1
|
exitWithError = 1
|
||||||
}
|
}
|
||||||
|
|
||||||
if (collaboratorId == "") {
|
if (collaboratorId == "") {
|
||||||
print "Column header collaborator_id missing from " tsvFile > "/dev/stderr"
|
print "ERROR: Column header collaborator_id missing from " tsvFile > "/dev/stderr"
|
||||||
exitWithError = 1
|
exitWithError = 1
|
||||||
}
|
}
|
||||||
|
|
||||||
if (bamFile == "") {
|
if (bamFile == "") {
|
||||||
print "Column header *bam_file* missing from " tsvFile > "/dev/stderr"
|
print "ERROR: Column header *bam_file* missing from " tsvFile > "/dev/stderr"
|
||||||
exitWithError = 1
|
exitWithError = 1
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
@ -115,7 +115,6 @@ awk '
|
||||||
exit 1
|
exit 1
|
||||||
}
|
}
|
||||||
|
|
||||||
|
|
||||||
refseqDir = "/humgen/gsa-hpprojects/GATK/data/Annotations/refseq/"
|
refseqDir = "/humgen/gsa-hpprojects/GATK/data/Annotations/refseq/"
|
||||||
dbsnpDir = "/humgen/gsa-hpprojects/GATK/data/"
|
dbsnpDir = "/humgen/gsa-hpprojects/GATK/data/"
|
||||||
|
|
||||||
|
|
@ -131,22 +130,34 @@ awk '
|
||||||
|
|
||||||
printf "{"
|
printf "{"
|
||||||
} else {
|
} else {
|
||||||
if (NR == 2) {
|
missingValue = 0
|
||||||
# Based on the reference of the first sample, specify the dbsnps and refseq tables.
|
if ($referenceFile == "") missingValue = 1
|
||||||
|
if ($intervalList == "") missingValue = 1
|
||||||
|
if ($sampleId == "") missingValue = 1
|
||||||
|
if ($squidProject == "") missingValue = 1
|
||||||
|
if ($collaboratorId == "") missingValue = 1
|
||||||
|
if ($bamFile == "") missingValue = 1
|
||||||
|
|
||||||
referencePartCount = split($referenceFile, referenceParts, "/")
|
if (missingValue) {
|
||||||
referenceName = referenceParts[referencePartCount]
|
print "WARNING: Skipping row which does not have all values: " $0 > "/dev/stderr"
|
||||||
|
|
||||||
genotypeDbsnp = genotypeDbsnps[referenceName]
|
|
||||||
evalDbsnp = evalDbsnps[referenceName]
|
|
||||||
refseq = refseqs[referenceName]
|
|
||||||
|
|
||||||
printf '"$PROJECT_YAML_TEMPLATE"'
|
|
||||||
printf "\n samples: ["
|
|
||||||
} else {
|
} else {
|
||||||
printf ","
|
if (NR == 2) {
|
||||||
|
# Based on the reference of the first sample, specify the dbsnps and refseq tables.
|
||||||
|
|
||||||
|
referencePartCount = split($referenceFile, referenceParts, "/")
|
||||||
|
referenceName = referenceParts[referencePartCount]
|
||||||
|
|
||||||
|
genotypeDbsnp = genotypeDbsnps[referenceName]
|
||||||
|
evalDbsnp = evalDbsnps[referenceName]
|
||||||
|
refseq = refseqs[referenceName]
|
||||||
|
|
||||||
|
printf '"$PROJECT_YAML_TEMPLATE"'
|
||||||
|
printf "\n samples: ["
|
||||||
|
} else {
|
||||||
|
printf ","
|
||||||
|
}
|
||||||
|
printf '"$SAMPLE_YAML_TEMPLATE"'
|
||||||
}
|
}
|
||||||
printf '"$SAMPLE_YAML_TEMPLATE"'
|
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
END {
|
END {
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue