A standalone companion to BamToFastqWalker: does the same thing but without calling in gatk's heavy artillery (does not "require" a reference either). Extracts seqs and quals and places them into fastq; along the way it also reverse complements reads that align to the negative strand (so that fastq contains reads as they come from the machine).
git-svn-id: file:///humgen/gsa-scr1/gsa-engineering/svn_contents/trunk@1419 348d0f76-0448-11de-a6fe-93d51630548a
This commit is contained in:
parent
112a283f54
commit
ebec0ec171
|
|
@ -0,0 +1,81 @@
|
||||||
|
package org.broadinstitute.sting.playground.tools;
|
||||||
|
|
||||||
|
import net.sf.picard.cmdline.CommandLineProgram;
|
||||||
|
import net.sf.picard.cmdline.Usage;
|
||||||
|
import net.sf.picard.cmdline.Option;
|
||||||
|
import net.sf.samtools.SAMFileReader;
|
||||||
|
import net.sf.samtools.SAMRecord;
|
||||||
|
|
||||||
|
import java.io.*;
|
||||||
|
|
||||||
|
import org.broadinstitute.sting.utils.BaseUtils;
|
||||||
|
|
||||||
|
/**
|
||||||
|
* Created by IntelliJ IDEA.
|
||||||
|
* User: asivache
|
||||||
|
* Date: Aug 12, 2009
|
||||||
|
* Time: 3:24:46 PM
|
||||||
|
* To change this template use File | Settings | File Templates.
|
||||||
|
*/
|
||||||
|
public class BamToFastq extends CommandLineProgram {
|
||||||
|
@Usage(programVersion="1.0") public String USAGE = "Extracts read sequences and qualities from the input sam/bam file and wirtes them into "+
|
||||||
|
"the output file in fastq format. In the RC mode (default is True), if the read is aligned and the alignment is to the reverse strand on the genome, "+
|
||||||
|
"the read's sequence from input sam file will be reverse-complemented prior to writing it to fastq in order restore correctly "+
|
||||||
|
"the original read sequence as it was generated by the sequencer.";
|
||||||
|
@Option(shortName="I", doc="Input file (bam or sam) to extract reads from. If not specified, reads from stdin.",
|
||||||
|
optional=true) public File IN = null;
|
||||||
|
@Option(shortName="O",doc="Output file (fastq). If not specified, output is printed to stdout.",
|
||||||
|
optional=true) public File OUT = null;
|
||||||
|
@Option(shortName="RC", doc="re-reverse bases and quals of reads aligned to the negative strand before writing them to fastq", optional=true)
|
||||||
|
public Boolean RE_REVERSE = true;
|
||||||
|
|
||||||
|
public static void main(final String[] argv) {
|
||||||
|
System.exit(new BamToFastq().instanceMain(argv));
|
||||||
|
}
|
||||||
|
|
||||||
|
protected int doWork() {
|
||||||
|
|
||||||
|
|
||||||
|
InputStream ins = null;
|
||||||
|
if ( IN == null ) ins = System.in;
|
||||||
|
else {
|
||||||
|
try {
|
||||||
|
ins = new FileInputStream(IN);
|
||||||
|
} catch ( FileNotFoundException ie ) {
|
||||||
|
System.out.println("Failed to open input file "+IN+": "+ie.getCause());
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
SAMFileReader inReader = new SAMFileReader(ins);
|
||||||
|
PrintStream out = null;
|
||||||
|
if ( OUT == null ) out = System.out;
|
||||||
|
else {
|
||||||
|
try {
|
||||||
|
out = new PrintStream(OUT);
|
||||||
|
} catch ( FileNotFoundException ie ) {
|
||||||
|
System.out.println("Failed to open output file "+OUT+": "+ie.getCause());
|
||||||
|
return 1;
|
||||||
|
}
|
||||||
|
}
|
||||||
|
|
||||||
|
for (SAMRecord read : inReader ) {
|
||||||
|
out.println("@" + read.getReadName());
|
||||||
|
if ( read.getReadUnmappedFlag() || !RE_REVERSE || !read.getReadNegativeStrandFlag() ) {
|
||||||
|
out.println(read.getReadString());
|
||||||
|
out.println('+');
|
||||||
|
out.println(read.getBaseQualityString());
|
||||||
|
} else {
|
||||||
|
out.println(BaseUtils.simpleReverseComplement(read.getReadString()));
|
||||||
|
out.println('+');
|
||||||
|
out.println(BaseUtils.reverse(read.getBaseQualityString()));
|
||||||
|
}
|
||||||
|
}
|
||||||
|
inReader.close();
|
||||||
|
out.close();
|
||||||
|
|
||||||
|
return 0;
|
||||||
|
}
|
||||||
|
|
||||||
|
|
||||||
|
}
|
||||||
Loading…
Reference in New Issue