diff --git a/biopet-framework/src/main/scala/nl/lumc/sasc/biopet/tools/ExtractAlignedFastq.scala b/biopet-framework/src/main/scala/nl/lumc/sasc/biopet/tools/ExtractAlignedFastq.scala index 7f7fe2239ba176f7b1ed9104c5f9e7a507f44760..8ceb27793639a8d687eca799aa84deb3913b62ad 100644 --- a/biopet-framework/src/main/scala/nl/lumc/sasc/biopet/tools/ExtractAlignedFastq.scala +++ b/biopet-framework/src/main/scala/nl/lumc/sasc/biopet/tools/ExtractAlignedFastq.scala @@ -21,6 +21,9 @@ object ExtractAlignedFastq extends ToolCommand { type FastqInput = (FastqRecord, Option[FastqRecord]) + /** function to get FastqRecord ID */ + def fastqId(rec: FastqRecord) = rec.getReadHeader.split(" ")(0) + /** * Function to create iterator over Interval given input interval string * @@ -113,11 +116,12 @@ object ExtractAlignedFastq extends ToolCommand { ) (pair: FastqInput) => pair._2 match { - case None => selected.contains(pair._1.getReadHeader) + case None => selected.contains(fastqId(pair._1)) case Some(x) => - require(commonSuffixLength < pair._1.getReadHeader.length) - require(commonSuffixLength < x.getReadHeader.length) - selected.contains(pair._1.getReadHeader.dropRight(commonSuffixLength)) + val rec1Id = fastqId(pair._1) + require(commonSuffixLength < rec1Id.length) + require(commonSuffixLength < fastqId(x).length) + selected.contains(rec1Id.dropRight(commonSuffixLength)) } } @@ -224,6 +228,7 @@ object ExtractAlignedFastq extends ToolCommand { minMapQ = commandArgs.minMapQ, commonSuffixLength = commandArgs.commonSuffixLength) + logger.info("Writing to output file(s) ...") (commandArgs.inputFastq2, commandArgs.outputFastq2) match { case (None, None) => extractReads(memFunc, diff --git a/biopet-framework/src/test/resources/paired01a.fq b/biopet-framework/src/test/resources/paired01a.fq index 530a1bb9bada4865a047a8c8fe73dd5700d0b84d..d1fcedf3780772a936e94a929595f13d4dcc9e65 100644 --- a/biopet-framework/src/test/resources/paired01a.fq +++ b/biopet-framework/src/test/resources/paired01a.fq @@ -1,4 +1,4 @@ -@r01/1 +@r01/1 hello A + H diff --git a/biopet-framework/src/test/resources/paired01b.fq b/biopet-framework/src/test/resources/paired01b.fq index 72cf9246dcce5c29a2500ced269dc3c17fd18847..b93021532b61081eb371c6f784dd2f6f53eb29f3 100644 --- a/biopet-framework/src/test/resources/paired01b.fq +++ b/biopet-framework/src/test/resources/paired01b.fq @@ -1,4 +1,4 @@ -@r01/2 +@r01/2 hello T + I diff --git a/biopet-framework/src/test/scala/nl/lumc/sasc/biopet/tools/ExtractAlignedFastqUnitTest.scala b/biopet-framework/src/test/scala/nl/lumc/sasc/biopet/tools/ExtractAlignedFastqUnitTest.scala index 4cd7205c0ac6e22c4f93c384600c9f570bc88c06..e60af846646321501a5902a2eb4d81ddf3392a6d 100644 --- a/biopet-framework/src/test/scala/nl/lumc/sasc/biopet/tools/ExtractAlignedFastqUnitTest.scala +++ b/biopet-framework/src/test/scala/nl/lumc/sasc/biopet/tools/ExtractAlignedFastqUnitTest.scala @@ -189,7 +189,7 @@ class ExtractAlignedFastqUnitTest extends TestNGSuite with MockitoSugar with Mat } @Test def testWriteSingleFastqDefault() = { - val memFunc = (recs: FastqInput) => Set("r01", "r03").contains(recs._1.getReadHeader) + val memFunc = (recs: FastqInput) => Set("r01", "r03").contains(fastqId(recs._1)) val in1 = new FastqReader(resourceFile("/single01.fq")) val mo1 = mock[BasicFastqWriter] val obs = inOrd(mo1) @@ -201,15 +201,15 @@ class ExtractAlignedFastqUnitTest extends TestNGSuite with MockitoSugar with Mat @Test def testWritePairFastqDefault() = { val mockSet = Set("r01/1", "r01/2", "r03/1", "r03/2") - val memFunc = (recs: FastqInput) => mockSet.contains(recs._1.getReadHeader) || mockSet.contains(recs._2.get.getReadHeader) + val memFunc = (recs: FastqInput) => mockSet.contains(fastqId(recs._1)) || mockSet.contains(fastqId(recs._2.get)) val in1 = new FastqReader(resourceFile("/paired01a.fq")) val in2 = new FastqReader(resourceFile("/paired01b.fq")) val mo1 = mock[BasicFastqWriter] val mo2 = mock[BasicFastqWriter] val obs = inOrd(mo1, mo2) extractReads(memFunc, in1, mo1, in2, mo2) - obs.verify(mo1).write(new FastqRecord("r01/1", "A", "", "H")) - obs.verify(mo2).write(new FastqRecord("r01/2", "T", "", "I")) + obs.verify(mo1).write(new FastqRecord("r01/1 hello", "A", "", "H")) + obs.verify(mo2).write(new FastqRecord("r01/2 hello", "T", "", "I")) obs.verify(mo1).write(new FastqRecord("r03/1", "G", "", "H")) obs.verify(mo2).write(new FastqRecord("r03/2", "C", "", "I")) verify(mo1, times(2)).write(anyObject.asInstanceOf[FastqRecord])