diff --git a/external-example/.gitignore b/external-example/.gitignore new file mode 100644 index 0000000000000000000000000000000000000000..77146859b6e12b32e90cc6f6d388ebc878d548d6 --- /dev/null +++ b/external-example/.gitignore @@ -0,0 +1,14 @@ +# Project-related +dependency-reduced-pom.xml +git.properties + +# gedit +*~ +# Vim +*.swp +# IntelliJ +.idea/* +*.iml +target/ +public/target/ +protected/target/ diff --git a/external-example/README.md b/external-example/README.md new file mode 100644 index 0000000000000000000000000000000000000000..956c6ccf2746212b45f3650ef917147bdd9ed800 --- /dev/null +++ b/external-example/README.md @@ -0,0 +1 @@ +Test implementation of Magpie 2.0 \ No newline at end of file diff --git a/external-example/pom.xml b/external-example/pom.xml new file mode 100644 index 0000000000000000000000000000000000000000..da0d2258fc90fe3cc9a49b76504be5388c683fa1 --- /dev/null +++ b/external-example/pom.xml @@ -0,0 +1,294 @@ +<?xml version="1.0" encoding="UTF-8"?> +<project xmlns="http://maven.apache.org/POM/4.0.0" + xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" + xsi:schemaLocation="http://maven.apache.org/POM/4.0.0 http://maven.apache.org/xsd/maven-4.0.0.xsd"> + <modelVersion>4.0.0</modelVersion> + + <!--TODO: replace groupId --> + <groupId>org.example.group</groupId> + + <!--TODO: replace artifactId --> + <artifactId>ExternalExample</artifactId> + + <!--TODO: replace version, for a new pipeline it's advised to start with '0.1.0-SNAPSHOT' --> + <version>0.1.0-SNAPSHOT</version> + + <properties> + <project.build.sourceEncoding>UTF-8</project.build.sourceEncoding> + <scoverage.plugin.version>1.0.4</scoverage.plugin.version> + <sting.shade.phase>package</sting.shade.phase> + + <!-- + TODO: replace app.main.class, this is the class that get executed when running the jar file + This can be any executable that have a main method. In Biopet any pipeline can be used as direct executable. + Value for direct pipeline: 'org.example.group.pipelines.SimplePipeline' + In the given example is an extension of the biopet executable. In this example there are multiple pipelines in 1 executable. + + It's also possible to make your own main function and call the main function with it's argument of the pipeline from there. + --> + <app.main.class>org.example.group.ExecutableExample</app.main.class> + </properties> + + <dependencies> + <!-- + In here maven dependencies can be placed, when importing a biopet pipeline 'Biopet-Framework' is not required. + When only using the framework without pipeline you need to import BiopetFramework. + It's advised to not use different versions of the pipeline and the framework. + --> + <dependency> + <groupId>nl.lumc.sasc</groupId> + <artifactId>BiopetCore</artifactId> + + <!--TODO: replace version of pipeline to a fixed version --> + <version>0.5.0-SNAPSHOT</version> + </dependency> + <dependency> + <groupId>nl.lumc.sasc</groupId> + <artifactId>BiopetExtensions</artifactId> + <version>0.5.0-SNAPSHOT</version> + </dependency> + <dependency> + <groupId>nl.lumc.sasc</groupId> + <artifactId>Shiva</artifactId> + + <!--TODO: replace version of pipeline to a fixed version --> + <version>0.5.0-SNAPSHOT</version> + </dependency> + </dependencies> + + <build> + <sourceDirectory>${basedir}/src/main/scala</sourceDirectory> + <testSourceDirectory>${basedir}/src/test/scala</testSourceDirectory> + <testResources> + <testResource> + <directory>${basedir}/src/test/resources</directory> + <includes> + <include>**/*</include> + </includes> + </testResource> + </testResources> + <resources> + <resource> + <directory>${basedir}/src/main/resources</directory> + <includes> + <include>**/*</include> + </includes> + </resource> + </resources> + <plugins> + <plugin> + <groupId>org.apache.maven.plugins</groupId> + <artifactId>maven-shade-plugin</artifactId> + <version>2.4.1</version> + <configuration> + <!--suppress MavenModelInspection --> + <finalName>${project.artifactId}-${project.version}-${git.commit.id.abbrev}</finalName> + <transformers> + <transformer implementation="org.apache.maven.plugins.shade.resource.ManifestResourceTransformer"> + <manifestEntries> + <Main-Class>${app.main.class}</Main-Class> + <!--suppress MavenModelInspection --> + <X-Compile-Source-JDK>${maven.compile.source}</X-Compile-Source-JDK> + <!--suppress MavenModelInspection --> + <X-Compile-Target-JDK>${maven.compile.target}</X-Compile-Target-JDK> + </manifestEntries> + </transformer> + </transformers> + <filters> + </filters> + </configuration> + <executions> + <execution> + <phase>package</phase> + <goals> + <goal>shade</goal> + </goals> + </execution> + </executions> + </plugin> + <plugin> + <groupId>org.apache.maven.plugins</groupId> + <artifactId>maven-surefire-plugin</artifactId> + <version>2.18.1</version> + <configuration> + <forkCount>1C</forkCount> + <workingDirectory>${project.build.directory}</workingDirectory> + </configuration> + </plugin> + <plugin> + <artifactId>maven-dependency-plugin</artifactId> + <version>2.10</version> + <executions> + <execution> + <id>copy-installed</id> + <phase>prepare-package</phase> + <goals> + <goal>list</goal> + </goals> + <configuration> + <outputFile>${project.build.outputDirectory}/dependency_list.txt</outputFile> + </configuration> + </execution> + </executions> + </plugin> + <plugin> + <groupId>net.alchim31.maven</groupId> + <artifactId>scala-maven-plugin</artifactId> + <version>3.2.0</version> + <executions> + <execution> + <id>scala-compile</id> + <goals> + <goal>compile</goal> + <goal>testCompile</goal> + </goals> + <configuration> + <args> + <arg>-dependencyfile</arg> + <arg>${project.build.directory}/.scala_dependencies</arg> + <arg>-deprecation</arg> + <arg>-feature</arg> + </args> + </configuration> + </execution> + </executions> + <!-- ... (see other usage or goals for details) ... --> + </plugin> + <plugin> + <groupId>org.apache.maven.plugins</groupId> + <artifactId>maven-jar-plugin</artifactId> + <version>2.5</version> + <executions> + <execution> + <goals> + <goal>test-jar</goal> + </goals> + </execution> + </executions> + <configuration> + <archive> + <manifest> + <addDefaultImplementationEntries>true</addDefaultImplementationEntries> + <addDefaultSpecificationEntries>true</addDefaultSpecificationEntries> + </manifest> + </archive> + </configuration> + </plugin> + <plugin> + <groupId>org.apache.maven.plugins</groupId> + <artifactId>maven-compiler-plugin</artifactId> + <version>2.3.2</version> + <configuration> + <showDeprecation>true</showDeprecation> + </configuration> + </plugin> + <plugin> + <groupId>org.scalariform</groupId> + <artifactId>scalariform-maven-plugin</artifactId> + <version>0.1.4</version> + <executions> + <execution> + <phase>process-sources</phase> + <goals> + <goal>format</goal> + </goals> + <configuration> + <rewriteArrowSymbols>false</rewriteArrowSymbols> + <alignParameters>true</alignParameters> + <alignSingleLineCaseStatements_maxArrowIndent>40 + </alignSingleLineCaseStatements_maxArrowIndent> + <alignSingleLineCaseStatements>true</alignSingleLineCaseStatements> + <compactStringConcatenation>false</compactStringConcatenation> + <compactControlReadability>false</compactControlReadability> + <doubleIndentClassDeclaration>false</doubleIndentClassDeclaration> + <formatXml>true</formatXml> + <indentLocalDefs>false</indentLocalDefs> + <indentPackageBlocks>true</indentPackageBlocks> + <indentSpaces>2</indentSpaces> + <placeScaladocAsterisksBeneathSecondAsterisk>false + </placeScaladocAsterisksBeneathSecondAsterisk> + <preserveDanglingCloseParenthesis>true</preserveDanglingCloseParenthesis> + <preserveSpaceBeforeArguments>false</preserveSpaceBeforeArguments> + <rewriteArrowSymbols>false</rewriteArrowSymbols> + <spaceBeforeColon>false</spaceBeforeColon> + <spaceInsideBrackets>false</spaceInsideBrackets> + <spaceInsideParentheses>false</spaceInsideParentheses> + <spacesWithinPatternBinders>true</spacesWithinPatternBinders> + </configuration> + </execution> + </executions> + </plugin> + <plugin> + <groupId>pl.project13.maven</groupId> + <artifactId>git-commit-id-plugin</artifactId> + <version>2.1.10</version> + <executions> + <execution> + <goals> + <goal>revision</goal> + </goals> + </execution> + </executions> + <configuration> + <prefix>git</prefix> + <dateFormat>dd.MM.yyyy '@' HH:mm:ss z</dateFormat> + <verbose>false</verbose> + <!-- TODO: This directory need to be changed depening where your .git folder is relative from this pom.xml --> + <dotGitDirectory>${basedir}/../.git</dotGitDirectory> + <useNativeGit>true</useNativeGit> + <skipPoms>false</skipPoms> + <generateGitPropertiesFile>true</generateGitPropertiesFile> + <generateGitPropertiesFilename>src/main/resources/git.properties</generateGitPropertiesFilename> + <failOnNoGitDirectory>false</failOnNoGitDirectory> + <abbrevLength>8</abbrevLength> + <skip>false</skip> + <gitDescribe> + <skip>false</skip> + <always>false</always> + <abbrev>8</abbrev> + <dirty>-dirty</dirty> + <forceLongFormat>false</forceLongFormat> + </gitDescribe> + </configuration> + </plugin> + <plugin> + <groupId>com.mycila</groupId> + <artifactId>license-maven-plugin</artifactId> + <version>2.6</version> + <configuration> + <excludes> + <exclude>**/*git*</exclude> + <exclude>**/License*</exclude> + <exclude>**/*.bam</exclude> + <exclude>**/*.bai</exclude> + <exclude>**/*.gtf</exclude> + <exclude>**/*.fq</exclude> + <exclude>**/*.sam</exclude> + <exclude>**/*.bed</exclude> + <exclude>**/*.refFlat</exclude> + <exclude>**/*.R</exclude> + <exclude>**/*.rscript</exclude> + </excludes> + </configuration> + </plugin> + <plugin> + <groupId>org.scoverage</groupId> + <artifactId>scoverage-maven-plugin</artifactId> + <version>${scoverage.plugin.version}</version> + <configuration> + <scalaVersion>2.10.2</scalaVersion> + <!-- other parameters --> + </configuration> + </plugin> + </plugins> + </build> + <reporting> + <plugins> + <plugin> + <groupId>org.scoverage</groupId> + <artifactId>scoverage-maven-plugin</artifactId> + <version>${scoverage.plugin.version}</version> + </plugin> + </plugins> + </reporting> +</project> \ No newline at end of file diff --git a/external-example/src/main/scala/org/example/group/ExecutableExample.scala b/external-example/src/main/scala/org/example/group/ExecutableExample.scala new file mode 100644 index 0000000000000000000000000000000000000000..fe0aaa13d57d5380f8eb14bf984145992ce297e8 --- /dev/null +++ b/external-example/src/main/scala/org/example/group/ExecutableExample.scala @@ -0,0 +1,19 @@ +package org.example.group + +import nl.lumc.sasc.biopet.utils.{ BiopetExecutable, MainCommand } + +/** + * Created by pjvanthof on 30/08/15. + */ +object ExecutableExample extends BiopetExecutable { + + /** This list defines the pipeline that are usable from the executable */ + def pipelines: List[MainCommand] = List( + org.example.group.pipelines.MultisamplePipeline, + org.example.group.pipelines.BiopetPipeline, + org.example.group.pipelines.SimplePipeline + ) + + /** This list defines the (biopet)tools that are usable from the executable */ + def tools: List[MainCommand] = Nil +} diff --git a/external-example/src/main/scala/org/example/group/pipelines/BiopetPipeline.scala b/external-example/src/main/scala/org/example/group/pipelines/BiopetPipeline.scala new file mode 100644 index 0000000000000000000000000000000000000000..6099047a6e5153c15df565d3e70179006ef4ceac --- /dev/null +++ b/external-example/src/main/scala/org/example/group/pipelines/BiopetPipeline.scala @@ -0,0 +1,47 @@ +package org.example.group.pipelines + +import nl.lumc.sasc.biopet.core.PipelineCommand +import nl.lumc.sasc.biopet.utils.config.Configurable +import nl.lumc.sasc.biopet.core.summary.SummaryQScript +import nl.lumc.sasc.biopet.pipelines.shiva.Shiva +import nl.lumc.sasc.biopet.utils.config.Configurable +import org.broadinstitute.gatk.queue.QScript + +/** + * Created by pjvan_thof on 8/28/15. + */ +//TODO: Replace class Name +class BiopetPipeline(val root: Configurable) extends QScript with SummaryQScript { + def this() = this(null) + + /** Only required when using [[SummaryQScript]] */ + def summaryFile = new File(outputDir, "magpie.summary.json") + + /** Only required when using [[SummaryQScript]] */ + def summaryFiles: Map[String, File] = Map() + + /** Only required when using [[SummaryQScript]] */ + def summarySettings = Map() + + // This method can be used to initialize some classes where needed + def init(): Unit = { + } + + // This method is the actual pipeline + def biopetScript: Unit = { + + // Executing a biopet pipeline inside + val shiva = new Shiva(this) + shiva.init() + shiva.biopetScript() + addAll(shiva.functions) + + /* Only required when using [[SummaryQScript]] */ + addSummaryQScript(shiva) + + // From here you can use the output files of shiva as input file of other jobs + } +} + +//TODO: Replace object Name, must be the same as the class of the pipeline +object BiopetPipeline extends PipelineCommand diff --git a/external-example/src/main/scala/org/example/group/pipelines/MultisamplePipeline.scala b/external-example/src/main/scala/org/example/group/pipelines/MultisamplePipeline.scala new file mode 100644 index 0000000000000000000000000000000000000000..ee66d89663c22868958720615a83c5d72f85e8f7 --- /dev/null +++ b/external-example/src/main/scala/org/example/group/pipelines/MultisamplePipeline.scala @@ -0,0 +1,64 @@ +package org.example.group.pipelines + +import nl.lumc.sasc.biopet.core.{ PipelineCommand, MultiSampleQScript } +import nl.lumc.sasc.biopet.utils.config.Configurable +import nl.lumc.sasc.biopet.utils.config.Configurable +import org.broadinstitute.gatk.queue.QScript + +/** + * Created by pjvanthof on 30/08/15. + */ +class MultisamplePipeline(val root: Configurable) extends QScript with MultiSampleQScript { + qscript => + def this() = this(null) + + def init: Unit = { + } + + def biopetScript: Unit = { + addSamplesJobs() // This executes jobs for all samples + } + + def addMultiSampleJobs: Unit = { + // this code will be executed after all code of all samples is executed + } + + def summaryFile: File = new File(outputDir, "MultisamplePipeline.summary.json") + + //TODO: Add summary + def summaryFiles: Map[String, File] = Map() + + //TODO: Add summary + def summarySettings: Map[String, Any] = Map() + + def makeSample(id: String) = new Sample(id) + class Sample(sampleId: String) extends AbstractSample(sampleId) { + + def makeLibrary(id: String) = new Library(id) + class Library(libId: String) extends AbstractLibrary(libId) { + //TODO: Add summary + def summaryFiles: Map[String, File] = Map() + + //TODO: Add summary + def summaryStats: Map[String, Any] = Map() + + def addJobs: Unit = { + //TODO: add library specific jobs + } + } + + //TODO: Add summary + def summaryFiles: Map[String, File] = Map() + + //TODO: Add summary + def summaryStats: Map[String, Any] = Map() + + def addJobs: Unit = { + addPerLibJobs() // This add jobs for each library + //TODO: add sample specific jobs + } + } + +} + +object MultisamplePipeline extends PipelineCommand \ No newline at end of file diff --git a/external-example/src/main/scala/org/example/group/pipelines/SimplePipeline.scala b/external-example/src/main/scala/org/example/group/pipelines/SimplePipeline.scala new file mode 100644 index 0000000000000000000000000000000000000000..f24b0f6152a03979d74c2f7337760cdc06c9e3be --- /dev/null +++ b/external-example/src/main/scala/org/example/group/pipelines/SimplePipeline.scala @@ -0,0 +1,38 @@ +package org.example.group.pipelines + +import nl.lumc.sasc.biopet.core.{ BiopetQScript, PipelineCommand } +import nl.lumc.sasc.biopet.utils.config.Configurable +import nl.lumc.sasc.biopet.extensions.{ Gzip, Cat } +import org.broadinstitute.gatk.queue.QScript + +/** + * Created by pjvanthof on 30/08/15. + */ +//TODO: Replace class name, must be the same as the class of the pipeline +class SimplePipeline(val root: Configurable) extends QScript with BiopetQScript { + // A constructor without arguments is needed if this pipeline is a root pipeline + def this() = this(null) + + @Input(required = true) + var inputFile: File = null + + /** This method can be used to initialize some classes where needed */ + def init(): Unit = { + } + + /** This method is the actual pipeline */ + def biopetScript: Unit = { + val cat = new Cat(this) + cat.input :+= inputFile + cat.output = new File(outputDir, "file.out") + add(cat) + + val gzip = new Gzip(this) + gzip.input :+= cat.output + gzip.output = new File(outputDir, "file.out.gz") + add(gzip) + } +} + +//TODO: Replace object name, must be the same as the class of the pipeline +object SimplePipeline extends PipelineCommand diff --git a/pom.xml b/pom.xml index 9390bf9a13c0362d75f158b08d2e99d3ad8d181f..143a9095a763bbdcc323dc6e4299e534e5f0bc33 100644 --- a/pom.xml +++ b/pom.xml @@ -16,5 +16,6 @@ <modules> <module>public</module> <module>protected</module> + <module>external-example</module> </modules> </project> diff --git a/protected/biopet-gatk-extensions/src/main/scala/nl/lumc/sasc/biopet/extensions/gatk/broad/GatkGeneral.scala b/protected/biopet-gatk-extensions/src/main/scala/nl/lumc/sasc/biopet/extensions/gatk/broad/GatkGeneral.scala index 1d8de140b277d349095ae459f700ed5437888b16..91dd00ed5ed7f4d331d04207b283c5e40bf30bbd 100644 --- a/protected/biopet-gatk-extensions/src/main/scala/nl/lumc/sasc/biopet/extensions/gatk/broad/GatkGeneral.scala +++ b/protected/biopet-gatk-extensions/src/main/scala/nl/lumc/sasc/biopet/extensions/gatk/broad/GatkGeneral.scala @@ -5,7 +5,8 @@ */ package nl.lumc.sasc.biopet.extensions.gatk.broad -import nl.lumc.sasc.biopet.core.{ BiopetJavaCommandLineFunction, Reference } +import nl.lumc.sasc.biopet.core.{ Reference, BiopetJavaCommandLineFunction } +import org.broadinstitute.gatk.engine.phonehome.GATKRunReport import org.broadinstitute.gatk.queue.extensions.gatk.CommandLineGATK trait GatkGeneral extends CommandLineGATK with BiopetJavaCommandLineFunction with Reference { @@ -20,6 +21,15 @@ trait GatkGeneral extends CommandLineGATK with BiopetJavaCommandLineFunction wit if (config.contains("intervals")) intervals = config("intervals").asFileList if (config.contains("exclude_intervals")) excludeIntervals = config("exclude_intervals").asFileList + + Option(config("et").value) match { + case Some("NO_ET") => et = GATKRunReport.PhoneHomeOption.NO_ET + case Some("AWS") => et = GATKRunReport.PhoneHomeOption.AWS + case Some("STDOUT") => et = GATKRunReport.PhoneHomeOption.STDOUT + case Some(x) => throw new IllegalArgumentException(s"Unknown et option for gatk: $x") + case _ => + } + if (config.contains("gatk_key")) gatk_key = config("gatk_key") if (config.contains("pedigree")) pedigree = config("pedigree") diff --git a/protected/biopet-gatk-pipelines/src/test/scala/nl/lumc/sasc/biopet/pipelines/gatk/ShivaTest.scala b/protected/biopet-gatk-pipelines/src/test/scala/nl/lumc/sasc/biopet/pipelines/gatk/ShivaTest.scala index 9395daa1da479d97d5b5bd822379be5085b67c6c..e47797cc7482900cd9084774320ef174eb79e6e2 100644 --- a/protected/biopet-gatk-pipelines/src/test/scala/nl/lumc/sasc/biopet/pipelines/gatk/ShivaTest.scala +++ b/protected/biopet-gatk-pipelines/src/test/scala/nl/lumc/sasc/biopet/pipelines/gatk/ShivaTest.scala @@ -93,6 +93,12 @@ class ShivaTest extends TestNGSuite with Matchers { object ShivaTest { val outputDir = Files.createTempDir() + new File(outputDir, "input").mkdirs() + def inputTouch(name: String): String = { + val file = new File(outputDir, "input" + File.separator + name) + Files.touch(file) + file.getAbsolutePath + } private def copyFile(name: String): Unit = { val is = getClass.getResourceAsStream("/" + name) @@ -136,8 +142,8 @@ object ShivaTest { val sample1 = Map( "samples" -> Map("sample1" -> Map("libraries" -> Map( "lib1" -> Map( - "R1" -> "1_1_R1.fq", - "R2" -> "1_1_R2.fq" + "R1" -> inputTouch("1_1_R1.fq"), + "R2" -> inputTouch("1_1_R2.fq") ) ) ))) @@ -145,8 +151,8 @@ object ShivaTest { val sample2 = Map( "samples" -> Map("sample2" -> Map("libraries" -> Map( "lib1" -> Map( - "R1" -> "2_1_R1.fq", - "R2" -> "2_1_R2.fq" + "R1" -> inputTouch("2_1_R1.fq"), + "R2" -> inputTouch("2_1_R2.fq") ) ) ))) @@ -154,12 +160,12 @@ object ShivaTest { val sample3 = Map( "samples" -> Map("sample3" -> Map("libraries" -> Map( "lib1" -> Map( - "R1" -> "3_1_R1.fq", - "R2" -> "3_1_R2.fq" + "R1" -> inputTouch("3_1_R1.fq"), + "R2" -> inputTouch("3_1_R2.fq") ), "lib2" -> Map( - "R1" -> "3_2_R1.fq", - "R2" -> "3_2_R2.fq" + "R1" -> inputTouch("3_2_R1.fq"), + "R2" -> inputTouch("3_2_R2.fq") ) ) ))) diff --git a/protected/biopet-gatk-pipelines/src/test/scala/nl/lumc/sasc/biopet/pipelines/gatk/ShivaVariantcallingTest.scala b/protected/biopet-gatk-pipelines/src/test/scala/nl/lumc/sasc/biopet/pipelines/gatk/ShivaVariantcallingTest.scala index 2c60207a82fae9da823eb02d7a860b5dd8be1834..8e8a1eddf9e5d6b5aab36c4c6fea7d35ea2da82e 100644 --- a/protected/biopet-gatk-pipelines/src/test/scala/nl/lumc/sasc/biopet/pipelines/gatk/ShivaVariantcallingTest.scala +++ b/protected/biopet-gatk-pipelines/src/test/scala/nl/lumc/sasc/biopet/pipelines/gatk/ShivaVariantcallingTest.scala @@ -73,7 +73,7 @@ class ShivaVariantcallingTest extends TestNGSuite with Matchers { val map = Map("variantcallers" -> callers.toList) val pipeline = initPipeline(map) - pipeline.inputBams = (for (n <- 1 to bams) yield new File("bam_" + n + ".bam")).toList + pipeline.inputBams = (for (n <- 1 to bams) yield ShivaVariantcallingTest.inputTouch("bam_" + n + ".bam")).toList val illegalArgumentException = pipeline.inputBams.isEmpty || (!raw && !bcftools && @@ -107,6 +107,12 @@ class ShivaVariantcallingTest extends TestNGSuite with Matchers { object ShivaVariantcallingTest { val outputDir = Files.createTempDir() + new File(outputDir, "input").mkdirs() + def inputTouch(name: String): File = { + val file = new File(outputDir, "input" + File.separator + name).getAbsoluteFile + Files.touch(file) + file + } private def copyFile(name: String): Unit = { val is = getClass.getResourceAsStream("/" + name) diff --git a/protected/biopet-protected-package/src/main/scala/nl/lumc/sasc/biopet/BiopetExecutableProtected.scala b/protected/biopet-protected-package/src/main/scala/nl/lumc/sasc/biopet/BiopetExecutableProtected.scala index 4e725bb0b1e2002a323cc22f38c86b53ca4f14af..9155e7dbacf4fd624694ac06a1ddf24c69071afe 100644 --- a/protected/biopet-protected-package/src/main/scala/nl/lumc/sasc/biopet/BiopetExecutableProtected.scala +++ b/protected/biopet-protected-package/src/main/scala/nl/lumc/sasc/biopet/BiopetExecutableProtected.scala @@ -8,7 +8,7 @@ package nl.lumc.sasc.biopet import nl.lumc.sasc.biopet.utils.{ BiopetExecutable, MainCommand } object BiopetExecutableProtected extends BiopetExecutable { - def pipelines: List[MainCommand] = BiopetExecutablePublic.pipelines ::: List( + def pipelines: List[MainCommand] = BiopetExecutablePublic.publicPipelines ::: List( nl.lumc.sasc.biopet.pipelines.gatk.Shiva, nl.lumc.sasc.biopet.pipelines.gatk.ShivaVariantcalling, nl.lumc.sasc.biopet.pipelines.gatk.Basty) diff --git a/public/bam2wig/src/main/scala/nl/lumc/sasc/biopet/pipelines/bamtobigwig/Bam2Wig.scala b/public/bam2wig/src/main/scala/nl/lumc/sasc/biopet/pipelines/bamtobigwig/Bam2Wig.scala index 451350227e5620ae612212eb341e0acae49ad958..fb9e39611fd861f9158503581f17d4bd12e6cb30 100644 --- a/public/bam2wig/src/main/scala/nl/lumc/sasc/biopet/pipelines/bamtobigwig/Bam2Wig.scala +++ b/public/bam2wig/src/main/scala/nl/lumc/sasc/biopet/pipelines/bamtobigwig/Bam2Wig.scala @@ -35,6 +35,7 @@ class Bam2Wig(val root: Configurable) extends QScript with BiopetQScript { var bamFile: File = null def init(): Unit = { + inputFiles :+= new InputFile(bamFile) } def biopetScript(): Unit = { diff --git a/public/bammetrics/src/main/resources/nl/lumc/sasc/biopet/pipelines/bammetrics/insertSize.ssp b/public/bammetrics/src/main/resources/nl/lumc/sasc/biopet/pipelines/bammetrics/insertSize.ssp index 45f8da529dbab9bcd5c9a7dd6d93fd730b87715b..ba6692dd7af137c57e51d023438995f136d2e477 100644 --- a/public/bammetrics/src/main/resources/nl/lumc/sasc/biopet/pipelines/bammetrics/insertSize.ssp +++ b/public/bammetrics/src/main/resources/nl/lumc/sasc/biopet/pipelines/bammetrics/insertSize.ssp @@ -42,7 +42,7 @@ #end #if (showPlot) - #{ BammetricsReport.insertSizePlot(outputDir, "insertsize", summary, !sampleLevel, sampleId = sampleId) }# + #{ BammetricsReport.insertSizePlot(outputDir, "insertsize", summary, !sampleLevel, sampleId = sampleId, libId = libId) }# <div class="panel-body"> <img src="insertsize.png" class="img-responsive" /> diff --git a/public/bammetrics/src/main/resources/nl/lumc/sasc/biopet/pipelines/bammetrics/wgsHistogram.ssp b/public/bammetrics/src/main/resources/nl/lumc/sasc/biopet/pipelines/bammetrics/wgsHistogram.ssp index 9905a23cfdcb9ac10ba96b1bb2ed43b3686604b8..e900774e0788d03fc5180444fbbb6bd875ad253e 100644 --- a/public/bammetrics/src/main/resources/nl/lumc/sasc/biopet/pipelines/bammetrics/wgsHistogram.ssp +++ b/public/bammetrics/src/main/resources/nl/lumc/sasc/biopet/pipelines/bammetrics/wgsHistogram.ssp @@ -36,7 +36,7 @@ #end #if (showPlot) - #{ BammetricsReport.wgsHistogramPlot(outputDir, "wgs", summary, !sampleLevel, sampleId = sampleId) }# + #{ BammetricsReport.wgsHistogramPlot(outputDir, "wgs", summary, !sampleLevel, sampleId = sampleId, libId = libId) }# <div class="panel-body"> <img src="wgs.png" class="img-responsive" /> diff --git a/public/bammetrics/src/main/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BamMetrics.scala b/public/bammetrics/src/main/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BamMetrics.scala index 24b0a29b1a7ce265ea145f404203f614da550884..f6a6dc090defdb238f76b68f21189faf38fd207c 100644 --- a/public/bammetrics/src/main/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BamMetrics.scala +++ b/public/bammetrics/src/main/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BamMetrics.scala @@ -71,7 +71,8 @@ class BamMetrics(val root: Configurable) extends QScript with SummaryQScript wit } /** executed before script */ - def init() { + def init(): Unit = { + inputFiles :+= new InputFile(inputBam) } /** Script to add jobs */ @@ -186,8 +187,13 @@ class BamMetrics(val root: Configurable) extends QScript with SummaryQScript wit object BamMetrics extends PipelineCommand { /** Make default implementation of BamMetrics and runs script already */ - def apply(root: Configurable, bamFile: File, outputDir: File): BamMetrics = { + def apply(root: Configurable, + bamFile: File, outputDir: File, + sampleId: Option[String] = None, + libId: Option[String] = None): BamMetrics = { val bamMetrics = new BamMetrics(root) + bamMetrics.sampleId = sampleId + bamMetrics.libId = libId bamMetrics.inputBam = bamFile bamMetrics.outputDir = outputDir diff --git a/public/bammetrics/src/main/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BammetricsReport.scala b/public/bammetrics/src/main/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BammetricsReport.scala index f4138e12ec607ecfdcc9538347c83fbe6c9d4d16..babc43f721b9a1bd4d03f6930a97e4cb454f4187 100644 --- a/public/bammetrics/src/main/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BammetricsReport.scala +++ b/public/bammetrics/src/main/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BammetricsReport.scala @@ -156,14 +156,15 @@ object BammetricsReport extends ReportBuilder { prefix: String, summary: Summary, libraryLevel: Boolean = false, - sampleId: Option[String] = None): Unit = { + sampleId: Option[String] = None, + libId: Option[String] = None): Unit = { val tsvFile = new File(outputDir, prefix + ".tsv") val pngFile = new File(outputDir, prefix + ".png") val tsvWriter = new PrintWriter(tsvFile) if (libraryLevel) { tsvWriter.println((for ( sample <- summary.samples if sampleId.isEmpty || sampleId.get == sample; - lib <- summary.libraries(sample) + lib <- summary.libraries(sample) if libId.isEmpty || libId.get == lib ) yield s"$sample-$lib") .mkString("library\t", "\t", "")) } else { @@ -198,7 +199,7 @@ object BammetricsReport extends ReportBuilder { if (libraryLevel) { for ( sample <- summary.samples if sampleId.isEmpty || sampleId.get == sample; - lib <- summary.libraries(sample) + lib <- summary.libraries(sample) if libId.isEmpty || libId.get == lib ) fill(sample, Some(lib)) } else if (sampleId.isDefined) fill(sampleId.get, None) else summary.samples.foreach(fill(_, None)) @@ -208,7 +209,7 @@ object BammetricsReport extends ReportBuilder { if (libraryLevel) { for ( sample <- summary.samples if sampleId.isEmpty || sampleId.get == sample; - lib <- summary.libraries(sample) + lib <- summary.libraries(sample) if libId.isEmpty || libId.get == lib ) tsvWriter.print("\t" + counts.getOrElse(s"$sample-$lib", "0")) } else { for (sample <- summary.samples if sampleId.isEmpty || sampleId.get == sample) { @@ -243,14 +244,15 @@ object BammetricsReport extends ReportBuilder { prefix: String, summary: Summary, libraryLevel: Boolean = false, - sampleId: Option[String] = None): Unit = { + sampleId: Option[String] = None, + libId: Option[String] = None): Unit = { val tsvFile = new File(outputDir, prefix + ".tsv") val pngFile = new File(outputDir, prefix + ".png") val tsvWriter = new PrintWriter(tsvFile) if (libraryLevel) { tsvWriter.println((for ( sample <- summary.samples if sampleId.isEmpty || sampleId.get == sample; - lib <- summary.libraries(sample) + lib <- summary.libraries(sample) if libId.isEmpty || libId.get == lib ) yield s"$sample-$lib") .mkString("library\t", "\t", "")) } else { @@ -285,7 +287,7 @@ object BammetricsReport extends ReportBuilder { if (libraryLevel) { for ( sample <- summary.samples if sampleId.isEmpty || sampleId.get == sample; - lib <- summary.libraries(sample) + lib <- summary.libraries(sample) if libId.isEmpty || libId.get == lib ) fill(sample, Some(lib)) } else if (sampleId.isDefined) fill(sampleId.get, None) else summary.samples.foreach(fill(_, None)) @@ -295,8 +297,10 @@ object BammetricsReport extends ReportBuilder { if (libraryLevel) { for ( sample <- summary.samples if sampleId.isEmpty || sampleId.get == sample; - lib <- summary.libraries(sample) - ) tsvWriter.print("\t" + counts.getOrElse(s"$sample-$lib", "0")) + lib <- summary.libraries(sample) if libId.isEmpty || libId.get == lib + ) { + tsvWriter.print("\t" + counts.getOrElse(s"$sample-$lib", "0")) + } } else { for (sample <- summary.samples if sampleId.isEmpty || sampleId.get == sample) { tsvWriter.print("\t" + counts.getOrElse(sample, "0")) diff --git a/public/bammetrics/src/test/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BamMetricsTest.scala b/public/bammetrics/src/test/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BamMetricsTest.scala index 7e97b4a78e1176b1603a7ae5aec10057c4bd0175..33304cb198807f46d3801ddfc9b05eaa7d555fe4 100644 --- a/public/bammetrics/src/test/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BamMetricsTest.scala +++ b/public/bammetrics/src/test/scala/nl/lumc/sasc/biopet/pipelines/bammetrics/BamMetricsTest.scala @@ -69,7 +69,7 @@ class BamMetricsTest extends TestNGSuite with Matchers { Map("regions_of_interest" -> (1 to rois).map("roi_" + _ + ".bed").toList) val bammetrics: BamMetrics = initPipeline(map) - bammetrics.inputBam = new File("input.bam") + bammetrics.inputBam = BamMetricsTest.bam bammetrics.sampleId = Some("1") bammetrics.libId = Some("1") bammetrics.script() @@ -98,6 +98,10 @@ class BamMetricsTest extends TestNGSuite with Matchers { object BamMetricsTest { val outputDir = Files.createTempDir() + new File(outputDir, "input").mkdirs() + + val bam = new File(outputDir, "input" + File.separator + "bla.bam") + Files.touch(bam) private def copyFile(name: String): Unit = { val is = getClass.getResourceAsStream("/" + name) diff --git a/public/basty/src/main/scala/nl/lumc/sasc/biopet/pipelines/basty/BastyTrait.scala b/public/basty/src/main/scala/nl/lumc/sasc/biopet/pipelines/basty/BastyTrait.scala index 1990085cef63fc60c637e04bb17811a20b837f85..a2a1f832843072d5abc9d46fb0280ba3b2c19ea4 100644 --- a/public/basty/src/main/scala/nl/lumc/sasc/biopet/pipelines/basty/BastyTrait.scala +++ b/public/basty/src/main/scala/nl/lumc/sasc/biopet/pipelines/basty/BastyTrait.scala @@ -89,6 +89,8 @@ trait BastyTrait extends MultiSampleQScript { addAll(shiva.functions) addSummaryQScript(shiva) + inputFiles :::= shiva.inputFiles + addSamplesJobs() } diff --git a/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/BiopetQScript.scala b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/BiopetQScript.scala index 49f4e3893b7fe63ff03fca94f030363c54d1217f..fbc60aef43e754cd2e845bbf5864259236b71de4 100644 --- a/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/BiopetQScript.scala +++ b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/BiopetQScript.scala @@ -48,6 +48,10 @@ trait BiopetQScript extends Configurable with GatkLogging { var outputFiles: Map[String, File] = Map() + type InputFile = BiopetQScript.InputFile + + var inputFiles: List[InputFile] = Nil + /** Get implemented from org.broadinstitute.gatk.queue.QScript */ var qSettings: QSettings @@ -86,7 +90,16 @@ trait BiopetQScript extends Configurable with GatkLogging { globalConfig.writeReport(qSettings.runName, new File(outputDir, ".log/" + qSettings.runName)) else Logging.addError("Parent of output dir: '" + outputDir.getParent + "' is not writeable, outputdir can not be created") - reportClass.foreach(add(_)) + inputFiles.foreach { i => + if (!i.file.exists()) Logging.addError(s"Input file does not exist: ${i.file}") + else if (!i.file.canRead()) Logging.addError(s"Input file can not be read: ${i.file}") + } + + this match { + case q: MultiSampleQScript if q.onlySamples.nonEmpty && !q.samples.forall(x => q.onlySamples.contains(x._1)) => + logger.info("Write report is skipped because sample flag is used") + case _ => reportClass.foreach(add(_)) + } Logging.checkErrors() } @@ -103,3 +116,7 @@ trait BiopetQScript extends Configurable with GatkLogging { add(function) } } + +object BiopetQScript { + protected case class InputFile(file: File, md5: Option[String] = None) +} diff --git a/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/MultiSampleQScript.scala b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/MultiSampleQScript.scala index d8756c7b91cd27b330b4697aab0d94c9f436c98a..17631709f12db8a3e3b25253afc49fadd3820e32 100644 --- a/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/MultiSampleQScript.scala +++ b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/MultiSampleQScript.scala @@ -26,7 +26,7 @@ trait MultiSampleQScript extends SummaryQScript { qscript => @Argument(doc = "Only Sample", shortName = "s", required = false, fullName = "sample") - private val onlySamples: List[String] = Nil + private[core] val onlySamples: List[String] = Nil require(globalConfig.map.contains("samples"), "No Samples found in config") @@ -131,7 +131,7 @@ trait MultiSampleQScript extends SummaryQScript { /** Runs addAndTrackJobs method for each sample */ final def addSamplesJobs() { - if (onlySamples.isEmpty) { + if (onlySamples.isEmpty || samples.forall(x => onlySamples.contains(x._1))) { samples.foreach { case (sampleId, sample) => sample.addAndTrackJobs() } addMultiSampleJobs() } else onlySamples.foreach(sampleId => samples.get(sampleId) match { diff --git a/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/extensions/CheckChecksum.scala b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/extensions/CheckChecksum.scala new file mode 100644 index 0000000000000000000000000000000000000000..0ae2587f7928bb8d8cfe3e157f79fec7afff031a --- /dev/null +++ b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/extensions/CheckChecksum.scala @@ -0,0 +1,40 @@ +package nl.lumc.sasc.biopet.core.extensions + +import java.io.File + +import nl.lumc.sasc.biopet.core.summary.WriteSummary +import org.broadinstitute.gatk.queue.function.InProcessFunction +import org.broadinstitute.gatk.utils.commandline.{ Argument, Input } + +/** + * This class checks md5sums and give an exit code 1 when md5sum is not the same + * + * Created by pjvanthof on 16/08/15. + */ +class CheckChecksum extends InProcessFunction { + @Input(required = true) + var inputFile: File = _ + + @Input(required = true) + var checksumFile: File = _ + + @Argument(required = true) + var checksum: String = _ + + override def freezeFieldValues(): Unit = { + super.freezeFieldValues() + jobOutputFile = new File(checksumFile.getParentFile, checksumFile.getName + ".check.out") + } + + /** Exits whenever the input md5sum is not the same as the output md5sum */ + def run: Unit = { + val outputChecksum = WriteSummary.parseChecksum(checksumFile).toLowerCase + + if (outputChecksum != checksum.toLowerCase) { + logger.error(s"Input file: '$inputFile' md5sum is not as expected, aborting pipeline") + + // 130 Simulates a ctr-C + Runtime.getRuntime.halt(130) + } + } +} \ No newline at end of file diff --git a/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/report/ReportBuilder.scala b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/report/ReportBuilder.scala index 4c5217f1f3911ce3d6af8aec5d80ec1374df534b..ae7c08e8eb1d20e68d238a5fe4bb3a1f48306626 100644 --- a/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/report/ReportBuilder.scala +++ b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/report/ReportBuilder.scala @@ -231,6 +231,7 @@ object ReportBuilder { case Some(template) => template case _ => val tempFile = File.createTempFile("ssp-template", new File(location).getName) + tempFile.deleteOnExit() IoUtils.copyStreamToFile(getClass.getResourceAsStream(location), tempFile) templateCache += location -> tempFile tempFile diff --git a/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/summary/SummaryQScript.scala b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/summary/SummaryQScript.scala index 13fdc2139bfab807bd61d042433bc13b893c8a84..ab2f64546a7f79e8432ec1ac7ff0ab19427cccfc 100644 --- a/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/summary/SummaryQScript.scala +++ b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/summary/SummaryQScript.scala @@ -18,7 +18,7 @@ package nl.lumc.sasc.biopet.core.summary import java.io.File import nl.lumc.sasc.biopet.core._ -import nl.lumc.sasc.biopet.core.extensions.Md5sum +import nl.lumc.sasc.biopet.core.extensions.{ CheckChecksum, Md5sum } import scala.collection.mutable @@ -27,7 +27,7 @@ import scala.collection.mutable * * Created by pjvan_thof on 2/14/15. */ -trait SummaryQScript extends BiopetQScript { +trait SummaryQScript extends BiopetQScript { qscript => /** Key is sample/library, None is sample or library is not applicable */ private[summary] var summarizables: Map[(String, Option[String], Option[String]), List[Summarizable]] = Map() @@ -116,6 +116,20 @@ trait SummaryQScript extends BiopetQScript { //TODO: add more checksums types } + for (inputFile <- inputFiles) { + inputFile.md5 match { + case Some(checksum) => { + val checkMd5 = new CheckChecksum + checkMd5.inputFile = inputFile.file + require(SummaryQScript.md5sumCache.contains(inputFile.file), "Md5 job is not executed, checksum file can't be found") + checkMd5.checksumFile = SummaryQScript.md5sumCache(inputFile.file) + checkMd5.checksum = checksum + add(checkMd5) + } + case _ => + } + } + for ((_, summarizableList) <- summarizables; summarizable <- summarizableList) { summarizable match { case f: BiopetCommandLineFunction => f.beforeGraph() @@ -135,7 +149,11 @@ trait SummaryQScript extends BiopetQScript { for ((_, file) <- this.summaryFiles) addChecksum(file) - add(writeSummary) + this match { + case q: MultiSampleQScript if q.onlySamples.nonEmpty && !q.samples.forall(x => q.onlySamples.contains(x._1)) => + logger.info("Write summary is skipped because sample flag is used") + case _ => add(writeSummary) + } } } diff --git a/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/summary/WriteSummary.scala b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/summary/WriteSummary.scala index 3edb7a77e71a136d0dcb70185f19f25b0d193eb0..6e7f8248c0693ed0df4c3a372b8885e1908187a7 100644 --- a/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/summary/WriteSummary.scala +++ b/public/biopet-core/src/main/scala/nl/lumc/sasc/biopet/core/summary/WriteSummary.scala @@ -153,10 +153,11 @@ class WriteSummary(val root: Configurable) extends InProcessFunction with Config def parseFile(file: File): Map[String, Any] = { val map: mutable.Map[String, Any] = mutable.Map() map += "path" -> file.getAbsolutePath - if (md5sum) map += "md5" -> parseChecksum(SummaryQScript.md5sumCache(file)) + if (md5sum) map += "md5" -> WriteSummary.parseChecksum(SummaryQScript.md5sumCache(file)) map.toMap } - +} +object WriteSummary { /** Retrive checksum from file */ def parseChecksum(checksumFile: File): String = { Source.fromFile(checksumFile).getLines().toList.head.split(" ")(0) diff --git a/public/biopet-extentsions/src/main/scala/nl/lumc/sasc/biopet/extensions/gatk/Gatk.scala b/public/biopet-extentsions/src/main/scala/nl/lumc/sasc/biopet/extensions/gatk/Gatk.scala index 3134cf131610b1cb776a48bbd9cb3d66ed6ccd48..108253762bab534ab7740512da5ec692158dd0d4 100644 --- a/public/biopet-extentsions/src/main/scala/nl/lumc/sasc/biopet/extensions/gatk/Gatk.scala +++ b/public/biopet-extentsions/src/main/scala/nl/lumc/sasc/biopet/extensions/gatk/Gatk.scala @@ -49,6 +49,8 @@ abstract class Gatk extends BiopetJavaCommandLineFunction with Reference { @Input(required = false) var pedigree: List[File] = config("pedigree", default = Nil) + var et: Option[String] = config("et") + override def versionRegex = """(.*)""".r override def versionExitcode = List(0, 1) override def versionCommand = executable + " -jar " + jarFile + " -version" @@ -65,6 +67,7 @@ abstract class Gatk extends BiopetJavaCommandLineFunction with Reference { required("-T", analysisType) + required("-R", reference) + optional("-K", gatkKey) + + optional("-et", et) + repeat("-I", intervals) + repeat("-XL", excludeIntervals) + repeat("-ped", pedigree) diff --git a/public/biopet-tools-extensions/src/main/scala/nl/lumc/sasc/biopet/extensions/tools/MpileupToVcf.scala b/public/biopet-tools-extensions/src/main/scala/nl/lumc/sasc/biopet/extensions/tools/MpileupToVcf.scala index 212641116f93c61ea9ef1412c7228297cdbb4ff6..60797ce9ca7f491a9dff0cf3a2379570cc6d91f5 100644 --- a/public/biopet-tools-extensions/src/main/scala/nl/lumc/sasc/biopet/extensions/tools/MpileupToVcf.scala +++ b/public/biopet-tools-extensions/src/main/scala/nl/lumc/sasc/biopet/extensions/tools/MpileupToVcf.scala @@ -57,7 +57,7 @@ class MpileupToVcf(val root: Configurable) extends ToolCommandFuntion with Refer } override def beforeCmd(): Unit = { - if (sample == null && inputBam.exists()) { + if (sample == null && inputBam.exists() && inputBam.length() > 0) { val inputSam = SamReaderFactory.makeDefault.open(inputBam) val readGroups = inputSam.getFileHeader.getReadGroups val samples = readGroups.map(readGroup => readGroup.getSample).distinct diff --git a/public/biopet-tools/src/main/scala/nl/lumc/sasc/biopet/tools/VcfStats.scala b/public/biopet-tools/src/main/scala/nl/lumc/sasc/biopet/tools/VcfStats.scala index 960c4921debd6e58f45fa00bbb9dc0864dd11c60..62b04375f630ab59fea18d9c1d974bdf038cb767 100644 --- a/public/biopet-tools/src/main/scala/nl/lumc/sasc/biopet/tools/VcfStats.scala +++ b/public/biopet-tools/src/main/scala/nl/lumc/sasc/biopet/tools/VcfStats.scala @@ -625,6 +625,7 @@ object VcfStats extends ToolCommand { def executeRscript(resource: String, args: Array[String]): Unit = { val is = getClass.getResourceAsStream(resource) val file = File.createTempFile("script.", "." + resource) + file.deleteOnExit() val os = new FileOutputStream(file) org.apache.commons.io.IOUtils.copy(is, os) os.close() diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/BastyGenerateFastaTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/BastyGenerateFastaTest.scala index ebe393bfab7bdb8fedec024319e99a5b0ec29a07..d9d8c1bee6bf96bcc98a372585b5a89454775e08 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/BastyGenerateFastaTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/BastyGenerateFastaTest.scala @@ -31,6 +31,7 @@ class BastyGenerateFastaTest extends TestNGSuite with MockitoSugar with Matchers @Test def testMainVcf = { val tmp = File.createTempFile("basty_out", ".fa") + tmp.deleteOnExit() val tmppath = tmp.getAbsolutePath tmp.deleteOnExit() @@ -40,6 +41,7 @@ class BastyGenerateFastaTest extends TestNGSuite with MockitoSugar with Matchers @Test def testMainVcfAndBam = { val tmp = File.createTempFile("basty_out", ".fa") + tmp.deleteOnExit() val tmppath = tmp.getAbsolutePath tmp.deleteOnExit() @@ -49,6 +51,7 @@ class BastyGenerateFastaTest extends TestNGSuite with MockitoSugar with Matchers @Test def testMainVcfAndBamMore = { val tmp = File.createTempFile("basty_out", ".fa") + tmp.deleteOnExit() val tmppath = tmp.getAbsolutePath tmp.deleteOnExit() diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/BiopetFlagstatTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/BiopetFlagstatTest.scala index 758cb6be6d6aa0a75c2ec1830e0fa3334beb7626..d919fe400154683f5fef7a061ce76c60aab5f5e7 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/BiopetFlagstatTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/BiopetFlagstatTest.scala @@ -56,6 +56,7 @@ class BiopetFlagstatTest extends TestNGSuite with MockitoSugar with Matchers { def testMain() = { //TODO: Test output file val output = File.createTempFile("testMain", ".biopetflagstat") + output.deleteOnExit() main(Array("-I", bam.getAbsolutePath, "-o", output.toString)) } diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/FastqSplitterTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/FastqSplitterTest.scala index ffa8be0bcb6c2cf15bf0ad00efeeb54e903eb3df..dd66b204fab38a4fd26fb011ffe6739faf304009 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/FastqSplitterTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/FastqSplitterTest.scala @@ -23,7 +23,7 @@ class FastqSplitterTest extends TestNGSuite with MockitoSugar with Matchers { @Test def testMain() = { val temp = File.createTempFile("out", ".fastq") - + temp.deleteOnExit() val args = Array("-I", fq, "-o", temp.getAbsolutePath) main(args) } @@ -31,6 +31,7 @@ class FastqSplitterTest extends TestNGSuite with MockitoSugar with Matchers { @Test def testManyOutMain() = { val files = (0 until 10).map(_ => File.createTempFile("out", ".fastq")) + files.foreach(_.deleteOnExit()) var args = Array("-I", fq) files.foreach(x => args ++= Array("-o", x.getAbsolutePath)) main(args) diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/FindRepeatsPacBioTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/FindRepeatsPacBioTest.scala index b6de2f8bcca896e8979c2e21fc5bb8651524610a..907270b8c31f3eb152766f03a612101f754ba6c9 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/FindRepeatsPacBioTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/FindRepeatsPacBioTest.scala @@ -29,6 +29,7 @@ class FindRepeatsPacBioTest extends TestNGSuite with MockitoSugar with Matchers def testMain() = { val outputFile = File.createTempFile("repeats", ".tsv") + outputFile.deleteOnExit() val args = Array("-I", bam, "-b", bed, "-o", outputFile.toString) main(args) } diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/MpileupToVcfTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/MpileupToVcfTest.scala index 032f9a913373c0f3be617e45cc26a928ca69821d..e708bc654b3c81699dcab85bfc07a7e21cd3ea94 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/MpileupToVcfTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/MpileupToVcfTest.scala @@ -28,6 +28,7 @@ class MpileupToVcfTest extends TestNGSuite with MockitoSugar with Matchers { @Test def testMain() = { val tmp = File.createTempFile("mpileup", ".vcf") + tmp.deleteOnExit() val args = Array("-I", pileup, "--sample", "test", "-o", tmp.getAbsolutePath) main(args) @@ -36,6 +37,7 @@ class MpileupToVcfTest extends TestNGSuite with MockitoSugar with Matchers { @Test def validateOutVcf() = { val tmp = File.createTempFile("mpileup", ".vcf") + tmp.deleteOnExit() val args = Array("-I", pileup, "--sample", "test", "-o", tmp.getAbsolutePath, "--minDP", "1", "--minAP", "1") main(args) @@ -51,6 +53,7 @@ class MpileupToVcfTest extends TestNGSuite with MockitoSugar with Matchers { @Test def extraValidateOutVcf() = { val tmp = File.createTempFile("mpileup", ".vcf") + tmp.deleteOnExit() val args = Array("-I", pileup, "--sample", "test", "-o", tmp.getAbsolutePath, "--minDP", "1", "--minAP", "1") main(args) diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/PrefixFastqTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/PrefixFastqTest.scala index 41db9e3ae268a62860fd3fbe9a27e4430165429e..611557d836636aebc71f90e70707035033df6b97 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/PrefixFastqTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/PrefixFastqTest.scala @@ -26,6 +26,7 @@ class PrefixFastqTest extends TestNGSuite with MockitoSugar with Matchers { @Test def testMain() = { val temp = File.createTempFile("out", ".fastq") + temp.deleteOnExit() val args = Array("-i", fq, "-o", temp.getAbsolutePath, "-s", "AAA") main(args) @@ -34,6 +35,7 @@ class PrefixFastqTest extends TestNGSuite with MockitoSugar with Matchers { @Test def testOutput() = { val temp = File.createTempFile("out", ".fastq") + temp.deleteOnExit() val args = Array("-i", fq, "-o", temp.getAbsolutePath, "-s", "AAA") main(args) diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCountFastqTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCountFastqTest.scala index 15d3074c95313c6f2a084c41b4d0a4787bdedddb..5c7731c6dd2ec60b7c8cd01f84c6929026d7e007 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCountFastqTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCountFastqTest.scala @@ -22,6 +22,7 @@ class SageCountFastqTest extends TestNGSuite with MockitoSugar with Matchers { @Test def testMain() = { val temp = File.createTempFile("out", ".fastq") + temp.deleteOnExit() val args = Array("-I", fq, "-o", temp.getAbsolutePath) main(args) diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCreateLibaryTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCreateLibaryTest.scala index 48038ea6f476fd89a945f53cf3d3608661fbcc9c..c86c1ba5a9787c0cdcce00293309500d6f6e4b86 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCreateLibaryTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCreateLibaryTest.scala @@ -29,9 +29,13 @@ class SageCreateLibaryTest extends TestNGSuite with MockitoSugar with Matchers { val input = resourcePath("/mini.transcriptome.fa") val output = File.createTempFile("sageCreateLibrary", ".tsv") + output.deleteOnExit() val noTagsOutput = File.createTempFile("sageCreateLibrary", ".tsv") + noTagsOutput.deleteOnExit() val antiTagsOutput = File.createTempFile("sageCreateLibrary", ".tsv") + antiTagsOutput.deleteOnExit() val allGenesOutput = File.createTempFile("sageCreateLibrary", ".tsv") + allGenesOutput.deleteOnExit() val args = Array("-I", input, "-o", output.getAbsolutePath, "--tag", "CATG", "--length", "17", "--noTagsOutput", noTagsOutput.getAbsolutePath, "--noAntiTagsOutput", @@ -52,9 +56,13 @@ class SageCreateLibaryTest extends TestNGSuite with MockitoSugar with Matchers { def testOutPut = { val input = resourcePath("/mini.transcriptome.fa") val output = File.createTempFile("sageCreateLibrary", ".tsv") + output.deleteOnExit() val noTagsOutput = File.createTempFile("sageCreateLibrary", ".tsv") + noTagsOutput.deleteOnExit() val antiTagsOutput = File.createTempFile("sageCreateLibrary", ".tsv") + antiTagsOutput.deleteOnExit() val allGenesOutput = File.createTempFile("sageCreateLibrary", ".tsv") + allGenesOutput.deleteOnExit() val args = Array("-I", input, "-o", output.getAbsolutePath, "--tag", "CATG", "--length", "17", "--noTagsOutput", noTagsOutput.getAbsolutePath, "--noAntiTagsOutput", diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCreateTagCountsTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCreateTagCountsTest.scala index b47c507856ec251878057a3823d47d57160045e9..ecd1dae87d5c43a88e722cbb12f7eb18ece3a9b8 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCreateTagCountsTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SageCreateTagCountsTest.scala @@ -26,9 +26,13 @@ class SageCreateTagCountsTest extends TestNGSuite with MockitoSugar with Matcher val tagLib = resourcePath("/sageTest.tsv") val sense = File.createTempFile("SageCreateTagCountsTEst", ".tsv") + sense.deleteOnExit() val allSense = File.createTempFile("SageCreateTagCountsTEst", ".tsv") + allSense.deleteOnExit() val antiSense = File.createTempFile("SageCreateTagCountsTEst", ".tsv") + antiSense.deleteOnExit() val allAntiSense = File.createTempFile("SageCreateTagCountsTEst", ".tsv") + allAntiSense.deleteOnExit() noException should be thrownBy main(Array("-I", input, "--tagLib", tagLib, "--countSense", sense.getAbsolutePath, "--countAllSense", allSense.getAbsolutePath, @@ -50,9 +54,13 @@ class SageCreateTagCountsTest extends TestNGSuite with MockitoSugar with Matcher val tagLib = resourcePath("/sageTest.tsv") val sense = File.createTempFile("SageCreateTagCountsTEst", ".tsv") + sense.deleteOnExit() val allSense = File.createTempFile("SageCreateTagCountsTEst", ".tsv") + allSense.deleteOnExit() val antiSense = File.createTempFile("SageCreateTagCountsTEst", ".tsv") + antiSense.deleteOnExit() val allAntiSense = File.createTempFile("SageCreateTagCountsTEst", ".tsv") + allAntiSense.deleteOnExit() main(Array("-I", input, "--tagLib", tagLib, "--countSense", sense.getAbsolutePath, "--countAllSense", allSense.getAbsolutePath, "--countAntiSense", antiSense.getAbsolutePath, diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SamplesTsvToJsonTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SamplesTsvToJsonTest.scala index 9866ad47a8efbfad5f34868b82fe415f6e6b8c28..e8a09a9d7cb9af569f2084c95a1b6c2e7f1e1aad 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SamplesTsvToJsonTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SamplesTsvToJsonTest.scala @@ -21,6 +21,7 @@ class SamplesTsvToJsonTest extends TestNGSuite with MockitoSugar with Matchers { def testCorrectSampleTsv = { val tsv = resourcePath("/sample.tsv") val output = File.createTempFile("testCorrectSampleTsv", ".json") + output.deleteOnExit() noException should be thrownBy main(Array("-i", tsv, "-o", output.toString)) } @@ -29,6 +30,7 @@ class SamplesTsvToJsonTest extends TestNGSuite with MockitoSugar with Matchers { def testNoSampleColumn() = { val tsv = resourcePath("/no_sample.tsv") val output = File.createTempFile("testNoSampleColumn", ".json") + output.deleteOnExit() val thrown = the[IllegalStateException] thrownBy main(Array("-i", tsv, "-o", output.toString)) thrown.getMessage should equal("Sample column does not exist in: " + tsv) } @@ -37,6 +39,7 @@ class SamplesTsvToJsonTest extends TestNGSuite with MockitoSugar with Matchers { def testNumberInLibs = { val tsv = resourcePath("/number.tsv") val output = File.createTempFile("testNumberInLibs", ".json") + output.deleteOnExit() val thrown = the[IllegalStateException] thrownBy main(Array("-i", tsv, "-o", output.toString)) thrown.getMessage should equal("Sample or library may not start with a number") } @@ -45,6 +48,7 @@ class SamplesTsvToJsonTest extends TestNGSuite with MockitoSugar with Matchers { def testSampleIDs = { val tsv = resourcePath("/same.tsv") val output = File.createTempFile("testSampleIDs", ".json") + output.deleteOnExit() val thrown = the[IllegalStateException] thrownBy main(Array("-i", tsv, "-o", output.toString)) thrown.getMessage should equal("Combination of Sample_ID_1 and Lib_ID_1 is found multiple times") diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SummaryToTsvTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SummaryToTsvTest.scala index 6071fceaaed85a943a4f973ac713d24e8b708952..4f921affbc090031b83c0ee5fea3c64b9c9bdf4c 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SummaryToTsvTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/SummaryToTsvTest.scala @@ -24,6 +24,7 @@ class SummaryToTsvTest extends TestNGSuite with MockitoSugar with Matchers { def testMain = { val tsv = resourcePath("/test.summary.json") val output = File.createTempFile("main", "tsv") + output.deleteOnExit() noException should be thrownBy main(Array("-s", tsv, "-p", "something=flexiprep:settings:skip_trim", "-m", "root", "-o", output.toString)) diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/VcfWithVcfTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/VcfWithVcfTest.scala index af8ff6267d5c73dad9eaa10762b1d356a2641626..a6a70881012480a8e92b9aac1c689e4456f9f8c7 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/VcfWithVcfTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/VcfWithVcfTest.scala @@ -47,50 +47,57 @@ class VcfWithVcfTest extends TestNGSuite with MockitoSugar with Matchers { val rand = new Random() @Test def testOutputTypeVcf() = { - val tmpPath = File.createTempFile("VcfWithVcf_", ".vcf").getAbsolutePath - val arguments = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpPath, "-f", "CSQ") + val tmpFile = File.createTempFile("VcfWithVcf_", ".vcf") + tmpFile.deleteOnExit() + val arguments = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpFile.getAbsolutePath, "-f", "CSQ") main(arguments) } @Test def testOutputTypeVcfGz() = { - val tmpPath = File.createTempFile("VcfWithVcf_", ".vcf.gz").getAbsolutePath - val arguments = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpPath, "-f", "CSQ") + val tmpFile = File.createTempFile("VcfWithVcf_", ".vcf.gz") + tmpFile.deleteOnExit() + val arguments = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpFile.getAbsolutePath, "-f", "CSQ") main(arguments) } @Test def testOutputTypeBcf() = { - val tmpPath = File.createTempFile("VcfWithVcf_", ".bcf").getAbsolutePath - val arguments = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpPath, "-f", "CSQ") + val tmpFile = File.createTempFile("VcfWithVcf_", ".bcf") + tmpFile.deleteOnExit() + val arguments = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpFile.getAbsolutePath, "-f", "CSQ") main(arguments) } @Test def testOutputFieldException = { - val tmpPath = File.createTempFile("VCFWithVCf", ".vcf").getAbsolutePath - val args = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpPath, "-f", "CSQ:AC") + val tmpFile = File.createTempFile("VCFWithVCf", ".vcf") + tmpFile.deleteOnExit() + val args = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpFile.getAbsolutePath, "-f", "CSQ:AC") an[IllegalArgumentException] should be thrownBy main(args) val thrown = the[IllegalArgumentException] thrownBy main(args) thrown.getMessage should equal("Field 'AC' already exists in input vcf") } @Test def testInputFieldException = { - val tmpPath = File.createTempFile("VCFWithVCf", ".vcf").getAbsolutePath - val args = Array("-I", unveppedPath, "-s", unveppedPath, "-o", tmpPath, "-f", "CSQ:NEW_CSQ") + val tmpFile = File.createTempFile("VCFWithVCf", ".vcf") + tmpFile.deleteOnExit() + val args = Array("-I", unveppedPath, "-s", unveppedPath, "-o", tmpFile.getAbsolutePath, "-f", "CSQ:NEW_CSQ") an[IllegalArgumentException] should be thrownBy main(args) val thrown = the[IllegalArgumentException] thrownBy main(args) thrown.getMessage should equal("Field 'CSQ' does not exist in secondary vcf") } @Test def testMinMethodException = { - val tmpPath = File.createTempFile("VcfWithVcf_", ".vcf").getAbsolutePath - val args = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpPath, "-f", "CSQ:CSQ:min") + val tmpFile = File.createTempFile("VcfWithVcf_", ".vcf") + tmpFile.deleteOnExit() + val args = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpFile.getAbsolutePath, "-f", "CSQ:CSQ:min") an[IllegalArgumentException] should be thrownBy main(args) val thrown = the[IllegalArgumentException] thrownBy main(args) thrown.getMessage should equal("Type of field CSQ is not numeric") } @Test def testMaxMethodException = { - val tmpPath = File.createTempFile("VcfWithVcf_", ".vcf").getAbsolutePath - val args = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpPath, "-f", "CSQ:CSQ:max") + val tmpFile = File.createTempFile("VcfWithVcf_", ".vcf") + tmpFile.deleteOnExit() + val args = Array("-I", unveppedPath, "-s", veppedPath, "-o", tmpFile.getAbsolutePath, "-f", "CSQ:CSQ:max") an[IllegalArgumentException] should be thrownBy main(args) val thrown = the[IllegalArgumentException] thrownBy main(args) thrown.getMessage should equal("Type of field CSQ is not numeric") diff --git a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/VepNormalizerTest.scala b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/VepNormalizerTest.scala index 5a12e9b579296b58a2764fdaa0b5b916717e384f..53aeddfaf1d6ba87f9e89ac29b31edff8fc5e01b 100644 --- a/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/VepNormalizerTest.scala +++ b/public/biopet-tools/src/test/scala/nl/lumc/sasc/biopet/tools/VepNormalizerTest.scala @@ -47,38 +47,44 @@ class VepNormalizerTest extends TestNGSuite with MockitoSugar with Matchers { val rand = new Random() @Test def testGzOutputExplode(): Unit = { - val tmpPath = File.createTempFile("VepNormalizer_", ".vcf.gz").getAbsolutePath - val arguments: Array[String] = Array("-I", vepped_path, "-O", tmpPath, "-m", "explode") + val tmpFile = File.createTempFile("VepNormalizer_", ".vcf.gz") + tmpFile.deleteOnExit() + val arguments: Array[String] = Array("-I", vepped_path, "-O", tmpFile.getAbsolutePath, "-m", "explode") main(arguments) } @Test def testVcfOutputExplode(): Unit = { - val tmpPath = File.createTempFile("VepNormalizer_", ".vcf").getAbsolutePath - val arguments: Array[String] = Array("-I", vepped_path, "-O", tmpPath, "-m", "explode") + val tmpFile = File.createTempFile("VepNormalizer_", ".vcf") + tmpFile.deleteOnExit() + val arguments: Array[String] = Array("-I", vepped_path, "-O", tmpFile.getAbsolutePath, "-m", "explode") main(arguments) } @Test def testBcfOutputExplode(): Unit = { - val tmp_path = File.createTempFile("VepNormalizer_", ".bcf").getAbsolutePath - val arguments: Array[String] = Array("-I", vepped_path, "-O", tmp_path, "-m", "explode") + val tmpFile = File.createTempFile("VepNormalizer_", ".bcf") + tmpFile.deleteOnExit() + val arguments: Array[String] = Array("-I", vepped_path, "-O", tmpFile.getAbsolutePath, "-m", "explode") main(arguments) } @Test def testGzOutputStandard(): Unit = { - val tmp_path = File.createTempFile("VepNormalizer_", ".vcf.gz").getAbsolutePath - val arguments: Array[String] = Array("-I", vepped_path, "-O", tmp_path, "-m", "standard") + val tmpFile = File.createTempFile("VepNormalizer_", ".vcf.gz") + tmpFile.deleteOnExit() + val arguments: Array[String] = Array("-I", vepped_path, "-O", tmpFile.getAbsolutePath, "-m", "standard") main(arguments) } @Test def testVcfOutputStandard(): Unit = { - val tmp_path = File.createTempFile("VepNormalizer_", ".vcf").getAbsolutePath - val arguments: Array[String] = Array("-I", vepped_path, "-O", tmp_path, "-m", "standard") + val tmpFile = File.createTempFile("VepNormalizer_", ".vcf") + tmpFile.deleteOnExit() + val arguments: Array[String] = Array("-I", vepped_path, "-O", tmpFile.getAbsolutePath, "-m", "standard") main(arguments) } @Test def testBcfOutputStandard(): Unit = { - val tmp_path = File.createTempFile("VepNormalizer_", ".bcf").getAbsolutePath - val arguments: Array[String] = Array("-I", vepped_path, "-O", tmp_path, "-m", "standard") + val tmpFile = File.createTempFile("VepNormalizer_", ".bcf") + tmpFile.deleteOnExit() + val arguments: Array[String] = Array("-I", vepped_path, "-O", tmpFile.getAbsolutePath, "-m", "standard") main(arguments) } diff --git a/public/biopet-utils/src/main/scala/nl/lumc/sasc/biopet/utils/rscript/LinePlot.scala b/public/biopet-utils/src/main/scala/nl/lumc/sasc/biopet/utils/rscript/LinePlot.scala index fb0e2f0a0706a56c6063c2a2fa2dc199bfee573c..1954609198b33dcaa380eaafa3534f463ef43d4c 100644 --- a/public/biopet-utils/src/main/scala/nl/lumc/sasc/biopet/utils/rscript/LinePlot.scala +++ b/public/biopet-utils/src/main/scala/nl/lumc/sasc/biopet/utils/rscript/LinePlot.scala @@ -48,5 +48,5 @@ class LinePlot(val root: Configurable) extends Rscript { ylabel.map(Seq("--ylabel", _)).getOrElse(Seq()) ++ llabel.map(Seq("--llabel", _)).getOrElse(Seq()) ++ title.map(Seq("--title", _)).getOrElse(Seq()) ++ - (if (removeZero) Seq("--removeZero") else Seq()) + (if (removeZero) Seq("--removeZero", "true") else Seq()) } diff --git a/public/biopet-utils/src/main/scala/nl/lumc/sasc/biopet/utils/rscript/Rscript.scala b/public/biopet-utils/src/main/scala/nl/lumc/sasc/biopet/utils/rscript/Rscript.scala index 685108d0cb7f31cebfcc4b998017ae0a4c91726f..3dfac894eeb591a84a31b3fd5bcfa88c34619192 100644 --- a/public/biopet-utils/src/main/scala/nl/lumc/sasc/biopet/utils/rscript/Rscript.scala +++ b/public/biopet-utils/src/main/scala/nl/lumc/sasc/biopet/utils/rscript/Rscript.scala @@ -28,7 +28,11 @@ trait Rscript extends Configurable { } else { val rScript: File = dir match { case Some(dir) => new File(dir, script.getName) - case _ => File.createTempFile(script.getName, ".R") + case _ => { + val file = File.createTempFile(script.getName, ".R") + file.deleteOnExit() + file + } } if (!rScript.getParentFile.exists) rScript.getParentFile.mkdirs diff --git a/public/biopet-utils/src/test/scala/nl/lumc/sasc/biopet/utils/ConfigUtilsTest.scala b/public/biopet-utils/src/test/scala/nl/lumc/sasc/biopet/utils/ConfigUtilsTest.scala index ad8ff00ee2e8a09026168efbf99f5926b4583c50..6bac74cdf9f3bf6148a78b05271593242d9b2d07 100644 --- a/public/biopet-utils/src/test/scala/nl/lumc/sasc/biopet/utils/ConfigUtilsTest.scala +++ b/public/biopet-utils/src/test/scala/nl/lumc/sasc/biopet/utils/ConfigUtilsTest.scala @@ -228,6 +228,7 @@ class ConfigUtilsTest extends TestNGSuite with Matchers { object ConfigUtilsTest { def writeTemp(text: String, extension: String): File = { val file = File.createTempFile("TestConfigUtils.", extension) + file.deleteOnExit() val w = new PrintWriter(file) w.write(text) w.close() diff --git a/public/biopet-utils/src/test/scala/nl/lumc/sasc/biopet/utils/intervals/BedRecordListTest.scala b/public/biopet-utils/src/test/scala/nl/lumc/sasc/biopet/utils/intervals/BedRecordListTest.scala index b748006c2800d5e86aad9e5f918a3d4bf5894c2c..0490b28db7dbf199a9b01c1b48c6783f11720f7d 100644 --- a/public/biopet-utils/src/test/scala/nl/lumc/sasc/biopet/utils/intervals/BedRecordListTest.scala +++ b/public/biopet-utils/src/test/scala/nl/lumc/sasc/biopet/utils/intervals/BedRecordListTest.scala @@ -39,6 +39,7 @@ class BedRecordListTest extends TestNGSuite with Matchers { records.header shouldBe Nil val tempFile = File.createTempFile("region", ".bed") + tempFile.deleteOnExit() records.writeToFile(tempFile) BedRecordList.fromFile(tempFile) shouldBe records tempFile.delete() @@ -50,6 +51,7 @@ class BedRecordListTest extends TestNGSuite with Matchers { records.header shouldBe BedRecordListTest.ucscHeader.split("\n").toList val tempFile = File.createTempFile("region", ".bed") + tempFile.deleteOnExit() records.writeToFile(tempFile) BedRecordList.fromFile(tempFile) shouldBe records tempFile.delete() @@ -129,13 +131,6 @@ class BedRecordListTest extends TestNGSuite with Matchers { list.scatter(100).allRecords.size shouldBe 15 list.scatter(100).length shouldBe 1500 } - - @AfterClass - def end: Unit = { - BedRecordListTest.bedFile.delete() - BedRecordListTest.corruptBedFile.delete() - BedRecordListTest.bedFileUcscHeader.delete() - } } object BedRecordListTest { @@ -149,6 +144,9 @@ object BedRecordListTest { |chr22 2000 6000 cloneB 900 - 2000 6000 0 2 433,399 0,3601""".stripMargin val bedFile = File.createTempFile("regions", ".bed") + bedFile.deleteOnExit() val corruptBedFile = File.createTempFile("regions", ".bed") + corruptBedFile.deleteOnExit() val bedFileUcscHeader = File.createTempFile("regions", ".bed") + bedFileUcscHeader.deleteOnExit() } \ No newline at end of file diff --git a/public/carp/src/main/scala/nl/lumc/sasc/biopet/pipelines/carp/Carp.scala b/public/carp/src/main/scala/nl/lumc/sasc/biopet/pipelines/carp/Carp.scala index fcb9aa3e6c5572858609d7c34d6d7a220c739f5e..f8b4dc6db0ff771d046ffe320a24a7c0d294b832 100644 --- a/public/carp/src/main/scala/nl/lumc/sasc/biopet/pipelines/carp/Carp.scala +++ b/public/carp/src/main/scala/nl/lumc/sasc/biopet/pipelines/carp/Carp.scala @@ -78,6 +78,10 @@ class Carp(val root: Configurable) extends QScript with MultiSampleQScript with if (config.contains("R1")) { mapping.input_R1 = config("R1") if (config.contains("R2")) mapping.input_R2 = config("R2") + + inputFiles :+= new InputFile(mapping.input_R1, config("R1_md5")) + mapping.input_R2.foreach(inputFiles :+= new InputFile(_, config("R2_md5"))) + mapping.init() mapping.biopetScript() addAll(mapping.functions) @@ -107,7 +111,7 @@ class Carp(val root: Configurable) extends QScript with MultiSampleQScript with add(merge) } - val bamMetrics = BamMetrics(qscript, bamFile, new File(sampleDir, "metrics")) + val bamMetrics = BamMetrics(qscript, bamFile, new File(sampleDir, "metrics"), sampleId = Some(sampleId)) addAll(bamMetrics.functions) addSummaryQScript(bamMetrics) addAll(Bam2Wig(qscript, bamFile).functions) diff --git a/public/carp/src/main/scala/nl/lumc/sasc/biopet/pipelines/carp/CarpReport.scala b/public/carp/src/main/scala/nl/lumc/sasc/biopet/pipelines/carp/CarpReport.scala index c5f2256b0c4cf7c4815c305bab8907573449c5a4..59a07dca040ff07f81438b59697953563b97d972 100644 --- a/public/carp/src/main/scala/nl/lumc/sasc/biopet/pipelines/carp/CarpReport.scala +++ b/public/carp/src/main/scala/nl/lumc/sasc/biopet/pipelines/carp/CarpReport.scala @@ -76,7 +76,7 @@ object CarpReport extends MultisampleReportBuilder { ), List( "Alignment" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/alignmentSummary.ssp", if (summary.libraries(sampleId).size > 1) Map("showPlot" -> true) else Map()), - "Preprocessing" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/alignmentSummary.ssp", Map("sampleLevel" -> true)), + "Merged" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/alignmentSummary.ssp", Map("sampleLevel" -> true)), "QC reads" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepReadSummary.ssp"), "QC bases" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepBaseSummary.ssp") ), args) diff --git a/public/carp/src/test/scala/nl/lumc/sasc/biopet/pipelines/carp/CarpTest.scala b/public/carp/src/test/scala/nl/lumc/sasc/biopet/pipelines/carp/CarpTest.scala index c361908fa1110ef7133639e91912acab5cce0da9..407b6fb415a4dbce63a80228241b7a81df29cf36 100644 --- a/public/carp/src/test/scala/nl/lumc/sasc/biopet/pipelines/carp/CarpTest.scala +++ b/public/carp/src/test/scala/nl/lumc/sasc/biopet/pipelines/carp/CarpTest.scala @@ -97,6 +97,12 @@ class CarpTest extends TestNGSuite with Matchers { object CarpTest { val outputDir = Files.createTempDir() + new File(outputDir, "input").mkdirs() + def inputTouch(name: String): String = { + val file = new File(outputDir, "input" + File.separator + name) + Files.touch(file) + file.getAbsolutePath + } private def copyFile(name: String): Unit = { val is = getClass.getResourceAsStream("/" + name) @@ -127,8 +133,8 @@ object CarpTest { val sample1 = Map( "samples" -> Map("sample1" -> Map("libraries" -> Map( "lib1" -> Map( - "R1" -> "1_1_R1.fq", - "R2" -> "1_1_R2.fq" + "R1" -> inputTouch("1_1_R1.fq"), + "R2" -> inputTouch("1_1_R2.fq") ) ) ))) @@ -136,8 +142,8 @@ object CarpTest { val sample2 = Map( "samples" -> Map("sample2" -> Map("libraries" -> Map( "lib1" -> Map( - "R1" -> "2_1_R1.fq", - "R2" -> "2_1_R2.fq" + "R1" -> inputTouch("2_1_R1.fq"), + "R2" -> inputTouch("2_1_R2.fq") ) ) ))) @@ -145,12 +151,12 @@ object CarpTest { val sample3 = Map( "samples" -> Map("sample3" -> Map("libraries" -> Map( "lib1" -> Map( - "R1" -> "3_1_R1.fq", - "R2" -> "3_1_R2.fq" + "R1" -> inputTouch("3_1_R1.fq"), + "R2" -> inputTouch("3_1_R2.fq") ), "lib2" -> Map( - "R1" -> "3_2_R1.fq", - "R2" -> "3_2_R2.fq" + "R1" -> inputTouch("3_2_R1.fq"), + "R2" -> inputTouch("3_2_R2.fq") ) ) ))) @@ -158,8 +164,8 @@ object CarpTest { val threatment1 = Map( "samples" -> Map("threatment" -> Map("control" -> "control1", "libraries" -> Map( "lib1" -> Map( - "R1" -> "threatment_1_R1.fq", - "R2" -> "threatment_1_R2.fq" + "R1" -> inputTouch("threatment_1_R1.fq"), + "R2" -> inputTouch("threatment_1_R2.fq") ) ) ))) @@ -167,8 +173,8 @@ object CarpTest { val control1 = Map( "samples" -> Map("control1" -> Map("libraries" -> Map( "lib1" -> Map( - "R1" -> "control_1_R1.fq", - "R2" -> "control_1_R2.fq" + "R1" -> inputTouch("control_1_R1.fq"), + "R2" -> inputTouch("control_1_R2.fq") ) ) ))) diff --git a/public/flexiprep/src/main/resources/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepBaseSummary.ssp b/public/flexiprep/src/main/resources/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepBaseSummary.ssp index c327a7cef9b16719f1ec4be35ee556005c9bee2e..b2f0057b3dc437c496c4a161af515c11f9a3d80e 100644 --- a/public/flexiprep/src/main/resources/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepBaseSummary.ssp +++ b/public/flexiprep/src/main/resources/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepBaseSummary.ssp @@ -129,7 +129,7 @@ #if (read == "R2") </tr><tr> #end #{ val beforeTotal = summary.getLibraryValue(sample, libId, "flexiprep", "stats", "seqstat_" + read, "bases", "num_total").getOrElse(0).toString.toLong - val afterTotal = summary.getLibraryValue(sample, libId, "flexiprep", "stats", "seqstat_" + read + "_after", "bases", "num_total").getOrElse(0).toString.toLong + val afterTotal = summary.getLibraryValue(sample, libId, "flexiprep", "stats", "seqstat_" + read + "_qc", "bases", "num_total").getOrElse(0).toString.toLong }# <td>${read}</td> <td>${beforeTotal}</td> diff --git a/public/flexiprep/src/main/resources/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepReadSummary.ssp b/public/flexiprep/src/main/resources/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepReadSummary.ssp index 17065bb987d62f147e76a3c096f3db0847bcd265..4a0a60659f5276f7230fef7fabd4cc12f23ae4a4 100644 --- a/public/flexiprep/src/main/resources/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepReadSummary.ssp +++ b/public/flexiprep/src/main/resources/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepReadSummary.ssp @@ -133,7 +133,7 @@ #if (read == "R2") </tr><tr> #end #{ val beforeTotal = summary.getLibraryValue(sample, libId, "flexiprep", "stats", "seqstat_" + read, "reads", "num_total") - val afterTotal = summary.getLibraryValue(sample, libId, "flexiprep", "stats", "seqstat_" + read + "_after", "reads", "num_total") + val afterTotal = summary.getLibraryValue(sample, libId, "flexiprep", "stats", "seqstat_" + read + "_qc", "reads", "num_total") val clippingDiscardedToShort = summary.getLibraryValue(sample, libId, "flexiprep", "stats", "clipping_" + read, "num_reads_discarded_too_short").getOrElse(0).toString.toLong val clippingDiscardedToLong = summary.getLibraryValue(sample, libId, "flexiprep", "stats", "clipping_" + read, "num_reads_discarded_too_long").getOrElse(0).toString.toLong val trimmingDiscarded = summary.getLibraryValue(sample, libId, "flexiprep", "stats", "trimming", "num_reads_discarded_" + read).getOrElse(0).toString.toLong diff --git a/public/flexiprep/src/main/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/Flexiprep.scala b/public/flexiprep/src/main/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/Flexiprep.scala index 5bd686c7e20a6ba37f407f44a0a9c83144aabb8d..771c562cf6f38855280aaa7de6d512eaef6fd973 100644 --- a/public/flexiprep/src/main/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/Flexiprep.scala +++ b/public/flexiprep/src/main/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/Flexiprep.scala @@ -85,6 +85,9 @@ class Flexiprep(val root: Configurable) extends QScript with SummaryQScript with paired = input_R2.isDefined + inputFiles :+= new InputFile(input_R1) + input_R2.foreach(inputFiles :+= new InputFile(_)) + if (input_R1.endsWith(".gz")) R1_name = input_R1.getName.substring(0, input_R1.getName.lastIndexOf(".gz")) else if (input_R1.endsWith(".gzip")) R1_name = input_R1.getName.substring(0, input_R1.getName.lastIndexOf(".gzip")) else R1_name = input_R1.getName @@ -214,6 +217,7 @@ class Flexiprep(val root: Configurable) extends QScript with SummaryQScript with fqSync.outputFastq1 = swapExt(outDir, R1, R1_ext, ".sync" + R1_ext) fqSync.outputFastq2 = swapExt(outDir, R2.get, R2_ext, ".sync" + R2_ext) fqSync.outputStats = swapExt(outDir, R1, R1_ext, ".sync.stats") + fqSync.isIntermediate = true fqSync.deps :::= deps add(fqSync) addSummarizable(fqSync, "fastq_sync") diff --git a/public/flexiprep/src/main/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/FlexiprepReport.scala b/public/flexiprep/src/main/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/FlexiprepReport.scala index c4988cd1e1b131a98d2d4dc52086fef58085e1bc..075077872a314c2a510478ff8a151a4ed7f5ba9c 100644 --- a/public/flexiprep/src/main/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/FlexiprepReport.scala +++ b/public/flexiprep/src/main/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/FlexiprepReport.scala @@ -95,7 +95,7 @@ object FlexiprepReport extends ReportBuilder { def getLine(summary: Summary, sample: String, lib: String): String = { val beforeTotal = new SummaryValue(List("flexiprep", "stats", "seqstat_" + read, "reads", "num_total"), summary, Some(sample), Some(lib)).value.getOrElse(0).toString.toLong - val afterTotal = new SummaryValue(List("flexiprep", "stats", "seqstat_" + read + "_after", "reads", "num_total"), + val afterTotal = new SummaryValue(List("flexiprep", "stats", "seqstat_" + read + "_qc", "reads", "num_total"), summary, Some(sample), Some(lib)).value.getOrElse(0).toString.toLong val clippingDiscardedToShort = new SummaryValue(List("flexiprep", "stats", "clipping_" + read, "num_reads_discarded_too_short"), summary, Some(sample), Some(lib)).value.getOrElse(0).toString.toLong @@ -152,7 +152,7 @@ object FlexiprepReport extends ReportBuilder { def getLine(summary: Summary, sample: String, lib: String): String = { val beforeTotal = new SummaryValue(List("flexiprep", "stats", "seqstat_" + read, "bases", "num_total"), summary, Some(sample), Some(lib)).value.getOrElse(0).toString.toLong - val afterTotal = new SummaryValue(List("flexiprep", "stats", "seqstat_" + read + "_after", "bases", "num_total"), + val afterTotal = new SummaryValue(List("flexiprep", "stats", "seqstat_" + read + "_qc", "bases", "num_total"), summary, Some(sample), Some(lib)).value.getOrElse(0).toString.toLong val sb = new StringBuffer() diff --git a/public/flexiprep/src/test/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/FlexiprepTest.scala b/public/flexiprep/src/test/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/FlexiprepTest.scala index 2cb3f0e7b36175d9bf7633d7d639e6b03612976f..7b6716024963be03f256eb31bfad2bf5bcdf769e 100644 --- a/public/flexiprep/src/test/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/FlexiprepTest.scala +++ b/public/flexiprep/src/test/scala/nl/lumc/sasc/biopet/pipelines/flexiprep/FlexiprepTest.scala @@ -67,8 +67,8 @@ class FlexiprepTest extends TestNGSuite with Matchers { ), Map(FlexiprepTest.executables.toSeq: _*)) val flexiprep: Flexiprep = initPipeline(map) - flexiprep.input_R1 = new File(flexiprep.outputDir, "bla_R1.fq" + (if (zipped) ".gz" else "")) - if (paired) flexiprep.input_R2 = Some(new File(flexiprep.outputDir, "bla_R2.fq" + (if (zipped) ".gz" else ""))) + flexiprep.input_R1 = (if (zipped) FlexiprepTest.r1Zipped else FlexiprepTest.r1) + if (paired) flexiprep.input_R2 = Some((if (zipped) FlexiprepTest.r2Zipped else FlexiprepTest.r2)) flexiprep.sampleId = Some("1") flexiprep.libId = Some("1") flexiprep.script() @@ -95,6 +95,16 @@ class FlexiprepTest extends TestNGSuite with Matchers { object FlexiprepTest { val outputDir = Files.createTempDir() + new File(outputDir, "input").mkdirs() + + val r1 = new File(outputDir, "input" + File.separator + "R1.fq") + Files.touch(r1) + val r2 = new File(outputDir, "input" + File.separator + "R2.fq") + Files.touch(r2) + val r1Zipped = new File(outputDir, "input" + File.separator + "R1.fq.gz") + Files.touch(r1Zipped) + val r2Zipped = new File(outputDir, "input" + File.separator + "R2.fq.gz") + Files.touch(r2Zipped) val executables = Map( "seqstat" -> Map("exe" -> "test"), diff --git a/public/gentrap/src/main/scala/nl/lumc/sasc/biopet/pipelines/gentrap/Gentrap.scala b/public/gentrap/src/main/scala/nl/lumc/sasc/biopet/pipelines/gentrap/Gentrap.scala index c500757088d3c313190cb4a9b0eca65bfc48f9a4..d033594c6e42663427108baf12038b7eed6fb3f6 100644 --- a/public/gentrap/src/main/scala/nl/lumc/sasc/biopet/pipelines/gentrap/Gentrap.scala +++ b/public/gentrap/src/main/scala/nl/lumc/sasc/biopet/pipelines/gentrap/Gentrap.scala @@ -844,6 +844,8 @@ class Gentrap(val root: Configurable) extends QScript def addJobs(): Unit = { // create per-library alignment file addAll(mappingJob.functions) + // Input file checking + inputFiles :::= mappingJob.inputFiles // add bigwig track addAll(bam2wigModule.functions) qscript.addSummaryQScript(mappingJob) diff --git a/public/gentrap/src/test/scala/nl/lumc/sasc/biopet/pipelines/gentrap/GentrapTest.scala b/public/gentrap/src/test/scala/nl/lumc/sasc/biopet/pipelines/gentrap/GentrapTest.scala index 140db66fd62dd850365b27137cc3df0891bd38a7..2b2ddaf259e8fa5ad382ef1aca1337826ecf0ad8 100644 --- a/public/gentrap/src/test/scala/nl/lumc/sasc/biopet/pipelines/gentrap/GentrapTest.scala +++ b/public/gentrap/src/test/scala/nl/lumc/sasc/biopet/pipelines/gentrap/GentrapTest.scala @@ -43,8 +43,8 @@ class GentrapTest extends TestNGSuite with Matchers { /** Convenience method for making library config */ private def makeLibConfig(idx: Int, paired: Boolean = true) = { - val files = Map("R1" -> "test_R1.fq") - if (paired) (s"lib_$idx", files ++ Map("R2" -> "test_R2.fq")) + val files = Map("R1" -> GentrapTest.inputTouch("test_R1.fq")) + if (paired) (s"lib_$idx", files ++ Map("R2" -> GentrapTest.inputTouch("test_R2.fq"))) else (s"lib_$idx", files) } @@ -179,6 +179,12 @@ class GentrapTest extends TestNGSuite with Matchers { object GentrapTest { val outputDir = Files.createTempDir() + new File(outputDir, "input").mkdirs() + def inputTouch(name: String): String = { + val file = new File(outputDir, "input" + File.separator + name) + Files.touch(file) + file.getAbsolutePath + } private def copyFile(name: String): Unit = { val is = getClass.getResourceAsStream("/" + name) diff --git a/public/mapping/src/main/scala/nl/lumc/sasc/biopet/pipelines/mapping/Mapping.scala b/public/mapping/src/main/scala/nl/lumc/sasc/biopet/pipelines/mapping/Mapping.scala index 24ec2a2bb7a7aded19350951cf8aa67308d4418e..39a07e955b469678fc3feb2c4870ad6a5fa72aa9 100644 --- a/public/mapping/src/main/scala/nl/lumc/sasc/biopet/pipelines/mapping/Mapping.scala +++ b/public/mapping/src/main/scala/nl/lumc/sasc/biopet/pipelines/mapping/Mapping.scala @@ -138,6 +138,9 @@ class Mapping(val root: Configurable) extends QScript with SummaryQScript with S require(sampleId.isDefined, "Missing sample ID on mapping module") require(libId.isDefined, "Missing library ID on mapping module") + inputFiles :+= new InputFile(input_R1) + input_R2.foreach(inputFiles :+= new InputFile(_)) + paired = input_R2.isDefined if (readgroupId == null) readgroupId = sampleId.get + "-" + libId.get diff --git a/public/mapping/src/test/scala/nl/lumc/sasc/biopet/pipelines/mapping/MappingTest.scala b/public/mapping/src/test/scala/nl/lumc/sasc/biopet/pipelines/mapping/MappingTest.scala index 2270f6ef8752298662f1b513414e657c529278c0..7588e4a84502d5bef276de3fd0d64237b0e63938 100644 --- a/public/mapping/src/test/scala/nl/lumc/sasc/biopet/pipelines/mapping/MappingTest.scala +++ b/public/mapping/src/test/scala/nl/lumc/sasc/biopet/pipelines/mapping/MappingTest.scala @@ -79,11 +79,11 @@ class MappingTest extends TestNGSuite with Matchers { val mapping: Mapping = initPipeline(map) if (zipped) { - mapping.input_R1 = new File(mapping.outputDir, "bla_R1.fq.gz") - if (paired) mapping.input_R2 = Some(new File(mapping.outputDir, "bla_R2.fq.gz")) + mapping.input_R1 = MappingTest.r1Zipped + if (paired) mapping.input_R2 = Some(MappingTest.r2Zipped) } else { - mapping.input_R1 = new File(mapping.outputDir, "bla_R1.fq") - if (paired) mapping.input_R2 = Some(new File(mapping.outputDir, "bla_R2.fq")) + mapping.input_R1 = MappingTest.r1 + if (paired) mapping.input_R2 = Some(MappingTest.r2) } mapping.sampleId = Some("1") mapping.libId = Some("1") @@ -131,6 +131,16 @@ class MappingTest extends TestNGSuite with Matchers { object MappingTest { val outputDir = Files.createTempDir() + new File(outputDir, "input").mkdirs() + + val r1 = new File(outputDir, "input" + File.separator + "R1.fq") + Files.touch(r1) + val r2 = new File(outputDir, "input" + File.separator + "R2.fq") + Files.touch(r2) + val r1Zipped = new File(outputDir, "input" + File.separator + "R1.fq.gz") + Files.touch(r1Zipped) + val r2Zipped = new File(outputDir, "input" + File.separator + "R2.fq.gz") + Files.touch(r2Zipped) private def copyFile(name: String): Unit = { val is = getClass.getResourceAsStream("/" + name) diff --git a/public/sage/src/main/scala/nl/lumc/sasc/biopet/pipelines/sage/Sage.scala b/public/sage/src/main/scala/nl/lumc/sasc/biopet/pipelines/sage/Sage.scala index 4aaee19c295de32dbc306a94cf6fecf63d1ba754..2ee8c3b1930aff553234f6f3860d7c13e0818783 100644 --- a/public/sage/src/main/scala/nl/lumc/sasc/biopet/pipelines/sage/Sage.scala +++ b/public/sage/src/main/scala/nl/lumc/sasc/biopet/pipelines/sage/Sage.scala @@ -88,6 +88,8 @@ class Sage(val root: Configurable) extends QScript with MultiSampleQScript { mapping.sampleId = Some(sampleId) protected def addJobs(): Unit = { + inputFiles :+= new InputFile(inputFastq, config("R1_md5")) + flexiprep.outputDir = new File(libDir, "flexiprep/") flexiprep.input_R1 = inputFastq flexiprep.init() diff --git a/public/shiva/src/main/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaTrait.scala b/public/shiva/src/main/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaTrait.scala index 3f65bf2a20864e2017f512981daa0d37aca52772..dafb2e1ccc5a72807aa37cc6858711afbfe78c23 100644 --- a/public/shiva/src/main/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaTrait.scala +++ b/public/shiva/src/main/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaTrait.scala @@ -136,51 +136,56 @@ trait ShivaTrait extends MultiSampleQScript with SummaryQScript with Reference { case (true, _) => mapping.foreach(mapping => { mapping.input_R1 = config("R1") mapping.input_R2 = config("R2") + inputFiles :+= new InputFile(mapping.input_R1, config("R1_md5")) + mapping.input_R2.foreach(inputFiles :+= new InputFile(_, config("R2_md5"))) }) - case (false, true) => config("bam_to_fastq", default = false).asBoolean match { - case true => - val samToFastq = SamToFastq(qscript, config("bam"), - new File(libDir, sampleId + "-" + libId + ".R1.fastq"), - new File(libDir, sampleId + "-" + libId + ".R2.fastq")) - samToFastq.isIntermediate = true - qscript.add(samToFastq) - mapping.foreach(mapping => { - mapping.input_R1 = samToFastq.fastqR1 - mapping.input_R2 = Some(samToFastq.fastqR2) - }) - case false => - val inputSam = SamReaderFactory.makeDefault.open(config("bam")) - val readGroups = inputSam.getFileHeader.getReadGroups - - val readGroupOke = readGroups.forall(readGroup => { - if (readGroup.getSample != sampleId) logger.warn("Sample ID readgroup in bam file is not the same") - if (readGroup.getLibrary != libId) logger.warn("Library ID readgroup in bam file is not the same") - readGroup.getSample == sampleId && readGroup.getLibrary == libId - }) - inputSam.close() - - if (!readGroupOke) { - if (config("correct_readgroups", default = false).asBoolean) { - logger.info("Correcting readgroups, file:" + config("bam")) - val aorrg = AddOrReplaceReadGroups(qscript, config("bam"), bamFile.get) - aorrg.RGID = sampleId + "-" + libId - aorrg.RGLB = libId - aorrg.RGSM = sampleId - aorrg.isIntermediate = true - qscript.add(aorrg) - } else throw new IllegalStateException("Sample readgroup and/or library of input bamfile is not correct, file: " + bamFile + - "\nPlease note that it is possible to set 'correct_readgroups' to true in the config to automatic fix this") - } else { - val oldBamFile: File = config("bam") - val oldIndex: File = new File(oldBamFile.getAbsolutePath.stripSuffix(".bam") + ".bai") - val newIndex: File = new File(libDir, oldBamFile.getName.stripSuffix(".bam") + ".bai") - val baiLn = Ln(qscript, oldIndex, newIndex) - add(baiLn) - - val bamLn = Ln(qscript, oldBamFile, bamFile.get) - bamLn.deps :+= baiLn.output - add(bamLn) - } + case (false, true) => { + inputFiles :+= new InputFile(config("bam"), config("bam_md5")) + config("bam_to_fastq", default = false).asBoolean match { + case true => + val samToFastq = SamToFastq(qscript, config("bam"), + new File(libDir, sampleId + "-" + libId + ".R1.fastq"), + new File(libDir, sampleId + "-" + libId + ".R2.fastq")) + samToFastq.isIntermediate = true + qscript.add(samToFastq) + mapping.foreach(mapping => { + mapping.input_R1 = samToFastq.fastqR1 + mapping.input_R2 = Some(samToFastq.fastqR2) + }) + case false => + val inputSam = SamReaderFactory.makeDefault.open(config("bam")) + val readGroups = inputSam.getFileHeader.getReadGroups + + val readGroupOke = readGroups.forall(readGroup => { + if (readGroup.getSample != sampleId) logger.warn("Sample ID readgroup in bam file is not the same") + if (readGroup.getLibrary != libId) logger.warn("Library ID readgroup in bam file is not the same") + readGroup.getSample == sampleId && readGroup.getLibrary == libId + }) + inputSam.close() + + if (!readGroupOke) { + if (config("correct_readgroups", default = false).asBoolean) { + logger.info("Correcting readgroups, file:" + config("bam")) + val aorrg = AddOrReplaceReadGroups(qscript, config("bam"), bamFile.get) + aorrg.RGID = sampleId + "-" + libId + aorrg.RGLB = libId + aorrg.RGSM = sampleId + aorrg.isIntermediate = true + qscript.add(aorrg) + } else throw new IllegalStateException("Sample readgroup and/or library of input bamfile is not correct, file: " + bamFile + + "\nPlease note that it is possible to set 'correct_readgroups' to true in the config to automatic fix this") + } else { + val oldBamFile: File = config("bam") + val oldIndex: File = new File(oldBamFile.getAbsolutePath.stripSuffix(".bam") + ".bai") + val newIndex: File = new File(libDir, oldBamFile.getName.stripSuffix(".bam") + ".bai") + val baiLn = Ln(qscript, oldIndex, newIndex) + add(baiLn) + + val bamLn = Ln(qscript, oldBamFile, bamFile.get) + bamLn.deps :+= baiLn.output + add(bamLn) + } + } } case _ => logger.warn("Sample: " + sampleId + " Library: " + libId + ", no reads found") } @@ -294,7 +299,7 @@ trait ShivaTrait extends MultiSampleQScript with SummaryQScript with Reference { addAll(vc.functions) addSummaryQScript(vc) - if (config("annotation", default = true).asBoolean) { + if (config("annotation", default = false).asBoolean) { val toucan = new Toucan(this) toucan.outputDir = new File(outputDir, "annotation") toucan.inputVCF = vc.finalFile diff --git a/public/shiva/src/test/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaTest.scala b/public/shiva/src/test/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaTest.scala index 56b6bf172b2d122b2ccd70818d3f9f92161e270d..cff186c29e8776f4457ceb6787ea75efc61a8885 100644 --- a/public/shiva/src/test/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaTest.scala +++ b/public/shiva/src/test/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaTest.scala @@ -88,6 +88,12 @@ class ShivaTest extends TestNGSuite with Matchers { object ShivaTest { val outputDir = Files.createTempDir() + new File(outputDir, "input").mkdirs() + def inputTouch(name: String): String = { + val file = new File(outputDir, "input" + File.separator + name) + Files.touch(file) + file.getAbsolutePath + } private def copyFile(name: String): Unit = { val is = getClass.getResourceAsStream("/" + name) @@ -131,8 +137,8 @@ object ShivaTest { val sample1 = Map( "samples" -> Map("sample1" -> Map("libraries" -> Map( "lib1" -> Map( - "R1" -> "1_1_R1.fq", - "R2" -> "1_1_R2.fq" + "R1" -> inputTouch("1_1_R1.fq"), + "R2" -> inputTouch("1_1_R2.fq") ) ) ))) @@ -140,8 +146,8 @@ object ShivaTest { val sample2 = Map( "samples" -> Map("sample2" -> Map("libraries" -> Map( "lib1" -> Map( - "R1" -> "2_1_R1.fq", - "R2" -> "2_1_R2.fq" + "R1" -> inputTouch("2_1_R1.fq"), + "R2" -> inputTouch("2_1_R2.fq") ) ) ))) @@ -149,12 +155,12 @@ object ShivaTest { val sample3 = Map( "samples" -> Map("sample3" -> Map("libraries" -> Map( "lib1" -> Map( - "R1" -> "3_1_R1.fq", - "R2" -> "3_1_R2.fq" + "R1" -> inputTouch("3_1_R1.fq"), + "R2" -> inputTouch("3_1_R2.fq") ), "lib2" -> Map( - "R1" -> "3_2_R1.fq", - "R2" -> "3_2_R2.fq" + "R1" -> inputTouch("3_2_R1.fq"), + "R2" -> inputTouch("3_2_R2.fq") ) ) ))) diff --git a/public/shiva/src/test/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaVariantcallingTest.scala b/public/shiva/src/test/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaVariantcallingTest.scala index 0281d33f678804d7edd1620d204a0830d4f3201f..caeea0326d46e4b7673dae4a3d07f27c3cbd5f4e 100644 --- a/public/shiva/src/test/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaVariantcallingTest.scala +++ b/public/shiva/src/test/scala/nl/lumc/sasc/biopet/pipelines/shiva/ShivaVariantcallingTest.scala @@ -61,7 +61,7 @@ class ShivaVariantcallingTest extends TestNGSuite with Matchers { val map = Map("variantcallers" -> callers.toList) val pipeline = initPipeline(map) - pipeline.inputBams = (for (n <- 1 to bams) yield new File("bam_" + n + ".bam")).toList + pipeline.inputBams = (for (n <- 1 to bams) yield ShivaVariantcallingTest.inputTouch("bam_" + n + ".bam")).toList val illegalArgumentException = pipeline.inputBams.isEmpty || (!raw && !bcftools && !freebayes) @@ -88,6 +88,12 @@ class ShivaVariantcallingTest extends TestNGSuite with Matchers { object ShivaVariantcallingTest { val outputDir = Files.createTempDir() + new File(outputDir, "input").mkdirs() + def inputTouch(name: String): File = { + val file = new File(outputDir, "input" + File.separator + name).getAbsoluteFile + Files.touch(file) + file + } private def copyFile(name: String): Unit = { val is = getClass.getResourceAsStream("/" + name) diff --git a/public/toucan/src/main/scala/nl/lumc/sasc/biopet/pipelines/toucan/Toucan.scala b/public/toucan/src/main/scala/nl/lumc/sasc/biopet/pipelines/toucan/Toucan.scala index 606853f933f6cd1263a0f44193e5ae0e615812df..7c3cc327858be60bb3d299e550c0f4244b656560 100644 --- a/public/toucan/src/main/scala/nl/lumc/sasc/biopet/pipelines/toucan/Toucan.scala +++ b/public/toucan/src/main/scala/nl/lumc/sasc/biopet/pipelines/toucan/Toucan.scala @@ -35,6 +35,7 @@ class Toucan(val root: Configurable) extends QScript with BiopetQScript with Sum var inputVCF: File = _ def init(): Unit = { + inputFiles :+= new InputFile(inputVCF) } override def defaults = ConfigUtils.mergeMaps(Map(