From 18a4466259d89cfe835ae32f20a72e8b66ad7b2a Mon Sep 17 00:00:00 2001
From: Peter van 't Hof <p.j.van_t_hof@lumc.nl>
Date: Wed, 19 Aug 2015 15:52:16 +0200
Subject: [PATCH] Added a scatter plot

---
 .../biopet/extensions/rscript/plotScatter.R   | 40 +++++++++++++
 .../extensions/rscript/ScatterPlot.scala      | 56 +++++++++++++++++++
 2 files changed, 96 insertions(+)
 create mode 100644 public/biopet-framework/src/main/resources/nl/lumc/sasc/biopet/extensions/rscript/plotScatter.R
 create mode 100644 public/biopet-framework/src/main/scala/nl/lumc/sasc/biopet/extensions/rscript/ScatterPlot.scala

diff --git a/public/biopet-framework/src/main/resources/nl/lumc/sasc/biopet/extensions/rscript/plotScatter.R b/public/biopet-framework/src/main/resources/nl/lumc/sasc/biopet/extensions/rscript/plotScatter.R
new file mode 100644
index 000000000..a1959a262
--- /dev/null
+++ b/public/biopet-framework/src/main/resources/nl/lumc/sasc/biopet/extensions/rscript/plotScatter.R
@@ -0,0 +1,40 @@
+library(reshape2)
+library(ggplot2)
+library(argparse)
+
+parser <- ArgumentParser(description='Process some integers')
+parser$add_argument('--input', dest='input', type='character', help='Input tsv file', required=TRUE)
+parser$add_argument('--output', dest='output', type='character', help='Output png file', required=TRUE)
+parser$add_argument('--width', dest='width', type='integer', default = 500)
+parser$add_argument('--height', dest='height', type='integer', default = 500)
+parser$add_argument('--xlabel', dest='xlabel', type='character')
+parser$add_argument('--ylabel', dest='ylabel', type='character', required=TRUE)
+parser$add_argument('--llabel', dest='llabel', type='character')
+parser$add_argument('--title', dest='title', type='character')
+parser$add_argument('--removeZero', dest='removeZero', type='character', default="false")
+
+arguments <- parser$parse_args()
+
+png(filename = arguments$output, width = arguments$width, height = arguments$height)
+
+DF <- read.table(arguments$input, header=TRUE)
+
+if (is.null(arguments$xlabel)) xlab <- colnames(DF)[1] else xlab <- arguments$xlabel
+
+colnames(DF)[1] <- "Rank"
+
+DF1 <- melt(DF, id.var="Rank")
+
+if (arguments$removeZero == "true") DF1 <- DF1[DF1$value > 0, ]
+if (arguments$removeZero == "true") print("Removed 0 values")
+
+ggplot(DF1, aes(x = Rank, y = value, group = variable, color = variable)) +
+  xlab(xlab) +
+  ylab(arguments$ylabel) +
+  guides(fill=guide_legend(title=arguments$llabel)) +
+  theme(axis.text.x = element_text(angle = 90, hjust = 1, size = 8)) +
+  ggtitle(arguments$title) +
+  theme_bw() +
+  geom_point()
+
+dev.off()
diff --git a/public/biopet-framework/src/main/scala/nl/lumc/sasc/biopet/extensions/rscript/ScatterPlot.scala b/public/biopet-framework/src/main/scala/nl/lumc/sasc/biopet/extensions/rscript/ScatterPlot.scala
new file mode 100644
index 000000000..e03ce0b4b
--- /dev/null
+++ b/public/biopet-framework/src/main/scala/nl/lumc/sasc/biopet/extensions/rscript/ScatterPlot.scala
@@ -0,0 +1,56 @@
+/**
+ * Biopet is built on top of GATK Queue for building bioinformatic
+ * pipelines. It is mainly intended to support LUMC SHARK cluster which is running
+ * SGE. But other types of HPC that are supported by GATK Queue (such as PBS)
+ * should also be able to execute Biopet tools and pipelines.
+ *
+ * Copyright 2014 Sequencing Analysis Support Core - Leiden University Medical Center
+ *
+ * Contact us at: sasc@lumc.nl
+ *
+ * A dual licensing mode is applied. The source code within this project that are
+ * not part of GATK Queue is freely available for non-commercial use under an AGPL
+ * license; For commercial users or users who do not want to follow the AGPL
+ * license, please contact us to obtain a separate license.
+ */
+package nl.lumc.sasc.biopet.extensions.rscript
+
+import java.io.File
+
+import nl.lumc.sasc.biopet.core.config.Configurable
+import nl.lumc.sasc.biopet.extensions.RscriptCommandLineFunction
+import org.broadinstitute.gatk.utils.commandline.{Input, Output}
+
+/**
+ * Extension for en general line plot with R
+ *
+ * Created by pjvan_thof on 4/29/15.
+ */
+class ScatterPlot(val root: Configurable) extends RscriptCommandLineFunction {
+  protected var script: File = config("script", default = "plotScatter.R")
+
+  @Input
+  var input: File = _
+
+  @Output
+  var output: File = _
+
+  var width: Option[Int] = config("width")
+  var height: Option[Int] = config("height")
+  var xlabel: Option[String] = config("xlabel")
+  var ylabel: Option[String] = config("ylabel")
+  var llabel: Option[String] = config("llabel")
+  var title: Option[String] = config("title")
+  var removeZero: Boolean = config("removeZero", default = false)
+
+  override def cmdLine: String = super.cmdLine +
+    required("--input", input) +
+    required("--output", output) +
+    optional("--width", width) +
+    optional("--height", height) +
+    optional("--xlabel", xlabel) +
+    required("--ylabel", ylabel) +
+    optional("--llabel", llabel) +
+    optional("--title", title) +
+    optional("--removeZero", removeZero)
+}
-- 
GitLab