ShivaReport.scala 7.34 KB
Newer Older
Peter van 't Hof's avatar
Peter van 't Hof committed
1
2
3
4
5
6
7
8
9
10
/**
 * Biopet is built on top of GATK Queue for building bioinformatic
 * pipelines. It is mainly intended to support LUMC SHARK cluster which is running
 * SGE. But other types of HPC that are supported by GATK Queue (such as PBS)
 * should also be able to execute Biopet tools and pipelines.
 *
 * Copyright 2014 Sequencing Analysis Support Core - Leiden University Medical Center
 *
 * Contact us at: sasc@lumc.nl
 *
11
 * A dual licensing mode is applied. The source code within this project is freely available for non-commercial use under an AGPL
Peter van 't Hof's avatar
Peter van 't Hof committed
12
13
14
 * license; For commercial users or users who do not want to follow the AGPL
 * license, please contact us to obtain a separate license.
 */
15
16
package nl.lumc.sasc.biopet.pipelines.shiva

Peter van 't Hof's avatar
Peter van 't Hof committed
17
import java.io.{ File, PrintWriter }
18

19
import nl.lumc.sasc.biopet.core.report._
20
import nl.lumc.sasc.biopet.pipelines.mapping.MultisampleMappingReportTrait
Peter van 't Hof's avatar
Peter van 't Hof committed
21
import nl.lumc.sasc.biopet.utils.config.Configurable
22
import nl.lumc.sasc.biopet.utils.rscript.StackedBarPlot
Peter van 't Hof's avatar
Peter van 't Hof committed
23
import nl.lumc.sasc.biopet.utils.summary.{ Summary, SummaryValue }
24
25

/**
26
27
 * With this extension the report is executed within a pipeline
 *
28
29
 * Created by pjvan_thof on 3/30/15.
 */
30
class ShivaReport(val root: Configurable) extends ReportBuilderExtension {
31
  def builder = ShivaReport
32
33
}

34
/** Object for report generation for Shiva pipeline */
35
object ShivaReport extends MultisampleMappingReportTrait {
36

37
  def variantcallingExecuted = summary.getValue("shiva", "settings", "multisample_variantcalling") match {
Peter van 't Hof's avatar
Peter van 't Hof committed
38
    case Some(true) => true
Peter van 't Hof's avatar
Peter van 't Hof committed
39
    case _          => false
40
41
  }

42
43
  override def frontSection = ReportSection("/nl/lumc/sasc/biopet/pipelines/shiva/shivaFront.ssp")

Peter van 't Hof's avatar
Peter van 't Hof committed
44
45
  override def pipelineName = "shiva"

46
47
48
49
  override def additionalSections = super.additionalSections ++ (if (variantcallingExecuted) List("Variantcalling" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/shiva/sampleVariants.ssp",
    Map("showPlot" -> true, "showTable" -> false)))
  else Nil)

50
  /** Root page for the shiva report */
51
  override def indexPage = {
52
    val regions = regionsPage
53
54
    val oldPage = super.indexPage

55
    oldPage.copy(subPages = oldPage.subPages ++ regionsPage)
56
  }
57

58
59
  /** Generate a page with all target coverage stats */
  def regionsPage: Option[(String, ReportPage)] = {
60
61
62
63
64
65
    val roi = summary.getValue("shiva", "settings", "regions_of_interest")
    val amplicon = summary.getValue("shiva", "settings", "amplicon_bed")

    var regionPages: Map[String, ReportPage] = Map()

    def createPage(name: String, amplicon: Boolean = false): ReportPage = {
Peter van 't Hof's avatar
Peter van 't Hof committed
66
      ReportPage(
67
        List(),
Peter van 't Hof's avatar
Peter van 't Hof committed
68
69
70
        List("Coverage" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/covstatsMultiTable.ssp")),
        Map("target" -> name)
      )
71
72
73
    }

    amplicon match {
74
      case Some(x: String) => regionPages += (x + " (Amplicon)") -> createPage(x, amplicon = true)
75
76
77
78
      case _               =>
    }

    roi match {
79
80
      case Some(x: String)  => regionPages += x -> createPage(x, amplicon = false)
      case Some(x: List[_]) => x.foreach(x => regionPages += x.toString -> createPage(x.toString, amplicon = false))
81
82
83
      case _                =>
    }

Peter van 't Hof's avatar
Peter van 't Hof committed
84
    if (regionPages.nonEmpty) Some("Regions" -> ReportPage(
85
86
      regionPages.map(p => p._1 -> ReportPage(Nil,
        List(
Peter van 't Hof's avatar
Peter van 't Hof committed
87
          "Variants" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/shiva/sampleVariants.ssp", Map("showPlot" -> true)),
88
89
90
          "Coverage" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/covstatsMultiTable.ssp")
        ),
        Map("target" -> Some(p._1.stripSuffix(" (Amplicon)")))
91
      )).toList.sortBy(_._1),
92
      List(),
Peter van 't Hof's avatar
Peter van 't Hof committed
93
      Map())
Peter van 't Hof's avatar
Peter van 't Hof committed
94
95
    )
    else None
96
97
  }

98
  /** Files page, can be used general or at sample level */
99
100
  override def filesPage: ReportPage = {
    val vcfFilesSection = if (variantcallingExecuted) List("VCF files" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/shiva/outputVcfFiles.ssp",
Peter van 't Hof's avatar
Peter van 't Hof committed
101
102
      Map("sampleId" -> None)))
    else Nil
103
104
    val oldPage = super.filesPage
    oldPage.copy(sections = oldPage.sections ++ vcfFilesSection)
105
106
  }

107
108
109
110
111
  /** Single sample page */
  override def samplePage(sampleId: String, args: Map[String, Any]): ReportPage = {
    val variantcallingSection = if (variantcallingExecuted) List("Variantcalling" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/shiva/sampleVariants.ssp")) else Nil
    val oldPage = super.samplePage(sampleId, args)
    oldPage.copy(sections = variantcallingSection ++ oldPage.sections)
112
113
  }

114
  /** Name of the report */
115
  def reportName = "Shiva Report"
116

117
118
  /**
   * Generate a stackbar plot for found variants
Peter van 't Hof's avatar
Peter van 't Hof committed
119
   *
120
121
122
123
124
125
   * @param outputDir OutputDir for the tsv and png file
   * @param prefix Prefix of the tsv and png file
   * @param summary Summary class
   * @param libraryLevel Default false, when set true plot will be based on library stats instead of sample stats
   * @param sampleId Default it selects all sampples, when sample is giving it limits to selected sample
   */
126
  def variantSummaryPlot(outputDir: File,
127
128
129
                         prefix: String,
                         summary: Summary,
                         libraryLevel: Boolean = false,
130
131
132
                         sampleId: Option[String] = None,
                         caller: String = "final",
                         target: Option[String] = None): Unit = {
133
134
135
136
137
138
139
    val tsvFile = new File(outputDir, prefix + ".tsv")
    val pngFile = new File(outputDir, prefix + ".png")
    val tsvWriter = new PrintWriter(tsvFile)
    if (libraryLevel) tsvWriter.print("Library") else tsvWriter.print("Sample")
    tsvWriter.println("\tHomVar\tHet\tHomRef\tNoCall")

    def getLine(summary: Summary, sample: String, lib: Option[String] = None): String = {
140
141
      val path = target match {
        case Some(t) => List("shivavariantcalling", "stats", s"multisample-vcfstats-$caller-$t", "genotype")
Peter van 't Hof's avatar
Peter van 't Hof committed
142
        case _       => List("shivavariantcalling", "stats", s"multisample-vcfstats-$caller", "genotype")
143
144
145
146
147
      }
      val homVar = new SummaryValue(path :+ "HomVar", summary, Some(sample), lib).value.getOrElse(0).toString.toLong
      val homRef = new SummaryValue(path :+ "HomRef", summary, Some(sample), lib).value.getOrElse(0).toString.toLong
      val noCall = new SummaryValue(path :+ "NoCall", summary, Some(sample), lib).value.getOrElse(0).toString.toLong
      val het = new SummaryValue(path :+ "Het", summary, Some(sample), lib).value.getOrElse(0).toString.toLong
148
149
150
151
152
153
154
155
156
157
      val sb = new StringBuffer()
      if (lib.isDefined) sb.append(sample + "-" + lib.get + "\t") else sb.append(sample + "\t")
      sb.append(homVar + "\t")
      sb.append(het + "\t")
      sb.append(homRef + "\t")
      sb.append(noCall)
      sb.toString
    }

    if (libraryLevel) {
158
      for (
159
        sample <- summary.samples if sampleId.isEmpty || sample == sampleId.get;
160
161
        lib <- summary.libraries(sample)
      ) {
162
163
164
        tsvWriter.println(getLine(summary, sample, Some(lib)))
      }
    } else {
165
      for (sample <- summary.samples if sampleId.isEmpty || sample == sampleId.get) {
166
167
168
169
170
171
172
173
174
175
        tsvWriter.println(getLine(summary, sample))
      }
    }

    tsvWriter.close()

    val plot = new StackedBarPlot(null)
    plot.input = tsvFile
    plot.output = pngFile
    plot.ylabel = Some("VCF records")
176
177
    if (libraryLevel) {
      plot.width = Some(200 + (summary.libraries.filter(s => sampleId.getOrElse(s._1) == s._1).foldLeft(0)(_ + _._2.size) * 10))
178
    } else plot.width = Some(200 + (summary.samples.count(s => sampleId.getOrElse(s) == s) * 10))
179
180
    plot.runLocal()
  }
181
}