ShivaReport.scala 10.8 KB
Newer Older
Peter van 't Hof's avatar
Peter van 't Hof committed
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
/**
 * Biopet is built on top of GATK Queue for building bioinformatic
 * pipelines. It is mainly intended to support LUMC SHARK cluster which is running
 * SGE. But other types of HPC that are supported by GATK Queue (such as PBS)
 * should also be able to execute Biopet tools and pipelines.
 *
 * Copyright 2014 Sequencing Analysis Support Core - Leiden University Medical Center
 *
 * Contact us at: sasc@lumc.nl
 *
 * A dual licensing mode is applied. The source code within this project that are
 * not part of GATK Queue is freely available for non-commercial use under an AGPL
 * license; For commercial users or users who do not want to follow the AGPL
 * license, please contact us to obtain a separate license.
 */
16
17
package nl.lumc.sasc.biopet.pipelines.shiva

Peter van 't Hof's avatar
Peter van 't Hof committed
18
import java.io.{ File, PrintWriter }
19

Peter van 't Hof's avatar
Peter van 't Hof committed
20
import nl.lumc.sasc.biopet.utils.config.Configurable
Peter van 't Hof's avatar
Peter van 't Hof committed
21
import nl.lumc.sasc.biopet.core.report._
22
import nl.lumc.sasc.biopet.utils.summary.{ Summary, SummaryValue }
23
import nl.lumc.sasc.biopet.utils.rscript.StackedBarPlot
24
import nl.lumc.sasc.biopet.pipelines.bammetrics.BammetricsReport
25
26
27
import nl.lumc.sasc.biopet.pipelines.flexiprep.FlexiprepReport

/**
28
29
 * With this extension the report is executed within a pipeline
 *
30
31
 * Created by pjvan_thof on 3/30/15.
 */
32
33
34
35
class ShivaReport(val root: Configurable) extends ReportBuilderExtension {
  val builder = ShivaReport
}

36
/** Object for report generation for Shiva pipeline */
37
object ShivaReport extends MultisampleReportBuilder {
38

39
  def variantcallingExecuted = summary.getValue("shiva", "settings", "multisample_variantcalling") match {
Peter van 't Hof's avatar
Peter van 't Hof committed
40
    case Some(true) => true
Peter van 't Hof's avatar
Peter van 't Hof committed
41
    case _          => false
42
43
  }

44
45
46
  override def extFiles = super.extFiles ++ List("js/gears.js")
    .map(x => ExtFile("/nl/lumc/sasc/biopet/pipelines/gears/report/ext/" + x, x))

47
  /** Root page for the shiva report */
48
  def indexPage = {
49
    val regions = regionsPage
50
    ReportPage(
51
      List("Samples" -> generateSamplesPage(pageArgs)) ++
52
        (if (regions.isDefined) Map(regions.get) else Map()) ++
Peter van 't Hof's avatar
Peter van 't Hof committed
53
54
55
56
        Map("Reference" -> ReportPage(List(), List(
          "Reference" -> ReportSection("/nl/lumc/sasc/biopet/core/report/reference.ssp", Map("pipeline" -> "shiva"))
        ), Map()),
          "Files" -> filesPage,
Peter van 't Hof's avatar
Peter van 't Hof committed
57
58
59
          "Versions" -> ReportPage(List(), List(
            "Executables" -> ReportSection("/nl/lumc/sasc/biopet/core/report/executables.ssp")
          ), Map())
60
        ),
61
      List(
62
63
        "Report" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/shiva/shivaFront.ssp")) ++
        (if (variantcallingExecuted) List("Variantcalling" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/shiva/sampleVariants.ssp",
Peter van 't Hof's avatar
Peter van 't Hof committed
64
65
          Map("showPlot" -> true, "showTable" -> false)))
        else Nil) ++
66
        List("Alignment" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/alignmentSummary.ssp",
Peter van 't Hof's avatar
Peter van 't Hof committed
67
          Map("sampleLevel" -> true, "showPlot" -> true, "showTable" -> false)
68
        ),
Peter van 't Hof's avatar
Peter van 't Hof committed
69
70
71
72
73
74
75
76
77
          "Insert Size" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/insertSize.ssp",
            Map("sampleLevel" -> true, "showPlot" -> true, "showTable" -> false)),
          "Whole genome coverage" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/wgsHistogram.ssp",
            Map("sampleLevel" -> true, "showPlot" -> true, "showTable" -> false)),
          "QC reads" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepReadSummary.ssp",
            Map("showPlot" -> true, "showTable" -> false)),
          "QC bases" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepBaseSummary.ssp",
            Map("showPlot" -> true, "showTable" -> false))
        ),
78
79
80
      pageArgs
    )
  }
81

82
83
84
  //TODO: Add variants per target
  /** Generate a page with all target coverage stats */
  def regionsPage: Option[(String, ReportPage)] = {
85
86
87
88
89
90
    val roi = summary.getValue("shiva", "settings", "regions_of_interest")
    val amplicon = summary.getValue("shiva", "settings", "amplicon_bed")

    var regionPages: Map[String, ReportPage] = Map()

    def createPage(name: String, amplicon: Boolean = false): ReportPage = {
Peter van 't Hof's avatar
Peter van 't Hof committed
91
      ReportPage(
92
        List(),
Peter van 't Hof's avatar
Peter van 't Hof committed
93
94
95
        List("Coverage" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/covstatsMultiTable.ssp")),
        Map("target" -> name)
      )
96
97
98
    }

    amplicon match {
99
      case Some(x: String) => regionPages += (x + " (Amplicon)") -> createPage(x, amplicon = true)
100
101
102
103
      case _               =>
    }

    roi match {
104
105
      case Some(x: String)  => regionPages += x -> createPage(x, amplicon = false)
      case Some(x: List[_]) => x.foreach(x => regionPages += x.toString -> createPage(x.toString, amplicon = false))
106
107
108
      case _                =>
    }

Peter van 't Hof's avatar
Peter van 't Hof committed
109
    if (regionPages.nonEmpty) Some("Regions" -> ReportPage(
110
      List(),
111
      regionPages.map(p => p._1 -> ReportSection(
Peter van 't Hof's avatar
Peter van 't Hof committed
112
113
        "/nl/lumc/sasc/biopet/pipelines/bammetrics/covstatsMultiTable.ssp",
        Map("target" -> p._1.stripSuffix(" (Amplicon)"))
114
      )).toList.sortBy(_._1),
Peter van 't Hof's avatar
Peter van 't Hof committed
115
      Map())
116
117
    )
    else None
118
119
  }

120
121
  /** Files page, can be used general or at sample level */
  def filesPage: ReportPage = ReportPage(List(), List(
122
123
    "Input fastq files" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepInputfiles.ssp"),
    "After QC fastq files" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepOutputfiles.ssp"),
124
125
    "Bam files per lib" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/mapping/outputBamfiles.ssp", Map("sampleLevel" -> false)),
    "Preprocessed bam files" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/mapping/outputBamfiles.ssp",
Peter van 't Hof's avatar
Peter van 't Hof committed
126
127
      Map("pipelineName" -> "shiva", "fileTag" -> "preProcessBam"))) ++
    (if (variantcallingExecuted) List("VCF files" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/shiva/outputVcfFiles.ssp",
Peter van 't Hof's avatar
Peter van 't Hof committed
128
129
      Map("sampleId" -> None)))
    else Nil), Map())
130

131
132
  /** Single sample page */
  def samplePage(sampleId: String, args: Map[String, Any]): ReportPage = {
133
    ReportPage(List(
134
      "Libraries" -> generateLibraryPage(args),
135
      "Alignment" -> BammetricsReport.bamMetricsPage(summary, Some(sampleId), None),
136
      "Files" -> filesPage
137
    ), List(
138
139
      "Alignment" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/alignmentSummary.ssp",
        if (summary.libraries(sampleId).size > 1) Map("showPlot" -> true) else Map()),
140
141
142
      "Preprocessing" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/alignmentSummary.ssp", Map("sampleLevel" -> true))) ++
      (if (variantcallingExecuted) List("Variantcalling" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/shiva/sampleVariants.ssp")) else Nil) ++
      List("QC reads" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepReadSummary.ssp"),
Peter van 't Hof's avatar
Peter van 't Hof committed
143
144
        "QC bases" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepBaseSummary.ssp")
      ), args)
145
146
  }

147
148
  /** Library page */
  def libraryPage(sampleId: String, libId: String, args: Map[String, Any]): ReportPage = {
149
    val flexiprepExecuted = summary.getLibraryValue(sampleId, libId, "flexiprep").isDefined
150
    val krakenExecuted = summary.getValue(Some(sampleId), Some(libId), "gears", "stats", "krakenreport").isDefined
151

152
153
154
    ReportPage(
      "Alignment" -> BammetricsReport.bamMetricsPage(summary, Some(sampleId), Some(libId)) ::
        (if (flexiprepExecuted) List("QC" -> FlexiprepReport.flexiprepPage) else Nil
155
        ) ::: (if (krakenExecuted) List("Gears - Metagenomics" -> ReportPage(List(), List(
Peter van 't Hof's avatar
Peter van 't Hof committed
156
157
158
          "Sunburst analysis" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/gears/gearsSunburst.ssp"
          )), Map()))
        else Nil), "Alignment" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/bammetrics/alignmentSummary.ssp") ::
159
160
161
162
163
        (if (flexiprepExecuted) List(
          "QC reads" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepReadSummary.ssp"),
          "QC bases" -> ReportSection("/nl/lumc/sasc/biopet/pipelines/flexiprep/flexiprepBaseSummary.ssp")
        )
        else Nil), args)
164
165
  }

166
  /** Name of the report */
167
  def reportName = "Shiva Report"
168

169
170
171
172
173
174
175
176
  /**
   * Generate a stackbar plot for found variants
   * @param outputDir OutputDir for the tsv and png file
   * @param prefix Prefix of the tsv and png file
   * @param summary Summary class
   * @param libraryLevel Default false, when set true plot will be based on library stats instead of sample stats
   * @param sampleId Default it selects all sampples, when sample is giving it limits to selected sample
   */
177
  def variantSummaryPlot(outputDir: File,
178
179
180
181
                         prefix: String,
                         summary: Summary,
                         libraryLevel: Boolean = false,
                         sampleId: Option[String] = None): Unit = {
182
183
184
185
186
187
188
189
190
191
192
193
194
195
196
197
198
199
200
201
202
203
204
205
206
    val tsvFile = new File(outputDir, prefix + ".tsv")
    val pngFile = new File(outputDir, prefix + ".png")
    val tsvWriter = new PrintWriter(tsvFile)
    if (libraryLevel) tsvWriter.print("Library") else tsvWriter.print("Sample")
    tsvWriter.println("\tHomVar\tHet\tHomRef\tNoCall")

    def getLine(summary: Summary, sample: String, lib: Option[String] = None): String = {
      val homVar = new SummaryValue(List("shivavariantcalling", "stats", "multisample-vcfstats-final", "genotype", "HomVar"),
        summary, Some(sample), lib).value.getOrElse(0).toString.toLong
      val homRef = new SummaryValue(List("shivavariantcalling", "stats", "multisample-vcfstats-final", "genotype", "HomRef"),
        summary, Some(sample), lib).value.getOrElse(0).toString.toLong
      val noCall = new SummaryValue(List("shivavariantcalling", "stats", "multisample-vcfstats-final", "genotype", "NoCall"),
        summary, Some(sample), lib).value.getOrElse(0).toString.toLong
      val het = new SummaryValue(List("shivavariantcalling", "stats", "multisample-vcfstats-final", "genotype", "Het"),
        summary, Some(sample), lib).value.getOrElse(0).toString.toLong
      val sb = new StringBuffer()
      if (lib.isDefined) sb.append(sample + "-" + lib.get + "\t") else sb.append(sample + "\t")
      sb.append(homVar + "\t")
      sb.append(het + "\t")
      sb.append(homRef + "\t")
      sb.append(noCall)
      sb.toString
    }

    if (libraryLevel) {
207
      for (
208
        sample <- summary.samples if sampleId.isEmpty || sample == sampleId.get;
209
210
        lib <- summary.libraries(sample)
      ) {
211
212
213
        tsvWriter.println(getLine(summary, sample, Some(lib)))
      }
    } else {
214
      for (sample <- summary.samples if sampleId.isEmpty || sample == sampleId.get) {
215
216
217
218
219
220
221
222
223
224
        tsvWriter.println(getLine(summary, sample))
      }
    }

    tsvWriter.close()

    val plot = new StackedBarPlot(null)
    plot.input = tsvFile
    plot.output = pngFile
    plot.ylabel = Some("VCF records")
225
226
    if (libraryLevel) {
      plot.width = Some(200 + (summary.libraries.filter(s => sampleId.getOrElse(s._1) == s._1).foldLeft(0)(_ + _._2.size) * 10))
227
    } else plot.width = Some(200 + (summary.samples.count(s => sampleId.getOrElse(s) == s) * 10))
228
229
    plot.runLocal()
  }
230
}