Skip to content
Snippets Groups Projects
Unverified Commit 82cc7609 authored by Ruben Vorderman's avatar Ruben Vorderman Committed by GitHub
Browse files

Merge branch 'develop' into BIOWDL-199

parents 6be49bda e55fc372
No related branches found
No related tags found
1 merge request!92Dockerize GATK. Scattering now works with containers. Tabix another docker image.
version 1.0
task Hisat2 {
input {
File indexDirectory
String indexBasename
File inputR1
File? inputR2
String outputBam
String sample
String library
String readgroup
String platform = "illumina"
Boolean downstreamTranscriptomeAssembly = true
Int threads = 1
Int memory = 48
String dockerTag = "2388ff67fc407dad75774291ca5038f40cac4be0-0"
}
command {
set -e -o pipefail
mkdir -p $(dirname ~{outputBam})
hisat2 \
-p ~{threads} \
-x ~{indexDirectory}/~{indexBasename} \
~{true="-1" false="-U" defined(inputR2)} ~{inputR1} \
~{"-2" + inputR2} \
--rg-id ~{readgroup} \
--rg 'SM:~{sample}' \
--rg 'LB:~{library}' \
--rg 'PL:~{platform}' \
~{true="--dta" false="" downstreamTranscriptomeAssembly} \
| samtools sort > ~{outputBam}
}
output {
File bamFile = outputBam
}
runtime {
memory: (memory / threads) + 1
cpu: threads + 1
docker: "quay.io/biocontainers/mulled-v2-a97e90b3b802d1da3d6958e0867610c718cb5eb1:" + dockerTag
}
}
\ No newline at end of file
......@@ -14,6 +14,7 @@ task HTSeqCount {
String stranded = "no"
Int memory = 12
String dockerTag = "0.9.1--py36h7eb728f_2"
}
command {
......@@ -35,5 +36,6 @@ task HTSeqCount {
runtime {
memory: memory
docker: "quay.io/biocontainers/htseq:" + dockerTag
}
}
\ No newline at end of file
......@@ -9,6 +9,9 @@ task MergeCounts {
Int featureColumn
Int valueColumn
Boolean inputHasHeader
String featureAttribute = "gene_id"
File referenceGtf
Array[String]+? additionalAttributes
}
# Based on a script by Szymon Kielbasa/Ioannis Moustakas
......@@ -19,26 +22,43 @@ task MergeCounts {
R --no-save <<CODE
library(dplyr)
library(reshape2)
library(refGenome)
listOfFiles <- c("~{sep='", "' inputFiles}")
list.of.files <- c("~{sep='", "' inputFiles}")
valueI <- ~{valueColumn}
featureI <- ~{featureColumn}
value.i <- ~{valueColumn}
feature.i <- ~{featureColumn}
header <- ~{true="TRUE" false="FALSE" inputHasHeader}
feature.attribute <- "~{featureAttribute}"
additional.attributes <- c(~{true='"' false="" defined(additionalAttributes)}~{sep='", "' additionalAttributes}~{true='"' false="" defined(additionalAttributes)})
reference.gtf <- "~{referenceGtf}"
output.path <- "~{outputFile}"
d <- do.call(rbind, lapply(listOfFiles, function(file){
d <- do.call(rbind, lapply(list.of.files, function(file){
d <- read.table(file, sep="\t", header=header, comment.char="#")
splitPath <- strsplit(file, "/")[[1]]
colnames(d)[valueI] <- sub("\\\.[^\\\.]*$", "",
splitPath[length(splitPath)])
colnames(d)[featureI] <- "feature"
filename <- basename(file)
colnames(d)[value.i] <- sub("\\\.[^\\\.]*\$", "", filename)
colnames(d)[feature.i] <- "feature"
d <- d %>% melt(id.vars=featureI, variable.name="sample", value.name="count")
d <- d %>% melt(id.vars=feature.i, variable.name="sample",
value.name="count")
}))
d <- d %>% dcast(feature ~ sample, value.var="count")
write.table(d, file="~{outputFile}", sep="\t", quote=FALSE, row.names=FALSE)
gtf <- ensemblGenome(dirname(reference.gtf))
read.gtf(gtf, basename(reference.gtf))
gtf.table <- gtf@ev\$gtf
gtf.table <- gtf.table[order(gtf.table[,feature.attribute]),]
gtf.table <- gtf.table[!duplicated(gtf.table[,feature.attribute]),]
id.table <- gtf.table[, c(feature.attribute, additional.attributes), drop=F]
output.table <- merge(id.table, d, all.y = T, by.y="feature",
by.x=feature.attribute)
write.table(output.table, file=output.path, sep="\t", quote=FALSE,
row.names=FALSE, na="")
CODE
>>>
......@@ -48,5 +68,6 @@ task MergeCounts {
runtime {
memory: 4 + (2*length(inputFiles))
docker: "biowdl/mergecounts:1.0"
}
}
\ No newline at end of file
......@@ -13,6 +13,8 @@ task Stringtie {
Boolean? firstStranded
Boolean? secondStranded
String? geneAbundanceFile
String dockerTag = "1.3.3--py36_3"
}
command {
......@@ -37,6 +39,7 @@ task Stringtie {
runtime {
cpu: threads
docker: "quay.io/biocontainers/stringtie:" + dockerTag
}
}
......@@ -55,6 +58,8 @@ task Merge {
Float? minimumIsoformFraction
Boolean keepMergedTranscriptsWithRetainedIntrons = false
String? label
String dockerTag = "1.3.3--py36_3"
}
command {
......@@ -77,4 +82,8 @@ task Merge {
output {
File mergedGtfFile = outputGtfPath
}
runtime {
docker: "quay.io/biocontainers/stringtie:" + dockerTag
}
}
0% Loading or .
You are about to add 0 people to the discussion. Proceed with caution.
Finish editing this message first!
Please register or to comment