这是indexloc提供的服务,不要输入任何密码
Skip to content
Merged
Show file tree
Hide file tree
Changes from all commits
Commits
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
3 changes: 3 additions & 0 deletions CHANGELOG.md
Original file line number Diff line number Diff line change
Expand Up @@ -54,6 +54,9 @@ version 6.0.0-dev
+ Add support for filterThreshold/filterPercent for `modkit.Pileup`.
+ Add `modkit.Summary` task.
+ Disable the one-click GDPR dataleak button in MultiQC `--no-ai` by default.
+ Update clair3 version from 1.0.11 to 1.1.0
+ Improve whatshap runtime/memory usage for our cluster.
+ Add `Modkit.SampleProbs`

version 5.2.0
---------------------------
Expand Down
6 changes: 3 additions & 3 deletions clair3.wdl
Original file line number Diff line number Diff line change
Expand Up @@ -34,8 +34,8 @@ task Clair3 {
Int threads = 8
Boolean includeAllCtgs = false
String memory = "~{threads + 16}GiB"
Int timeMinutes = 10 + ceil(size(bam, "G") * 400 / threads)
String dockerImage = "quay.io/biocontainers/clair3:1.0.11--py39hd649744_0"
Int timeMinutes = 10 + ceil(size(bam, "G") * 200 / threads)
String dockerImage = "quay.io/biocontainers/clair3:1.1.0--py39hd649744_0"
}

String modelArg = "~{if defined(modelTar) then basename(select_first([modelTar]), '.tar.gz') else builtinModel}"
Expand Down Expand Up @@ -91,4 +91,4 @@ task Clair3 {
vcfIndex: {description: "Output VCF index."}

}
}
}
73 changes: 72 additions & 1 deletion modkit.wdl
Original file line number Diff line number Diff line change
Expand Up @@ -130,7 +130,7 @@ task Summary {

Int threads = 4
String memory = ceil(size(bam, "GiB") * 0.1) + 5 # Based on a linear model with some fudge (memory = 0.07540 * file_size - 0.6).
Int timeMinutes = 2880 / threads # 2 Days / threads
Int timeMinutes = 60 # originally this was set at "2 Days / threads" but with 4 threads and that much ram, it's pretty fast.
String dockerImage = "quay.io/biocontainers/ont-modkit:0.4.3--hcdda2d0_0"
}

Expand Down Expand Up @@ -177,3 +177,74 @@ task Summary {
summaryReport: {description: "The output modkit summary."}
}
}

task SampleProbs {
input {
File bam
File bamIndex

String summary = "modkit-sample-probs"

Boolean sample = true
Int? numReads # = 10042
Float? samplingFrac # = 0.1
Int? seed

Int threads = 4
String memory = "32G"
Int timeMinutes = 60
String dockerImage = "quay.io/biocontainers/ont-modkit:0.4.3--hcdda2d0_0"
}

command <<<
set -e
mkdir -p ~{summary}

modkit sample-probs \
--threads ~{threads} \
--out-dir ~{summary} \
~{true="" false="--no-sampling" sample} \
~{"--num-reads " + numReads} \
~{"--sampling-frac " + samplingFrac} \
~{"--seed " + seed} \
--hist \
~{bam}
>>>

output {
File reportCounts = "~{summary}/counts.html"
File reportProportion = "~{summary}/proportion.html"
File reportProbabilitiesTsv = "~{summary}/probabilities.tsv"
File reportThresholdsTsv = "~{summary}/thresholds.tsv"
}

runtime {
docker: dockerImage
cpu: threads
memory: memory
time_minutes: timeMinutes
}

parameter_meta {
# input
bam: {description: "The input alignment file", category: "required"}
bamIndex: {description: "The index for the input alignment file", category: "required"}
summary: {description: "A folder for the outputs", category: "required"}

sample: {description: "Allows you to disable sampling and report stats for the whole file.", category: "advanced"}
numReads: {description: "By default a fixed amount of reads are read, you can set this to change the number of reads to sample.", category: "advanced"}
samplingFrac: {description: "Use a fixed percentage of reads, rather than a fixed number of reads, for sampling.", category: "advanced"}
seed: {description: "A seed can be provided for reproducibility in the sampling fraction case.", category: "advanced"}

threads: {description: "The number of threads to use.", category: "advanced"}
memory: {description: "The amount of memory this job will use.", category: "advanced"}
timeMinutes: {description: "The maximum amount of time the job will run in minutes.", category: "advanced"}
dockerImage: {description: "The docker image used for this task. Changing this may result in errors which the developers may choose not to address.", category: "advanced"}

# output
reportCounts: {description: "The output html report of counts"}
reportProportion: {description: "The output html report of proportions"}
reportProbabilitiesTsv: {description: "The output TSV of Probabilities"}
reportThresholdsTsv: {description: "The output TSV of thresholds"}
}
}
22 changes: 17 additions & 5 deletions whatshap.wdl
Original file line number Diff line number Diff line change
Expand Up @@ -38,14 +38,18 @@ task Phase {
String? threshold
String? ped

String memory = "4GiB"
Int timeMinutes = 120
String memory = 2 + ceil(size(phaseInput, "G") / 20 )
Int timeMinutes = 400 + ceil(size(phaseInput, "G") * 0.9 )

# Whatshap 1.0, tabix 0.2.5.
String dockerImage = "quay.io/biocontainers/mulled-v2-5c61fe1d8c284dd05d26238ce877aa323205bf82:89b4005d04552bdd268e8af323df83357e968d83-0"
}

command {
set -e

mkdir -p $(dirname ~{outputVCF})

whatshap phase \
~{vcf} \
~{phaseInput} \
Expand Down Expand Up @@ -110,12 +114,16 @@ task Stats {
String? chromosome

String memory = "4GiB"
Int timeMinutes = 120
Int timeMinutes = 30
# Whatshap 1.0, tabix 0.2.5.
String dockerImage = "quay.io/biocontainers/mulled-v2-5c61fe1d8c284dd05d26238ce877aa323205bf82:89b4005d04552bdd268e8af323df83357e968d83-0"
}

command {
set -e

mkdir -p $(dirname ~{tsv})

whatshap stats \
~{vcf} \
~{if defined(gtf) then ("--gtf " + '"' + gtf + '"') else ""} \
Expand Down Expand Up @@ -169,14 +177,18 @@ task Haplotag {
String? regions
String? sample

String memory = "4GiB"
Int timeMinutes = 120
String memory = 2 + ceil(size(alignments, "G") / 50 )
Int timeMinutes = 50 + ceil(size(alignments, "G") * 2 )

# Whatshap 1.0, tabix 0.2.5.
String dockerImage = "quay.io/biocontainers/mulled-v2-5c61fe1d8c284dd05d26238ce877aa323205bf82:89b4005d04552bdd268e8af323df83357e968d83-0"
}

command {
set -e

mkdir -p $(dirname ~{outputFile})

whatshap haplotag \
~{vcf} \
~{alignments} \
Expand Down
Loading