nf-core_modules/modules/rmarkdownnotebook/main.nf

98 lines
3.7 KiB
Text
Raw Normal View History

Notebook modules (#617) * Draft rmarkdown module * stub jupyter notebook module * Create yaml file with params * Update meta.yml for rmarkdown module * Add comment on YAML * Update notebooks module, clean up parametrize.nf * Two separate channels for parameters and input files * Fix Rmd render script * Add tests for rmarkdown * Fix tests for rmarkdown module * Update checksums * Fix tests for jupyter * Test without Grab() * Update software versions * update rmarkdown dependencies * Draft for multiple versions * Fix indent of script * Fix indent in rmarkdown script * Emit version.syml * Update modules/rmarkdown/main.nf Co-authored-by: James A. Fellows Yates <jfy133@gmail.com> * Update modules/rmarkdown/meta.yml Co-authored-by: James A. Fellows Yates <jfy133@gmail.com> * Update modules/rmarkdown/meta.yml Co-authored-by: James A. Fellows Yates <jfy133@gmail.com> * Rename rmarkdown to rmarkdownnotebook * Add rmarkdown mulled biocontainer * Write sessionInfo to separate log file * Update rmarkdownnotebook * Sessioninfo does not have a stable md5sum * Update jupyternotebook * Update meta * Add jupyternotebook biocontainers * Handle Groovy Gstrings in parameterize * Update to versions.yml * Update functions.nf * Fix versions yaml * Fix EC lint * Update modules/rmarkdownnotebook/main.nf Co-authored-by: James A. Fellows Yates <jfy133@gmail.com> * Update modules/jupyternotebook/main.nf Co-authored-by: James A. Fellows Yates <jfy133@gmail.com> * Use official test data * Harshilify * Make parameters channel clearer * Apply suggestions from code review Co-authored-by: Harshil Patel <drpatelh@users.noreply.github.com> * Apply suggestions from code review * Update main.nf Co-authored-by: James A. Fellows Yates <jfy133@gmail.com> Co-authored-by: Harshil Patel <drpatelh@users.noreply.github.com>
2021-10-24 20:51:56 +02:00
// Import generic module functions
include { initOptions; saveFiles; getProcessName; getSoftwareName } from './functions'
include { dump_params_yml; indent_code_block } from "./parametrize"
params.options = [:]
options = initOptions(params.options)
params.parametrize = true
params.implicit_params = true
params.meta_params = true
process RMARKDOWNNOTEBOOK {
tag "$meta.id"
label 'process_low'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:params.options, publish_dir:getSoftwareName(task.process), meta:meta, publish_by_meta:['id']) }
//NB: You likely want to override this with a container containing all required
//dependencies for your analysis. The container at least needs to contain the
//yaml and rmarkdown R packages.
conda (params.enable_conda ? "r-base=4.1.0 r-rmarkdown=2.9 r-yaml=2.2.1" : null)
if (workflow.containerEngine == 'singularity' && !params.singularity_pull_docker_container) {
container "https://depot.galaxyproject.org/singularity/mulled-v2-31ad840d814d356e5f98030a4ee308a16db64ec5%3A0e852a1e4063fdcbe3f254ac2c7469747a60e361-0"
} else {
container "quay.io/biocontainers/mulled-v2-31ad840d814d356e5f98030a4ee308a16db64ec5:0e852a1e4063fdcbe3f254ac2c7469747a60e361-0"
}
input:
tuple val(meta), path(notebook)
val parameters
path input_files
output:
tuple val(meta), path("*.html") , emit: report
tuple val(meta), path ("artifacts/*") , emit: artifacts, optional: true
tuple val(meta), path ("session_info.log"), emit: session_info
path "versions.yml" , emit: versions
script:
def prefix = options.suffix ? "${meta.id}${options.suffix}" : "${meta.id}"
// Dump parameters to yaml file.
// Using a yaml file over using the CLI params because
// * no issue with escaping
// * allows to pass nested maps instead of just single values
def params_cmd = ""
def render_cmd = ""
if (params.parametrize) {
nb_params = [:]
if (params.implicit_params) {
nb_params["cpus"] = task.cpus
nb_params["artifact_dir"] = "artifacts"
nb_params["input_dir"] = "./"
}
if (params.meta_params) {
nb_params["meta"] = meta
}
nb_params += parameters
params_cmd = dump_params_yml(nb_params)
render_cmd = """\
params = yaml::read_yaml('.params.yml')
rmarkdown::render('${prefix}.Rmd', params=params, envir=new.env())
"""
} else {
render_cmd = "rmarkdown::render('${prefix}.Rmd')"
}
"""
# Dump .params.yml heredoc (section will be empty if parametrization is disabled)
${indent_code_block(params_cmd, 4)}
# Create output directory
mkdir artifacts
# Set parallelism for BLAS/MKL etc. to avoid over-booking of resources
export MKL_NUM_THREADS="${task.cpus}"
export OPENBLAS_NUM_THREADS="${task.cpus}"
export OMP_NUM_THREADS="${task.cpus}"
# Work around https://github.com/rstudio/rmarkdown/issues/1508
# If the symbolic link is not replaced by a physical file
# output- and temporary files will be written to the original directory.
mv "${notebook}" "${notebook}.orig"
cp -L "${notebook}.orig" "${prefix}.Rmd"
# Render notebook
Rscript - <<EOF
${indent_code_block(render_cmd, 8)}
writeLines(capture.output(sessionInfo()), "session_info.log")
EOF
cat <<-END_VERSIONS > versions.yml
${getProcessName(task.process)}:
rmarkdown: \$(Rscript -e "cat(paste(packageVersion('rmarkdown'), collapse='.'))")
END_VERSIONS
"""
}