nf-core_modules/modules/rmarkdownnotebook/main.nf
Gregor Sturm 2ad98162f3
Notebook modules (#617)
* Draft rmarkdown module

* stub jupyter notebook module

* Create yaml file with params

* Update meta.yml for rmarkdown module

* Add comment on YAML

* Update notebooks module, clean up parametrize.nf

* Two separate channels for parameters and input files

* Fix Rmd render script

* Add tests for rmarkdown

* Fix tests for rmarkdown module

* Update checksums

* Fix tests for jupyter

* Test without Grab()

* Update software versions

* update rmarkdown dependencies

* Draft for multiple versions

* Fix indent of script

* Fix indent in rmarkdown script

* Emit version.syml

* Update modules/rmarkdown/main.nf

Co-authored-by: James A. Fellows Yates <jfy133@gmail.com>

* Update modules/rmarkdown/meta.yml

Co-authored-by: James A. Fellows Yates <jfy133@gmail.com>

* Update modules/rmarkdown/meta.yml

Co-authored-by: James A. Fellows Yates <jfy133@gmail.com>

* Rename rmarkdown to rmarkdownnotebook

* Add rmarkdown mulled biocontainer

* Write sessionInfo to separate log file

* Update rmarkdownnotebook

* Sessioninfo does not have a stable md5sum

* Update jupyternotebook

* Update meta

* Add jupyternotebook biocontainers

* Handle Groovy Gstrings in parameterize

* Update to versions.yml

* Update functions.nf

* Fix versions yaml

* Fix EC lint

* Update modules/rmarkdownnotebook/main.nf

Co-authored-by: James A. Fellows Yates <jfy133@gmail.com>

* Update modules/jupyternotebook/main.nf

Co-authored-by: James A. Fellows Yates <jfy133@gmail.com>

* Use official test data

* Harshilify

* Make parameters channel clearer

* Apply suggestions from code review

Co-authored-by: Harshil Patel <drpatelh@users.noreply.github.com>

* Apply suggestions from code review

* Update main.nf

Co-authored-by: James A. Fellows Yates <jfy133@gmail.com>
Co-authored-by: Harshil Patel <drpatelh@users.noreply.github.com>
2021-10-24 20:51:56 +02:00

97 lines
3.7 KiB
Text

// Import generic module functions
include { initOptions; saveFiles; getProcessName; getSoftwareName } from './functions'
include { dump_params_yml; indent_code_block } from "./parametrize"
params.options = [:]
options = initOptions(params.options)
params.parametrize = true
params.implicit_params = true
params.meta_params = true
process RMARKDOWNNOTEBOOK {
tag "$meta.id"
label 'process_low'
publishDir "${params.outdir}",
mode: params.publish_dir_mode,
saveAs: { filename -> saveFiles(filename:filename, options:params.options, publish_dir:getSoftwareName(task.process), meta:meta, publish_by_meta:['id']) }
//NB: You likely want to override this with a container containing all required
//dependencies for your analysis. The container at least needs to contain the
//yaml and rmarkdown R packages.
conda (params.enable_conda ? "r-base=4.1.0 r-rmarkdown=2.9 r-yaml=2.2.1" : null)
if (workflow.containerEngine == 'singularity' && !params.singularity_pull_docker_container) {
container "https://depot.galaxyproject.org/singularity/mulled-v2-31ad840d814d356e5f98030a4ee308a16db64ec5%3A0e852a1e4063fdcbe3f254ac2c7469747a60e361-0"
} else {
container "quay.io/biocontainers/mulled-v2-31ad840d814d356e5f98030a4ee308a16db64ec5:0e852a1e4063fdcbe3f254ac2c7469747a60e361-0"
}
input:
tuple val(meta), path(notebook)
val parameters
path input_files
output:
tuple val(meta), path("*.html") , emit: report
tuple val(meta), path ("artifacts/*") , emit: artifacts, optional: true
tuple val(meta), path ("session_info.log"), emit: session_info
path "versions.yml" , emit: versions
script:
def prefix = options.suffix ? "${meta.id}${options.suffix}" : "${meta.id}"
// Dump parameters to yaml file.
// Using a yaml file over using the CLI params because
// * no issue with escaping
// * allows to pass nested maps instead of just single values
def params_cmd = ""
def render_cmd = ""
if (params.parametrize) {
nb_params = [:]
if (params.implicit_params) {
nb_params["cpus"] = task.cpus
nb_params["artifact_dir"] = "artifacts"
nb_params["input_dir"] = "./"
}
if (params.meta_params) {
nb_params["meta"] = meta
}
nb_params += parameters
params_cmd = dump_params_yml(nb_params)
render_cmd = """\
params = yaml::read_yaml('.params.yml')
rmarkdown::render('${prefix}.Rmd', params=params, envir=new.env())
"""
} else {
render_cmd = "rmarkdown::render('${prefix}.Rmd')"
}
"""
# Dump .params.yml heredoc (section will be empty if parametrization is disabled)
${indent_code_block(params_cmd, 4)}
# Create output directory
mkdir artifacts
# Set parallelism for BLAS/MKL etc. to avoid over-booking of resources
export MKL_NUM_THREADS="${task.cpus}"
export OPENBLAS_NUM_THREADS="${task.cpus}"
export OMP_NUM_THREADS="${task.cpus}"
# Work around https://github.com/rstudio/rmarkdown/issues/1508
# If the symbolic link is not replaced by a physical file
# output- and temporary files will be written to the original directory.
mv "${notebook}" "${notebook}.orig"
cp -L "${notebook}.orig" "${prefix}.Rmd"
# Render notebook
Rscript - <<EOF
${indent_code_block(render_cmd, 8)}
writeLines(capture.output(sessionInfo()), "session_info.log")
EOF
cat <<-END_VERSIONS > versions.yml
${getProcessName(task.process)}:
rmarkdown: \$(Rscript -e "cat(paste(packageVersion('rmarkdown'), collapse='.'))")
END_VERSIONS
"""
}