view nf/subworkflows/ncbi/gnomon/gnomon_training/main.nf @ 6:a7304162d737 draft

planemo upload for repository https://github.com/ncbi/egapx commit 9e59da535540cb4d5c1c412bb2b0969744dfb0b0-dirty
author fubar
date Sun, 04 Aug 2024 02:30:36 +0000
parents d9c5c5b87fec
children
line wrap: on
line source

#!/usr/bin/env nextflow
nextflow.enable.dsl=2

include { merge_params } from '../../utilities'

workflow gnomon_training {
    take:
        genome_asn
        models_file
        max_intron1 // max intron length, name modified from max_intron to pacify stupid Nextflow compiler
        parameters  // Map : extra parameter and parameter update
    main:
        default_params = "-b -asn -maxintron 1200000"
        effective_params = merge_params(default_params, parameters, 'gnomon_training')
        run_gnomon_training(genome_asn, models_file, max_intron1, effective_params)
    emit:
        hmm_params_file = run_gnomon_training.out.hmm_params_file
}


process run_gnomon_training {
    input:
        path genome_asn, stageAs: 'indexed/*'
        path models_file
        val max_intron1
        val parameters
    output:
        path ('output/hmm_params.asn'), emit: 'hmm_params_file'

    script:
    // Substitute -maxintron with correct value coming from max_intron
    def dummy = ["dummy" : "-maxintron ${max_intron1}"]
    parameters = merge_params(parameters, dummy, "dummy")
    """
    mkdir -p output
    lds2_indexer -source indexed -db ./indexed_lds
    gnomon_training ${parameters} -nogenbank -lds2 ./indexed_lds  -input ${models_file} -out output/hmm_params.asn 
    """
    stub:
    def dummy = ["dummy" : "-maxintron ${max_intron1}"]
    parameters = merge_params(parameters, dummy, "dummy")
    println("Gnomon training parameters: ${parameters}")
    """
    mkdir -p output
    touch  output/hmm_params.asn
    """
}