nf-core
diff --git a/‎modules/nf-core/gcta/makegrmpart/main.nf‎
Lines changed: 15 additions & 15 deletions b/‎modules/nf-core/gcta/makegrmpart/main.nf‎
Lines changed: 15 additions & 15 deletions
diff --git a/‎modules/nf-core/gcta/makegrmpart/meta.yml‎
Lines changed: 48 additions & 30 deletions b/‎modules/nf-core/gcta/makegrmpart/meta.yml‎
Lines changed: 48 additions & 30 deletions
diff --git a/‎modules/nf-core/gcta/makegrmpart/tests/main.nf.test‎
Lines changed: 76 additions & 12 deletions b/‎modules/nf-core/gcta/makegrmpart/tests/main.nf.test‎
Lines changed: 76 additions & 12 deletions
@@ -1,25 +1,25 @@
 process GCTA_MAKEGRMPART {
-    tag "part ${meta.part_gcta_job} of ${meta.nparts_gcta} (${meta.id})"
+    tag "${meta.id}: part ${part_gcta_job} of ${nparts_gcta}"
     label 'process_medium'
     conda "${moduleDir}/environment.yml"
-    container "${ workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container ?
-        'docker://community.wave.seqera.io/library/gcta:1.94.1--9bc35dc424fcf6e9' :
-        'community.wave.seqera.io/library/gcta:1.94.1--9bc35dc424fcf6e9' }"
+    container "${workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container
+        ? 'https://community-cr-prod.seqera.io/docker/registry/v2/blobs/sha256/46/46b0d05f0daa47561d87d2a9cac5e51edc2c78e26f1bbab439c688386241a274/data'
+        : 'community.wave.seqera.io/library/gcta:1.94.1--9bc35dc424fcf6e9'}"
 
     input:
-    tuple val(meta), path(mfile), path(bed_pgen), path(bim_pvar), path(fam_psam)
+    tuple val(meta), val(nparts_gcta), val(part_gcta_job), path(mfile), path(bed_pgen), path(bim_pvar), path(fam_psam)
     tuple val(meta2), path(snp_group_file)
 
     output:
-    tuple val(meta), path("*.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.id"), path("*.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.bin"), path("*.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.N.bin"), emit: grm_files
-    tuple val("${task.process}"), val("gcta"), eval("gcta --version 2>&1 | grep 'version v' | tr -s ' ' | cut -d' ' -f3 | sed 's/^v//'"), emit: versions_gcta, topic: versions
+    tuple val(meta), path("*.part_${nparts}_${part}.grm.*"), val(nparts_gcta), val(part_gcta_job), emit: grm_files
+    tuple val("${task.process}"), val("gcta"), eval("gcta --version | sed -En 's/^[*] version v([0-9.]*).*/\\1/p'"), emit: versions_gcta, topic: versions
 
     when:
     task.ext.when == null || task.ext.when
 
     script:
-    def part_gcta_job = meta.part_gcta_job
-    def nparts_gcta = meta.nparts_gcta
+    nparts = nparts_gcta ?: 1
+    part = part_gcta_job ?: 1
     def extract_cmd = snp_group_file ? "--extract ${snp_group_file}" : ''
     def extra_args = task.ext.args ?: ''
     def prefix = task.ext.prefix ?: "${meta.id}"
@@ -28,21 +28,21 @@ process GCTA_MAKEGRMPART {
     def multi_file_flag = genotype_extension == 'pgen' ? '--mpfile' : '--mbfile'
 
     """
-
     gcta \\
         ${multi_file_flag} ${mfile} \\
-        --make-grm-part ${nparts_gcta} ${part_gcta_job} \\
+        --make-grm-part ${nparts} ${part} \\
         ${extract_cmd} \\
-        --maf 0.01 \\
         --thread-num ${task.cpus} \\
         --out ${prefix} ${extra_args}
     """
 
     stub:
+    nparts = nparts_gcta ?: 1
+    part = part_gcta_job ?: 1
     def prefix = task.ext.prefix ?: "${meta.id}"
     """
-    touch ${prefix}.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.id
-    touch ${prefix}.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.bin
-    touch ${prefix}.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.N.bin
+    touch ${prefix}.part_${nparts}_${part}.grm.id
+    touch ${prefix}.part_${nparts}_${part}.grm.bin
+    touch ${prefix}.part_${nparts}_${part}.grm.N.bin
     """
 }
@@ -3,51 +3,70 @@ name: "gcta_makegrmpart"
 description: Compute one partition of a GCTA genetic relationship matrix
 keywords:
   - gcta
+  - genome-wide complex trait analysis
   - grm
+  - genetic relationship matrix
   - genetics
 tools:
   - "gcta":
       description: "GCTA is a tool for genome-wide complex trait analysis."
       homepage: "https://yanglab.westlake.edu.cn/software/gcta/"
       documentation: "https://yanglab.westlake.edu.cn/software/gcta/static/gcta_doc_latest.pdf"
       tool_dev_url: "https://github.com/jianyangqt/gcta"
-      licence: ["GPL-3.0-only"]
+      licence:
+        - "GPL-3.0-only"
+      identifier: biotools:gcta
 input:
   - - meta:
         type: map
         description: |
-          Groovy Map containing GRM-partition job metadata
-          e.g. `[ id:'gcta_grm', part_gcta_job:1, nparts_gcta:2 ]`
+          Groovy Map containing GRM-partition sample metadata
+          e.g. `[ id:'gcta_grm' ]`
+    - nparts_gcta:
+        type: integer
+        description: Total number of GRM partitions requested via
+          `--make-grm-part`; defaults to `1` when `null`
+        default: 1
+    - part_gcta_job:
+        type: integer
+        description: One-based index of the GRM partition to compute via
+          `--make-grm-part`; defaults to `1` when `null`
+        default: 1
     - mfile:
         type: file
-        description: GCTA multi-input manifest consumed by `--mbfile` or `--mpfile`
+        description: GCTA multi-input manifest consumed by `--mbfile` or
+          `--mpfile`
         pattern: "*.{mbfile,mpfile,txt}"
         ontologies:
           - edam: "http://edamontology.org/format_2330"
     - bed_pgen:
         type: file
-        description: Collection of PLINK primary genotype files referenced by the multi-input manifest
+        description: Collection of PLINK primary genotype files referenced by the
+          multi-input manifest
         pattern: "*.{bed,pgen}"
         ontologies:
           - edam: "http://edamontology.org/format_3003"
     - bim_pvar:
         type: file
-        description: Collection of PLINK variant metadata files referenced by the multi-input manifest
+        description: Collection of PLINK variant metadata files referenced by the
+          multi-input manifest
         pattern: "*.{bim,pvar}"
         ontologies: []
     - fam_psam:
         type: file
-        description: Collection of PLINK sample metadata files referenced by the multi-input manifest
+        description: Collection of PLINK sample metadata files referenced by the
+          multi-input manifest
         pattern: "*.{fam,psam}"
         ontologies: []
   - - meta2:
         type: map
         description: |
           Groovy Map containing SNP-selection metadata
-          e.g. `[ id:'snp_group1', snp_group:1 ]`
+          e.g. `[ id:'snp_group1' ]`
     - snp_group_file:
         type: file
-        description: Optional SNP extraction file passed to `--extract`; provide `[]` when absent
+        description: Optional SNP extraction file passed to `--extract`; provide
+          `[]` when absent
         pattern: "*.{txt,list}"
         ontologies:
           - edam: "http://edamontology.org/format_2330"
@@ -56,31 +75,30 @@ output:
     - - meta:
           type: map
           description: |
-            Groovy Map containing GRM-partition job metadata
-            e.g. `[ id:'gcta_grm', part_gcta_job:1, nparts_gcta:2 ]`
-      - "*.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.id":
+            Groovy Map containing GRM-partition sample metadata
+            e.g. `[ id:'gcta_grm' ]`
+      - "*.part_${nparts}_${part}.grm.*":
           type: file
-          description: Partitioned GRM ID file
-          pattern: "*.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.id"
-          ontologies: []
-      - "*.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.bin":
-          type: file
-          description: Partitioned GRM binary matrix file
-          pattern: "*.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.bin"
-          ontologies: []
-      - "*.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.N.bin":
-          type: file
-          description: Partitioned GRM sample-count matrix file
-          pattern: "*.part_${meta.nparts_gcta}_${meta.part_gcta_job}.grm.N.bin"
+          description: Partitioned GRM output files, including ID, binary matrix,
+            and sample-count matrix files
+          pattern: "*.part_${nparts}_${part}.grm.*"
           ontologies: []
+      - nparts_gcta:
+          type: integer
+          description: Total number of GRM partitions requested via
+            `--make-grm-part`
+      - part_gcta_job:
+          type: integer
+          description: One-based index of the GRM partition computed via
+            `--make-grm-part`
   versions_gcta:
-    - - "${task.process}":
+    - - ${task.process}:
           type: string
           description: The process the versions were collected from
-      - "gcta":
+      - gcta:
           type: string
           description: The tool name
-      - "gcta --version 2>&1 | grep 'version v' | tr -s ' ' | cut -d' ' -f3 | sed 's/^v//'":
+      - "gcta --version | sed -En 's/^[*] version v([0-9.]*).*/\\1/p'":
           type: eval
           description: The command used to generate the version of the tool
 topics:
@@ -91,10 +109,10 @@ topics:
       - gcta:
           type: string
           description: The tool name
-      - gcta --version 2>&1 | grep 'version v' | tr -s ' ' | cut -d' ' -f3 | sed 's/^v//':
+      - "gcta --version | sed -En 's/^[*] version v([0-9.]*).*/\\1/p'":
           type: eval
           description: The command used to generate the version of the tool
 authors:
-  - "@andongni"
+  - "@lyh970817"
 maintainers:
-  - "@andongni"
+  - "@lyh970817"
@@ -10,15 +10,15 @@ nextflow_process {
     tag "gcta/makegrmpart"
 
     test("homo_sapiens popgen - plink2") {
-        config "./nextflow.config"
-
         when {
             process {
                 """
                 file('gcta_grm.mpfile').text = 'plink_simulated plink_simulated.pgen plink_simulated.psam plink_simulated.pvar\\n'
 
                 input[0] = [
-                    [ id:'gcta_grm', part_gcta_job:1, nparts_gcta:2 ],
+                    [ id:'gcta_grm' ],
+                    2,
+                    1,
                     file('gcta_grm.mpfile'),
                     [
                         file(params.modules_testdata_base_path + 'genomics/homo_sapiens/popgen/plink_simulated.pgen', checkIfExists: true)
@@ -40,6 +40,10 @@ nextflow_process {
                 { assert process.success },
                 { assert process.out.grm_files.size() == 1 },
                 { assert process.out.grm_files.get(0).get(0).id == 'gcta_grm' },
+                { assert process.out.grm_files.get(0).get(0).keySet() == ['id'] as Set },
+                { assert process.out.grm_files.get(0).get(1).size() == 3 },
+                { assert process.out.grm_files.get(0).get(2) == 2 },
+                { assert process.out.grm_files.get(0).get(3) == 1 },
                 {
                     assert snapshot(
                         process.out.grm_files,
@@ -51,15 +55,15 @@ nextflow_process {
     }
 
     test("homo_sapiens popgen - plink1") {
-        config "./nextflow.config"
-
         when {
             process {
                 """
                 file('gcta_grm.mbfile').text = 'plink_simulated\\n'
 
                 input[0] = [
-                    [ id:'gcta_grm_bed', part_gcta_job:1, nparts_gcta:2 ],
+                    [ id:'gcta_grm_bed' ],
+                    2,
+                    1,
                     file('gcta_grm.mbfile'),
                     [
                         file(params.modules_testdata_base_path + 'genomics/homo_sapiens/popgen/plink_simulated.bed', checkIfExists: true)
@@ -81,6 +85,10 @@ nextflow_process {
                 { assert process.success },
                 { assert process.out.grm_files.size() == 1 },
                 { assert process.out.grm_files.get(0).get(0).id == 'gcta_grm_bed' },
+                { assert process.out.grm_files.get(0).get(0).keySet() == ['id'] as Set },
+                { assert process.out.grm_files.get(0).get(1).size() == 3 },
+                { assert process.out.grm_files.get(0).get(2) == 2 },
+                { assert process.out.grm_files.get(0).get(3) == 1 },
                 {
                     assert snapshot(
                         process.out.grm_files,
@@ -92,8 +100,6 @@ nextflow_process {
     }
 
     test("homo_sapiens popgen - plink1 - extract snp group") {
-        config "./nextflow.config"
-
         when {
             process {
                 """
@@ -107,7 +113,9 @@ nextflow_process {
                 file('snp_group_extract.txt').text = extractSnps
 
                 input[0] = [
-                    [ id:'gcta_grm_bed_extract', part_gcta_job:1, nparts_gcta:2 ],
+                    [ id:'gcta_grm_bed_extract' ],
+                    2,
+                    1,
                     file('gcta_grm_extract.mbfile'),
                     [
                         file(params.modules_testdata_base_path + 'genomics/homo_sapiens/popgen/plink_simulated.bed', checkIfExists: true)
@@ -119,7 +127,7 @@ nextflow_process {
                         file(params.modules_testdata_base_path + 'genomics/homo_sapiens/popgen/plink_simulated.fam', checkIfExists: true)
                     ]
                 ]
-                input[1] = [[ id:'snp_group_extract', snp_group:1 ], file('snp_group_extract.txt')]
+                input[1] = [[ id:'snp_group_extract' ], file('snp_group_extract.txt')]
                 """
             }
         }
@@ -129,6 +137,10 @@ nextflow_process {
                 { assert process.success },
                 { assert process.out.grm_files.size() == 1 },
                 { assert process.out.grm_files.get(0).get(0).id == 'gcta_grm_bed_extract' },
+                { assert process.out.grm_files.get(0).get(0).keySet() == ['id'] as Set },
+                { assert process.out.grm_files.get(0).get(1).size() == 3 },
+                { assert process.out.grm_files.get(0).get(2) == 2 },
+                { assert process.out.grm_files.get(0).get(3) == 1 },
                 {
                     assert snapshot(
                         process.out.grm_files,
@@ -139,17 +151,69 @@ nextflow_process {
         }
     }
 
+    test("homo_sapiens popgen - plink1 - default partition values") {
+        when {
+            process {
+                """
+                file('gcta_grm_default.mbfile').text = 'plink_simulated\\n'
+
+                input[0] = [
+                    [ id:'gcta_grm_bed_default' ],
+                    null,
+                    null,
+                    file('gcta_grm_default.mbfile'),
+                    [
+                        file(params.modules_testdata_base_path + 'genomics/homo_sapiens/popgen/plink_simulated.bed', checkIfExists: true)
+                    ],
+                    [
+                        file(params.modules_testdata_base_path + 'genomics/homo_sapiens/popgen/plink_simulated.bim', checkIfExists: true)
+                    ],
+                    [
+                        file(params.modules_testdata_base_path + 'genomics/homo_sapiens/popgen/plink_simulated.fam', checkIfExists: true)
+                    ]
+                ]
+                input[1] = [[ id:'snp_group0' ], []]
+                """
+            }
+        }
+
+        then {
+            assertAll(
+                { assert process.success },
+                { assert process.out.grm_files.size() == 1 },
+                { assert process.out.grm_files.get(0).get(0).id == 'gcta_grm_bed_default' },
+                { assert process.out.grm_files.get(0).get(0).keySet() == ['id'] as Set },
+                { assert process.out.grm_files.get(0).get(1).size() == 3 },
+                {
+                    assert process.out.grm_files.get(0).get(1).collect { it.toString().tokenize('/').last() }.toSet() == [
+                        'gcta_grm_bed_default.part_1_1.grm.id',
+                        'gcta_grm_bed_default.part_1_1.grm.bin',
+                        'gcta_grm_bed_default.part_1_1.grm.N.bin'
+                    ] as Set
+                },
+                { assert process.out.grm_files.get(0).get(2) == null },
+                { assert process.out.grm_files.get(0).get(3) == null },
+                {
+                    assert snapshot(
+                        process.out.findAll { key, val -> key.startsWith('versions') }
+                    ).match()
+                }
+            )
+        }
+    }
+
     test("homo_sapiens popgen - plink1 - stub") {
         options "-stub"
-        config "./nextflow.config"
 
         when {
             process {
                 """
                 file('gcta_grm.mbfile').text = 'plink_simulated\\n'
 
                 input[0] = [
-                    [ id:'gcta_grm_bed', part_gcta_job:1, nparts_gcta:2 ],
+                    [ id:'gcta_grm_bed' ],
+                    2,
+                    1,
                     file('gcta_grm.mbfile'),
                     [
                         file(params.modules_testdata_base_path + 'genomics/homo_sapiens/popgen/plink_simulated.bed', checkIfExists: true)