nf-core
diff --git a/‎modules/nf-core/gcta/makegrmpart/environment.yml‎
Lines changed: 7 additions & 0 deletions b/‎modules/nf-core/gcta/makegrmpart/environment.yml‎
Lines changed: 7 additions & 0 deletions
diff --git a/‎modules/nf-core/gcta/makegrmpart/main.nf‎
Lines changed: 48 additions & 0 deletions b/‎modules/nf-core/gcta/makegrmpart/main.nf‎
Lines changed: 48 additions & 0 deletions
diff --git a/‎modules/nf-core/gcta/makegrmpart/meta.yml‎
Lines changed: 118 additions & 0 deletions b/‎modules/nf-core/gcta/makegrmpart/meta.yml‎
Lines changed: 118 additions & 0 deletions
@@ -0,0 +1,7 @@
+---
+# yaml-language-server: $schema=https://raw.githubusercontent.com/nf-core/modules/master/modules/environment-schema.json
+channels:
+  - conda-forge
+  - bioconda
+dependencies:
+  - bioconda::gcta=1.94.1
@@ -0,0 +1,48 @@
+process GCTA_MAKEGRMPART {
+    tag "${meta.id}: part ${part_gcta_job} of ${nparts_gcta}"
+    label 'process_medium'
+    conda "${moduleDir}/environment.yml"
+    container "${workflow.containerEngine == 'singularity' && !task.ext.singularity_pull_docker_container
+        ? 'https://community-cr-prod.seqera.io/docker/registry/v2/blobs/sha256/46/46b0d05f0daa47561d87d2a9cac5e51edc2c78e26f1bbab439c688386241a274/data'
+        : 'community.wave.seqera.io/library/gcta:1.94.1--9bc35dc424fcf6e9'}"
+
+    input:
+    tuple val(meta), val(nparts_gcta), val(part_gcta_job), path(mfile), path(bed_pgen), path(bim_pvar), path(fam_psam)
+    tuple val(meta2), path(snp_group_file)
+
+    output:
+    tuple val(meta), path("*.part_${nparts}_${part}.grm.*"), val(nparts_gcta), val(part_gcta_job), emit: grm_files
+    tuple val("${task.process}"), val("gcta"), eval("gcta --version | sed -En 's/^[*] version v([0-9.]*).*/\\1/p'"), emit: versions_gcta, topic: versions
+
+    when:
+    task.ext.when == null || task.ext.when
+
+    script:
+    nparts = nparts_gcta ?: 1
+    part = part_gcta_job ?: 1
+    def extract_cmd = snp_group_file ? "--extract ${snp_group_file}" : ''
+    def extra_args = task.ext.args ?: ''
+    def prefix = task.ext.prefix ?: "${meta.id}"
+    def genotype_files = bed_pgen instanceof List ? bed_pgen : [bed_pgen]
+    def genotype_extension = genotype_files[0].name.tokenize('.').last()
+    def multi_file_flag = genotype_extension == 'pgen' ? '--mpfile' : '--mbfile'
+
+    """
+    gcta \\
+        ${multi_file_flag} ${mfile} \\
+        --make-grm-part ${nparts} ${part} \\
+        ${extract_cmd} \\
+        --thread-num ${task.cpus} \\
+        --out ${prefix} ${extra_args}
+    """
+
+    stub:
+    nparts = nparts_gcta ?: 1
+    part = part_gcta_job ?: 1
+    def prefix = task.ext.prefix ?: "${meta.id}"
+    """
+    touch ${prefix}.part_${nparts}_${part}.grm.id
+    touch ${prefix}.part_${nparts}_${part}.grm.bin
+    touch ${prefix}.part_${nparts}_${part}.grm.N.bin
+    """
+}
@@ -0,0 +1,118 @@
+# yaml-language-server: $schema=https://raw.githubusercontent.com/nf-core/modules/master/modules/meta-schema.json
+name: "gcta_makegrmpart"
+description: Compute one partition of a GCTA genetic relationship matrix
+keywords:
+  - gcta
+  - genome-wide complex trait analysis
+  - grm
+  - genetic relationship matrix
+  - genetics
+tools:
+  - "gcta":
+      description: "GCTA is a tool for genome-wide complex trait analysis."
+      homepage: "https://yanglab.westlake.edu.cn/software/gcta/"
+      documentation: "https://yanglab.westlake.edu.cn/software/gcta/static/gcta_doc_latest.pdf"
+      tool_dev_url: "https://github.com/jianyangqt/gcta"
+      licence:
+        - "GPL-3.0-only"
+      identifier: biotools:gcta
+input:
+  - - meta:
+        type: map
+        description: |
+          Groovy Map containing GRM-partition sample metadata
+          e.g. `[ id:'gcta_grm' ]`
+    - nparts_gcta:
+        type: integer
+        description: Total number of GRM partitions requested via
+          `--make-grm-part`; defaults to `1` when `null`
+        default: 1
+    - part_gcta_job:
+        type: integer
+        description: One-based index of the GRM partition to compute via
+          `--make-grm-part`; defaults to `1` when `null`
+        default: 1
+    - mfile:
+        type: file
+        description: GCTA multi-input manifest consumed by `--mbfile` or
+          `--mpfile`
+        pattern: "*.{mbfile,mpfile,txt}"
+        ontologies:
+          - edam: "http://edamontology.org/format_2330"
+    - bed_pgen:
+        type: file
+        description: Collection of PLINK primary genotype files referenced by the
+          multi-input manifest
+        pattern: "*.{bed,pgen}"
+        ontologies:
+          - edam: "http://edamontology.org/format_3003"
+    - bim_pvar:
+        type: file
+        description: Collection of PLINK variant metadata files referenced by the
+          multi-input manifest
+        pattern: "*.{bim,pvar}"
+        ontologies: []
+    - fam_psam:
+        type: file
+        description: Collection of PLINK sample metadata files referenced by the
+          multi-input manifest
+        pattern: "*.{fam,psam}"
+        ontologies: []
+  - - meta2:
+        type: map
+        description: |
+          Groovy Map containing SNP-selection metadata
+          e.g. `[ id:'snp_group1' ]`
+    - snp_group_file:
+        type: file
+        description: Optional SNP extraction file passed to `--extract`; provide
+          `[]` when absent
+        pattern: "*.{txt,list}"
+        ontologies:
+          - edam: "http://edamontology.org/format_2330"
+output:
+  grm_files:
+    - - meta:
+          type: map
+          description: |
+            Groovy Map containing GRM-partition sample metadata
+            e.g. `[ id:'gcta_grm' ]`
+      - "*.part_${nparts}_${part}.grm.*":
+          type: file
+          description: Partitioned GRM output files, including ID, binary matrix,
+            and sample-count matrix files
+          pattern: "*.part_${nparts}_${part}.grm.*"
+          ontologies: []
+      - nparts_gcta:
+          type: integer
+          description: Total number of GRM partitions requested via
+            `--make-grm-part`
+      - part_gcta_job:
+          type: integer
+          description: One-based index of the GRM partition computed via
+            `--make-grm-part`
+  versions_gcta:
+    - - ${task.process}:
+          type: string
+          description: The process the versions were collected from
+      - gcta:
+          type: string
+          description: The tool name
+      - "gcta --version | sed -En 's/^[*] version v([0-9.]*).*/\\1/p'":
+          type: eval
+          description: The command used to generate the version of the tool
+topics:
+  versions:
+    - - ${task.process}:
+          type: string
+          description: The process the versions were collected from
+      - gcta:
+          type: string
+          description: The tool name
+      - "gcta --version | sed -En 's/^[*] version v([0-9.]*).*/\\1/p'":
+          type: eval
+          description: The command used to generate the version of the tool
+authors:
+  - "@lyh970817"
+maintainers:
+  - "@lyh970817"