|
| 1 | +# yaml-language-server: $schema=https://raw.githubusercontent.com/nf-core/modules/master/modules/meta-schema.json |
| 2 | +name: "regenie_splitl0" |
| 3 | +description: Split REGENIE step 1 level-0 ridge-regression blocks into parallel jobs |
| 4 | +keywords: |
| 5 | + - regenie |
| 6 | + - gwas |
| 7 | + - association |
| 8 | + - genomics |
| 9 | + - parallel |
| 10 | +tools: |
| 11 | + - "regenie": |
| 12 | + description: "Regenie is a C++ program for whole genome regression modelling of large genome-wide association studies (GWAS)." |
| 13 | + homepage: "https://rgcgithub.github.io/regenie/" |
| 14 | + documentation: "https://rgcgithub.github.io/regenie/options/" |
| 15 | + tool_dev_url: "https://github.com/rgcgithub/regenie" |
| 16 | + doi: "10.1038/s41588-021-00870-7" |
| 17 | + licence: ["MIT"] |
| 18 | + identifier: "biotools:regenie" |
| 19 | + |
| 20 | +input: |
| 21 | + - - meta: |
| 22 | + type: map |
| 23 | + description: | |
| 24 | + Groovy Map containing genotype information |
| 25 | + Keep only the genotype analysis identifier in this map |
| 26 | + REGENIE consumes the staged basename of `plink_genotype_file` as the `--bed` or `--pgen` prefix, so the `.bed/.bim/.fam` or `.pgen/.pvar/.psam` files must share one basename |
| 27 | + e.g. `[ id:'cohort' ]` |
| 28 | + - plink_genotype_file: |
| 29 | + type: file |
| 30 | + description: PLINK primary genotype file in BED or PGEN format |
| 31 | + pattern: "*.{bed,pgen}" |
| 32 | + ontologies: |
| 33 | + - edam: "http://edamontology.org/format_3003" # BED |
| 34 | + - plink_variant_file: |
| 35 | + type: file |
| 36 | + description: PLINK variant metadata file in BIM or PVAR format |
| 37 | + pattern: "*.{bim,pvar,zst}" |
| 38 | + ontologies: [] |
| 39 | + - plink_sample_file: |
| 40 | + type: file |
| 41 | + description: PLINK sample metadata file in FAM or PSAM format |
| 42 | + pattern: "*.{fam,psam}" |
| 43 | + ontologies: [] |
| 44 | + - - meta2: |
| 45 | + type: map |
| 46 | + description: | |
| 47 | + Groovy Map containing genotype/sample information associated with the phenotype file input |
| 48 | + Use the same phenotype file and phenotype-selection arguments for all `regenie/splitl0`, `regenie/runl0`, and `regenie/runl1` jobs in the same chunked step 1 analysis |
| 49 | + e.g. `[ id:'plink_simulated' ]` |
| 50 | + - pheno: |
| 51 | + type: file |
| 52 | + description: Phenotype file passed to `--phenoFile` |
| 53 | + pattern: "*.{phe,pheno,txt,tsv}" |
| 54 | + ontologies: |
| 55 | + - edam: "http://edamontology.org/format_3475" # TSV |
| 56 | + - - meta3: |
| 57 | + type: map |
| 58 | + description: | |
| 59 | + Groovy Map containing genotype/sample information associated with the covariate input |
| 60 | + Use compatible covariate inputs for all stages in the same chunked step 1 analysis |
| 61 | + e.g. `[ id:'plink_simulated' ]` |
| 62 | + - covar: |
| 63 | + type: file |
| 64 | + optional: true |
| 65 | + description: Optional covariate file passed to `--covarFile`; provide `[]` when absent |
| 66 | + pattern: "*.{covar,cov,txt,tsv}" |
| 67 | + ontologies: |
| 68 | + - edam: "http://edamontology.org/format_3475" # TSV |
| 69 | + - bsize: |
| 70 | + type: integer |
| 71 | + description: Optional block size passed to `--bsize`; pass `[]` to use the module default of `1000` |
| 72 | + - n_jobs: |
| 73 | + type: integer |
| 74 | + description: Number of level-0 jobs requested with `--split-l0` |
| 75 | + |
| 76 | +output: |
| 77 | + master: |
| 78 | + - - meta: |
| 79 | + type: map |
| 80 | + description: | |
| 81 | + Groovy Map containing genotype/sample information |
| 82 | + e.g. `[ id:'plink_simulated' ]` |
| 83 | + - "*.master": |
| 84 | + type: file |
| 85 | + description: REGENIE split level-0 master file |
| 86 | + pattern: "*.master" |
| 87 | + ontologies: |
| 88 | + - edam: "http://edamontology.org/format_2330" # Text |
| 89 | + snplists: |
| 90 | + - - meta: |
| 91 | + type: map |
| 92 | + description: | |
| 93 | + Groovy Map containing genotype/sample information |
| 94 | + e.g. `[ id:'plink_simulated' ]` |
| 95 | + - "*_job*.snplist": |
| 96 | + type: file |
| 97 | + description: REGENIE per-job variant list files referenced by the master file |
| 98 | + pattern: "*_job*.snplist" |
| 99 | + ontologies: |
| 100 | + - edam: "http://edamontology.org/format_2330" # Text |
| 101 | + log: |
| 102 | + - - meta: |
| 103 | + type: map |
| 104 | + description: | |
| 105 | + Groovy Map containing genotype information |
| 106 | + e.g. `[ id:'plink_simulated' ]` |
| 107 | + - "*.log": |
| 108 | + type: file |
| 109 | + description: REGENIE split level-0 log file |
| 110 | + pattern: "*.log" |
| 111 | + ontologies: |
| 112 | + - edam: "http://edamontology.org/format_2330" # Text |
| 113 | + versions_regenie: |
| 114 | + - - "${task.process}": |
| 115 | + type: string |
| 116 | + description: The process the versions were collected from |
| 117 | + - "regenie": |
| 118 | + type: string |
| 119 | + description: The tool name |
| 120 | + - 'regenie --version 2>&1 | sed -n "1{s/^v//;s/\.gz$//;p}"': |
| 121 | + type: eval |
| 122 | + description: The command used to generate the version of the tool |
| 123 | + |
| 124 | +topics: |
| 125 | + versions: |
| 126 | + - - ${task.process}: |
| 127 | + type: string |
| 128 | + description: The process the versions were collected from |
| 129 | + - regenie: |
| 130 | + type: string |
| 131 | + description: The tool name |
| 132 | + - 'regenie --version 2>&1 | sed -n "1{s/^v//;s/\.gz$//;p}"': |
| 133 | + type: eval |
| 134 | + description: The command used to generate the version of the tool |
| 135 | + |
| 136 | +notes: | |
| 137 | + `task.ext.args` is passed directly to REGENIE and can be used for stage-consistent options such as `--phenoColList`, `--bt`, `--loocv`, or `--keep-l0`. |
| 138 | + The same phenotype file, phenotype-selection arguments, trait mode arguments such as `--bt`, and compatible genotype/covariate inputs must be used across `regenie/splitl0`, every matching `regenie/runl0` job, and `regenie/runl1`. |
| 139 | +authors: |
| 140 | + - "@lyh970817" |
| 141 | +maintainers: |
| 142 | + - "@lyh970817" |
| 143 | +containers: |
| 144 | + conda: |
| 145 | + linux_amd64: |
| 146 | + lock_file: "modules/nf-core/regenie/splitl0/.conda-lock/linux_amd64-bd-5d361f9fcb2f85cf_1.txt" |
| 147 | + docker: |
| 148 | + linux_amd64: |
| 149 | + build_id: "bd-5d361f9fcb2f85cf_1" |
| 150 | + name: "community.wave.seqera.io/library/regenie:4.1.2--5d361f9fcb2f85cf" |
| 151 | + scanId: "sc-cc9eb5ed5eb381dd_2" |
| 152 | + singularity: |
| 153 | + linux_amd64: |
| 154 | + build_id: "bd-7c121fb4ecd57890_1" |
| 155 | + name: "oras://community.wave.seqera.io/library/regenie:4.1.2--7c121fb4ecd57890" |
| 156 | + https: "https://community-cr-prod.seqera.io/docker/registry/v2/blobs/sha256/7a/7a05bf71ea09adc5ebf9f0c656c9b326c0f16ba8e4966914972e58313469a466/data" |
0 commit comments