@@ -143,9 +143,9 @@ rule fetch_inflate_ncbi_dataset_package:
143143 --filename {params.compressed_package_zip} \
144144 {params.api_key} \
145145 {params.gateway} \
146- && {params.unzip} \
147- -o {params.compressed_package_zip} \
148- -d results
146+ && {params.unzip} \
147+ -o {params.compressed_package_zip} \
148+ -d results
149149 fi
150150 """
151151
@@ -163,7 +163,7 @@ rule format_ncbi_dataset_report:
163163 --config-file {input.config} \
164164 --input {input.dataset_report} \
165165 --output {output.ncbi_dataset_tsv}
166- echo "Processed metadata file lines: $(wc -l < {output.ncbi_dataset_tsv})"
166+ echo "Processed metadata file lines: $(wc -l <{output.ncbi_dataset_tsv})"
167167 echo "Hash of output: $(md5sum {output.ncbi_dataset_tsv})"
168168 echo "Hash of sorted output: $(md5sum <(sort {output.ncbi_dataset_tsv}))"
169169 """
@@ -178,7 +178,7 @@ rule format_ncbi_dataset_sequences:
178178 """
179179 seqkit seq -w0 -i \
180180 {input.dataset_sequences} \
181- > {output.ncbi_dataset_sequences}
181+ >{output.ncbi_dataset_sequences}
182182 echo "Stats of NCBI dataset sequences: $(seqkit stats {output.ncbi_dataset_sequences})"
183183 echo "seqkit hash of NCBI dataset sequences: $(seqkit sum -a -s {output.ncbi_dataset_sequences})"
184184 echo "Plain hash of NCBI dataset sequences: $(md5sum {output.ncbi_dataset_sequences})"
@@ -198,9 +198,9 @@ if CHECK_ENA_DEPOSITION:
198198 shell :
199199 """
200200 python {input.script} \
201- --output-insdc-accessions {output.exclude_insdc_accessions} \
202- --log-level {params.log_level} \
203- --config-file {input.config} \
201+ --output-insdc-accessions {output.exclude_insdc_accessions} \
202+ --log-level {params.log_level} \
203+ --config-file {input.config}
204204 """
205205
206206 rule filter_out_loculus_depositions :
@@ -216,11 +216,11 @@ if CHECK_ENA_DEPOSITION:
216216 shell :
217217 """
218218 python {input.script} \
219- --input-metadata-tsv {input.ncbi_dataset_tsv} \
220- --exclude-insdc-accessions {input.exclude_insdc_accessions} \
221- --log-level {params.log_level} \
222- --config-file {input.config} \
223- --output-metadata-tsv {output.metadata_tsv} \
219+ --input-metadata-tsv {input.ncbi_dataset_tsv} \
220+ --exclude-insdc-accessions {input.exclude_insdc_accessions} \
221+ --log-level {params.log_level} \
222+ --config-file {input.config} \
223+ --output-metadata-tsv {output.metadata_tsv}
224224 """
225225
226226
@@ -260,7 +260,7 @@ if SEGMENTED and segment_detection_method == SegmentDetectionMethod.ALIGN:
260260 {input.sequences} \
261261 --output-tsv {output.results} \
262262 --server {params.dataset_server} \
263- --dataset-name {params.dataset_name} \
263+ --dataset-name {params.dataset_name}
264264 """
265265
266266 rule process_alignments :
@@ -281,10 +281,10 @@ if SEGMENTED and segment_detection_method == SegmentDetectionMethod.ALIGN:
281281 ),
282282 shell :
283283 """
284- python {input.script} \
285- {params.segment_paths} \
286- --output {output.merged}
287- """
284+ python {input.script} \
285+ {params.segment_paths} \
286+ --output {output.merged}
287+ """
288288
289289
290290if APPLY_MINIMIZER :
@@ -312,8 +312,8 @@ if APPLY_MINIMIZER:
312312 shell :
313313 """
314314 nextclade sort -m {input.minimizer} \
315- -r {output.results} {input.sequences} \
316- --max-score-gap 0.3 --min-score 0.05 --min-hits 2 --all-matches
315+ -r {output.results} {input.sequences} \
316+ --max-score-gap 0.3 --min-score 0.05 --min-hits 2 --all-matches
317317 """
318318
319319 rule parse_sort :
@@ -328,10 +328,10 @@ if APPLY_MINIMIZER:
328328 shell :
329329 """
330330 python {input.script} \
331- --config-file {input.config} \
332- --sort-results {input.sorted} \
333- --output {output.merged} \
334- --log-level {params.log_level} \
331+ --config-file {input.config} \
332+ --sort-results {input.sorted} \
333+ --output {output.merged} \
334+ --log-level {params.log_level}
335335 """
336336
337337
@@ -369,7 +369,7 @@ rule prepare_metadata:
369369 --sequence-hashes-file {input.sequence_hashes} \
370370 {params.segments} \
371371 --output {output.metadata} \
372- --log-level {params.log_level} \
372+ --log-level {params.log_level}
373373 """
374374
375375
@@ -418,22 +418,22 @@ if CALCULATE_GROUPS_OVERRIDE_JSON:
418418 shell :
419419 """
420420 if [[ "{params.use_mirror}" == "True" ]]; then
421- curl {params.mirror_url} -o {params.compressed_package_tzst} && \
422- mkdir -p {params.package} && \
423- tar xf {params.compressed_package_tzst} -C {params.package}
421+ curl {params.mirror_url} -o {params.compressed_package_tzst} \
422+ && mkdir -p {params.package} \
423+ && tar xf {params.compressed_package_tzst} -C {params.package}
424424 else
425425 datasets download genome taxon {params.taxon_id} \
426426 --assembly-source {wildcards.source} \
427427 --no-progressbar --dehydrated \
428428 --filename {params.compressed_package_zip} \
429429 {params.api_key} \
430430 {params.gateway} \
431- && {params.unzip} \
432- -o {params.compressed_package_zip} \
433- -d {params.package} \
434- && datasets rehydrate \
435- --directory {params.package} \
436- --no-progressbar
431+ && {params.unzip} \
432+ -o {params.compressed_package_zip} \
433+ -d {params.package} \
434+ && datasets rehydrate \
435+ --directory {params.package} \
436+ --no-progressbar
437437 fi
438438 touch {output.marker}
439439 """
@@ -453,11 +453,11 @@ if CALCULATE_GROUPS_OVERRIDE_JSON:
453453 shell :
454454 """
455455 python {input.script} \
456- --dataset-dir {params.genbank_dir} \
457- --dataset-dir {params.refseq_dir} \
458- --output-file {output.groups_json} \
459- --ignore-list {input.ignore_list} \
460- --config-file {input.config_file}
456+ --dataset-dir {params.genbank_dir} \
457+ --dataset-dir {params.refseq_dir} \
458+ --output-file {output.groups_json} \
459+ --ignore-list {input.ignore_list} \
460+ --config-file {input.config_file}
461461 """
462462
463463
@@ -474,10 +474,10 @@ if GROUPING_OVERRIDE_URL and CALCULATE_GROUPS_OVERRIDE_JSON:
474474 shell :
475475 """
476476 python {input.script} \
477- --groups {input.calculated} \
478- --groups {input.downloaded} \
479- --config-file {input.config} \
480- --output-file {output.groups_json}
477+ --groups {input.calculated} \
478+ --groups {input.downloaded} \
479+ --config-file {input.config} \
480+ --output-file {output.groups_json}
481481 """
482482
483483
@@ -560,8 +560,8 @@ rule heuristic_group_segments:
560560 --output-seq {output.sequences} \
561561 --log-level {params.log_level}
562562 if [ "{params.GROUPS_OVERRIDE_JSON}" = "true" ]; then
563- cat {input.metadata_grouped} >> {output.metadata}
564- cat {input.sequences_grouped} >> {output.sequences}
563+ cat {input.metadata_grouped} >>{output.metadata}
564+ cat {input.sequences_grouped} >>{output.sequences}
565565 fi
566566 """
567567
@@ -594,12 +594,12 @@ if FILTER:
594594 shell :
595595 """
596596 python {input.script} \
597- --input-seq {input.sequences} \
598- --output-seq {output.sequences} \
599- --input-metadata {input.metadata} \
600- --output-metadata {output.metadata} \
601- --log-level {params.log_level} \
602- --config-file {input.config} \
597+ --input-seq {input.sequences} \
598+ --output-seq {output.sequences} \
599+ --input-metadata {input.metadata} \
600+ --output-metadata {output.metadata} \
601+ --log-level {params.log_level} \
602+ --config-file {input.config}
603603 """
604604
605605
@@ -669,7 +669,7 @@ rule compare_hashes:
669669 --output-blocked {output.blocked} \
670670 --sampled-out-file {output.sampled_out} \
671671 --log-level {params.log_level} \
672- --subsample-fraction {params.subsample_fraction} \
672+ --subsample-fraction {params.subsample_fraction}
673673 """
674674
675675
@@ -711,7 +711,7 @@ rule prepare_files:
711711 --metadata-submit-prior-to-revoke-path {output.metadata_revoke} \
712712 --sequences-submit-path {output.sequences_submit} \
713713 --sequences-revise-path {output.sequences_revise} \
714- --sequences-submit-prior-to-revoke-path {output.sequences_revoke} \
714+ --sequences-submit-prior-to-revoke-path {output.sequences_revoke}
715715 """
716716
717717
@@ -723,7 +723,7 @@ rule sort_fasta:
723723 sorted = "results/{basename}_sorted.fasta" ,
724724 shell :
725725 """
726- seqkit sort -N --two-pass {input.sequences} | seqkit seq -w 0 > {output.sorted}
726+ seqkit sort -N --two-pass {input.sequences} | seqkit seq -w 0 >{output.sorted}
727727 """
728728
729729
@@ -735,11 +735,11 @@ rule sort_metadata:
735735 sorted = "results/{basename}_sorted.tsv" ,
736736 shell :
737737 """
738- columnNumber=$(awk -F'\\ t' '{{for(i=1;i<=NF;i++) if($i=="id") print i}}' {input.metadata});
738+ columnNumber=$(awk -F'\\ t' '{{for(i=1;i<=NF;i++) if($i=="id") print i}}' {input.metadata})
739739 if [ ${{columnNumber}} ]; then
740- (head -n 1 {input.metadata} && tail -n +2 {input.metadata} | sort -t$'\t ' -k${{columnNumber}},${{columnNumber}}) > {output.sorted}
740+ (head -n 1 {input.metadata} && tail -n +2 {input.metadata} | sort -t$'\t ' -k${{columnNumber}},${{columnNumber}}) >{output.sorted}
741741 else
742- cat {input.metadata} > {output.sorted}
742+ cat {input.metadata} >{output.sorted}
743743 fi
744744 """
745745
0 commit comments