Skip to content

Commit 35307c3

Browse files
authored
Merge pull request #147 from csoneson/minor-edits
Minor edits reviewed and approved
2 parents c9c6aae + 54d184f commit 35307c3

2 files changed

Lines changed: 6 additions & 140 deletions

File tree

joss/paper.bib

Lines changed: 4 additions & 138 deletions
Original file line numberDiff line numberDiff line change
@@ -1,33 +1,3 @@
1-
@article{tian2025designed,
2-
title={A designed synthetic microbiota provides insight to community function in Clostridioides difficile resistance},
3-
author={Tian, Shuchang and Kim, Min Soo and Zhao, Jingcheng and Heber, Kerim and Hao, Fuhua and Koslicki, David and Tian, Sangshan and Singh, Vishal and Patterson, Andrew D and Bisanz, Jordan E},
4-
journal={Cell Host \& Microbe},
5-
year={2025},
6-
doi={10.1016/j.chom.2025.02.007},
7-
publisher={Elsevier}
8-
}
9-
@article{hera2023deriving,
10-
title={Deriving confidence intervals for mutation rates across a wide range of evolutionary distances using FracMinHash},
11-
author={Hera, Mahmudur Rahman and Pierce-Ward, N Tessa and Koslicki, David},
12-
journal={Genome research},
13-
volume={33},
14-
number={7},
15-
pages={1061--1068},
16-
year={2023},
17-
doi={10.1101/gr.277651.123},
18-
publisher={Cold Spring Harbor Lab}
19-
}
20-
@article{blanca2022statistics,
21-
title={The statistics of k-mers from a sequence undergoing a simple mutation process without spurious matches},
22-
author={Blanca, Antonio and Harris, Robert S and Koslicki, David and Medvedev, Paul},
23-
journal={Journal of Computational Biology},
24-
volume={29},
25-
number={2},
26-
pages={155--168},
27-
year={2022},
28-
doi={10.1089/cmb.2021.0431},
29-
publisher={Mary Ann Liebert, Inc., publishers 140 Huguenot Street, 3rd Floor New~…}
30-
}
311
@article{irber2024sourmash,
322
title={sourmash v4: A multitool to quickly search, compare, and analyze genomic and metagenomic data sets},
333
author={Irber, Luiz and Pierce-Ward, N Tessa and Abuelanin, Mohamed and Alexander, Harriet and Anant, Abhishek and Barve, Keya and Baumler, Colton and Botvinnik, Olga and Brooks, Phillip and Dsouza, Daniel and others},
@@ -63,7 +33,6 @@ @article{ward2018metapoap
6333
publisher={Oxford University Press}
6434
}
6535

66-
6736
@article{marcelino2019metatranscriptomics,
6837
title={Metatranscriptomics as a tool to identify fungal species and subspecies in mixed communities--a proof of concept under laboratory conditions},
6938
author={Marcelino, Vanesa R and Irinyi, Laszlo and Eden, John-Sebastian and Meyer, Wieland and Holmes, Edward C and Sorrell, Tania C},
@@ -147,41 +116,6 @@ @article{meyer2022critical
147116
}
148117

149118
%USE CASE EXAMPLE REFERENCES
150-
@article{hayden2022genome,
151-
title={Genome capture sequencing selectively enriches bacterial DNA and enables genome-wide measurement of intrastrain genetic diversity in human infections},
152-
author={Hayden, Hillary S and Joshi, Snehal and Radey, Matthew C and Vo, Anh T and Forsberg, Cara and Morgan, Sarah J and Waalkes, Adam and Holmes, Elizabeth A and Klee, Sara M and Emond, Mary J and others},
153-
journal={Mbio},
154-
volume={13},
155-
number={5},
156-
pages={e01424--22},
157-
year={2022},
158-
doi={10.1128/mbio.01424-22},
159-
publisher={Am Soc Microbiol}
160-
}
161-
162-
@article{rajeev2023metagenome,
163-
title={Metagenome sequencing and recovery of 444 metagenome-assembled genomes from the biofloc aquaculture system},
164-
author={Rajeev, Meora and Jung, Ilsuk and Lim, Yeonjung and Kim, Suhyun and Kang, Ilnam and Cho, Jang-Cheon},
165-
journal={Scientific data},
166-
volume={10},
167-
number={1},
168-
pages={707},
169-
year={2023},
170-
doi={10.1038/s41597-023-02622-0},
171-
publisher={Nature Publishing Group UK London}
172-
}
173-
174-
@article{zhang2022cultivation,
175-
title={Cultivation and functional characterization of a deep-sea Lentisphaerae representative reveals its unique physiology and ecology},
176-
author={Zhang, Tianhang and Zheng, Rikuan and Liu, Rui and Li, Ronggui and Sun, Chaomin},
177-
journal={Frontiers in Marine Science},
178-
volume={9},
179-
pages={848136},
180-
year={2022},
181-
doi={10.3389/fmars.2022.848136},
182-
publisher={Frontiers Media SA}
183-
}
184-
185119
@article{schloss2020removal,
186120
title={Removal of rare amplicon sequence variants from 16S rRNA gene sequence surveys biases the interpretation of community structure data},
187121
author={Schloss, Patrick D},
@@ -191,18 +125,6 @@ @article{schloss2020removal
191125
publisher={Cold Spring Harbor Laboratory}
192126
}
193127

194-
@article{jia2022sequencing,
195-
title={Sequencing introduced false positive rare taxa lead to biased microbial community diversity, assembly, and interaction interpretation in amplicon studies},
196-
author={Jia, Yangyang and Zhao, Shengguo and Guo, Wenjie and Peng, Ling and Zhao, Fang and Wang, Lushan and Fan, Guangyi and Zhu, Yuanfang and Xu, Dayou and Liu, Guilin and others},
197-
journal={Environmental Microbiome},
198-
volume={17},
199-
number={1},
200-
pages={1--18},
201-
year={2022},
202-
doi={10.1186/s40793-022-00436-y},
203-
publisher={Springer}
204-
}
205-
206128
@article{kunin2008bioinformatician,
207129
title={A bioinformatician's guide to metagenomics},
208130
author={Kunin, Victor and Copeland, Alex and Lapidus, Alla and Mavromatis, Konstantinos and Hugenholtz, Philip},
@@ -217,7 +139,7 @@ @article{kunin2008bioinformatician
217139

218140
@article{schlaberg2017validation,
219141
title={Validation of metagenomic next-generation sequencing tests for universal pathogen detection},
220-
author={Schlaberg, Robert and Chiu, Charles Y and Miller, Steve and Procop, Gary W and Weinstock, George and Professional Practice Committee and Committee on Laboratory Practices of the American Society for Microbiology and Microbiology Resource Committee of the College of American Pathologists},
142+
author={Schlaberg, Robert and Chiu, Charles Y and Miller, Steve and Procop, Gary W and Weinstock, George and {Professional Practice Committee and Committee on Laboratory Practices of the American Society for Microbiology} and {Microbiology Resource Committee of the College of American Pathologists}},
221143
journal={Archives of Pathology and Laboratory Medicine},
222144
volume={141},
223145
number={6},
@@ -249,16 +171,6 @@ @article{marcelino2020ccmetagen
249171
publisher={Springer}
250172
}
251173

252-
%Schloss PD. Removal of rare amplicon sequence variants from 16s rrna gene sequence surveys biases the interpretation of community structure data. bioRxiv, 2020, preprint: not peer reviewed. https://doi.org/10.1101/2020.12.11.422279.
253-
254-
@article{Schloss,
255-
title={Removal of rare amplicon sequence variants from 16s rrna gene sequence surveys biases the interpretation of community structure data},
256-
author={Patrick D. Schloss},
257-
journal={bioRxiv},
258-
doi={10.1101/2020.12.11.422279},
259-
year={2020}
260-
}
261-
262174
@article{jia2022sequencing,
263175
title={Sequencing introduced false positive rare taxa lead to biased microbial community diversity, assembly, and interaction interpretation in amplicon studies},
264176
author={Jia, Yangyang and Zhao, Shengguo and Guo, Wenjie and Peng, Ling and Zhao, Fang and Wang, Lushan and Fan, Guangyi and Zhu, Yuanfang and Xu, Dayou and Liu, Guilin and others},
@@ -283,73 +195,27 @@ @article{jousset2017less
283195
publisher={Oxford University Press}
284196
}
285197

286-
@article{hu2022tenebrionibacter,
287-
title={Tenebrionibacter intestinalis gen. nov., sp. nov., a member of a novel genus of the family Enterobacteriaceae, isolated from the gut of the plastic-eating mealworm Tenebrio molitor L.},
288-
author={Hu, Lin and Yang, Yu},
289-
journal={International Journal of Systematic and Evolutionary Microbiology},
290-
volume={72},
291-
number={2},
292-
pages={005246},
293-
year={2022},
294-
doi={10.1099/ijsem.0.005246},
295-
publisher={Microbiology Society}
296-
}
297-
298-
@article{hardwick2018synthetic,
299-
title={Synthetic microbe communities provide internal reference standards for metagenome sequencing and analysis},
300-
author={Hardwick, Simon A and Chen, Wendy Y and Wong, Ted and Kanakamedala, Bindu S and Deveson, Ira W and Ongley, Sarah E and Santini, Nadia S and Marcellin, Esteban and Smith, Martin A and Nielsen, Lars K and others},
301-
journal={Nature communications},
302-
volume={9},
303-
number={1},
304-
pages={3096},
305-
year={2018},
306-
doi={10.1038/s41467-018-05555-0},
307-
publisher={Nature Publishing Group UK London}
308-
}
309-
310-
@article{singer2016next,
198+
@article{Singer2016MockCommunity,
311199
title={Next generation sequencing data of a defined microbial mock community},
312200
author={Singer, Esther and Andreopoulos, Bill and Bowers, Robert M and Lee, Janey and Deshpande, Shweta and Chiniquy, Jennifer and Ciobanu, Doina and Klenk, Hans-Peter and Zane, Matthew and Daum, Christopher and others},
313201
journal={Scientific data},
314202
volume={3},
315203
number={1},
316-
pages={1--8},
204+
pages={160081},
317205
year={2016},
318206
doi={10.1038/sdata.2016.81},
319207
publisher={Nature Publishing Group}
320208
}
321209

322-
@article{van2023synthetic,
323-
title={Synthetic microbial communities (SynComs) of the human gut: design, assembly, and applications},
324-
author={van Leeuwen, Pim T and Brul, Stanley and Zhang, Jianbo and Wortel, Meike T},
325-
journal={FEMS Microbiology Reviews},
326-
volume={47},
327-
number={2},
328-
pages={fuad012},
329-
year={2023},
330-
doi={10.1093/femsre/fuad012},
331-
publisher={Oxford University Press}
332-
}
333-
334210
@article{Irber2022FracMinHash,
335-
author = {Irber, Luiz C. and Brooks, Patrick T. and Reiter, Travis E. and Pierce-Ward, Nathan T. and Hera, M. R. and Koslicki, David and Brown, C. Titus},
211+
author = {Irber, Luiz and Brooks, Patrick T. and Reiter, Travis E. and Pierce-Ward, Nathan T. and Hera, M. R. and Koslicki, David and Brown, C. Titus},
336212
title = {Lightweight compositional analysis of metagenomes with FracMinHash and minimum metagenome covers},
337213
journal = {bioRxiv},
338214
year = {2022},
339215
doi = {10.1101/2022.01.11.475838},
340216
url = {https://doi.org/10.1101/2022.01.11.475838}
341217
}
342218

343-
@article{Singer2016MockCommunity,
344-
author = {Singer, Esther and Bushnell, Brian and Coleman-Derr, Devin and Douglas, Gina M. and Bowman, Benjamin and Bowers, Robert M. and Levy, Adi and Gies, Esther and Cheng, Jan-Fang and Copeland, Alex and others},
345-
title = {Next generation sequencing data of a defined microbial mock community},
346-
journal = {Scientific Data},
347-
volume = {3},
348-
number = {1},
349-
pages = {1--8},
350-
year = {2016},
351-
publisher = {Nature Publishing Group}
352-
}
353219
@book{irber2020decentralizing,
354220
title={Decentralizing indices for genomic data},
355221
author={Irber Jr, Luiz Carlos},

joss/paper.md

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -64,7 +64,7 @@ Identifying genomes in metagenomics samples can be complicated by taxonomic prof
6464

6565
Accurately identifying low-abundance microbial communities remains a significant challenge in metagenomics. Current methods rely on arbitrary filter thresholds that, even when applied, produce results skewed by sequencing errors and evolutionary processes, compromising profiling accuracy and leading to misinterpretations [@schloss2020removal; @jia2022sequencing]. The lack of a systematic credibility framework can undermine researcher confidence, a problem compounded by incomplete reference databases and variable sequencing coverage depth.
6666

67-
Metagenomic methods depend on reference databases that are often incomplete and misaligned with taxonomic frameworks, leaving evolutionarily diverged microbes undetected and causing profiling inaccuracies [@kunin2008bioinformatician; @schlaberg2017validation; @loeffler2020improving; @marcelino2020ccmetagen]. Addressing this equires analytical frameworks that incorporate genome similarity metrics, though sequencing coverage depth presents an additional challenge to reliable microbial detection.
67+
Metagenomic methods depend on reference databases that are often incomplete and misaligned with taxonomic frameworks, leaving evolutionarily diverged microbes undetected and causing profiling inaccuracies [@kunin2008bioinformatician; @schlaberg2017validation; @loeffler2020improving; @marcelino2020ccmetagen]. Addressing this requires analytical frameworks that incorporate genome similarity metrics, though sequencing coverage depth presents an additional challenge to reliable microbial detection.
6868

6969
Sequence coverage depth—the portion of a microbe’s genome detected in a sample—is crucial for detecting low-abundance microbes, which are often misinterpreted as noise due to limited sequencing depth [@mande2012classification; @shakya2013comparative; @sczyrba2017critical; @meyer2022critical]. The lack of guidelines for biologically meaningful coverage depth thresholds introduces subjectivity, making dynamic coverage depth thresholds essential. Yet even with adequate coverage and reliable genome references, controlling statistical errors remains a major challenge.
7070

@@ -111,7 +111,7 @@ We present the three use case examples to demonstrate the application of YACHT f
111111

112112
**Low abundance samples:** YACHT can analyze metagenomic samples with low microbial DNA concentrations common in clinical and environmental studies. Using a human skin metagenomics samples, we show that ANI threshold and k-size markedly influence species specificity. See [Low abundance samples](https://github.com/KoslickiLab/YACHT/tree/main/use_case_examples/low_abundance_samples).
113113

114-
**Metagenomic-assembled genome (MAG) fishing:** Using a single MAG as a training reference database, YACHT searches for specific MAGs within a sample. Applied to two skin metagenomic samples, results shows detection is sensitive to sequencing depth, coverage, and parameter choice. See [MAG fishing](https://github.com/KoslickiLab/YACHT/tree/main/use_case_examples/MAG_fishing).
114+
**Metagenomic-assembled genome (MAG) fishing:** Using a single MAG as a training reference database, YACHT searches for specific MAGs within a sample. Applied to two skin metagenomic samples, results shows that detection is sensitive to sequencing depth, coverage, and parameter choice. See [MAG fishing](https://github.com/KoslickiLab/YACHT/tree/main/use_case_examples/MAG_fishing).
115115

116116
**Synthetic metagenomes:** YACHT verifies the presence of designed microbes in mock microbial communities. Higher ANI thresholds recover expected genomes while lower thresholds introduce false positives, demonstrating how ANI and minimum coverage parameters affect sensitivy and specificity. See [Synthetic metagenomes](https://github.com/KoslickiLab/YACHT/tree/main/use_case_examples/synthetic_metagenome)
117117

0 commit comments

Comments
 (0)