Skip to content

Commit

Permalink
chore: add ganon reference
Browse files Browse the repository at this point in the history
  • Loading branch information
Midnighter committed Jul 5, 2023
1 parent d0b4234 commit e7872d2
Show file tree
Hide file tree
Showing 2 changed files with 18 additions and 1 deletion.
17 changes: 17 additions & 0 deletions paper/paper.bib
Original file line number Diff line number Diff line change
Expand Up @@ -296,3 +296,20 @@ @book{van_rossum_python_1995
author = {Van Rossum, Guido and Drake Jr, Fred L},
year = {1995},
}

@article{piro_ganon_2020,
title = {ganon: precise metagenomics classification against large and up-to-date sets of reference sequences},
volume = {36},
issn = {1367-4803},
url = {https://doi.org/10.1093/bioinformatics/btaa458},
doi = {10.1093/bioinformatics/btaa458},
abstract = {The exponential growth of assembled genome sequences greatly benefits metagenomics studies. However, currently available methods struggle to manage the increasing amount of sequences and their frequent updates. Indexing the current RefSeq can take days and hundreds of GB of memory on large servers. Few methods address these issues thus far, and even though many can theoretically handle large amounts of references, time/memory requirements are prohibitive in practice. As a result, many studies that require sequence classification use often outdated and almost never truly up-to-date indices.Motivated by those limitations, we created ganon, a k-mer-based read classification tool that uses Interleaved Bloom Filters in conjunction with a taxonomic clustering and a k-mer counting/filtering scheme. Ganon provides an efficient method for indexing references, keeping them updated. It requires \<55 min to index the complete RefSeq of bacteria, archaea, fungi and viruses. The tool can further keep these indices up-to-date in a fraction of the time necessary to create them. Ganon makes it possible to query against very large reference sets and therefore it classifies significantly more reads and identifies more species than similar methods. When classifying a high-complexity CAMI challenge dataset against complete genomes from RefSeq, ganon shows strongly increased precision with equal or better sensitivity compared with state-of-the-art tools. With the same dataset against the complete RefSeq, ganon improved the F1-score by 65\% at the genus level. It supports taxonomy- and assembly-level classification, multiple indices and hierarchical classification.The software is open-source and available at: https://gitlab.com/rki\_bioinformatics/ganon.Supplementary data are available at Bioinformatics online.},
number = {Supplement\_1},
urldate = {2023-07-05},
journal = {Bioinformatics},
author = {Piro, Vitor C and Dadi, Temesgen H and Seiler, Enrico and Reinert, Knut and Renard, Bernhard Y},
month = jul,
year = {2020},
pages = {i12--i20},
file = {Piro et al (2020)_Bioinformatics.pdf:/home/moritz/Dropbox/References/Storage/Piro et al (2020)_Bioinformatics.pdf:application/pdf},
}
2 changes: 1 addition & 1 deletion paper/paper.md
Original file line number Diff line number Diff line change
Expand Up @@ -135,7 +135,7 @@ profiling tools and formats, and it is designed to be used as a
building block in metagenomic analysis workflows. At the time of writing, it is
able to read profiles from nine different profilers, namely Bracken
[@lu_bracken_2017], Centrifuge [@kim_centrifuge_2016], DIAMOND
[@buchfink_sensitive_2021], Kaiju [@menzel_fast_2016], Kraken2
[@buchfink_sensitive_2021], ganon [@piro_ganon_2020], Kaiju [@menzel_fast_2016], Kraken2
[@wood_improved_2019], KrakenUniq [@breitwieser_krakenuniq_2018], MALT/MEGAN6
[@huson_megan_2016; @vagene_salmonella_2018], MetaPhlAn
[@blanco-miguez_extending_2023],and mOTUs
Expand Down

0 comments on commit e7872d2

Please sign in to comment.