2024
Wijesekara, Yasas; Wu, Ling-Yi; Beeloo, Rick; Rozwalak, Piotr; Hauptfeld, Ernestina; Doijad, Swapnil P.; Dutilh, Bas E.; Kaderali, Lars
Jaeger: an accurate and fast deep-learning tool to detect bacteriophage sequences Journal Article
In: bioRxiv, 2024.
Abstract | BibTeX | Tags: Project 14, WP 1.1 Virus identification, WP 1.2 Host prediction
@article{Wijesekara2024,
title = {Jaeger: an accurate and fast deep-learning tool to detect bacteriophage sequences},
author = {Yasas Wijesekara and Ling-Yi Wu and Rick Beeloo and Piotr Rozwalak and Ernestina Hauptfeld and Swapnil P. Doijad and Bas E. Dutilh and Lars Kaderali},
year = {2024},
date = {2024-09-24},
journal = {bioRxiv},
abstract = {Viruses are integral to every biome on Earth, yet we still need a more comprehensive picture of their identity and global distribution. Global metagenomics sequencing efforts revealed the genomic content of tens of thousands of environmental samples, however identifying the viral sequences in these datasets remains challenging due to their vast genomic diversity. Here, we address identifying bacteriophage sequences in unlabeled sequencing data. In a recent benchmarking paper, we observed that existing deep-learning tools show a high true positive rate, but may also produce many false positives when confronted with divergent sequences. To tackle this challenge, we introduce Jaeger, a novel deep-learning method designed specifically for identifying bacteriophage genome fragments. Extensive benchmarking on the IMG/VR database and real-world metagenomes reveals Jaeger’s consistent high sensitivity (0.87) and precision (0.92). Applying Jaeger to over 16,000 metagenomic assemblies from the MGnify database yielded over five million putative phage contigs. On average, Jaeger is around 20 times faster than the other state-of-the-art methods. Jaeger is available at https://github.com/MGXlab/Jaeger.},
keywords = {Project 14, WP 1.1 Virus identification, WP 1.2 Host prediction},
pubstate = {published},
tppubtype = {article}
}
Trgovec-Greif, Lovro; Hellinger, Hans-Jörg; Mainguy, Jean; Pfundner, Alexander; Frishman, Dmitrij; Kiening, Michael; Webster, Nicole Suzanne; Laffy, Patrick William; Feichtinger, Michael; Rattei, Thomas
VOGDB—Database of Virus Orthologous Groups Journal Article
In: Viruses, vol. 16, iss. 8, pp. 1191, 2024.
Abstract | Links | BibTeX | Tags: Project 14, WP 1.1 Virus identification
@article{Trgovec-Greif2024,
title = {VOGDB—Database of Virus Orthologous Groups},
author = {Lovro Trgovec-Greif and Hans-Jörg Hellinger and Jean Mainguy and Alexander Pfundner and Dmitrij Frishman and Michael Kiening and Nicole Suzanne Webster and Patrick William Laffy and Michael Feichtinger and Thomas Rattei},
doi = {10.3390/v16081191},
year = {2024},
date = {2024-07-25},
urldate = {2024-07-25},
journal = {Viruses},
volume = {16},
issue = {8},
pages = {1191},
abstract = {Computational models of homologous protein groups are essential in sequence bioinformatics. Due to the diversity and rapid evolution of viruses, the grouping of protein sequences from virus genomes is particularly challenging. The low sequence similarities of homologous genes in viruses require specific approaches for sequence- and structure-based clustering. Furthermore, the annotation of virus genomes in public databases is not as consistent and up to date as for many cellular genomes. To tackle these problems, we have developed VOGDB, which is a database of virus orthologous groups. VOGDB is a multi-layer database that progressively groups viral genes into groups connected by increasingly remote similarity. The first layer is based on pair-wise sequence similarities, the second layer is based on the sequence profile alignments, and the third layer uses predicted protein structures to find the most remote similarity. VOGDB groups allow for more sensitive homology searches of novel genes and increase the chance of predicting annotations or inferring phylogeny. VOGD B uses all virus genomes from RefSeq and partially reannotates them. VOGDB is updated with every RefSeq release. The unique feature of VOGDB is the inclusion of both prokaryotic and eukaryotic viruses in the same clustering process, which makes it possible to explore old evolutionary relationships of the two groups. VOGDB is freely available at vogdb.org under the CC BY 4.0 license.},
keywords = {Project 14, WP 1.1 Virus identification},
pubstate = {published},
tppubtype = {article}
}
2021
Goettsch, Winfried; Beerenwinkel, Niko; Deng, Li; Dölken, Lars; Dutilh, Bas E.; Erhard, Florian; Kaderali, Lars; von Kleist, Max; Marquet, Roland; Matthijnssens, Jelle; McCallin, Shawna; McMahon, Dino; Rattei, Thomas; van Rij, Ronald P.; Robertson, David L.; Schwemmle, Martin; Stern-Ginossar, Noam; Marz, Manja
ITN -- VIROINF: Understanding (Harmful) Virus-Host Interactions by Linking Virology and Bioinformatics Journal Article
In: Viruses, vol. 13, no. 5, pp. 766, 2021.
Abstract | Links | BibTeX | Tags: Project 01, Project 02, Project 03, Project 04, Project 05, Project 06, Project 07, Project 08, Project 09, Project 10, Project 11, Project 12, Project 13, Project 14, Project 15, WP 1.1 Virus identification, WP 1.2 Host prediction, WP 1.3 Virus-host interactions, WP 1.4 Virus regulation, WP 1.5 Virus products, WP 2.1 Microevolution: Virus quasispecies, WP 2.2 Macroevolution: Natural selection of viruses
@article{nokey,
title = {ITN -- VIROINF: Understanding (Harmful) Virus-Host Interactions by Linking Virology and Bioinformatics},
author = {Winfried Goettsch and Niko Beerenwinkel and Li Deng and Lars Dölken and Bas E. Dutilh and Florian Erhard and Lars Kaderali and Max von Kleist and Roland Marquet and Jelle Matthijnssens and Shawna McCallin and Dino McMahon and Thomas Rattei and Ronald P. {van Rij} and David L. Robertson and Martin Schwemmle and Noam Stern-Ginossar and Manja Marz},
doi = {10.3390/v13050766},
year = {2021},
date = {2021-04-27},
urldate = {2021-04-27},
journal = {Viruses},
volume = {13},
number = {5},
pages = {766},
abstract = {Many recent studies highlight the fundamental importance of viruses. Besides their important role as human and animal pathogens, their beneficial, commensal or harmful functions are poorly understood. By developing and applying tailored bioinformatical tools in important virological models, the Marie Skłodowska-Curie Initiative International Training Network VIROINF will provide a better understanding of viruses and the interaction with their hosts. This will open the door to validate methods of improving viral growth, morphogenesis and development, as well as to control strategies against unwanted microorganisms. The key feature of VIROINF is its interdisciplinary nature, which brings together virologists and bioinformaticians to achieve common goals.},
keywords = {Project 01, Project 02, Project 03, Project 04, Project 05, Project 06, Project 07, Project 08, Project 09, Project 10, Project 11, Project 12, Project 13, Project 14, Project 15, WP 1.1 Virus identification, WP 1.2 Host prediction, WP 1.3 Virus-host interactions, WP 1.4 Virus regulation, WP 1.5 Virus products, WP 2.1 Microevolution: Virus quasispecies, WP 2.2 Macroevolution: Natural selection of viruses},
pubstate = {published},
tppubtype = {article}
}