@article{46ec64a7f7784739944b14e78024c49c,
title = "Thousands of small, novel genes predicted in global phage genomes",
abstract = "Small genes (<150 nucleotides) have been systematically overlooked in phage genomes. We employ a large-scale comparative genomics approach to predict >40,000 small-gene families in ∼2.3 million phage genome contigs. We find that small genes in phage genomes are approximately 3-fold more prevalent than in host prokaryotic genomes. Our approach enriches for small genes that are translated in microbiomes, suggesting the small genes identified are coding. More than 9,000 families encode potentially secreted or transmembrane proteins, more than 5,000 families encode predicted anti-CRISPR proteins, and more than 500 families encode predicted antimicrobial proteins. By combining homology and genomic-neighborhood analyses, we reveal substantial novelty and diversity within phage biology, including small phage genes found in multiple host phyla, small genes encoding proteins that play essential roles in host infection, and small genes that share genomic neighborhoods and whose encoded proteins may share related functions.",
keywords = "CP: Microbiology, MetaRibo-Seq, comparative genomics, gene families, microbiome, phage, sORFs, small genes",
author = "Fremin, {Brayon J.} and Bhatt, {Ami S.} and Kyrpides, {Nikos C.} and Aditi Sengupta and Alexander Sczyrba and {da Silva}, {Aline Maria} and Alison Buchan and Amelie Gaudin and Andreas Brune and Hirsch, {Ann M.} and Anthony Neumann and Ashley Shade and Axel Visel and Barbara Campbell and Brett Baker and Hedlund, {Brian P.} and Crump, {Byron C.} and Cameron Currie and Charlene Kelly and Chris Craft and Christina Hazard and Christopher Francis and Schadt, {Christopher W.} and Colin Averill and Courtney Mobilian and Dan Buckley and Dana Hunt and Daniel Noguera and David Beck and Valentine, {David L.} and David Walsh and Dawn Sumner and Despoina Lymperopoulou and Devaki Bhaya and Bryant, {Donald A.} and Elise Morrison and Eoin Brodie and Erica Young and Erik Lilleskov and Eva H{\"o}gfors-R{\"o}nnholm and Feng Chen and Frank Stewart and Nicol, {Graeme W.} and Hanno Teeling and Beller, {Harry R.} and Hebe Dionisi and Hui-ling Liao and Beman, {J. Michael} and James Stegen and Thomas Mock and {Global Phage Small Open Reading Frame (GP-SmORF) Consortium}",
note = "Funding Information: The work conducted by the U.S. Department of Energy Joint Genome Institute, a DOE Office of Science User Facility, is supported by the Office of Science of the U.S. Department of Energy under contract no. DE-AC02-05CH11231. Computing costs were also supported via NIH S10 Shared Instrumentation Grant (1S10OD02014101), NIH R01 #AI148623–01, A Sloan Foundation Fellowship, and Damon Runyon Clinical Investigator Award to A.S.B. Sample collection costs were supported by NSF grants 1826734 and 1441717 as well as Simons Foundation grant 827839.",
year = "2022",
month = jun,
day = "21",
doi = "10.1016/j.celrep.2022.110984",
language = "English",
volume = "39",
journal = "Cell Reports",
issn = "2211-1247",
publisher = "Cell Press",
number = "12",
}