@article{f738640d5ce6492a91c9fb326670097f,
title = "Microbiome preterm birth DREAM challenge: Crowdsourcing machine learning approaches to advance preterm birth research",
abstract = "Every year, 11% of infants are born preterm with significant health consequences, with the vaginal microbiome a risk factor for preterm birth. We crowdsource models to predict (1) preterm birth (PTB; <37 weeks) or (2) early preterm birth (ePTB; <32 weeks) from 9 vaginal microbiome studies representing 3,578 samples from 1,268 pregnant individuals, aggregated from public raw data via phylogenetic harmonization. The predictive models are validated on two independent unpublished datasets representing 331 samples from 148 pregnant individuals. The top-performing models (among 148 and 121 submissions from 318 teams) achieve area under the receiver operator characteristic (AUROC) curve scores of 0.69 and 0.87 predicting PTB and ePTB, respectively. Alpha diversity, VALENCIA community state types, and composition are important features in the top-performing models, most of which are tree-based methods. This work is a model for translation of microbiome data into clinically relevant predictive models and to better understand preterm birth.",
keywords = "16S harmonization, crowdsourced, DREAM challenge, machine learning, microbiome, predictive modeling, preterm birth, vaginal microbiome",
author = "{The Preterm Birth DREAM Community} and Golob, {Jonathan L.} and Oskotsky, {Tomiko T.} and Tang, {Alice S.} and Alennie Roldan and Verena Chung and Ha, {Connie W.Y.} and Wong, {Ronald J.} and Flynn, {Kaitlin J.} and Antonio Parraga-Leo and Camilla Wibrand and Minot, {Samuel S.} and Boris Oskotsky and Gaia Andreoletti and Idit Kosti and Julie Bletz and Amber Nelson and Jifan Gao and Zhoujingpeng Wei and Guanhua Chen and Tang, {Zheng Zheng} and Pierfrancesco Novielli and Donato Romano and Ester Pantaleo and Nicola Amoroso and Alfonso Monaco and Mirco Vacca and {De Angelis}, Maria and Roberto Bellotti and Sabina Tangaro and Abigail Kuntzleman and Isaac Bigcraft and Stephen Techtmann and Daehun Bae and Eunyoung Kim and Jongbum Jeon and Soobok Joe and Theis, {Kevin R.} and Sherrianne Ng and Lee, {Yun S.} and Patricia Diaz-Gimeno and Bennett, {Phillip R.} and MacIntyre, {David A.} and Gustavo Stolovitzky and Lynch, {Susan V.} and Jake Albrecht and Nardhy Gomez-Lopez and Roberto Romero and Stevenson, {David K.} and Nima Aghaeepour and Tarca, {Adi L.} and Costello, {James C.} and Marina Sirota",
note = "Publisher Copyright: {\textcopyright} 2023 The Authors",
year = "2023",
doi = "10.1016/j.xcrm.2023.101350",
language = "English",
volume = "5",
journal = "Cell Reports Medicine",
issn = "2666-3791",
number = "1",
}