@article {Casti{\~n}eira1367, author = {David Casti{\~n}eira and Katherine R Schlosser and Alon Geva and Amir R Rahmani and Gaston Fiore and Brian K Walsh and Craig D Smallwood and John H Arnold and Mauricio Santillana}, title = {Adding Continuous Vital Sign Information to Static Clinical Data Improves the Prediction of Length of Stay After Intubation: A Data-Driven Machine Learning Approach}, volume = {65}, number = {9}, pages = {1367--1377}, year = {2020}, doi = {10.4187/respcare.07561}, publisher = {Respiratory Care}, abstract = {BACKGROUND: Bedside monitors in the ICU routinely measure and collect patients{\textquoteright} physiologic data in real time to continuously assess the health status of patients who are critically ill. With the advent of increased computational power and the ability to store and rapidly process big data sets in recent years, these physiologic data show promise in identifying specific outcomes and/or events during patients{\textquoteright} ICU hospitalization.METHODS: We introduced a methodology designed to automatically extract information from continuous-in-time vital sign data collected from bedside monitors to predict if a patient will experience a prolonged stay (length of stay) on mechanical ventilation, defined as \>4 d, in a pediatric ICU.RESULTS: Continuous-in-time vital signs information and clinical history data were retrospectively collected for 284 ICU subjects from their first 24 h on mechanical ventilation from a medical-surgical pediatric ICU at Boston Children{\textquoteright}s Hospital. Multiple machine learning models were trained on multiple subsets of these subjects to predict the likelihood that each of these subjects would experience a long stay. We evaluated the predictive power of our models strictly on unseen hold-out validation sets of subjects. Our methodology achieved model performance of \>83\% (area under the curve) by using only vital sign information as input, and performances of 90\% (area under the curve) by combining vital sign information with subjects{\textquoteright} static clinical data readily available in electronic health records. We implemented this approach on 300 independently trained experiments with different choices of training and hold-out validation sets to ensure the consistency and robustness of our results in our study sample. The predictive power of our approach outperformed recent efforts that used deep learning to predict a similar task.CONCLUSIONS: Our proposed workflow may prove useful in the design of scalable approaches for real-time predictive systems in ICU environments, exploiting real-time vital sign information from bedside monitors. (ClinicalTrials.gov registration NCT02184208.)}, issn = {0020-1324}, URL = {https://rc.rcjournal.com/content/65/9/1367}, eprint = {https://rc.rcjournal.com/content/65/9/1367.full.pdf}, journal = {Respiratory Care} }