@prefix this: . @prefix sub: . @prefix np: . @prefix dct: . @prefix nt: . @prefix npx: . @prefix xsd: . @prefix rdfs: . @prefix orcid: . @prefix prov: . @prefix foaf: . sub:Head { this: a np:Nanopublication; np:hasAssertion sub:assertion; np:hasProvenance sub:provenance; np:hasPublicationInfo sub:pubinfo . } sub:assertion { a , ; dct:creator orcid:0009-0001-1115-9741; dct:publisher ; rdfs:comment "This research investigates the impact of missing data on the performance of machine learning algorithms, with a particular focus on the MIMIC-IV dataset. This project aims to investigate the extent to which missing data negatively impacts the training of machine learning algorithms, and whether demographic groups with a higher proportion of missing data (i.e.,ethnicity) have lower predictive accuracy. Using advanced machine learning and data analysis techniques, our results highlight important considerations related to missing data in medical datasets and provide useful insights for improving predictive modeling and decision support systems in clinical practice offers. Major findings:This investigation leveraged the MIMIC-IV v2.2 dataset—containing de-identified data from 73,141 ICU admissions at Beth Israel Deaconess Medical Center—to study the impact of missing data on machine learning. The research found that while electronic health records (EHRs) offer massive clinical datasets, they are often non-standardized and riddled with missing values. By predicting hospital Length of Stay (LOS), the study showed that as data is missing \"not at random,\" algorithm performance (measured by RMSE) degrades. Specifically, when datasets were intentionally biased to have more missing entries for certain racial groups (Asian, Black, Hispanic, etc.), the predictive error for those specific groups increased in 83% of \"aggressive\" data removal tests. This highlights that simply imputing or completing missing data can entrench existing healthcare inequities."; rdfs:label "Addressing the Challenge of Missing Medical Data in Healthcare Analytics: A Focus on Machine Learning Predictions for ICU Length of Stay"; ; this:; "mahmad.isaq@outlook.com"; "2024"; "2023" . } sub:provenance { sub:assertion prov:wasAttributedTo orcid:0009-0008-8411-2742 . } sub:pubinfo { orcid:0009-0008-8411-2742 foaf:name "Emily Regalado" . this: dct:created "2026-01-14T05:53:32.919Z"^^xsd:dateTime; dct:creator orcid:0009-0008-8411-2742; dct:license ; npx:introduces ; npx:wasCreatedAt ; nt:wasCreatedFromProvenanceTemplate ; nt:wasCreatedFromPubinfoTemplate , ; nt:wasCreatedFromTemplate . sub:sig npx:hasAlgorithm "RSA"; npx:hasPublicKey "MIIBIjANBgkqhkiG9w0BAQEFAAOCAQ8AMIIBCgKCAQEAxzr6UBGMW6c8tegz0babaledWUEQ0PLDE4tp7Iinbe2DZtAtY5JUptKYuStWDZx+QER4808P8dejNWRnBDzgthYJm/AyNSXflHSJhz2+NC+h7RylOLxbwLEQocmyKKiYxa2gT85m6ajVL2M6TnfG67nnK+K2f7iCGL6wYXRITD1q+7+5SWqBdDXIV921W4IKWaD2GJk+NRBoOqQhbsrk8Tn5XsNd7DMYVHk47oMDGbeBnrOIoRPsbBgAcoCsxxhiB9yN6Lf8EUbnlXVEDzJuZk048L1BDZL+6nkA8btTQGP2ijUFWA7rTrod3LjUDQWLZS95njjl867dtmv/znYkzwIDAQAB"; npx:hasSignature "ew01BbW15Sne2LHMMUh5OFGNSNoEiFOf0YvAGWbToB5SlqhFDy27lOOt4ByCI2tJ2ElqcYWl+GfHFJt0FFR7ET5ZU65hxRrqNjVqz1hMXZhcqdHpEgJYOxKUoOHz4QfRs6uvreJlW33Pol9XIAxJ89jCJuhUVP2HbkF9e83wK/39Q9OAFi1kOqI3iPIXlM3ZOopFBF4/yy56kbesc7MZIKN6uMBry6913XNy3PpLkMDGpwCh2dfFA3osGCuG1qQdYHaIFTfW9o+55xDtxM0yt8WCZMYhdobhYlb0NPya2Gh5TwoQ0BKGX6c4SquQyPXXIqQ2L7SsMXNrZsarPqiH7w=="; npx:hasSignatureTarget this:; npx:signedBy orcid:0009-0008-8411-2742 . }