<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Pediatr Parent</journal-id><journal-id journal-id-type="publisher-id">pediatrics</journal-id><journal-id journal-id-type="index">30</journal-id><journal-title>JMIR Pediatrics and Parenting</journal-title><abbrev-journal-title>JMIR Pediatr Parent</abbrev-journal-title><issn pub-type="epub">2561-6722</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e76712</article-id><article-id pub-id-type="doi">10.2196/76712</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Modeling Zero-Dose Children in Ethiopia: A Machine Learning Perspective on Model Performance and Predictor Variables</article-title></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name name-style="western"><surname>Endehabtu</surname><given-names>Berhanu Fikadie</given-names></name><degrees>MPH</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Alemu</surname><given-names>Kassahun</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff2">2</xref><xref ref-type="aff" rid="aff3">3</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Mengiste</surname><given-names>Shegaw Anagaw</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff4">4</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Zelalem</surname><given-names>Meseret</given-names></name><degrees>MD</degrees><xref ref-type="aff" rid="aff5">5</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Gullslett</surname><given-names>Monika Knudsen</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff6">6</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Tilahun</surname><given-names>Binyam</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="aff" rid="aff2">2</xref></contrib></contrib-group><aff id="aff1"><institution>Department of Health Informatics, Institute of Public Health, College of Medicine and Health Sciences, University of Gondar</institution><addr-line>Gondar</addr-line><country>Ethiopia</country></aff><aff id="aff2"><institution>Center for Digital Health and Implementation Science, University of Gondar</institution><addr-line>Gondar</addr-line><country>Ethiopia</country></aff><aff id="aff3"><institution>Department of Epidemiology and Biostatistics, Institute of Public Health, College of Medicine and Health Sciences, University of Gondar</institution><addr-line>Gondar</addr-line><country>Ethiopia</country></aff><aff id="aff4"><institution>School of Business, University of South-Eastern Norway</institution><addr-line>Drammen</addr-line><country>Norway</country></aff><aff id="aff5"><institution>Department of Pediatrics and Child Health, University of Gondar</institution><addr-line>Gondar</addr-line><country>Ethiopia</country></aff><aff id="aff6"><institution>Norwegian Centre for E-health Research, University Hospital of North Norway</institution><addr-line>Troms&#x00F8;</addr-line><country>Norway</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Badawy</surname><given-names>Sherif</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Pabon-Rodriguez</surname><given-names>Felix</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Adisu</surname><given-names>Molalign</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Meng</surname><given-names>Nan</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Berhanu Fikadie Endehabtu, MPH, Department of Health Informatics, Institute of Public Health, College of Medicine and Health Sciences, University of Gondar, Gondar, 196, Ethiopia, 251 921013129; <email>berhanufikadie@gmail.com</email></corresp></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>2</day><month>2</month><year>2026</year></pub-date><volume>9</volume><elocation-id>e76712</elocation-id><history><date date-type="received"><day>29</day><month>04</month><year>2025</year></date><date date-type="rev-recd"><day>18</day><month>09</month><year>2025</year></date><date date-type="accepted"><day>14</day><month>10</month><year>2025</year></date></history><copyright-statement>&#x00A9; Berhanu Fikadie Endehabtu, Kassahun Alemu, Shegaw Anagaw Mengiste, Meseret Zelalem, Monika Knudsen Gullslett, Binyam Tilahun. Originally published in JMIR Pediatrics and Parenting (<ext-link ext-link-type="uri" xlink:href="https://pediatrics.jmir.org">https://pediatrics.jmir.org</ext-link>), 2.2.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Pediatrics and Parenting, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://pediatrics.jmir.org">https://pediatrics.jmir.org</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://pediatrics.jmir.org/2026/1/e76712"/><abstract><sec><title>Background</title><p>Despite progress in childhood vaccination, many children in low- and middle-income countries, including Ethiopia, remain unvaccinated, presenting a significant public health challenge. The Immunization Agenda 2030 (IA2030) seeks to halve the number of unvaccinated children by identifying at-risk populations, but effective strategies are limited. This study leverages machine learning (ML) to identify Ethiopian children aged 12-35 months who are at higher risk of being zero dose (ZD). By analyzing demographic, socioeconomic, and health care access data, the study developed predictive models using different algorithms. The findings aim to inform targeted interventions, ultimately improving vaccination coverage and health outcomes.</p></sec><sec><title>Objective</title><p>This study aimed to develop an ML model to predict ZD children and to identify the most influential predictors of ZD in Ethiopia.</p></sec><sec sec-type="methods"><title>Methods</title><p>We examined how well the predictive algorithms can characterize a child at risk of being ZD based on predictor variables sourced from the recent National Immunization Evaluation Survey data. We applied supervised ML algorithms with the survey datasets, which included 13,666 children aged 12-35 months. Model performance was assessed using accuracy, area under the curve, precision, recall, and <italic>F</italic><sub>1</sub>-score. We applied Shapley Additive analysis to identify the most important predictors.</p></sec><sec sec-type="results"><title>Results</title><p>The Light Gradient Boosting Machine (LGBM), Random Forest, Extreme Gradient Boosting (XGBoost), and AdaBoost classifiers effectively identified most ZD children as being at high risk. Among these, LGBM demonstrated the best performance, achieving an accuracy of 93%, an area under the curve of 97%, a precision of 94%, and a recall of 91%. The most significant features impacting the model included poor perception of vaccination benefits, lack of antenatal care utilization, distance from immunization services, and absence of maternal tetanus toxoid vaccinations.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>The developed ML models effectively predict children at risk of being ZD, with the LGBM model showing the best performance. This model can guide targeted interventions to reduce ZD prevalence and address vaccination inequities. Key predictors include access to immunization sites, maternal health service utilization, and perceptions of immunization benefits. By focusing on these vulnerable groups, public health efforts can tackle disparities in vaccination coverage. Enhancing maternal care, raising caregiver awareness, and improving immunization access through outreach can significantly reduce the number of ZD children.</p></sec></abstract><kwd-group><kwd>modeling</kwd><kwd>zero dose</kwd><kwd>children</kwd><kwd>machine learning</kwd><kwd>Ethiopia</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><p>Child immunization is a cornerstone of public health, essential for safeguarding against life-threatening diseases and promoting the health of future generations [<xref ref-type="bibr" rid="ref1">1</xref>]. Globally, significant advancements have been made in immunization programs, resulting in higher coverage rates [<xref ref-type="bibr" rid="ref2">2</xref>] and a corresponding decline in vaccine-preventable disease [<xref ref-type="bibr" rid="ref3">3</xref>]. However, as of 2023, approximately 14.5 million children worldwide didn&#x2019;t receive the first dose of diphtheria, tetanus, and pertussis (DTP1) containing vaccines [<xref ref-type="bibr" rid="ref4">4</xref>], a widely used indicator of access to immunization services [<xref ref-type="bibr" rid="ref5">5</xref>]. This high number of zero-dose (ZD) children continues to be a pressing issue, intensifying health inequalities and heightening the likelihood of vaccine-preventable disease outbreaks [<xref ref-type="bibr" rid="ref6">6</xref>]. These ZD children remain at high risk, creating considerable hurdles for public health efforts [<xref ref-type="bibr" rid="ref7">7</xref>-<xref ref-type="bibr" rid="ref9">9</xref>].</p><p>In a substantial portion of these ZD children, about 60% are concentrated in 10 low- and middle-income countries, including Ethiopia. Despite notable achievements in improving immunization coverage in Ethiopia, the country ranks third globally for ZD children, following Nigeria and India, accounting for 6% of the world&#x2019;s total [<xref ref-type="bibr" rid="ref4">4</xref>].</p><p>Addressing the issue of children at risk of becoming ZD has emerged as a priority on both national and global agendas [<xref ref-type="bibr" rid="ref10">10</xref>]. The Immunization Agenda 2030 (IA2030), endorsed by the World Health Assembly in November 2020, aims to reduce the number of ZD children by ensuring that every child is reached by 2030 [<xref ref-type="bibr" rid="ref5">5</xref>]. However, effectively identifying and reaching these at-risk children poses significant operational challenges, and little is known about what strategies perform best.</p><p>Research in Ethiopia has identified various predictors of low immunization uptake, including low education levels and low wealth index [<xref ref-type="bibr" rid="ref11">11</xref>-<xref ref-type="bibr" rid="ref13">13</xref>], rural residence [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref14">14</xref>], limited access to health services [<xref ref-type="bibr" rid="ref15">15</xref>,<xref ref-type="bibr" rid="ref16">16</xref>], lack of antenatal care (ANC) and postnatal care (PNC) [<xref ref-type="bibr" rid="ref13">13</xref>,<xref ref-type="bibr" rid="ref15">15</xref>-<xref ref-type="bibr" rid="ref18">18</xref>], home deliveries [<xref ref-type="bibr" rid="ref13">13</xref>-<xref ref-type="bibr" rid="ref16">16</xref>], absence of maternal tetanus toxoid (TT) vaccination [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref19">19</xref>], and poor caregiver knowledge [<xref ref-type="bibr" rid="ref16">16</xref>]. However, there is a lack of evidence regarding how well these factors predict ZD status specifically and which factors are most relevant for optimal prediction.</p><p>Recent advancements in data science, coupled with available routine immunization data, present new opportunities to identify and reach at-risk children at both subnational and individual levels. Developing a robust algorithm to predict ZD children based on a set of variables could provide a valuable foundation for tailored interventions. Machine learning (ML) has emerged as a transformative tool in public health research particularly suited for this task which can capture complex relationships and interactions between variables [<xref ref-type="bibr" rid="ref20">20</xref>-<xref ref-type="bibr" rid="ref22">22</xref>]. Unlike traditional statistical methods that rely on predefined hypotheses, ML models can autonomously identify patterns and relationships within large datasets by learning from data rather than making prior assumptions [<xref ref-type="bibr" rid="ref20">20</xref>,<xref ref-type="bibr" rid="ref23">23</xref>,<xref ref-type="bibr" rid="ref24">24</xref>]. This capability is particularly useful for multifactorial issues such as immunization uptake [<xref ref-type="bibr" rid="ref25">25</xref>].</p><p>Using rule-based ML models can uncover hidden relationships among determinants of ZD children in large datasets, often represented through &#x201C;if-then&#x201D; statements that illustrate connections between variables [<xref ref-type="bibr" rid="ref26">26</xref>]. This application of ML bridges the gap between theoretical research and practical applications, leading to advancements in the health care field [<xref ref-type="bibr" rid="ref27">27</xref>].</p><p>This study aims to use ML algorithms to predict which Ethiopian children aged 12-35 months are at higher risk of being ZD and assess the predictive capabilities of the developed models. Findings from this study may provide actionable insights for policy makers and immunization program actors, informing the development of targeted strategies to effectively identify and reach those most at-risk children.</p></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Design</title><p>The data for this study were sourced from the recent National Immunization Evaluation Survey in Ethiopia, which provides nationwide representation [<xref ref-type="bibr" rid="ref28">28</xref>]. The survey included 11 regions and the 2 city administrations. A 2-stage stratified cluster sampling technique was used to select participants. The first stage is the enumeration areas (EAs), which served as clusters, randomly chosen with an urban-rural stratification approach, and the second stage is households within each EA. Sampling frames were prepared for each region and city administrations by the Ethiopian Statistical Services. The number of EAs required per region and city administration was determined based on the size within the stratum (study regions) and proportion of the Ethiopia population living in urban and rural areas (21.4% urban and 78.6% rural). A total of 468 EAs were randomly selected, comprising 100 from urban areas and 368 from rural regions, resulting in a total sample size of approximately 13,666 households with children aged 12&#x2010;35 months.</p><p>We extracted information on immunization status for children aged 12&#x2010;35 months. The vaccination status of children was assessed using 3 sources of information: caregiver reports, home-based vaccination cards, and facility-based records, following World Health Organization guidelines [<xref ref-type="bibr" rid="ref29">29</xref>]. If a mother or a caregiver presented an immunization card, the child&#x2019;s vaccination status was assessed from that card. In cases where the card was unavailable, data collectors were instructed to verify the information at the nearest health facility if the caregiver reported that their child had been vaccinated. The mother&#x2019;s or caregiver&#x2019;s self-reports were considered only when neither the immunization card nor the facility records were available.</p><p>Using the operational definition set by Gavi, we defined a variable ZD status for each child, which is set to 1 if the child did not receive the first dose of the diphtheria, TTs, and pertussis-containing vaccine (DPT1), and set 0 otherwise [<xref ref-type="bibr" rid="ref30">30</xref>,<xref ref-type="bibr" rid="ref31">31</xref>].</p><p>We included a set of predictor variables or features to capture characteristics that have been associated with ZD status (<xref ref-type="table" rid="table1">Table 1</xref>). The factors influencing the outcome of interest are grouped into 3 groups: socioeconomic and demographic variables, health service utilization, and perceptions and attitudes. The first group of socioeconomic and demographic variables encompasses individual, household, and community-level characteristics that may affect the outcome of interest. The health service utilization represents the access to and use of various health care services, which can impact immunization status. The third category focuses on the perceptions or attitudes that individuals or caregivers have toward the benefits of immunization. All the 3 categories of the variables gathered during the survey.</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>The predictor variables used for analysis were extracted from the recent National Immunization Evaluation Survey in Ethiopia, 2023.</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Category</td><td align="left" valign="bottom">Description</td><td align="left" valign="bottom">Response/type of data</td></tr></thead><tbody><tr><td align="left" valign="top">Socioeconomic and demographic factor</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Residency</td><td align="left" valign="top">Type of living arrangement</td><td align="left" valign="top">Categorical (urban and rural)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Region</td><td align="left" valign="top">Geographic area of residence</td><td align="left" valign="top">Nominal (eg, Afar, Amhara...)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Religion</td><td align="left" valign="top">Cultural beliefs influencing health behaviors</td><td align="left" valign="top">Nominal or categorical (orthodox, Muslim, protestant, and others)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Marital status</td><td align="left" valign="top">Relationship status of the mother or the caregiver</td><td align="left" valign="top">Categorical (married and living together, married, married but not living together, and not in marital union)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mother&#x2019;s or caregiver&#x2019;s educational status</td><td align="left" valign="top">Level of formal education attained</td><td align="left" valign="top">Categorical (no, primary, secondary, and higher education)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Occupation of mothers or caregivers</td><td align="left" valign="top">Employment status and type of work</td><td align="left" valign="top">Nominal categorical data</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Birth order</td><td align="left" valign="top">Position of a child in relation to their siblings within a family</td><td align="left" valign="top">Categorical (first, second, third, and fourth and above)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Wealth index</td><td align="left" valign="top">Measures economic status</td><td align="left" valign="top">Categorical (poor, middle, and rich)</td></tr><tr><td align="left" valign="top">Health service utilization</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>ANC<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup> follow-up</td><td align="left" valign="top">History of ANC visits for the index child</td><td align="left" valign="top">Categorical (Yes/No)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>History of maternal tetanus diphtheria vaccine</td><td align="left" valign="top">Previous vaccinations received</td><td align="left" valign="top">Categorical (Yes/No)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Distance to immunization site</td><td align="left" valign="top">Perceived impact of distance on immunization access</td><td align="left" valign="top">Categorical (&#x201C;big problem,&#x201D; &#x201C;not a problem&#x201D;)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Place of delivery</td><td align="left" valign="top">Location where the child was born</td><td align="left" valign="top">Categorical (Home/Facility)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Postnatal care</td><td align="left" valign="top">Follow-up care received after childbirth</td><td align="left" valign="top">Categorical (Yes/No)</td></tr><tr><td align="left" valign="top">Perceptions and attitudes</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Mother&#x2019;s or caregiver&#x2019;s perceived benefits on immunization</td><td align="left" valign="top">Beliefs regarding the advantages of vaccination</td><td align="left" valign="top">Was Likert (categorized into poor or good)</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Trust in health care provider</td><td align="left" valign="top">The belief of mothers or caregivers on the services provided</td><td align="left" valign="top">Categorized into poor or good</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>ANC: antenatal care.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s2-2"><title>Data Preprocessing and Transformation</title><p>We implemented several preprocessing steps to enhance model performance. First, we addressed missing values in the independent variables using the k-nearest neighbor approach. We then transformed categorical variables into numerical format through one-hot encoding, which is essential for preparing data for ML models. To standardize feature ranges, we applied minimum-maximum scaling and mean normalization, ensuring comparability among features (<xref ref-type="fig" rid="figure1">Figure 1</xref>).</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>Data preparation and analysis steps for zero-dose children prediction. AUC: area under the curve; LGBM: Light Gradient Boosting Machine.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="pediatrics_v9i1e76712_fig01.png"/></fig><p>We conducted sampling weight as instance weights during the training process for all algorithms. This was done by using the sample_weight parameter in the model&#x2019;s fitting functions, which adjusts the influence of each observation based on its probability of selection.</p><p>Next, we conducted a correlation analysis to identify and remove highly correlated features, thereby reducing multicollinearity and enhancing model robustness. Our correlation matrix showed a strong relation between parity and birth order (<xref ref-type="fig" rid="figure2">Figure 2</xref>), leading us to compute mutual information scores for each variable (<xref ref-type="fig" rid="figure3">Figure 3</xref>). This analysis highlighted ANC utilization and TT vaccination as significant predictors, while features such as marital status were excluded due to their minimal information value. Consequently, we retained birth order and omitted parity based on their scores.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Correlation analysis matrix for predictor variables for zero-dose children, Ethiopia, 2023. ANC: antenatal care; PNC: postnatal care; TT: tetanus toxoid.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="pediatrics_v9i1e76712_fig02.png"/></fig><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Mutual information score of predictor variables for zero-dose children, Ethiopia, 2023. ANC: antenatal care; PNC: postnatal care.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="pediatrics_v9i1e76712_fig03.png"/></fig><p>For dimensionality reduction, we used Forward Selection, Backward Elimination, and Recursive Feature Elimination methods. We opted for Recursive Feature Elimination due to its effectiveness in identifying the most significant predictors while simplifying the dataset. To address class imbalance, we applied the Synthetic Minority Oversampling Technique, which balanced the dataset from an initial skew of 82% majority and 18% minority to an equal distribution. This balancing supports the development of robust predictive models and mitigates bias toward the majority class (<xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s2-3"><title>Model Development</title><p>After the preprocessing, we split the dataset into 80% for training and 20% for testing (<xref ref-type="fig" rid="figure1">Figure 1</xref>). To avoid overfitting and underfitting, we applied 10-fold cross-validation, dividing the data into 10-folds and using one for validation while training on the others. The final performance is averaged across all folds.</p><p>The outcome variable, known as the class, is a binary variable indicating ZD status. A ZD status of 1 denotes a ZD child, while 0 indicates a non-ZD child. We applied supervised learning algorithms to develop a model from the training data to accurately predict this outcome in the test data.</p><p>Given the categorical nature of the outcome variable, we used 7 classical classification algorithms: AdaBoost Classifier [<xref ref-type="bibr" rid="ref32">32</xref>], Logistic Regression [<xref ref-type="bibr" rid="ref33">33</xref>], Naive Bayes, Random Forest (RF) [<xref ref-type="bibr" rid="ref34">34</xref>], Light Gradient Boosting Machine (LGBM) [<xref ref-type="bibr" rid="ref35">35</xref>], Extreme Gradient Boosting (XGBoost) [<xref ref-type="bibr" rid="ref35">35</xref>], and Decision Tree [<xref ref-type="bibr" rid="ref36">36</xref>]. These models generate a predicted score between 0 and 1 for each child, which is then classified as ZD or non-ZD based on a defined threshold. Following the initial model comparison, hyperparametric tuning was conducted to further optimize the performance of the best performing algorithm using a RandomizedSearchCV with cross-validation. The search involved 100 iterations with each hyperparameter combination evaluated using 5-fold cross-validation. Finally, the performance of each model was tested before and after balancing the dataset to choose the best predictive model. The model comparison was carried out using the balanced dataset.</p></sec><sec id="s2-4"><title>Model Evaluation</title><p>We evaluated model performance using both train-test split and cross-validation techniques, emphasizing both discrimination and calibration metrics to compare our classification of ZD status against the true ZD status of each child. Discrimination metrics included accuracy, precision, recall (sensitivity), <italic>F</italic><sub>1</sub>-score, and area under the curve and area under the receiver operating characteristic curve. Accuracy reflects the proportion of correctly classified instances among all tested cases [<xref ref-type="bibr" rid="ref37">37</xref>], while precision indicates the ratio of true-positive predictions to all positive predictions [<xref ref-type="bibr" rid="ref38">38</xref>]. Recall measures the proportion of actual positive cases that the model successfully identifies [<xref ref-type="bibr" rid="ref39">39</xref>], and the <italic>F</italic><sub>1</sub>-score provides a balanced assessment of model performance, particularly useful in scenarios with class imbalances. In our application, as the objective is to assess the ability of a model to distinguish between positive and negative classes, area under the curve and area under the receiver operating characteristic curve emerged as the most critical measure, as it evaluates the model&#x2019;s ability to effectively distinguish between positive and negative classes by analyzing the trade-off between sensitivity and specificity [<xref ref-type="bibr" rid="ref40">40</xref>].</p><p>In addition to discrimination metrics, we performed calibration to examine how well the predicted probabilities align with actual outcomes. While a model can demonstrate good discrimination, it may still exhibit biases in its risk predictions [<xref ref-type="bibr" rid="ref41">41</xref>]. Calibration is essential to ensure that predicted probabilities accurately reflect the likelihood of outcomes. To visualize this alignment, we used calibration curves, which plot predicted probabilities against observed results (<xref ref-type="fig" rid="figure4">Figure 4</xref>). An ideally calibrated model would form a 45-degree diagonal line, signifying that predicted probabilities correspond closely to actual outcomes [<xref ref-type="bibr" rid="ref42">42</xref>].</p><fig position="float" id="figure4"><label>Figure 4.</label><caption><p>Calibration plot.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="pediatrics_v9i1e76712_fig04.png"/></fig></sec><sec id="s2-5"><title>Important Feature Selection</title><p>Our second objective is to identify the most important predictors of ZD children. To achieve this, we used the best-performing ML model to determine the key features associated with identifying ZD cases. We used a unified framework developed by Lundberg and Lee [<xref ref-type="bibr" rid="ref43">43</xref>]<ext-link ext-link-type="uri" xlink:href="https://proceedings.neurips.cc/paper/2017/hash/8a20a8621978632d76c43dfd28b67767-Abstract.html">,</ext-link> known as SHAP (SHapley Additive Explanations). This approach is based on Shapley values from cooperative game theory, which assign a value to each feature based on its contribution to the prediction, taking into account all possible combinations of features [<xref ref-type="bibr" rid="ref44">44</xref>]. A waterfall plot is then created to visualize the cumulative effect of individual features on specific predictions, illustrating how each feature influences the final output. In addition, a beeswarm plot summarizes the distribution of SHAP values across multiple instances, revealing the variability and significance of feature contributions.</p></sec><sec id="s2-6"><title>Rule Generation</title><p>We used rule mining techniques to uncover patterns and relationships within our dataset. We used association rule mining to identify correlations between features through Apriori algorithms [<xref ref-type="bibr" rid="ref45">45</xref>]. In addition, we applied classification rule mining to generate rules that predict class labels, aiding in the identification of key predictors for ZD children, and explored sequential rule mining to capture temporal patterns where relevant. Following the mining process, we generated actionable insights by formulating human-readable rules that outline conditions (antecedents) and outcomes (consequents) [<xref ref-type="bibr" rid="ref46">46</xref>]. We assessed the quality of these rules using metrics such as confidence and lift to ensure their reliability and relevance [<xref ref-type="bibr" rid="ref47">47</xref>].</p></sec><sec id="s2-7"><title>Ethical Considerations</title><p>The research was implemented in compliance with national and international ethical principles. The University of Gondar has provided ethical approval (CMHSSH-UOG IRERC/3/7/2024) to conduct this analysis. For this analyses we used the existing data with primary consent. We used deidentified data (summary data without individuals&#x2019; identity) to ensure confidentiality. We followed the international standard of strengthening the reporting of cross-sectional studies in epidemiology.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Children&#x2019;s and Mothers&#x2019; or Caregivers&#x2019; Characteristics</title><p>A total of 13,666 samples of children aged from 12 to 35 months were included for analysis. Nearly 57% (7727/13,666) of the children were younger than 24&#x2010;35 months. The majority (10,204/13,666, 74.7%) of the children were from mothers or caregivers who live in rural areas. Half (6986/13,666, 51.1%) of the children were born from mothers who had not had formal education. More than half (6757/12,419, 54.4%) of the children were from mothers who had no PNC follow-up for the index children. The details are shown in <xref ref-type="table" rid="table2">Table 2</xref>.</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Sociodemographic and economic characteristics of mothers or caregivers of children aged 12&#x2010;35 months in Ethiopia, 2023 (N=1366).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Variables</td><td align="left" valign="bottom">Frequency</td><td align="left" valign="bottom">Percentage</td></tr></thead><tbody><tr><td align="left" valign="top">Age of the child</td><td align="left" valign="top" colspan="2"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>12&#x2010;23 months</td><td align="left" valign="top">5934</td><td align="left" valign="top">43.5</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>24&#x2010;35 months</td><td align="left" valign="top">7727</td><td align="left" valign="top">56.5</td></tr><tr><td align="left" valign="top">Place of residency</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Rural</td><td align="left" valign="top">10,204</td><td align="left" valign="top">74.7</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Urban</td><td align="left" valign="top">3462</td><td align="left" valign="top">25.3</td></tr><tr><td align="left" valign="top">Religion</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Orthodox</td><td align="left" valign="top">4430</td><td align="left" valign="top">32.4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Muslim</td><td align="left" valign="top">6158</td><td align="left" valign="top">45.2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Protestant</td><td align="left" valign="top">2944</td><td align="left" valign="top">21.5</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Others<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="top">134</td><td align="left" valign="top">1.0</td></tr><tr><td align="left" valign="top">Educational status</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>No education</td><td align="left" valign="top">6986</td><td align="left" valign="top">51.1</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Primary</td><td align="left" valign="top">3870</td><td align="left" valign="top">28.3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Secondary</td><td align="left" valign="top">1798</td><td align="left" valign="top">13.2</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>College and above</td><td align="left" valign="top">1012</td><td align="left" valign="top">7.4</td></tr><tr><td align="left" valign="top">Wealth status</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Poor</td><td align="left" valign="top">4558</td><td align="left" valign="top">33.4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Middle</td><td align="left" valign="top">4566</td><td align="left" valign="top">33.4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Richer</td><td align="left" valign="top">4542</td><td align="left" valign="top">33.2</td></tr><tr><td align="left" valign="top">Marital status</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Married and living together</td><td align="left" valign="top">12,765</td><td align="left" valign="top">93.4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Married but not living together</td><td align="left" valign="top">352</td><td align="left" valign="top">2.6</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Not in marital union</td><td align="left" valign="top">549</td><td align="left" valign="top">4.0</td></tr><tr><td align="left" valign="top">Birth order</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>First</td><td align="left" valign="top">4043</td><td align="left" valign="top">29.6</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Second</td><td align="left" valign="top">4830</td><td align="left" valign="top">35.3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Third</td><td align="left" valign="top">2639</td><td align="left" valign="top">19.3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Fourth and above</td><td align="left" valign="top">2154</td><td align="left" valign="top">15.8</td></tr><tr><td align="left" valign="top">Parity</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Primipara</td><td align="left" valign="top">2499</td><td align="left" valign="top">20.1</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Multipara (2-4)</td><td align="left" valign="top">6573</td><td align="left" valign="top">52.9</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Grand multipara (5+)</td><td align="left" valign="top">3346</td><td align="left" valign="top">27.0</td></tr><tr><td align="left" valign="top">Perceived distance to health facility</td><td align="left" valign="top" colspan="2"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Big problem</td><td align="left" valign="top">5251</td><td align="left" valign="top">38.4</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Not big problem</td><td align="left" valign="top">8415</td><td align="left" valign="top">61.6</td></tr><tr><td align="left" valign="top">Perceived benefit on immunization</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Poor</td><td align="left" valign="top">2502</td><td align="left" valign="top">19.3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Good</td><td align="left" valign="top">10,471</td><td align="left" valign="top">80.7</td></tr><tr><td align="left" valign="top">ANC<sup><xref ref-type="table-fn" rid="table2fn2">b</xref></sup> visit</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Yes</td><td align="left" valign="top">10,345</td><td align="left" valign="top">83.3</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>No</td><td align="left" valign="top">2074</td><td align="left" valign="top">16.7</td></tr><tr><td align="left" valign="top">Place of delivery</td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Home</td><td align="left" valign="top">3807</td><td align="left" valign="top">30.6</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Health facility</td><td align="left" valign="top">8612</td><td align="left" valign="top">69.4</td></tr><tr><td align="left" valign="top">PNC<sup><xref ref-type="table-fn" rid="table2fn3">c</xref></sup></td><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Yes</td><td align="left" valign="top">5662</td><td align="left" valign="top">45.6</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>No</td><td align="left" valign="top">6757</td><td align="left" valign="top">54.4</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>Others: Catholic, traditional, and others.</p></fn><fn id="table2fn2"><p><sup>b</sup>ANC: antenatal care.</p></fn><fn id="table2fn3"><p><sup>c</sup>PNC: postnatal care. </p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>ZD Prevalence</title><p>The overall prevalence of ZD in Ethiopia was 18% (95% CI 17.4%&#x2010;18.7%). There were regional variations in the prevalence of ZD children. The higher prevalence was observed in Somali (38.8%), Afar (34.2%), and followed by Oromia (22.7%), and the lowest observed in Addis Ababa (0.8%) and Dire Dawa (5 %) (<xref ref-type="fig" rid="figure5">Figure 5</xref>).</p><fig position="float" id="figure5"><label>Figure 5.</label><caption><p>Distribution of zero-dose children aged 12&#x2010;35 months across regions in Ethiopia 2023. SNNP: Southern Nations, Nationalities, and Peoples'..</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="pediatrics_v9i1e76712_fig05.png"/></fig></sec><sec id="s3-3"><title>Performance of the Prediction Models</title><p>Seven ML algorithms were used to predict ZD status in Ethiopia, with the LGBM yielding the best performance for both unbalanced and balanced datasets (<xref ref-type="table" rid="table3">Table 3</xref>). It achieved accuracies of 89% and 93% for the unbalanced and balanced datasets, respectively. Most models showed improved accuracy when applied to the balanced dataset, except for Logistic Regression and Naive Bayes. After balancing the data, both XGBoost and LGBM reached an accuracy of 93%. Notably, the LGBM classifier excelled in terms of area under the curve (AUC) (98%) and sensitivity (92%).</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Model performance comparison before and after dataset balancing for predicting zero-dose children in Ethiopia, 2023.</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Models and dataset</td><td align="left" valign="bottom">Accuracy (%)</td><td align="left" valign="bottom">AUC<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup> (%)</td><td align="left" valign="bottom">Precision (%)</td><td align="left" valign="bottom">Sensitivity</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score</td></tr></thead><tbody><tr><td align="left" valign="top">Logistic Regression</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unbalanced</td><td align="left" valign="top">88</td><td align="left" valign="top">88</td><td align="left" valign="top">77</td><td align="left" valign="top">48</td><td align="left" valign="top">59</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Balanced</td><td align="left" valign="top">81</td><td align="left" valign="top">89</td><td align="left" valign="top">83</td><td align="left" valign="top">77</td><td align="left" valign="top">80</td></tr><tr><td align="left" valign="top">Na&#x00EF;ve Bayes</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unbalanced</td><td align="left" valign="top">85</td><td align="left" valign="top">87</td><td align="left" valign="top">59</td><td align="left" valign="top">63</td><td align="left" valign="top">61</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Balanced</td><td align="left" valign="top">79</td><td align="left" valign="top">87</td><td align="left" valign="top">82</td><td align="left" valign="top">73</td><td align="left" valign="top">77</td></tr><tr><td align="left" valign="top">LGBM<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> Classifier</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unbalanced</td><td align="left" valign="top">89</td><td align="left" valign="top">88</td><td align="left" valign="top">79</td><td align="left" valign="top">53</td><td align="left" valign="top">63</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Balanced</td><td align="left" valign="top">93</td><td align="left" valign="top">97</td><td align="left" valign="top">94</td><td align="left" valign="top">91</td><td align="left" valign="top">92</td></tr><tr><td align="left" valign="top">DT<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup> Classifier</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unbalanced</td><td align="left" valign="top">86</td><td align="left" valign="top">75</td><td align="left" valign="top">64</td><td align="left" valign="top">51</td><td align="left" valign="top">57</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Balanced</td><td align="left" valign="top">89</td><td align="left" valign="top">91</td><td align="left" valign="top">90</td><td align="left" valign="top">87</td><td align="left" valign="top">88</td></tr><tr><td align="left" valign="top">Random Forest Classifier</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unbalanced</td><td align="left" valign="top">87</td><td align="left" valign="top">85</td><td align="left" valign="top">70</td><td align="left" valign="top">52</td><td align="left" valign="top">61</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Balanced</td><td align="left" valign="top">91</td><td align="left" valign="top">96</td><td align="left" valign="top">91</td><td align="left" valign="top">90</td><td align="left" valign="top">91</td></tr><tr><td align="left" valign="top">XGBoost Classifier</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unbalanced</td><td align="left" valign="top">88</td><td align="left" valign="top">87</td><td align="left" valign="top">75</td><td align="left" valign="top">52</td><td align="left" valign="top">61</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Balanced</td><td align="left" valign="top">93</td><td align="left" valign="top">97</td><td align="left" valign="top">94</td><td align="left" valign="top">90</td><td align="left" valign="top">92</td></tr><tr><td align="left" valign="top">AdaBoost Classifier</td><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/><td align="left" valign="top"/></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Unbalanced</td><td align="left" valign="top">88</td><td align="left" valign="top">88</td><td align="left" valign="top">77</td><td align="left" valign="top">46</td><td align="left" valign="top">58</td></tr><tr><td align="left" valign="top"><named-content content-type="indent">&#x00A0;&#x00A0;&#x00A0;&#x00A0;</named-content>Balanced</td><td align="left" valign="top">88</td><td align="left" valign="top">95</td><td align="left" valign="top">89</td><td align="left" valign="top">86</td><td align="left" valign="top">87</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>AUC: area under the curve.</p></fn><fn id="table3fn2"><p><sup>b</sup>LGBM: Light Gradient Boosting Machine.</p></fn><fn id="table3fn3"><p><sup>c</sup>DT: Decision Tree. </p></fn></table-wrap-foot></table-wrap><p>Overall, while all ML models performed well on both datasets, those trained on balanced data especially XGBoost and LGBM proved to be more effective in identifying ZD children due to their higher recall and AUC. A comprehensive comparison of the ML algorithms used for ZD children is detailed in <xref ref-type="table" rid="table3">Table 3</xref>. After the hyperparameter optimization conducted, the LGBM model achieved robust performance, with an accuracy of 92.4, an AUC of 97.4%, a precision of 93.2%, and a recall of 90.9%. The details are shown in <xref ref-type="table" rid="table4">Table 4</xref>.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Model performance after hyperparameter tuning for predicting zero-dose children in Ethiopia, 2023.</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Model</td><td align="left" valign="bottom">Accuracy (%)</td><td align="left" valign="bottom">AUC<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup> (%)</td><td align="left" valign="bottom">Precision (%)</td><td align="left" valign="bottom">Recall (%)</td><td align="left" valign="bottom"><italic>F</italic><sub>1</sub>-score (%)</td></tr></thead><tbody><tr><td align="left" valign="top">Logistic Regression</td><td align="left" valign="top">80.8</td><td align="left" valign="top">89.1</td><td align="left" valign="top">82.5</td><td align="left" valign="top">76.9</td><td align="left" valign="top">79.6</td></tr><tr><td align="left" valign="top">Naive Bayes</td><td align="left" valign="top">79.1</td><td align="left" valign="top">87.3</td><td align="left" valign="top">82</td><td align="left" valign="top">73.1</td><td align="left" valign="top">77.3</td></tr><tr><td align="left" valign="top">Random Forest</td><td align="left" valign="top">91.6</td><td align="left" valign="top">96.7</td><td align="left" valign="top">91.9</td><td align="left" valign="top">90.6</td><td align="left" valign="top">91.3</td></tr><tr><td align="left" valign="top">XGBoost</td><td align="left" valign="top">92.2</td><td align="left" valign="top">97.3</td><td align="left" valign="top">93.9</td><td align="left" valign="top">89.8</td><td align="left" valign="top">91.8</td></tr><tr><td align="left" valign="top">AdaBoost</td><td align="left" valign="top">89.6</td><td align="left" valign="top">96.2</td><td align="left" valign="top">90.6</td><td align="left" valign="top">87.8</td><td align="left" valign="top">89.2</td></tr><tr><td align="left" valign="top">LGBM<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup></td><td align="left" valign="top">92.4</td><td align="left" valign="top">97.4</td><td align="left" valign="top">93.2</td><td align="left" valign="top">90.9</td><td align="left" valign="top">92.1</td></tr><tr><td align="left" valign="top">Decision Tree</td><td align="left" valign="top">89.9</td><td align="left" valign="top">94.5</td><td align="left" valign="top">89.5</td><td align="left" valign="top">89.7</td><td align="left" valign="top">89.6</td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>AUC: area under the curve.</p></fn><fn id="table4fn2"><p><sup>b</sup>LGBM: Light Gradient Boosting Machine.</p></fn></table-wrap-foot></table-wrap><p>After parameter tuning, the models were further evaluated using 10-fold cross-validation, where XGBoost and LGBM demonstrated comparable accuracies of 93% (<xref ref-type="fig" rid="figure6">Figure 6</xref>).</p><fig position="float" id="figure6"><label>Figure 6.</label><caption><p>Accuracy of models in 10-fold cross-validation after balancing the dataset for predicting zero-dose children in Ethiopia, 2023. LGBM: Light Gradient Boosting Machine.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="pediatrics_v9i1e76712_fig06.png"/></fig></sec><sec id="s3-4"><title>Predicting ZD</title><p>After building the model by using the training dataset, the performance of the LGBM model was evaluated by the testing dataset. From 2181 ZD children, the model predicted 1991 children correctly (true positive), and out of 2300 non-ZD children, the model predicted 2175 children correctly (true negative). However, the model incorrectly classified 190 ZD samples as non-ZD (false positive) and 125 non-ZD samples as ZD (false negative). The Matthews correlation coefficient was <italic>r</italic>=0.85 and Cohen &#x03BA;=0.85. Overall, the model predicted with an accuracy of 93%, recall of 91%, <italic>F</italic><sub>1</sub>-score of 92%, and 94% precision on test data.</p></sec><sec id="s3-5"><title>Feature Importance</title><p>The Shapley Additive analysis identified that mother&#x2019;s or caregiver&#x2019;s perception of benefit of immunization (+1.13), with whether the distance to immunization site (+0.88), whether the mother received ANC (+0.55), whether the mother received TT (+0.42), and whether trust in health providers (0.41) were the most important features followed by place of residence (+0.35), and PNC visit (+0.25). Wealth index, birth order, and place of delivery were the features with low importance (<xref ref-type="fig" rid="figure7">Figure 7</xref>).</p><fig position="float" id="figure7"><label>Figure 7.</label><caption><p>Important features for predicting zero-dose children in Ethiopia, 2023. ANC: antenatal care; PNC: postnatal care; SHAP: SHapley Additive Explanations.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="pediatrics_v9i1e76712_fig07.png"/></fig><p>The waterfall chart demonstrates how various factors influence the prediction of ZD vaccination status, starting from a baseline expected value of (<italic>E</italic>[<italic>f</italic>(<italic>X</italic>)]=0.023) and culminating in a final prediction of <italic>f</italic>(<italic>x</italic>)=4.655) indicating that the child is ZD. This indicated that poor perceptions of vaccination benefits, long distances to immunization sites, lack of antenatal and postnatal care visits, absence of TT vaccination, and low trust in health care providers are positively correlated with ZD. Conversely, being in a medium wealth index and having a third birth order is negatively correlated with ZD (<xref ref-type="fig" rid="figure8">Figure 8</xref>).</p><fig position="float" id="figure8"><label>Figure 8.</label><caption><p>Waterfall plot of first observation value to predict zero-dose children in Ethiopia, 2023. ANC: antenatal care; PNC: postnatal care.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="pediatrics_v9i1e76712_fig08.png"/></fig><p>.</p><p>As shown in <xref ref-type="fig" rid="figure9">Figure 9</xref>, the beeswarm plot illustrates the impact of various predictor variables on ZD status, with distinct colors representing risk levels: red dots indicate high-risk values, while blue dots denote low-risk values for the predictor variables. The feature of perception exhibits a wide range of SHAP values, highlighting its significant influence on the model&#x2019;s predictions. A poor perception of the benefits of vaccination notably increases the likelihood of a child being classified as ZD. In addition, distance from health care facilities is strongly associated with ZD status, where far distances correlate with a higher likelihood of being unvaccinated. Other contributing factors include a lack of ANC visits, PNC visits, TT vaccination, low wealth index, low trust in health care providers, and home delivery, all of which contribute to the prediction of the positive class (ZD).</p><fig position="float" id="figure9"><label>Figure 9.</label><caption><p>Zero-dose predictors for Light Gradient Boosting Machine model. SHAP summary plot of top predictors. ANC: antenatal care; PNC: postnatal care; SHAP: SHapley Additive Explanations.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="pediatrics_v9i1e76712_fig09.png"/></fig></sec><sec id="s3-6"><title>Rule Generation</title><p>The rule generation process was done based on important attributes selected by the best performing ML model LGBM. Moving beyond individual feature importance, we used association rule mining to identify complex, multifactorial profiles of ZD children and to rigorously validate the interactions suggested by the SHAP analysis. This generated a set of human-interpretable &#x201C;if then&#x201D; rules, each validated by key metrics: support (prevalence of the rule in the data), confidence (conditional probability of the outcome), and lift (strength of the association above random chance). The rule generation process was done based on important attributes selected by the best performing ML model LGBM. The strongest rule (rule 1: lift = 2.17, confidence = 0.90) indicates that children whose caregivers live far from a health facility and have a poor perception of vaccination benefits have a 90% probability of being ZD, a risk 2.17 times higher than random. Rule 2 (confidence = 0.81) shows that combining distance with a lack of ANC and poor trust in providers creates another high-risk pathway, while rule 5 (confidence = 0.79) highlights the potent combination of no tetanus vaccination, no ANC, and distance. Crucially, these rules reveal critical synergies, while SHAP identified &#x201C;distance&#x201D; and &#x201C;ANC&#x201D; as top individual predictors, rule mining quantified how their combination with other factors (eg, rule 8: no ANC + Far distance, confidence = 0.72) creates a risk profile with a distinctly high probability of the outcome. This provides programmatically actionable insights, demonstrating that interventions must target these intersecting barriers simultaneously rather than in isolation to effectively reach ZD children. A total of 9 association rules were generated, and the details of the rules are shown in <xref ref-type="other" rid="box1">Textbox 1</xref>.</p><boxed-text id="box1"><title> Rule generation and knowledge extraction.</title><p>##Rule## 1: Distance from facility_far, Perception in benefit_Poor -&#x003E; Zerodose_Yes</p><p>Support: 0.10897435897435898, Lift: 2.1738917080243128, Confidence: 0.9037974683544304</p><p>##Rule## 2: Distance from facility_far, Trust in healthcare provider_Poor, Anc visit_No -&#x003E; Zerodose_Yes</p><p>Support: 0.10134310134310134, Lift: 1.947695283120232, Confidence: 0.8097560975609757</p><p>##Rule## 3: Perception in benefit_Poor -&#x003E; Zerodose_Yes</p><p>Support: 0.15262515262515264, Lift: 1.9211552265274243, Confidence: 0.7987220447284347</p><p>##Rule## 4: Perception in benefit_Poor, Place Residence_rural -&#x003E; Zerodose_Yes</p><p>Support: 0.10103785103785104, Lift: 1.9138215859030838, Confidence: 0.795673076923077</p><p>##Rule## 5: Received TT_No, Distance from facility_far, Anc visit_No -&#x003E; Zerodose_Yes</p><p>Support: 0.13064713064713065, Lift: 1.9099490817552491, Confidence: 0.7940630797773656</p><p>##Rule## 6: Received TT_No, Distance from facility_far, Place delivery_Home -&#x003E; Zerodose_Yes</p><p>Support: 0.12606837606837606, Lift: 1.7738986784140967, Confidence: 0.7374999999999999</p><p>##Rule## 7: PNC visit_Yes, Distance from facility_far, Anc visit_No -&#x003E; Zerodose_Yes</p><p>Support: 0.10073260073260074, Lift: 1.7406677486668212, Confidence: 0.7236842105263158</p><p>##Rule## 8: Distance from facility_far, Anc visit_No -&#x003E; Zerodose_Yes</p><p>Support: 0.17918192918192918, Lift: 1.736658159533137, Confidence: 0.7220172201722017</p><p>##Rule## 9: Distance from facility_far, Anc visit_No, Place Residence_rural -&#x003E; Zerodose_Yes</p><p>Support: 0.1108058608058608, Lift: 1.7019862431408919, Confidence: 0.7076023391812866</p></boxed-text></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>Using the data from the most recent National Immunization Evaluation Survey in Ethiopia, we applied different supervised machine algorithms to assess how well the models predict whether a child is likely to be ZD and to identify the important predictor variables. We trained and compared 7 ML classifiers on both unbalanced and balanced datasets, using a train-test split, hyperparameter tuning, and 10-fold cross-validation for robust evaluation. A variety of socioeconomic, demographic, and health-related factors were included to enhance the model&#x2019;s predictions and facilitate important feature selection.</p><p>Our findings demonstrate that these ML algorithms are effective in identifying children at high risk of being ZD. Among the 7 models tested, LGBM emerged as the top performer, achieving an AUC of 97.4%, recall of 90.9%, accuracy of 92.4%, precision of 93.2%, and an <italic>F</italic><sub>1</sub>-score of 92.1%. These evaluation metrics underscore the model&#x2019;s strong capability in predicting ZD children. The high AUC indicates the model&#x2019;s effectiveness in distinguishing between children who receive immunization services and those who do not. Notably, a recall of 90.9% signifies that the model successfully identifies 90.9% of ZD children, who are often at greater risk for missing vaccines and vaccine-preventable diseases.</p><p>In addition to LGBM, both XGBoost and RF algorithms performed well, each achieving an accuracy of 92.2% and 91.6%, respectively. These results are consistent with previous studies that recognized XGBoost [<xref ref-type="bibr" rid="ref48">48</xref>] and RF [<xref ref-type="bibr" rid="ref49">49</xref>] as top performers in similar contexts. While these metrics indicate robust performance for critical health issues such as immunization, it is crucial to validate the model in real-world settings. Such testing will enhance its utility as a tool for guiding public health initiatives aimed at increasing vaccination rates and improving access to essential health care services for unvaccinated children.</p><p>Using an ML model, health care workers can pinpoint specific households and communities with ZD children, allowing them to shift from broad campaigns to targeted household visits. By leveraging the model&#x2019;s insights on local perceptions and socioeconomic barriers, they can tailor their communication and services, such as setting up mobile clinics, to overcome specific challenges and efficiently use scarce resources, ensuring that vaccines reach those most in need.</p><p>The second objective of the study was to identify important attributes that could predict ZD among children aged 12&#x2010;35 months. Using SHAP analysis, the study found that perception of immunization benefit, ANC utilization, distance from vaccination site, maternal TT vaccination status, and trust in health providers were the most important features to identify at-risk children for ZD.</p><p>The top predictor was poor maternal perception with a SHAP value of 1.13 (<xref ref-type="fig" rid="figure7">Figure 7</xref>). This indicates that a negative perception of mothers or caregivers increases the likelihood of a child being ZD, likely because parental beliefs directly influence health care decisions regarding vaccination. This finding aligns with previous studies showing that parental beliefs and attitudes significantly affect a child&#x2019;s vaccination status [<xref ref-type="bibr" rid="ref50">50</xref>,<xref ref-type="bibr" rid="ref51">51</xref>].</p><p>ANC utilization was another important feature, with a SHAP value of 0.55, indicating that a lack of ANC is strongly linked to a child being ZD. This finding is in line with the previous similar studies done [<xref ref-type="bibr" rid="ref48">48</xref>,<xref ref-type="bibr" rid="ref52">52</xref>,<xref ref-type="bibr" rid="ref53">53</xref>]. This could be due to the fact that ANC visits enable mothers to access integrated health services, be more likely to receive information on immunization schedules, build trust in the health system, and improve adherence to health services [<xref ref-type="bibr" rid="ref54">54</xref>-<xref ref-type="bibr" rid="ref56">56</xref>].</p><p>In addition, the study found several important predictors. Maternal TT vaccination was a key factor; mothers who received the TT vaccine were more likely to have their children vaccinated, a finding consistent with studies from Sudan and Bangladesh [<xref ref-type="bibr" rid="ref57">57</xref>,<xref ref-type="bibr" rid="ref58">58</xref>]. Postnatal care visit was another important predictor. This service is likely gaining a better understanding of vaccination importance and feeding practices, thus reducing missed vaccinations [<xref ref-type="bibr" rid="ref59">59</xref>,<xref ref-type="bibr" rid="ref60">60</xref>]. In addition, maternal education was an important predictor, with uneducated mothers having a higher risk of ZD children than those with at least a primary education, firming up the known link between maternal literacy and vaccination rates and primary education. This finding is in line with previous research linking maternal literacy to vaccination completeness [<xref ref-type="bibr" rid="ref61">61</xref>-<xref ref-type="bibr" rid="ref65">65</xref>]. The other finding of this study is rule mining and generation. Using association rule mining with the Apriori algorithm, the study uncovered strong relationships between various socioeconomic, demographic, and health-related factors and ZD status. Key determinants, including distance from health facility, perception of vaccination benefits, trust in health care providers, ANC, place of delivery, place of residency, and TT vaccines were the most important features predicting ZD. Confidence levels for these findings ranged from 71% to 90%, indicating robust associations.</p><p>Findings from association rule 1 indicated that the probability of a child being ZD would be 90%, if and only if the mothers or caregivers were far from the health facility and had poor perception on immunization. This may be because mothers or caregivers who are far from the facility may not have access to health education directly or indirectly, affecting health-seeking behavior and health service utilization such as vaccination. The second rule also included poor trust in health care providers and lack of ANC visits as predictors for ZD. A child ZD would be 80% if mothers or caregivers have trust in providers and had no ANC follow-up for the index child.</p></sec><sec id="s4-2"><title>Strengths and Limitations</title><p>This study had several strengths worth mentioning. We used national-level survey data from 463 EAs ensuring generalizability across the country and providing a current snapshot of the ZD situation. A key strength is that our analysis uses various ML algorithms from the field of data science, which significantly aids in identifying and targeting ZD children more effectively. These advanced analytical techniques allow us to process large datasets and uncover insights that may not be immediately apparent through traditional methods. At the same time, this study identified the risk factors of ZD that may help policy makers and planners to design tailored interventions to identify and reach the unvaccinated children.</p><p>This study was subject to some limitations. First, although we used national-level data, we did not include data from the Tigray region, which is one of the administrative regions of the country, due to security issues. Second, the study did not include health system side predictors such as availability of vaccination supplies and vaccines. Finally, we could not do external validation for the modes due to the lack of real-world data.</p></sec><sec id="s4-3"><title>Conclusions</title><p>The developed ML models effectively predict children at risk of being ZD and identify associated risk factors. Among these models, the LGBM model demonstrated the best performance in predicting ZD children. Key features linked to ZD status include access to immunization sites, maternal health service utilization (such as antenatal and postnatal care, place of delivery, and TT vaccination), and perceptions regarding immunization.</p><p>By implementing ML models, public health interventions can be more precisely targeted at the most vulnerable groups. This approach may address inequities in vaccination coverage by identifying specific sociodemographic, economic, and health-related factors associated with ZD children. Consequently, it aids in the formulation and implementation of effective policies and strategies to improve vaccination rates. Strengthening the continuum of care for mothers, raising awareness among caregivers, and improving immunization access through outreach strategies may help in reducing the high burden of ZD children.</p></sec></sec></body><back><ack><p>The authors would like to thank the University of Gondar for the unwavering support. In addition, the authors extend their sincere thanks to the Ministry of Health of Ethiopia for granting them access to the data that were critical for their study.</p></ack><notes><sec><title>Funding</title><p>No external financial support or grants were received from any public, commercial, or not-for-profit entities for the research, authorship, or publication of this article.</p></sec><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are available from the corresponding author on reasonable request.</p></sec></notes><fn-group><fn fn-type="con"><p>BFE, KA, SAM, MZ, MKG, and BT conceptualized and designed the study. All authors contributed significantly to the analysis and interpretation of the results. The original draft was written by BFE and reviewed by all authors, who also provided critical revisions for important intellectual content. Each author has read and approved the final manuscript. They have agreed to take personal responsibility for their contributions and to ensure that any questions regarding the accuracy or integrity of any part of the work, even if they were not directly involved, are properly investigated and documented in the literature.</p></fn><fn fn-type="conflict"><p>None declared.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">ANC</term><def><p>antenatal care</p></def></def-item><def-item><term id="abb2">AUC</term><def><p>area under the curve</p></def></def-item><def-item><term id="abb3">DPT</term><def><p>diphtheria, tetanus, and pertussis</p></def></def-item><def-item><term id="abb4">EA</term><def><p>enumeration area</p></def></def-item><def-item><term id="abb5">LGBM</term><def><p>Light Gradient Boosting Machine</p></def></def-item><def-item><term id="abb6">ML</term><def><p>machine learning</p></def></def-item><def-item><term id="abb7">RF</term><def><p>Random Forest</p></def></def-item><def-item><term id="abb8">SHAP</term><def><p>SHapley Additive Explanations</p></def></def-item><def-item><term id="abb9">TT</term><def><p>tetanus toxoid</p></def></def-item><def-item><term id="abb10">XGBoost</term><def><p>Extreme Gradient Boosting</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Clark</surname><given-names>H</given-names> </name><name name-style="western"><surname>Coll-Seck</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Banerjee</surname><given-names>A</given-names> </name><etal/></person-group><article-title>A future for the world&#x2019;s children? A WHO&#x2013;UNICEF&#x2013;Lancet Commission</article-title><source>Lancet</source><year>2020</year><month>02</month><day>22</day><volume>395</volume><issue>10224</issue><fpage>605</fpage><lpage>658</lpage><pub-id pub-id-type="doi">10.1016/S0140-6736(19)32540-1</pub-id><pub-id pub-id-type="medline">32085821</pub-id></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kaur</surname><given-names>G</given-names> </name><name name-style="western"><surname>Danovaro-Holliday</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Mwinnyaa</surname><given-names>G</given-names> </name><etal/></person-group><article-title>Routine vaccination coverage&#x2014;worldwide, 2022</article-title><source>MMWR Morb Mortal Wkly Rep</source><year>2023</year><month>10</month><day>27</day><volume>72</volume><issue>43</issue><fpage>1155</fpage><lpage>1161</lpage><pub-id pub-id-type="doi">10.15585/mmwr.mm7243a1</pub-id><pub-id pub-id-type="medline">37883326</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sharrow</surname><given-names>D</given-names> </name><name name-style="western"><surname>Hug</surname><given-names>L</given-names> </name><name name-style="western"><surname>You</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Global, regional, and national trends in under-5 mortality between 1990 and 2019 with scenario-based projections until 2030: a systematic analysis by the UN Inter-agency Group for Child Mortality Estimation</article-title><source>Lancet Glob Health</source><year>2022</year><month>02</month><volume>10</volume><issue>2</issue><fpage>e195</fpage><lpage>e206</lpage><pub-id pub-id-type="doi">10.1016/S2214-109X(21)00515-5</pub-id><pub-id pub-id-type="medline">35063111</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="web"><article-title>WHO/UNICEF estimates of national immunization coverage</article-title><source>World Health Organization</source><year>2023</year><month>09</month><access-date>2026-01-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/news-room/questions-and-answers/item/who-unicef-estimates-of-national-immunization-coverage">https://www.who.int/news-room/questions-and-answers/item/who-unicef-estimates-of-national-immunization-coverage</ext-link></comment></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="report"><article-title>Immunization Agenda 2030: a global strategy to leave no one behind</article-title><year>2020</year><access-date>2024-11-22</access-date><publisher-name>World Health Organization</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/publications/m/item/immunization-agenda-2030-a-global-strategy-to-leave-no-one-behind">https://www.who.int/publications/m/item/immunization-agenda-2030-a-global-strategy-to-leave-no-one-behind</ext-link></comment></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Restrepo-M&#x00E9;ndez</surname><given-names>MC</given-names> </name><name name-style="western"><surname>Barros</surname><given-names>AJ</given-names> </name><name name-style="western"><surname>Wong</surname><given-names>KL</given-names> </name><etal/></person-group><article-title>Inequalities in full immunization coverage: trends in low- and middle-income countries</article-title><source>Bull World Health Organ</source><year>2016</year><month>11</month><day>1</day><volume>94</volume><issue>11</issue><fpage>794</fpage><lpage>805B</lpage><pub-id pub-id-type="doi">10.2471/BLT.15.162172</pub-id><pub-id pub-id-type="medline">27821882</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ozawa</surname><given-names>S</given-names> </name><name name-style="western"><surname>Yemeke</surname><given-names>TT</given-names> </name><name name-style="western"><surname>Evans</surname><given-names>DR</given-names> </name><name name-style="western"><surname>Pallas</surname><given-names>SE</given-names> </name><name name-style="western"><surname>Wallace</surname><given-names>AS</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>BY</given-names> </name></person-group><article-title>Defining hard-to-reach populations for vaccination</article-title><source>Vaccine (Auckl)</source><year>2019</year><month>09</month><volume>37</volume><issue>37</issue><fpage>5525</fpage><lpage>5534</lpage><pub-id pub-id-type="doi">10.1016/j.vaccine.2019.06.081</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johri</surname><given-names>M</given-names> </name><name name-style="western"><surname>Rajpal</surname><given-names>S</given-names> </name><name name-style="western"><surname>Subramanian</surname><given-names>SV</given-names> </name></person-group><article-title>Progress in reaching unvaccinated (zero-dose) children in India, 1992-2016: a multilevel, geospatial analysis of repeated cross-sectional surveys</article-title><source>Lancet Glob Health</source><year>2021</year><month>12</month><volume>9</volume><issue>12</issue><fpage>e1697</fpage><lpage>e1706</lpage><pub-id pub-id-type="doi">10.1016/S2214-109X(21)00349-1</pub-id><pub-id pub-id-type="medline">34798029</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Johri</surname><given-names>M</given-names> </name><name name-style="western"><surname>Ng</surname><given-names>ES</given-names> </name><name name-style="western"><surname>Sharkey</surname><given-names>A</given-names> </name><name name-style="western"><surname>Bosson-Rieutort</surname><given-names>D</given-names> </name><name name-style="western"><surname>Kone</surname><given-names>GK</given-names> </name><name name-style="western"><surname>Subramanian</surname><given-names>SV</given-names> </name></person-group><article-title>Effects of zero-dose vaccination status in early childhood and level of community socioeconomic development on learning attainment in preadolescence in India: a population-based cohort study</article-title><source>bmjph</source><year>2023</year><month>11</month><volume>1</volume><issue>1</issue><fpage>e000022</fpage><pub-id pub-id-type="doi">10.1136/bmjph-2023-000022</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chopra</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bhutta</surname><given-names>Z</given-names> </name><name name-style="western"><surname>Chang Blanc</surname><given-names>D</given-names> </name><etal/></person-group><article-title>Addressing the persistent inequities in immunization coverage</article-title><source>Bull World Health Organ</source><year>2020</year><month>02</month><day>1</day><volume>98</volume><issue>2</issue><fpage>146</fpage><lpage>148</lpage><pub-id pub-id-type="doi">10.2471/BLT.19.241620</pub-id><pub-id pub-id-type="medline">32015586</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Teferi</surname><given-names>E</given-names> </name></person-group><article-title>Factors influencing coverage and key challenges to achieving targets of routine immunization in Africa: a systematic review</article-title><source>Ethiop J Pediatr Child Health</source><year>2016</year><access-date>2024-11-20</access-date><volume>12</volume><issue>2</issue><fpage>34</fpage><lpage>45</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://ejpch.net/index.php/ejpch/article/view/89">https://ejpch.net/index.php/ejpch/article/view/89</ext-link></comment></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nour</surname><given-names>TY</given-names> </name><name name-style="western"><surname>Farah</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Ali</surname><given-names>OM</given-names> </name><name name-style="western"><surname>Osman</surname><given-names>MO</given-names> </name><name name-style="western"><surname>Aden</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Abate</surname><given-names>KH</given-names> </name></person-group><article-title>Predictors of immunization coverage among 12&#x2013;23&#x2009;month old children in Ethiopia: systematic review and meta-analysis</article-title><source>BMC Public Health</source><year>2020</year><month>12</month><volume>20</volume><issue>1</issue><fpage>1</fpage><lpage>19</lpage><pub-id pub-id-type="doi">10.1186/s12889-020-09890-0</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tamir</surname><given-names>TT</given-names> </name><name name-style="western"><surname>Zegeye</surname><given-names>AF</given-names> </name><name name-style="western"><surname>Mekonen</surname><given-names>EG</given-names> </name><etal/></person-group><article-title>Prevalence, spatial variation and determinants of zero-dose children in Ethiopia: spatial and multilevel analyses</article-title><source>Public Health (Fairfax)</source><year>2024</year><month>11</month><volume>236</volume><fpage>365</fpage><lpage>372</lpage><pub-id pub-id-type="doi">10.1016/j.puhe.2024.09.011</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Yadita</surname><given-names>ZS</given-names> </name><name name-style="western"><surname>Ayehubizu</surname><given-names>LM</given-names> </name></person-group><article-title>Full immunization coverage and associated factors among children aged 12-23 months in Somali Region, Eastern Ethiopia</article-title><source>PLoS One</source><year>2021</year><volume>16</volume><issue>12</issue><fpage>e0260258</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0260258</pub-id><pub-id pub-id-type="medline">34874949</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Biset</surname><given-names>G</given-names> </name><name name-style="western"><surname>Woday</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mihret</surname><given-names>S</given-names> </name><name name-style="western"><surname>Tsihay</surname><given-names>M</given-names> </name></person-group><article-title>Full immunization coverage and associated factors among children age 12-23 months in Ethiopia: systematic review and meta-analysis of observational studies</article-title><source>Hum Vaccin Immunother</source><year>2021</year><month>07</month><day>3</day><volume>17</volume><issue>7</issue><fpage>2326</fpage><lpage>2335</lpage><pub-id pub-id-type="doi">10.1080/21645515.2020.1870392</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Girmay</surname><given-names>A</given-names> </name><name name-style="western"><surname>Dadi</surname><given-names>AF</given-names> </name></person-group><article-title>Full immunization coverage and associated factors among children aged 12-23 months in a hard-to-reach areas of Ethiopia</article-title><source>Int J Pediatr</source><year>2019</year><volume>2019</volume><fpage>1924941</fpage><pub-id pub-id-type="doi">10.1155/2019/1924941</pub-id><pub-id pub-id-type="medline">31263502</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gurmu</surname><given-names>E</given-names> </name><name name-style="western"><surname>Etana</surname><given-names>D</given-names> </name></person-group><article-title>Factors influencing children&#x2019;s full immunization in Ethiopia</article-title><source>Afr Popul Stud</source><year>2016</year><volume>30</volume><fpage>2</fpage><pub-id pub-id-type="doi">10.11564/30-2-813</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Asresie</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Dagnew</surname><given-names>GW</given-names> </name><name name-style="western"><surname>Bekele</surname><given-names>YA</given-names> </name></person-group><article-title>Changes in immunization coverage and contributing factors among children aged 12-23 months from 2000 to 2019, Ethiopia: multivariate decomposition analysis</article-title><source>PLoS One</source><year>2023</year><volume>18</volume><issue>9</issue><fpage>e0291499</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0291499</pub-id><pub-id pub-id-type="medline">37703252</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Nozaki</surname><given-names>I</given-names> </name><name name-style="western"><surname>Hachiya</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kitamura</surname><given-names>T</given-names> </name></person-group><article-title>Factors influencing basic vaccination coverage in Myanmar: secondary analysis of 2015 Myanmar demographic and health survey data</article-title><source>BMC Public Health</source><year>2019</year><month>02</month><day>28</day><volume>19</volume><issue>1</issue><fpage>242</fpage><pub-id pub-id-type="doi">10.1186/s12889-019-6548-0</pub-id><pub-id pub-id-type="medline">30819127</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Song</surname><given-names>X</given-names> </name><name name-style="western"><surname>Mitnitski</surname><given-names>A</given-names> </name><name name-style="western"><surname>Cox</surname><given-names>J</given-names> </name><name name-style="western"><surname>Rockwood</surname><given-names>K</given-names> </name></person-group><article-title>Comparison of machine learning techniques with classical statistical models in predicting health outcomes</article-title><source>Stud Health Technol Inform</source><year>2004</year><volume>107</volume><issue>Pt 1</issue><fpage>736</fpage><lpage>740</lpage><pub-id pub-id-type="medline">15360910</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Bonaccorso</surname><given-names>G</given-names> </name></person-group><source>Machine Learning Algorithms: Popular Algorithms for Data Science and Machine Learning</source><year>2018</year><access-date>2024-11-22</access-date><publisher-name>Packt Publishing Ltd</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://cir.nii.ac.jp/crid/1130000794529220864">https://cir.nii.ac.jp/crid/1130000794529220864</ext-link></comment></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sarker</surname><given-names>IH</given-names> </name></person-group><article-title>Machine learning: algorithms, real-world applications and research directions</article-title><source>SN Comput Sci</source><year>2021</year><volume>2</volume><issue>3</issue><fpage>160</fpage><pub-id pub-id-type="doi">10.1007/s42979-021-00592-x</pub-id><pub-id pub-id-type="medline">33778771</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Agrawal</surname><given-names>R</given-names> </name><name name-style="western"><surname>Imieli&#x0144;ski</surname><given-names>T</given-names> </name><name name-style="western"><surname>Swami</surname><given-names>A</given-names> </name></person-group><article-title>Mining association rules between sets of items in large databases</article-title><conf-name>Proceedings of the 1993 ACM SIGMOD International Conference on Management of Data</conf-name><conf-date>Jun 1, 1993</conf-date><conf-loc>Washington, DC</conf-loc><fpage>207</fpage><lpage>216</lpage><pub-id pub-id-type="doi">10.1145/170035.170072</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cheong</surname><given-names>Q</given-names> </name><name name-style="western"><surname>Au-Yeung</surname><given-names>M</given-names> </name><name name-style="western"><surname>Quon</surname><given-names>S</given-names> </name><name name-style="western"><surname>Concepcion</surname><given-names>K</given-names> </name><name name-style="western"><surname>Kong</surname><given-names>JD</given-names> </name></person-group><article-title>Predictive modeling of vaccination uptake in US counties: a machine learning-based approach</article-title><source>J Med Internet Res</source><year>2021</year><month>11</month><day>25</day><volume>23</volume><issue>11</issue><fpage>e33231</fpage><pub-id pub-id-type="doi">10.2196/33231</pub-id><pub-id pub-id-type="medline">34751650</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Carrieri</surname><given-names>V</given-names> </name><name name-style="western"><surname>Lagravinese</surname><given-names>R</given-names> </name><name name-style="western"><surname>Resce</surname><given-names>G</given-names> </name></person-group><article-title>Predicting vaccine hesitancy from area-level indicators: a machine learning approach</article-title><source>Health Econ</source><year>2021</year><month>12</month><volume>30</volume><issue>12</issue><fpage>3248</fpage><lpage>3256</lpage><pub-id pub-id-type="doi">10.1002/hec.4430</pub-id><pub-id pub-id-type="medline">34523180</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Avirappattu</surname><given-names>G</given-names> </name><name name-style="western"><surname>Pach Iii</surname><given-names>A</given-names> </name><name name-style="western"><surname>Locklear</surname><given-names>CE</given-names> </name><name name-style="western"><surname>Briggs</surname><given-names>AQ</given-names> </name></person-group><article-title>An optimized machine learning model for identifying socio-economic, demographic and health-related variables associated with low vaccination levels that vary across ZIP codes in California</article-title><source>Prev Med Rep</source><year>2022</year><month>08</month><volume>28</volume><fpage>101858</fpage><pub-id pub-id-type="doi">10.1016/j.pmedr.2022.101858</pub-id><pub-id pub-id-type="medline">35706686</pub-id></nlm-citation></ref><ref id="ref27"><label>27</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Zhang</surname><given-names>A</given-names> </name><name name-style="western"><surname>Xing</surname><given-names>L</given-names> </name><name name-style="western"><surname>Zou</surname><given-names>J</given-names> </name><name name-style="western"><surname>Wu</surname><given-names>JC</given-names> </name></person-group><article-title>Shifting machine learning for healthcare from development to deployment and from models to data</article-title><source>Nat Biomed Eng</source><year>2022</year><month>12</month><volume>6</volume><issue>12</issue><fpage>1330</fpage><lpage>1345</lpage><pub-id pub-id-type="doi">10.1038/s41551-022-00898-y</pub-id><pub-id pub-id-type="medline">35788685</pub-id></nlm-citation></ref><ref id="ref28"><label>28</label><nlm-citation citation-type="report"><article-title>National immunization program evaluation research in Ethiopia</article-title><year>2024</year><access-date>2025-06-29</access-date><publisher-name>Consortium of CBMP Universities</publisher-name><comment><ext-link ext-link-type="uri" xlink:href="https://www.scribd.com/document/875138308">https://www.scribd.com/document/875138308</ext-link></comment></nlm-citation></ref><ref id="ref29"><label>29</label><nlm-citation citation-type="web"><article-title>World Health Organization vaccination coverage cluster surveys: reference manual</article-title><source>World Health Organization</source><year>2018</year><access-date>2024-11-23</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/publications/i/item/WHO-IVB-18.09">https://www.who.int/publications/i/item/WHO-IVB-18.09</ext-link></comment></nlm-citation></ref><ref id="ref30"><label>30</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Wonodi</surname><given-names>C</given-names> </name><name name-style="western"><surname>Farrenkopf</surname><given-names>BA</given-names> </name></person-group><article-title>Defining the zero dose child: a comparative analysis of two approaches and their impact on assessing the zero dose burden and vulnerability profiles across 82 low- and middle-income countries</article-title><source>Vaccines (Basel)</source><year>2023</year><month>09</month><day>28</day><volume>11</volume><issue>10</issue><fpage>1543</fpage><pub-id pub-id-type="doi">10.3390/vaccines11101543</pub-id><pub-id pub-id-type="medline">37896946</pub-id></nlm-citation></ref><ref id="ref31"><label>31</label><nlm-citation citation-type="web"><article-title>Zero dose children and missed communities</article-title><source>Gavi</source><access-date>2026-01-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.gavi.org/our-alliance/strategy/phase-5-2021-2025/equity-goal/zero-dose-children-missed-communities">https://www.gavi.org/our-alliance/strategy/phase-5-2021-2025/equity-goal/zero-dose-children-missed-communities</ext-link></comment></nlm-citation></ref><ref id="ref32"><label>32</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Schapire</surname><given-names>RE</given-names> </name><name name-style="western"><surname>Freund</surname><given-names>Y</given-names> </name></person-group><article-title>Boosting: foundations and algorithms</article-title><source>Kybernetes</source><year>2013</year><month>01</month><day>4</day><volume>42</volume><issue>1</issue><fpage>164</fpage><lpage>166</lpage><pub-id pub-id-type="doi">10.1108/03684921311295547</pub-id></nlm-citation></ref><ref id="ref33"><label>33</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cessie</surname><given-names>SL</given-names> </name><name name-style="western"><surname>Houwelingen</surname><given-names>JCV</given-names> </name></person-group><article-title>Ridge estimators in logistic regression</article-title><source>Appl Stat</source><year>1992</year><volume>41</volume><issue>1</issue><fpage>191</fpage><pub-id pub-id-type="doi">10.2307/2347628</pub-id></nlm-citation></ref><ref id="ref34"><label>34</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Pal</surname><given-names>M</given-names> </name></person-group><article-title>Random forest classifier for remote sensing classification</article-title><source>Int J Remote Sens</source><year>2005</year><month>01</month><volume>26</volume><issue>1</issue><fpage>217</fpage><lpage>222</lpage><pub-id pub-id-type="doi">10.1080/01431160412331269698</pub-id></nlm-citation></ref><ref id="ref35"><label>35</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Chen</surname><given-names>T</given-names> </name><name name-style="western"><surname>Guestrin</surname><given-names>C</given-names> </name></person-group><article-title>XGBoost: a scalable tree boosting system</article-title><conf-name>Proceedings of the 22nd ACM SIGKDD International Conference on Knowledge Discovery and Data Mining</conf-name><conf-date>Aug 13-17, 2016</conf-date><conf-loc>San Francisco, CA</conf-loc><fpage>785</fpage><lpage>794</lpage><pub-id pub-id-type="doi">10.1145/2939672.2939785</pub-id></nlm-citation></ref><ref id="ref36"><label>36</label><nlm-citation citation-type="book"><person-group person-group-type="author"><name name-style="western"><surname>Breiman</surname><given-names>L</given-names> </name><name name-style="western"><surname>Friedman</surname><given-names>J</given-names> </name><name name-style="western"><surname>Olshen</surname><given-names>RA</given-names> </name><name name-style="western"><surname>Stone</surname><given-names>CJ</given-names> </name></person-group><source>Classification and Regression Trees</source><year>2017</year><publisher-name>Routledge</publisher-name><pub-id pub-id-type="doi">10.1201/9781315139470</pub-id></nlm-citation></ref><ref id="ref37"><label>37</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>&#x0160;imundi&#x0107;</surname><given-names>AM</given-names> </name></person-group><article-title>Measures of Diagnostic Accuracy: Basic Definitions</article-title><source>EJIFCC</source><year>2009</year><month>01</month><volume>19</volume><issue>4</issue><fpage>203</fpage><lpage>211</lpage><pub-id pub-id-type="medline">27683318</pub-id></nlm-citation></ref><ref id="ref38"><label>38</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Flach</surname><given-names>P</given-names> </name><name name-style="western"><surname>Kull</surname><given-names>M</given-names> </name></person-group><article-title>Precision-recall-gain curves: PR analysis done right</article-title><source>Adv Neural Inf Process Syst</source><year>2015</year><access-date>2024-11-23</access-date><volume>28</volume><comment><ext-link ext-link-type="uri" xlink:href="https://proceedings.neurips.cc/paper_files/paper/2015/hash/33e8075e9970de0cfea955afd4644bb2-Abstract.html">https://proceedings.neurips.cc/paper_files/paper/2015/hash/33e8075e9970de0cfea955afd4644bb2-Abstract.html</ext-link></comment></nlm-citation></ref><ref id="ref39"><label>39</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Santini</surname><given-names>A</given-names> </name><name name-style="western"><surname>Man</surname><given-names>A</given-names> </name><name name-style="western"><surname>Void&#x0103;zan</surname><given-names>S</given-names> </name></person-group><article-title>Accuracy of diagnostic tests</article-title><source>J Crit Care Med</source><year>2021</year><month>07</month><day>1</day><volume>7</volume><issue>3</issue><fpage>241</fpage><lpage>248</lpage><pub-id pub-id-type="doi">10.2478/jccm-2021-0022</pub-id></nlm-citation></ref><ref id="ref40"><label>40</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kumar</surname><given-names>R</given-names> </name><name name-style="western"><surname>Indrayan</surname><given-names>A</given-names> </name></person-group><article-title>Receiver operating characteristic (ROC) curve for medical researchers</article-title><source>Indian Pediatr</source><year>2011</year><month>04</month><volume>48</volume><issue>4</issue><fpage>277</fpage><lpage>287</lpage><pub-id pub-id-type="doi">10.1007/s13312-011-0055-4</pub-id><pub-id pub-id-type="medline">21532099</pub-id></nlm-citation></ref><ref id="ref41"><label>41</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Collins</surname><given-names>GS</given-names> </name><name name-style="western"><surname>Reitsma</surname><given-names>JB</given-names> </name><name name-style="western"><surname>Altman</surname><given-names>DG</given-names> </name><name name-style="western"><surname>Moons</surname><given-names>KGM</given-names> </name><collab>TRIPOD Group</collab></person-group><article-title>Transparent reporting of a multivariable prediction model for individual prognosis or diagnosis (TRIPOD): the TRIPOD statement. The TRIPOD Group</article-title><source>Circulation</source><year>2015</year><month>01</month><day>13</day><volume>131</volume><issue>2</issue><fpage>211</fpage><lpage>219</lpage><pub-id pub-id-type="doi">10.1161/CIRCULATIONAHA.114.014508</pub-id><pub-id pub-id-type="medline">25561516</pub-id></nlm-citation></ref><ref id="ref42"><label>42</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Huang</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Li</surname><given-names>W</given-names> </name><name name-style="western"><surname>Macheret</surname><given-names>F</given-names> </name><name name-style="western"><surname>Gabriel</surname><given-names>RA</given-names> </name><name name-style="western"><surname>Ohno-Machado</surname><given-names>L</given-names> </name></person-group><article-title>A tutorial on calibration measurements and calibration models for clinical prediction models</article-title><source>J Am Med Inform Assoc</source><year>2020</year><month>04</month><day>1</day><volume>27</volume><issue>4</issue><fpage>621</fpage><lpage>633</lpage><pub-id pub-id-type="doi">10.1093/jamia/ocz228</pub-id></nlm-citation></ref><ref id="ref43"><label>43</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Lundberg</surname><given-names>SM</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SI</given-names> </name></person-group><article-title>A unified approach to interpreting model predictions</article-title><year>2017</year><access-date>2026-01-25</access-date><conf-name>Proceedings of the 31st International Conference on Neural Information Processing Systems</conf-name><conf-date>Dec 4-9, 2017</conf-date><conf-loc>Long Beach, CA</conf-loc><publisher-name>Curran Associates Inc</publisher-name><fpage>4768</fpage><lpage>4777</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://proceedings.neurips.cc/paper/2017/hash/8a20a8621978632d76c43dfd28b67767-Abstract.html">https://proceedings.neurips.cc/paper/2017/hash/8a20a8621978632d76c43dfd28b67767-Abstract.html</ext-link></comment></nlm-citation></ref><ref id="ref44"><label>44</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Bifarin</surname><given-names>OO</given-names> </name></person-group><article-title>Interpretable machine learning with tree-based SHapley Additive Explanations: application to metabolomics datasets for binary classification</article-title><source>PLoS One</source><year>2023</year><volume>18</volume><issue>5</issue><fpage>e0284315</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0284315</pub-id><pub-id pub-id-type="medline">37141218</pub-id></nlm-citation></ref><ref id="ref45"><label>45</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Altaf</surname><given-names>W</given-names> </name><name name-style="western"><surname>Shahbaz</surname><given-names>M</given-names> </name><name name-style="western"><surname>Guergachi</surname><given-names>A</given-names> </name></person-group><article-title>Applications of association rule mining in health informatics: a survey</article-title><source>Artif Intell Rev</source><year>2017</year><month>03</month><volume>47</volume><issue>3</issue><fpage>313</fpage><lpage>340</lpage><pub-id pub-id-type="doi">10.1007/s10462-016-9483-9</pub-id></nlm-citation></ref><ref id="ref46"><label>46</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Khare</surname><given-names>S</given-names> </name><name name-style="western"><surname>Gupta</surname><given-names>D</given-names> </name></person-group><article-title>Association rule analysis in cardiovascular disease</article-title><conf-name>2016 Second International Conference on Cognitive Computing and Information Processing (CCIP)</conf-name><conf-date>Aug 12-13, 2016</conf-date><conf-loc>Mysuru, India</conf-loc><fpage>1</fpage><lpage>6</lpage><pub-id pub-id-type="doi">10.1109/CCIP.2016.7802881</pub-id></nlm-citation></ref><ref id="ref47"><label>47</label><nlm-citation citation-type="confproc"><person-group person-group-type="author"><name name-style="western"><surname>Agrawal</surname><given-names>R</given-names> </name><name name-style="western"><surname>Srikant</surname><given-names>R</given-names> </name></person-group><article-title>Fast algorithms for mining association rules</article-title><year>1994</year><access-date>2024-11-24</access-date><conf-name>Proceedings of the 20th International Conference on Very Large Data Bases</conf-name><conf-date>Sep 12-15, 1994</conf-date><conf-loc>San Francisco, CA, USA</conf-loc><fpage>487</fpage><lpage>499</lpage><comment><ext-link ext-link-type="uri" xlink:href="https://www.columbia.edu/~rd2537/docu/apriori(abstract).pdf">https://www.columbia.edu/~rd2537/docu/apriori(abstract).pdf</ext-link></comment></nlm-citation></ref><ref id="ref48"><label>48</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tadese</surname><given-names>ZB</given-names> </name><name name-style="western"><surname>Nigatu</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Yehuala</surname><given-names>TZ</given-names> </name><name name-style="western"><surname>Sebastian</surname><given-names>Y</given-names> </name></person-group><article-title>Prediction of incomplete immunization among under-five children in East Africa from recent demographic and health surveys: a machine learning approach</article-title><source>Sci Rep</source><year>2024</year><month>05</month><day>21</day><volume>14</volume><issue>1</issue><fpage>11529</fpage><pub-id pub-id-type="doi">10.1038/s41598-024-62641-8</pub-id><pub-id pub-id-type="medline">38773175</pub-id></nlm-citation></ref><ref id="ref49"><label>49</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chandir</surname><given-names>S</given-names> </name><name name-style="western"><surname>Siddiqi</surname><given-names>DA</given-names> </name><name name-style="western"><surname>Hussain</surname><given-names>OA</given-names> </name><etal/></person-group><article-title>Using predictive analytics to identify children at high risk of defaulting from a routine immunization program: feasibility study</article-title><source>JMIR Public Health Surveill</source><year>2018</year><month>09</month><day>4</day><volume>4</volume><issue>3</issue><fpage>e63</fpage><pub-id pub-id-type="doi">10.2196/publichealth.9681</pub-id><pub-id pub-id-type="medline">30181112</pub-id></nlm-citation></ref><ref id="ref50"><label>50</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chambongo</surname><given-names>PE</given-names> </name><name name-style="western"><surname>Nguku</surname><given-names>P</given-names> </name><name name-style="western"><surname>Wasswa</surname><given-names>P</given-names> </name><name name-style="western"><surname>Semali</surname><given-names>I</given-names> </name></person-group><article-title>Community vaccine perceptions and its role on vaccination uptake among children aged 12-23 months in the Ileje District, Tanzania: a cross section study</article-title><source>Pan Afr Med J</source><year>2016</year><volume>23</volume><fpage>162</fpage><pub-id pub-id-type="doi">10.11604/pamj.2016.23.162.8925</pub-id><pub-id pub-id-type="medline">27303578</pub-id></nlm-citation></ref><ref id="ref51"><label>51</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Puri</surname><given-names>YE</given-names> </name><name name-style="western"><surname>Murti</surname><given-names>B</given-names> </name><name name-style="western"><surname>Demartoto</surname><given-names>A</given-names> </name></person-group><article-title>Analysis of the effect of maternal perception on completeness of child immunization status with health belief model</article-title><source>J Health Promot Behav</source><year>2016</year><volume>01</volume><issue>3</issue><fpage>211</fpage><lpage>222</lpage><pub-id pub-id-type="doi">10.26911/thejhpb.2016.01.03.08</pub-id></nlm-citation></ref><ref id="ref52"><label>52</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Demsash</surname><given-names>AW</given-names> </name><name name-style="western"><surname>Chereka</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Walle</surname><given-names>AD</given-names> </name><name name-style="western"><surname>Kassie</surname><given-names>SY</given-names> </name><name name-style="western"><surname>Bekele</surname><given-names>F</given-names> </name><name name-style="western"><surname>Bekana</surname><given-names>T</given-names> </name></person-group><article-title>Machine learning algorithms&#x2019; application to predict childhood vaccination among children aged 12&#x2013;23 months in Ethiopia: evidence 2016 Ethiopian Demographic and Health Survey dataset</article-title><source>PLoS One</source><year>2023</year><volume>18</volume><issue>10</issue><fpage>e0288867</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0288867</pub-id></nlm-citation></ref><ref id="ref53"><label>53</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Biswas</surname><given-names>A</given-names> </name><name name-style="western"><surname>Tucker</surname><given-names>J</given-names> </name><name name-style="western"><surname>Bauhoff</surname><given-names>S</given-names> </name></person-group><article-title>Performance of predictive algorithms in estimating the risk of being a zero-dose child in India, Mali and Nigeria</article-title><source>BMJ Glob Health</source><year>2023</year><month>10</month><volume>8</volume><issue>10</issue><fpage>e012836</fpage><pub-id pub-id-type="doi">10.1136/bmjgh-2023-012836</pub-id><pub-id pub-id-type="medline">37821114</pub-id></nlm-citation></ref><ref id="ref54"><label>54</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dixit</surname><given-names>P</given-names> </name><name name-style="western"><surname>Dwivedi</surname><given-names>LK</given-names> </name><name name-style="western"><surname>Ram</surname><given-names>F</given-names> </name></person-group><article-title>Strategies to improve child immunization via antenatal care visits in India: a propensity score matching analysis</article-title><source>PLoS One</source><year>2013</year><volume>8</volume><issue>6</issue><fpage>e66175</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0066175</pub-id><pub-id pub-id-type="medline">23824555</pub-id></nlm-citation></ref><ref id="ref55"><label>55</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Jiao</surname><given-names>B</given-names> </name><name name-style="western"><surname>Iversen</surname><given-names>I</given-names> </name><name name-style="western"><surname>Sato</surname><given-names>R</given-names> </name><etal/></person-group><article-title>Association between achieving adequate antenatal care and health-seeking behaviors: a study of demographic and health surveys in 47 low- and middle-income countries</article-title><source>PLoS Med</source><year>2024</year><month>07</month><volume>21</volume><issue>7</issue><fpage>e1004421</fpage><pub-id pub-id-type="doi">10.1371/journal.pmed.1004421</pub-id><pub-id pub-id-type="medline">38968303</pub-id></nlm-citation></ref><ref id="ref56"><label>56</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Krishnamoorthy</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Rehman</surname><given-names>T</given-names> </name></person-group><article-title>Impact of antenatal care visits on childhood immunization: a propensity score-matched analysis using nationally representative survey</article-title><source>Fam Pract</source><year>2022</year><month>07</month><day>19</day><volume>39</volume><issue>4</issue><fpage>603</fpage><lpage>609</lpage><pub-id pub-id-type="doi">10.1093/fampra/cmab124</pub-id><pub-id pub-id-type="medline">34564727</pub-id></nlm-citation></ref><ref id="ref57"><label>57</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ibrahim</surname><given-names>ZA</given-names> </name><name name-style="western"><surname>Sabahelzain</surname><given-names>MM</given-names> </name><name name-style="western"><surname>Elhadi</surname><given-names>YAM</given-names> </name><name name-style="western"><surname>Malande</surname><given-names>OO</given-names> </name><name name-style="western"><surname>Babiker</surname><given-names>S</given-names> </name></person-group><article-title>Predictors of tetanus vaccine uptake among pregnant women in Khartoum State, Sudan: a hospital-based cross-sectional study</article-title><source>Vaccines (Basel)</source><year>2023</year><month>07</month><day>21</day><volume>11</volume><issue>7</issue><fpage>7</fpage><pub-id pub-id-type="doi">10.3390/vaccines11071268</pub-id><pub-id pub-id-type="medline">37515083</pub-id></nlm-citation></ref><ref id="ref58"><label>58</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Amin</surname><given-names>MB</given-names> </name><name name-style="western"><surname>Roy</surname><given-names>N</given-names> </name><name name-style="western"><surname>Meem</surname><given-names>AE</given-names> </name><name name-style="western"><surname>Hossain</surname><given-names>E</given-names> </name><name name-style="western"><surname>Aktarujjaman</surname><given-names>M</given-names> </name></person-group><article-title>Trends and determinants of taking tetanus toxoid vaccine among women during last pregnancy in Bangladesh: country representative survey from 2006 to 2019</article-title><source>PLoS One</source><year>2022</year><volume>17</volume><issue>10</issue><fpage>e0276417</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0276417</pub-id></nlm-citation></ref><ref id="ref59"><label>59</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Laryea</surname><given-names>DO</given-names> </name><name name-style="western"><surname>Abbeyquaye Parbie</surname><given-names>E</given-names> </name><name name-style="western"><surname>Frimpong</surname><given-names>E</given-names> </name></person-group><article-title>Timeliness of childhood vaccine uptake among children attending a tertiary health service facility-based immunisation clinic in Ghana</article-title><source>BMC Public Health</source><year>2014</year><month>01</month><day>29</day><volume>14</volume><fpage>1</fpage><lpage>5</lpage><pub-id pub-id-type="doi">10.1186/1471-2458-14-90</pub-id><pub-id pub-id-type="medline">24476339</pub-id></nlm-citation></ref><ref id="ref60"><label>60</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sarker</surname><given-names>AR</given-names> </name><name name-style="western"><surname>Akram</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ali</surname><given-names>N</given-names> </name><name name-style="western"><surname>Chowdhury</surname><given-names>ZI</given-names> </name><name name-style="western"><surname>Sultana</surname><given-names>M</given-names> </name></person-group><article-title>Coverage and determinants of full immunization: vaccination coverage among Senegalese children</article-title><source>Medicina</source><year>2019</year><volume>55</volume><issue>8</issue><fpage>480</fpage><pub-id pub-id-type="doi">10.3390/medicina55080480</pub-id></nlm-citation></ref><ref id="ref61"><label>61</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Acharya</surname><given-names>P</given-names> </name><name name-style="western"><surname>Kismul</surname><given-names>H</given-names> </name><name name-style="western"><surname>Mapatano</surname><given-names>MA</given-names> </name><name name-style="western"><surname>Hatl&#x00F8;y</surname><given-names>A</given-names> </name></person-group><article-title>Individual- and community-level determinants of child immunization in the Democratic Republic of Congo: a multilevel analysis</article-title><source>PLoS One</source><year>2018</year><volume>13</volume><issue>8</issue><fpage>e0202742</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0202742</pub-id><pub-id pub-id-type="medline">30138459</pub-id></nlm-citation></ref><ref id="ref62"><label>62</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rauniyar</surname><given-names>SK</given-names> </name><name name-style="western"><surname>Munkhbat</surname><given-names>E</given-names> </name><name name-style="western"><surname>Ueda</surname><given-names>P</given-names> </name><name name-style="western"><surname>Yoneoka</surname><given-names>D</given-names> </name><name name-style="western"><surname>Shibuya</surname><given-names>K</given-names> </name><name name-style="western"><surname>Nomura</surname><given-names>S</given-names> </name></person-group><article-title>Timeliness of routine vaccination among children and determinants associated with age-appropriate vaccination in Mongolia</article-title><source>Heliyon</source><year>2020</year><month>09</month><volume>6</volume><issue>9</issue><fpage>e04898</fpage><pub-id pub-id-type="doi">10.1016/j.heliyon.2020.e04898</pub-id><pub-id pub-id-type="medline">32995607</pub-id></nlm-citation></ref><ref id="ref63"><label>63</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Budu</surname><given-names>E</given-names> </name><name name-style="western"><surname>Darteh</surname><given-names>EKM</given-names> </name><name name-style="western"><surname>Ahinkorah</surname><given-names>BO</given-names> </name><name name-style="western"><surname>Seidu</surname><given-names>AA</given-names> </name><name name-style="western"><surname>Dickson</surname><given-names>KS</given-names> </name></person-group><article-title>Trend and determinants of complete vaccination coverage among children aged 12-23 months in Ghana: analysis of data from the 1998 to 2014 Ghana Demographic and Health Surveys</article-title><source>PLoS One</source><year>2020</year><volume>15</volume><issue>10</issue><fpage>e0239754</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0239754</pub-id></nlm-citation></ref><ref id="ref64"><label>64</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Noh</surname><given-names>JW</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>Y m.</given-names> </name><name name-style="western"><surname>Akram</surname><given-names>N</given-names> </name><etal/></person-group><article-title>Factors affecting complete and timely childhood immunization coverage in Sindh, Pakistan; a secondary analysis of cross-sectional survey data</article-title><source>PLoS One</source><year>2018</year><volume>13</volume><issue>10</issue><fpage>e0206766</fpage><pub-id pub-id-type="doi">10.1371/journal.pone.0206766</pub-id></nlm-citation></ref><ref id="ref65"><label>65</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Sarker</surname><given-names>AR</given-names> </name><name name-style="western"><surname>Akram</surname><given-names>R</given-names> </name><name name-style="western"><surname>Ali</surname><given-names>N</given-names> </name><name name-style="western"><surname>Sultana</surname><given-names>M</given-names> </name></person-group><article-title>Coverage and factors associated with full immunisation among children aged 12&#x2013;59 months in Bangladesh: insights from the nationwide cross-sectional demographic and health survey</article-title><source>BMJ Open</source><year>2019</year><month>07</month><volume>9</volume><issue>7</issue><fpage>e028020</fpage><pub-id pub-id-type="doi">10.1136/bmjopen-2018-028020</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Zero-dose status among children aged 12&#x2010;35 months in Ethiopia, before and after data balancing, using the 2023 survey dataset. SMOTE: Synthetic Minority Oversampling Technique.</p><media xlink:href="pediatrics_v9i1e76712_app1.png" xlink:title="PNG File, 162 KB"/></supplementary-material></app-group></back></article>