<?xml version="1.0" encoding="UTF-8"?><!DOCTYPE article PUBLIC "-//NLM//DTD Journal Publishing DTD v2.0 20040830//EN" "journalpublishing.dtd"><article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" dtd-version="2.0" xml:lang="en" article-type="research-article"><front><journal-meta><journal-id journal-id-type="nlm-ta">JMIR Nursing</journal-id><journal-id journal-id-type="publisher-id">nursing</journal-id><journal-id journal-id-type="index">33</journal-id><journal-title>JMIR Nursing</journal-title><abbrev-journal-title>JMIR Nursing</abbrev-journal-title><issn pub-type="epub">2562-7600</issn><publisher><publisher-name>JMIR Publications</publisher-name><publisher-loc>Toronto, Canada</publisher-loc></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">v9i1e94450</article-id><article-id pub-id-type="doi">10.2196/94450</article-id><article-categories><subj-group subj-group-type="heading"><subject>Original Paper</subject></subj-group></article-categories><title-group><article-title>Explainable AI for Equitable Nurse Scheduling: Pragmatic Pre-Post Implementation Study</article-title></title-group><contrib-group><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Shia</surname><given-names>Ben-Chang</given-names></name><degrees>Prof Dr, PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Peng</surname><given-names>Szu-Ming</given-names></name><degrees>PhD</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author" equal-contrib="yes"><name name-style="western"><surname>Zhang</surname><given-names>Qui-Yang</given-names></name><degrees>PGDM</degrees><xref ref-type="aff" rid="aff1">1</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib><contrib contrib-type="author"><name name-style="western"><surname>Lo</surname><given-names>Chiung-Yun</given-names></name><degrees>BSN, MHA</degrees><xref ref-type="aff" rid="aff2">2</xref></contrib><contrib contrib-type="author" corresp="yes" equal-contrib="yes"><name name-style="western"><surname>Wang</surname><given-names>Sheng-Ru</given-names></name><degrees>MD, EMBA</degrees><xref ref-type="aff" rid="aff3">3</xref><xref ref-type="fn" rid="equal-contrib1">*</xref></contrib></contrib-group><aff id="aff1"><institution>Graduate Institute of Business Administration, College of Management, Fu Jen Catholic University</institution><addr-line>New Taipei City</addr-line><country>Taiwan</country></aff><aff id="aff2"><institution>Deputy Director of Teaching and Research Department, St. Paul&#x2019;s Hospital</institution><addr-line>Taoyuan City</addr-line><country>Taiwan</country></aff><aff id="aff3"><institution>Department of Pediatric Emergency, Fu Jen Catholic University Hospital</institution><addr-line>No. 69, Sec. 1, Gui-zi Road, Taishan Dist.</addr-line><addr-line>New Taipei City</addr-line><country>Taiwan</country></aff><contrib-group><contrib contrib-type="editor"><name name-style="western"><surname>Borycki</surname><given-names>Elizabeth</given-names></name></contrib></contrib-group><contrib-group><contrib contrib-type="reviewer"><name name-style="western"><surname>Lin</surname><given-names>Bertrand M T</given-names></name></contrib><contrib contrib-type="reviewer"><name name-style="western"><surname>Koruca</surname><given-names>Halil</given-names></name></contrib></contrib-group><author-notes><corresp>Correspondence to Sheng-Ru Wang, MD, EMBA, Department of Pediatric Emergency, Fu Jen Catholic University Hospital, No. 69, Sec. 1, Gui-zi Road, Taishan Dist., New Taipei City, 24352, Taiwan, 886 0926189605; <email>wang.clinic@gmail.com</email></corresp><fn fn-type="equal" id="equal-contrib1"><label>*</label><p>these authors contributed equally</p></fn></author-notes><pub-date pub-type="collection"><year>2026</year></pub-date><pub-date pub-type="epub"><day>2</day><month>7</month><year>2026</year></pub-date><volume>9</volume><elocation-id>e94450</elocation-id><history><date date-type="received"><day>01</day><month>03</month><year>2026</year></date><date date-type="rev-recd"><day>06</day><month>04</month><year>2026</year></date><date date-type="accepted"><day>05</day><month>05</month><year>2026</year></date></history><copyright-statement>&#x00A9; Ben-Chang Shia, Szu-Ming Peng, Qui-Yang Zhang, Chiung-Yun Lo, Sheng-Ru Wang. Originally published in JMIR Nursing (<ext-link ext-link-type="uri" xlink:href="https://nursing.jmir.org">https://nursing.jmir.org</ext-link>), 2.7.2026. </copyright-statement><copyright-year>2026</copyright-year><license license-type="open-access" xlink:href="https://creativecommons.org/licenses/by/4.0/"><p>This is an open-access article distributed under the terms of the Creative Commons Attribution License (<ext-link ext-link-type="uri" xlink:href="https://creativecommons.org/licenses/by/4.0/">https://creativecommons.org/licenses/by/4.0/</ext-link>), which permits unrestricted use, distribution, and reproduction in any medium, provided the original work, first published in JMIR Nursing, is properly cited. The complete bibliographic information, a link to the original publication on <ext-link ext-link-type="uri" xlink:href="https://nursing.jmir.org/">https://nursing.jmir.org/</ext-link>, as well as this copyright and license information must be included.</p></license><self-uri xlink:type="simple" xlink:href="https://nursing.jmir.org/2026/1/e94450"/><abstract><sec><title>Background</title><p>Inequitable and time-consuming shift scheduling contributes to nurse burnout, dissatisfaction, and turnover. In Taiwan, annual nurse turnover reaches 11.6%, with rigid 3-shift systems and unfair workload distribution frequently cited as key drivers. Although artificial intelligence (AI) scheduling tools exist, most lack transparency and do not formally address algorithmic bias, limiting clinical adoption.</p></sec><sec><title>Objective</title><p>This study aimed to design, deploy, and evaluate a transparent, fairness-audited, explainable AI&#x2013;enabled nurse scheduling decision support system (XAI-NSDSS) to reduce administrative burden, eliminate experience-based algorithmic bias, and enhance staff acceptance in a real-world hospital setting.</p></sec><sec sec-type="methods"><title>Methods</title><p>A pragmatic before-after implementation study was conducted at a 671-bed teaching hospital in Taiwan (January-December 2023), involving 8 departments and 156 nurses (42 novice, 78 midlevel, and 36 experienced). A 6-month manual scheduling baseline (January-June 2023) was compared with a 6-month AI-assisted period (July-December 2023). The XAI-NSDSS integrates a random forest workload prediction model (<italic>R</italic>&#x00B2;=0.887), Shapley Additive Explanations&#x2013;based explainability, a hybrid integer programming and binary differential evolution (IP+ BDE) optimizer, and a multidimensional fairness monitoring dashboard. A formal weight sensitivity analysis (WSA) was conducted across 7 prespecified weight configurations using full-factorial repeated-measures ANOVA to assess outcome robustness. Primary outcomes were scheduling time, error rate, and user satisfaction. Statistical analyses used linear mixed effects models (LMMs) and generalized estimating equations (GEE) with department as a random effect.</p></sec><sec sec-type="results"><title>Results</title><p>Monthly scheduling time decreased by 81.2% (mean 32.0, SD 8.0-mean 6.0, SD 2.0) hours; <italic>P</italic>&#x003C;.001; Cohen <italic>d</italic>=4.33) and error rate decreased by 73.8% (mean 18.3, SD 4.3%-mean 4.8, SD 1.2%; <italic>P</italic>&#x003C;.001; Cohen <italic>d</italic>=4.12). Nurse satisfaction improved from a mean of 3.2 (SD 0.8) to a mean of 4.4 (SD 0.6; <italic>P</italic>&#x003C;.001), with 148 out of 156 nurses (94.9%) adopting the system by Month 3. Preexisting experience-based bias was fully eliminated: workload coefficient of variation (CV) decreased 50% (0.18-0.09; <italic>P</italic>&#x003C;.001), disparate impact ratios normalized from 1.35&#x2010;1.56 to 1.01&#x2010;1.04, and preference satisfaction equity was achieved across experience tiers (ANOVA <italic>P</italic>=.38). Among 156 nurses, 82 (52.6%) regularly engaged with Shapley Additive Explanations; this engagement was positively associated with satisfaction (Pearson <italic>r</italic>=0.456; <italic>P</italic>&#x003C;.001). The WSA across 7 configurations confirmed that the consensus-derived default weights achieved the highest composite quality score (mean 82.1, SD 3.2) and that disparate impact ratios remained within the 0.80&#x2010;1.25 fairness threshold across all configurations (<italic>P</italic>=.12), demonstrating structural robustness of the fairness-auditing module.</p></sec><sec sec-type="conclusions"><title>Conclusions</title><p>This study presents the first longitudinally validated explainable AI implementation framework for nurse scheduling with formal algorithmic fairness auditing and WSA. The XAI-NSDSS framework is replicable, scalable, and provides a practical blueprint for responsible AI adoption in health care workforce governance, with fairness guarantees that are robust to institutional customization of optimization priorities.</p></sec></abstract><kwd-group><kwd>nurse scheduling</kwd><kwd>workload equity</kwd><kwd>explainable artificial intelligence</kwd><kwd>algorithmic fairness</kwd><kwd>implementation science</kwd><kwd>decision support systems</kwd><kwd>workforce management</kwd></kwd-group></article-meta></front><body><sec id="s1" sec-type="intro"><title>Introduction</title><sec id="s1-1"><title>Background and Rationale</title><p>The global nursing workforce crisis is one of the most pressing challenges in modern health care. The World Health Organization (WHO) projects a shortage of 5.9 million nurses by 2030, with high-income countries experiencing turnover exceeding 15% annually [<xref ref-type="bibr" rid="ref1">1</xref>]. In Taiwan, the annual nursing turnover rate reached a 10-year high of 11.6%, with scheduling-related dissatisfaction identified as a leading contributor to burnout and early career exit [<xref ref-type="bibr" rid="ref2">2</xref>,<xref ref-type="bibr" rid="ref3">3</xref>]. Inefficient scheduling creates a vicious cycle; unfair shift distribution increases fatigue, which accelerates attrition, which further strains remaining staff.</p><p>Nurse scheduling is a complex combinatorial optimization problem requiring simultaneous consideration of regulatory constraints (labor laws and union agreements), operational requirements (shift coverage and skill mix), and individual staff preferences (time-off requests and work-life balance) [<xref ref-type="bibr" rid="ref4">4</xref>]. Traditional manual scheduling is time-intensive, error-prone, and chronically fails to achieve fair workload distribution, particularly disadvantaging novice nurses who lack institutional leverage to negotiate favorable assignments [<xref ref-type="bibr" rid="ref5">5</xref>].</p></sec><sec id="s1-2"><title>Gaps in Existing AI Scheduling Systems</title><p>Artificial intelligence (AI) and operations research approaches have shown promise in nurse scheduling. Recent implementations include mixed integer programming heuristics [<xref ref-type="bibr" rid="ref6">6</xref>], genetic algorithms [<xref ref-type="bibr" rid="ref7">7</xref>], and machine learning&#x2013;based prediction models [<xref ref-type="bibr" rid="ref8">8</xref>]. However, a systematic review of the literature reveals four persistent, unresolved gaps:</p><list list-type="order"><list-item><p>Opacity and lack of explainability: most systems operate as &#x201C;black boxes,&#x201D; generating schedules without interpretable rationale, a critical barrier to trust in high-accountability health care environments [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>].</p></list-item><list-item><p>Absence of formal fairness auditing: while scheduling optimization papers frequently mention equity as an objective, formal auditing of algorithmic bias using established fairness metrics (eg, disparate impact ratios) remains virtually absent from the literature [<xref ref-type="bibr" rid="ref11">11</xref>].</p></list-item><list-item><p>Insufficient real-world longitudinal validation: the majority of published systems are evaluated on simulated or retrospective datasets. Prospective, hospital-based evaluations are rare, limiting evidence for practical adoption [<xref ref-type="bibr" rid="ref12">12</xref>,<xref ref-type="bibr" rid="ref13">13</xref>].</p></list-item><list-item><p>Neglect of user trust mechanisms: system design rarely accounts for how transparency features influence actual adoption behavior, creating a gap between algorithmic performance and clinical uptake [<xref ref-type="bibr" rid="ref14">14</xref>,<xref ref-type="bibr" rid="ref15">15</xref>].</p></list-item></list></sec><sec id="s1-3"><title>Study Objectives and Contributions</title><p>This study directly addresses all 4 gaps through the design, deployment, and 12-month evaluation (6-mo pre- and 6-mo postimplementation) of the explainable AI&#x2013;enabled nurse scheduling decision support system (XAI-NSDSS) at a 671-bed tertiary referral hospital in Taiwan. The aim of this study was to demonstrate that a single integrated framework can simultaneously achieve operational efficiency, provable algorithmic equity, and clinician trust through explainability. Specific contributions are as follows:</p><list list-type="order"><list-item><p>Framework contribution: among the first end-to-end XAI implementation frameworks for nurse scheduling integrating Shapley Additive Explanations (SHAP)&#x2013;based explainability, formal optimization, and a multidimensional algorithmic fairness monitoring system.</p></list-item><list-item><p>Empirical contribution: prospective real-world evidence from 156 nurses across 8 departments over 12 months, among the largest single-site longitudinal evaluations of an explainable artificial intelligence (XAI) nurse scheduling system reported to date.</p></list-item><list-item><p>Fairness contribution: formal documentation and complete elimination of preexisting experience-based algorithmic bias using disparate impact ratios, Gini coefficients, and ANOVA-based equity testing.</p></list-item><list-item><p>Trust mechanism contribution: empirical evidence that SHAP engagement (82/156, 52.6% nurses) is positively associated with satisfaction (<italic>r</italic>=0.456; <italic>P</italic>&#x003C;.001), positioning explainability as a functional organizational intervention.</p></list-item><list-item><p>Implementation science contribution: actionable guidelines for change management, governance, and phased rollout based on observed adoption patterns, learning curves, and organizational barriers.</p></list-item></list></sec></sec><sec id="s2" sec-type="methods"><title>Methods</title><sec id="s2-1"><title>Study Setting and Design</title><p>This pragmatic before-after implementation study was conducted at Fu Jen Catholic University Hospital, a 671-bed tertiary referral hospital in New Taipei City, Taiwan, from January to December 2023. The XAI-NSDSS was deployed across 8 nursing departments&#x2014;medical, surgical, intensive care, emergency, pediatrics, obstetrics, oncology, and geriatrics&#x2014;serving 156 nurses (42 novice [&#x003C;3 y experience], 78 midlevel [3&#x2010;10 y], and 36 experienced [&#x003E;10 y]).</p><p>We used a mixed methods evaluation design with a 6-month preimplementation baseline (manual scheduling; January-June 2023) compared to a 6-month postimplementation period (AI-assisted scheduling; July-December 2023). Randomization was not feasible due to the hospital-wide nature of the intervention and risk of cross-contamination; the large effect sizes observed (Cohen <italic>d</italic>&#x003E;4) and consistency across all 8 departments strengthen confidence in attribution. This study is reported in accordance with the Standards for Quality Improvement Reporting Excellence (SQUIRE 2.0) guidelines.</p></sec><sec id="s2-2"><title>Participants and Eligibility</title><p>All registered nurses employed in the participating departments during the study period were eligible for inclusion. Exclusion criteria included (1) nurses on extended leave (&#x003E;4 consecutive weeks), (2) temporary or agency staff without permanent employment contracts, and (3) nurses in administrative roles without direct patient care responsibilities. Of 162 eligible nurses, 156 (96.3%) participated in the full 12-month study period. Six nurses were excluded due to maternity leave (n=3), resignation (n=2), or transfer to nonparticipating departments (n=1).</p></sec><sec id="s2-3"><title>System Architecture and Decision Pipeline</title><p>The XAI-NSDSS uses a modular 5-layer architecture (<xref ref-type="fig" rid="figure1">Figure 1</xref>; detailed in Section S2.1 in ): (1) user interface layer&#x2014;mobile-responsive dashboards (React.js 18.2.0; Meta Platforms, Inc); (2) AI engine layer&#x2014;random forest regressors (scikit-learn 1.3.0; scikit-learn developers) for workload capacity prediction; (3) explainability module&#x2014;SHAP TreeExplainer (shap v0.42.1; Scott Lundberg); (4) optimization layer&#x2014;hybrid integer programming (IP; Gurobi 10.0.3; Gurobi Optimization, LLC)+binary differential evolution (BDE); and (5) data layer&#x2014;PostgreSQL (15.3; PostgreSQL Global Development Group) with TimescaleDB (Tiger Data) and advanced encryption standard with a 256-bit key encrypted storage.</p><fig position="float" id="figure1"><label>Figure 1.</label><caption><p>System architecture diagram. AI: Artificial Intelligence; SHAP: Shapley Additive Explanations.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="nursing_v9i1e94450_fig01.png"/></fig></sec><sec id="s2-4"><title>XAI Components</title><sec id="s2-4-1"><title>SHAP-Enhanced Workload Prediction</title><p>Random forest regressors (200 trees, max_depth=15, min_samples_split=10, max_features=&#x201C;sqrt&#x201D;) predicted nurse workload capacity scores based on 18 input features spanning demographic characteristics, workload indicators, fatigue metrics, and preference alignment (Table S1 in ). All continuous features were standardized using min-max normalization prior to model training. Models were trained on 1872 nurse-quarter observations (2021&#x2010;2023) with 70/15/15 train/validation/test splits. Test-set performance: <italic>R</italic>&#x00B2;=0.887, mean absolute error (MAE)=5.1, root-mean-square error (RMSE)=7.4. SHAP TreeExplainer values provided both global feature importance rankings and local, assignment-level explanations displayed to each nurse [<xref ref-type="bibr" rid="ref16">16</xref>].</p></sec><sec id="s2-4-2"><title>2D Assignment Logic</title><p>A 2D assignment framework balances professionalism scores (weighted composite of performance evaluations, certifications, and experience; S2.2 in ) with fatigue indicators (consecutive shifts, overtime hours, night shift frequency, and recovery time). Exponential penalty functions capture the nonlinear clinical risk of accumulated fatigue. The key terms are defined as:</p><p>Professionalism score = 0.35 &#x00D7; Performance_Evaluation + 0.25 &#x00D7; Experience_Normalized + 0.20 &#x00D7; Certifications + 0.15 &#x00D7; Patient_Satisfaction + 0.05 &#x00D7; Peer_Collaboration</p><p>Fatigue score = 0.30 &#x00D7; Consecutive_Shifts_Penalty + 0.25 &#x00D7; Overtime_Penalty + 0.20 &#x00D7; Night_Shift_Penalty + 0.15 &#x00D7; Recovery_Deficit + 0.10 &#x00D7; Weekend_Penalty</p><p>where penalty functions follow exponential forms (eg, Consecutive_Shifts_Penalty=min[100, 10&#x00D7; e^(0.3&#x00D7; consecutive_shifts)]) to reflect the nonlinear accumulation of clinical risk.</p></sec></sec><sec id="s2-5"><title>Optimization Methodology</title><sec id="s2-5-1"><title>Hybrid IP+BDE Approach</title><p>Let x_ijs &#x2208; {0,1} denote whether nurse i (i &#x2208; N, |N|=156) is assigned to shift s (s &#x2208; S={day, evening, night, off}) on day j (j &#x2208; D={1,...,30}). The IP model enforces the following hard constraints, which carry zero tolerance for violation:</p><list list-type="bullet"><list-item><p>Coverage: &#x03A3;&#x1D62; x_ijs&#x2265; R_js for all j &#x2208; D, s &#x2208; S (minimum staffing requirements per shift)</p></list-item><list-item><p>One shift per day: &#x03A3;s x_ijs&#x2264;1 for all i &#x2208; N, j &#x2208; D</p></list-item><list-item><p>Maximum consecutive shifts: &#x03A3;_{k=j}^{j+5} &#x03A3;_{s&#x2260;off} x_iks&#x2264;5 for all i &#x2208; N, j &#x2208; D</p></list-item><list-item><p>Minimum rest: x_{i,j,night}+ x_{i,j+1,day}&#x2264;1 for all i, j (ensuring &#x2265;11 h intershift rest)</p></list-item><list-item><p>Skill mix: &#x03A3;&#x1D62; (q_ik&#x00D7; x_ijs)&#x2265; Q_jsk for all j, s, k (minimum qualified staff per specialty)</p></list-item></list><p>These constraints are implemented as strict mathematical constraints within the IP model (Gurobi 10.0.3), guaranteeing 100% compliance in all generated schedules. The BDE component then minimizes the following multiobjective penalty-based fitness function after IP feasibility repair:</p><disp-formula id="equWL1"><mml:math id="eqn1"><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mstyle displaystyle="true" scriptlevel="0"><mml:mrow><mml:mi mathvariant="normal">F</mml:mi></mml:mrow><mml:munder><mml:mrow/><mml:mo>_</mml:mo></mml:munder><mml:mrow><mml:mrow><mml:mi mathvariant="normal">s</mml:mi><mml:mi mathvariant="normal">c</mml:mi><mml:mi mathvariant="normal">h</mml:mi><mml:mi mathvariant="normal">e</mml:mi><mml:mi mathvariant="normal">d</mml:mi><mml:mi mathvariant="normal">u</mml:mi><mml:mi mathvariant="normal">l</mml:mi><mml:mi mathvariant="normal">e</mml:mi></mml:mrow></mml:mrow><mml:mo>=</mml:mo><mml:mrow><mml:mtext>&#x00A0;</mml:mtext></mml:mrow><mml:msub><mml:mrow><mml:mi>&#x03BB;</mml:mi></mml:mrow><mml:mrow><mml:mn>1</mml:mn></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:mrow><mml:mi mathvariant="normal">C</mml:mi></mml:mrow><mml:munder><mml:mrow/><mml:mo>_</mml:mo></mml:munder><mml:mrow><mml:mrow><mml:mi mathvariant="normal">h</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">a</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">r</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">d</mml:mi></mml:mrow></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mtext>&#x00A0;</mml:mtext></mml:mrow><mml:msub><mml:mrow><mml:mi>&#x03BB;</mml:mi></mml:mrow><mml:mrow><mml:mn>2</mml:mn></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:mrow><mml:mi mathvariant="normal">C</mml:mi></mml:mrow><mml:munder><mml:mrow/><mml:mo>_</mml:mo></mml:munder><mml:mrow><mml:mrow><mml:mi mathvariant="normal">s</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">o</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">f</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">t</mml:mi></mml:mrow></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mtext>&#x00A0;</mml:mtext></mml:mrow><mml:msub><mml:mrow><mml:mi>&#x03BB;</mml:mi></mml:mrow><mml:mrow><mml:mn>3</mml:mn></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:mrow><mml:mi mathvariant="normal">P</mml:mi></mml:mrow><mml:munder><mml:mrow/><mml:mo>_</mml:mo></mml:munder><mml:mrow><mml:mrow><mml:mi mathvariant="normal">u</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">n</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">m</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">e</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">t</mml:mi></mml:mrow></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mtext>&#x00A0;</mml:mtext></mml:mrow><mml:msub><mml:mrow><mml:mi>&#x03BB;</mml:mi></mml:mrow><mml:mrow><mml:mn>4</mml:mn></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:mrow><mml:mi mathvariant="normal">W</mml:mi></mml:mrow><mml:munder><mml:mrow/><mml:mo>_</mml:mo></mml:munder><mml:mrow><mml:mrow><mml:mi mathvariant="normal">i</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">m</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">b</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">a</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">l</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">a</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">n</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">c</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">e</mml:mi></mml:mrow></mml:mrow><mml:mo>+</mml:mo><mml:mrow><mml:mtext>&#x00A0;</mml:mtext></mml:mrow><mml:msub><mml:mrow><mml:mi>&#x03BB;</mml:mi></mml:mrow><mml:mrow><mml:mn>5</mml:mn></mml:mrow></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:mrow><mml:mi mathvariant="normal">F</mml:mi></mml:mrow><mml:munder><mml:mrow/><mml:mo>_</mml:mo></mml:munder><mml:mrow><mml:mrow><mml:mi mathvariant="normal">t</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">o</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">t</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">a</mml:mi></mml:mrow><mml:mrow><mml:mi mathvariant="normal">l</mml:mi></mml:mrow></mml:mrow></mml:mstyle></mml:mrow></mml:mstyle></mml:math></disp-formula><p>where C_hard is the count of IP hard-constraint violations in the BDE trial vector, used only as a barrier function; C_soft is the sum of weekend and night-shift fairness violations across all nurse pairs; P_unmet = &#x03A3;&#x1D62; &#x03A3;<sub>j</sub> &#x03A3;<sub>s</sub>(1 &#x2212; match_ijs) &#x00D7; preference_strength_ijs; W_imbalance = Var(monthly_hours) + Var(weekend_shifts) + Var(night_shifts) across all nurses; and F_total = &#x03A3;&#x1D62; &#x03A3;<sub>j</sub> &#x03A3;<sub>s</sub> fatigue_score(i,j) &#x00D7; x_ijs.</p><p>The penalty-scale coefficients were set as &#x03BB;&#x2081;=1000, &#x03BB;&#x2082;=100, &#x03BB;&#x2083;=50, &#x03BB;&#x2084;=30, &#x03BB;&#x2085;=20, calibrated through stakeholder consultation and validated via Pareto frontier analysis.</p><p>Importantly, the &#x03BB;&#x2081;=1000 penalty in the BDE fitness function serves exclusively as a barrier function to prevent BDE from exploring infeasible regions, not as a relaxation of hard constraints. All BDE trial solutions with C_hard&#x003E;0 are repaired to feasibility by the IP solver prior to fitness evaluation, ensuring hard constraints remain inviolable. The W_imbalance term acts as a proxy for demographic equity by minimizing variance in shift allocation across all nurses; post hoc disparate impact ratio analysis confirmed that this proxy effectively eliminated experience-based disparities (see the Fairness and Equity Analysis section and <xref ref-type="table" rid="table1">Table 1</xref>).</p><table-wrap id="t1" position="float"><label>Table 1.</label><caption><p>Undesirable shift distribution by experience level. Expected proportion of novice nurses: 26.9% (42/156 nurses). Acceptable disparate impact range: 0.80&#x2010;1.20 [<xref ref-type="bibr" rid="ref11">11</xref>].</p></caption><table id="table1" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Shift type</td><td align="left" valign="bottom">Preimplementation: novice actual, % (n/N)<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="bottom">Preimplementation: DIR<sup><xref ref-type="table-fn" rid="table1fn2">b</xref></sup></td><td align="left" valign="bottom">Postimplementation: novice actual, % (n/N)<sup><xref ref-type="table-fn" rid="table1fn1">a</xref></sup></td><td align="left" valign="bottom">Postimplementation: DIR</td></tr></thead><tbody><tr><td align="left" valign="top">Night shifts</td><td align="char" char="." valign="top">42.1 (69/164)</td><td align="char" char="." valign="top">1.56<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="char" char="." valign="top">27.4 (49/179)</td><td align="char" char="." valign="top">1.02</td></tr><tr><td align="left" valign="top">Weekend shifts</td><td align="char" char="." valign="top">38.5 (69/179)</td><td align="char" char="." valign="top">1.43<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="char" char="." valign="top">28.0 (49/175)</td><td align="char" char="." valign="top">1.04</td></tr><tr><td align="left" valign="top">Overtime shifts</td><td align="char" char="." valign="top">37.1 (69/186)</td><td align="char" char="." valign="top">1.38<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="char" char="." valign="top">27.4 (49/179)</td><td align="char" char="." valign="top">1.02</td></tr><tr><td align="left" valign="top">Consecutive night shifts</td><td align="char" char="." valign="top">36.3 (69/190)</td><td align="char" char="." valign="top">1.35<sup><xref ref-type="table-fn" rid="table1fn3">c</xref></sup></td><td align="char" char="." valign="top">27.2 (49/180)</td><td align="char" char="." valign="top">1.01</td></tr></tbody></table><table-wrap-foot><fn id="table1fn1"><p><sup>a</sup>n/N denotes novice-assigned undesirable shift events divided by total events in each category; denominators therefore vary across categories.</p></fn><fn id="table1fn2"><p><sup>b</sup>DIR: disparate impact ratio.</p></fn><fn id="table1fn3"><p><sup>c</sup>Preimplementation violation of four-fifths fairness threshold (<italic>P</italic>&#x003C;.05 for all 4 categories).</p></fn></table-wrap-foot></table-wrap><p>The hybrid strategy exploits complementary strengths; IP guarantees hard constraint satisfaction (coverage, rest periods, consecutive shift limits, and skill mix), while BDE explores the feasible solution space to maximize preference satisfaction and workload equity. Computation averaged 12.7 minutes per monthly schedule. Full pseudocode is provided in S2.3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-5-2"><title>Multiobjective Optimization Module</title><p>The scheduling optimizer balances five competing objectives: (1) workload equity (minimizing coefficient of variation [CV] in shift assignments), (2) preference satisfaction (maximizing alignment with stated shift preferences), (3) skill-mix adequacy (ensuring appropriate distribution of experience levels across shifts), (4) regulatory compliance (satisfying labor law constraints on consecutive shifts and rest periods), and (5) operational efficiency (minimizing understaffing and overstaffing events).</p><p>The composite objective function is formulated as a weighted linear scalarization:</p><p><inline-formula><mml:math id="ieqn1"><mml:mstyle><mml:mrow><mml:mstyle displaystyle="false"><mml:mrow><mml:mi mathvariant="normal">F</mml:mi></mml:mrow><mml:mo>=</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">W</mml:mi></mml:mrow><mml:mn>1</mml:mn></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">f</mml:mi></mml:mrow><mml:mn>1</mml:mn></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">W</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">f</mml:mi></mml:mrow><mml:mn>2</mml:mn></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">W</mml:mi></mml:mrow><mml:mn>3</mml:mn></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">f</mml:mi></mml:mrow><mml:mn>3</mml:mn></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">W</mml:mi></mml:mrow><mml:mn>4</mml:mn></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">f</mml:mi></mml:mrow><mml:mn>4</mml:mn></mml:msub><mml:mo>+</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">W</mml:mi></mml:mrow><mml:mn>5</mml:mn></mml:msub><mml:mo>&#x22C5;</mml:mo><mml:msub><mml:mrow><mml:mi mathvariant="normal">f</mml:mi></mml:mrow><mml:mn>5</mml:mn></mml:msub></mml:mstyle></mml:mrow></mml:mstyle></mml:math></inline-formula></p><p>where each subobjective is defined as follows:</p><list list-type="order"><list-item><p>f&#x2081; (Workload equity): CV of monthly shift assignments across all nurses; minimized to promote equitable workload distribution.</p></list-item><list-item><p>f&#x2082; (Preference satisfaction): proportion of fulfilled shift-preference requests; maximized (entered as 1, fulfillment rate to convert to a minimization problem).</p></list-item><list-item><p>f&#x2083; (Skill-mix adequacy): deviation from target experience-level ratios per shift slot; minimized to ensure appropriate distribution of junior and senior nurses.</p></list-item><list-item><p>f&#x2084; (Regulatory compliance): count of constraint violations (consecutive-shift limits, mandatory rest periods, overtime caps); minimized to zero as a hard constraint.</p></list-item><list-item><p>f&#x2085; (Operational efficiency): sum of absolute understaffing and overstaffing events across all shifts in a scheduling cycle; minimized to maintain safe staffing levels.</p></list-item></list><p>All subobjectives are normalized to the (0 and 1) range using min-max scaling derived from the historical baseline period (mo 1&#x2010;6) prior to optimization. The default weight configuration deployed in clinical practice was established through a structured consensus process involving 4 nurse managers and 2 clinical informaticists, yielding w&#x2081;=0.30, w&#x2082;=0.25, w&#x2083;=0.20, w&#x2084;=0.15, and w&#x2085;=0.10, reflecting the institutional priority of fairness and preference satisfaction over strict operational efficiency (weight sensitivity analysis [WSA] systematically varies the normalized weights w&#x2081;-w&#x2085; &#x2208; [0,1] that govern the multiobjective trade-off, which are distinct from the penalty-scale barrier weights &#x03BB;&#x2081;=1000, &#x03BB;&#x2082;=100 etc used in the BDE fitness function). The complete formulation is available in S2.8 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s2-5-3"><title>WSA Design</title><p>To formally assess the robustness of scheduling outcomes to variations in objective weights&#x2014;and to address the inherent subjectivity of the consensus-derived default configuration&#x2014;a prespecified WSA was conducted using a full-factorial grid design. Seven configurations were evaluated, spanning 3 clinically meaningful priority scenarios.</p><list list-type="bullet"><list-item><p>Fairness-priority (FP) configurations (FP-Low, FP-Default, FP-High) systematically vary w&#x2081; (workload equity) from 0.20 to 0.40 while proportionally redistributing the remaining weight budget across w&#x2082;-w&#x2085;, holding their relative ratios constant. This isolates the marginal impact of fairness emphasis on all outcome domains.</p></list-item><list-item><p>Preference-priority (PP) configurations (PP-Low and PP-High) vary w&#x2082; (preference satisfaction) from 0.15 to 0.35, redistributing the residual weight proportionally across w&#x2081;, w&#x2083;-w&#x2085;. This tests whether increasing preference responsiveness compromises workload equity.</p></list-item><list-item><p>Efficiency-priority (EP) configuration: sets w&#x2085;=0.30 as the dominant weight, reducing w&#x2081; and w&#x2082; to 0.20 each, to simulate a cost-minimization context where operational staffing coverage is paramount. An Equal-Weight (EW) configuration (all weights=0.20) serves as an unweighted baseline. For each configuration, the IP+BDE optimizer was rerun on the same 6-month intervention-period scheduling instances (n=48 monthly department schedules), and results were compared by one-way repeated-measures ANOVA with Bonferroni correction; the FP-Default configuration served as the reference group for all pairwise comparisons.</p></list-item></list></sec></sec><sec id="s2-6"><title>Data Collection and Outcome Measures</title><sec id="s2-6-1"><title>Outcome Measures</title><p>Primary outcomes included scheduling time (hours/schedule), error rate (%), and user satisfaction (5-point Likert scale, validated 8-item instrument; S2.4 in ). Secondary outcomes included workload CV, Gini coefficient, disparate impact ratios by experience tier, preference satisfaction equity, and SHAP engagement rate (proportion of nurses viewing SHAP explanations at least once per scheduling cycle).</p></sec><sec id="s2-6-2"><title>Statistical Analysis</title><p>Continuous outcomes were analyzed using linear mixed effects models (LMM) with time (pre/post) and month as fixed effects, and department as a random intercept, to account for clustering of nurses within departments. Count outcomes (error counts and constraint violations) were analyzed using generalized estimating equations (GEE, Poisson family, and exchangeable correlation structure). Effect sizes were estimated using Cohen <italic>d</italic> for continuous outcomes and incidence rate ratios (IRRs) for count outcomes, with 95% CIs reported in Table S2 in S1.2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>. Three prespecified sensitivity analyses were conducted: (1) Hawthorne effect assessment comparing Months 1&#x2010;3 versus 4&#x2010;6, (2) monthly learning curve analysis, and (3) seasonal adjustment for Taiwan&#x2019;s major holiday periods. Statistical significance was set at &#x03B1;=.05 (2-tailed). All analyses were performed in R (version 4.3.0; R Core Team); full code is provided in S2.5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><p>For the WSA, one-way repeated-measures ANOVA was used to compare outcome metrics across the 7 weight configurations, with the FP-Default configuration as the reference. Pairwise post hoc comparisons were adjusted using the Bonferroni correction. Effect sizes were reported as partial &#x03B7;&#x00B2;. A configuration was deemed clinically noninferior to FP-Default if the 95% CI for the difference in workload equity CV was within &#x00B1;0.02 and the preference fulfillment rate differed by less than 5 percentage points.</p></sec><sec id="s2-6-3"><title>Qualitative Assessment</title><p>Semistructured interviews were conducted with a purposive sample of 24 nurses and 8 nurse managers, selected to ensure maximum variation across experience tiers (novice, midlevel, and experienced), departments (all 8 represented), and SHAP engagement levels (active users vs nonusers). Thematic saturation was achieved at interview 26, defined as no new codes emerging across 3 consecutive interviews. Interview guides addressed four domains: (1) perceived usability and system trust; (2) experience with SHAP explanations; (3) perceived fairness; and (4) barriers and facilitators to adoption. All 32 interviews were conducted in Mandarin Chinese, audio-recorded with written consent, and professionally transcribed verbatim (mean duration 38 min, range 28&#x2010;52 min). Thematic analysis followed the 6-phase framework of Braun and Clarke [<xref ref-type="bibr" rid="ref17">17</xref>]. Two authors (QYZ and CYL) independently coded all transcripts using NVivo 14. Interrater reliability was assessed on a randomly selected 20% subsample (&#x03BA;=0.81, indicating strong agreement). Disagreements were resolved by consensus, with a third author (SRW) serving as arbitrator. Member checking was performed with 5 participants; negative cases were actively sought to challenge emerging themes. Participant characteristics are reported in Table S3 in S1.2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec></sec><sec id="s2-7"><title>Fairness Monitoring Framework</title><p>Algorithmic fairness was audited quarterly across 3 dimensions: (1) demographic parity, proportional undesirable shift distribution across experience tiers; (2) equal opportunity, preference satisfaction equity (one-way ANOVA); and (3) disparate impact, selection rate ratios against the 0.80&#x2010;1.20 threshold (&#x201C;four-fifths rule&#x201D;) [<xref ref-type="bibr" rid="ref11">11</xref>]. Gini coefficients provided complementary inequality measurement. Automated alerts upon threshold violations were reviewed monthly by the AI Scheduling Oversight Committee (ASOC), a multidisciplinary body comprising 8 nursing managers, 2 information technology staff, 1 clinical ethicist, 1 legal advisor, and 1 elected nurse representative (S2.6 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref> and dashboard: Figure S2 in S1.2 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>).</p></sec><sec id="s2-8"><title>Governance and Data Privacy</title><p>System integrity was maintained through weekly automated model drift detection and quarterly retraining (threshold: <italic>R</italic>&#x00B2; drop &#x003E;0.03 from baseline). SHAP explanations were scoped to individual nurse data only, preventing disclosure of colleagues&#x2019; performance metrics. All 156 nurses completed a 1-hour domain-specific training session covering system usage and SHAP interpretation prior to deployment. All data were stored in databases encrypted using the advanced encryption standard with a 256-bit key and protected by role-based access controls, in compliance with the Taiwan Personal Data Protection Act.</p></sec><sec id="s2-9"><title>Ethical Considerations</title><p>The study was approved under an exemption waiver by the Institutional Review Board of Fu Jen Catholic University Hospital (IRB reference: FJUH-IRB-114&#x2010;459). All participating nurses and managers provided written informed consent prior to enrollment. Participation was voluntary, and participants were informed that they could withdraw from the study at any time without penalty or any effect on their employment status, work assignments, or institutional evaluation. All data were deidentified before analysis and reported only in aggregate form. Individual-level scheduling records, interview transcripts, SHAP engagement data, and satisfaction responses were stored in encrypted, access-controlled databases, and no personally identifiable information is disclosed in the manuscript or supplementary materials. No images or other materials containing identifiable participant information are included. No financial compensation or other incentives were provided to participants.</p></sec></sec><sec id="s3" sec-type="results"><title>Results</title><sec id="s3-1"><title>Operational Performance Improvements</title><p><xref ref-type="table" rid="table2">Table 2</xref> summarizes key operational metrics. The XAI-NSDSS reduced monthly scheduling time by 81.2% (from mean 32.0, SD 8.0 to mean 6.0, SD 2.0 h; <italic>P</italic>&#x003C;.001; Cohen <italic>d</italic>=4.33; 95% CI for difference &#x2212;29.1 to &#x2212;22.9 h), compressing a 3&#x2010;5 workday administrative burden to under 1 day. At the Emergency Department, reduction was most pronounced (45 &#x2192; 8 h; 82.2%). Schedule error rates decreased by 73.8% (mean 18.3, SD 4.3% to 4.8 &#x00B1; 1.2%; <italic>P</italic>&#x003C;.001; <italic>d</italic>=4.12), with reductions in rest period violations (91.7% reduction, from 8.4 to 0.7 violations per schedule), hard constraint violations (86.9%), and skill mismatches (78.4%).</p><table-wrap id="t2" position="float"><label>Table 2.</label><caption><p>Operational performance metrics: pre- versus postimplementation (n=156 nurses; 8 departments).</p></caption><table id="table2" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Metric</td><td align="left" valign="bottom">Preimplementation, mean (SD)</td><td align="left" valign="bottom">Postimplementation, mean (SD)</td><td align="left" valign="bottom">Change (%)</td><td align="left" valign="bottom">Cohen <italic>d</italic></td><td align="left" valign="bottom"><italic>P</italic> value</td></tr></thead><tbody><tr><td align="left" valign="top">Scheduling time (hours/month)</td><td align="left" valign="top">32.0 (8.0)</td><td align="left" valign="top">6.0 (2.0)</td><td align="left" valign="top">&#x2013;81.2</td><td align="left" valign="top">4.33</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Error rate (%)</td><td align="left" valign="top">18.3 (4.3)</td><td align="left" valign="top">4.8 (1.2)</td><td align="left" valign="top">&#x2013;73.8</td><td align="left" valign="top">4.12</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Constraint violations (per schedule)</td><td align="left" valign="top">12.7 (2.8)</td><td align="left" valign="top">1.3 (0.6)</td><td align="left" valign="top">&#x2013;89.8</td><td align="left" valign="top">5.42</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Preference satisfaction (%)</td><td align="left" valign="top">72.4 (5.1)</td><td align="left" valign="top">88.1 (2.8)</td><td align="left" valign="top">+21.7</td><td align="left" valign="top">3.87</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Workload CV<sup><xref ref-type="table-fn" rid="table2fn1">a</xref></sup></td><td align="left" valign="top">0.18 (0.03)</td><td align="left" valign="top">0.09 (0.02)</td><td align="left" valign="top">&#x2013;50.0</td><td align="left" valign="top">3.74</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Nurse satisfaction (1-5)</td><td align="left" valign="top">3.2 (0.8)</td><td align="left" valign="top">4.4 (0.6)</td><td align="left" valign="top">+37.5</td><td align="left" valign="top">1.71</td><td align="left" valign="top">&#x003C;.001</td></tr><tr><td align="left" valign="top">Manager satisfaction (1-5)</td><td align="left" valign="top">3.5 (0.7)</td><td align="left" valign="top">4.7 (0.4)</td><td align="left" valign="top">+34.3</td><td align="left" valign="top">2.08</td><td align="left" valign="top">&#x003C;.001</td></tr></tbody></table><table-wrap-foot><fn id="table2fn1"><p><sup>a</sup>CV: coefficient of variation</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-2"><title>User Satisfaction and System Adoption</title><p>System adoption reached 148 out of 156 nurses (94.9%) by Month 3, with subsequent stability through Month 6 (<xref ref-type="fig" rid="figure2">Figure 2A-2D</xref>). The largest pre-to-post satisfaction gains were in transparency/explainability (mean 2.6, SD 1.0-mean 4.3, SD 0.6; <italic>P</italic>&#x003C;.001; <italic>d</italic>=2.08) and fairness perception (mean 2.9, SD 1.0-mean 4.2, SD 0.7; <italic>P</italic>&#x003C;.001; <italic>d</italic>=1.50). Trust in AI recommendations improved from a mean of 2.8 (SD) 0.9 to mean of 4.1 (SD 0.7; <italic>P</italic>&#x003C;.001; <italic>d</italic>=1.62). Of 156 nurses, 82 (52.6%) regularly engaged with SHAP explanations, with a significant positive association between engagement frequency and overall satisfaction (Pearson <italic>r</italic>=0.456; <italic>P</italic>&#x003C;.001; Figure S3 in ). Full satisfaction subscale results are reported in Table S4 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><fig position="float" id="figure2"><label>Figure 2.</label><caption><p>Monthly trend analysis: postimplementation performance (July-December 2023). (A) Scheduling time showing rapid decline from initial 8.2 hrs to stable 6.0 hrs, with preimplementation baseline (32.0 h) as dashed reference. (B) Error rate declining from 7.8% (Month 1) to stable 4.8%. (C) Nurse satisfaction improvement with system adoption reaching 94% by Month 3. (D) Workload CV sustained below the 0.12 target throughout, with preimplementation baseline (0.18) as reference.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="nursing_v9i1e94450_fig02.png"/></fig></sec><sec id="s3-3"><title>SHAP Explainability Insights</title><p>Global SHAP analysis identified cumulative fatigue score (mean |SHAP|=0.42), years of experience (0.38), and recent overtime hours (0.35) as the 3 most influential scheduling determinants (<xref ref-type="fig" rid="figure3">Figure 3</xref>). Survey responses confirmed that SHAP explanations helped 122 out of 156 (78.2%) nurses understand shift assignments, increased trust for 111 out of 156 (71.2%) nurses, and identified actionable strategies to improve scheduling priority for 100 out of 156 (64.1%) nurses.</p><fig position="float" id="figure3"><label>Figure 3.</label><caption><p>Global feature importance: mean absolute Shapley Additive Explanations (SHAP) values for the random forest workload capacity model (n=18 features). Bars colored by impact magnitude: high (red, |SHAP|&#x003E;0.30), medium (amber, 0.20&#x2010;0.30), lower (blue, &#x003C;0.20). SHAP: Shapley Additive Explanations.</p></caption><graphic alt-version="no" mimetype="image" position="float" xlink:type="simple" xlink:href="nursing_v9i1e94450_fig03.png"/></fig></sec><sec id="s3-4"><title>Algorithm Performance Comparison</title><p>The hybrid IP+BDE approach significantly outperformed either component in isolation (<xref ref-type="table" rid="table3">Table 3</xref>). BDE-only achieved only 95.2% hard constraint compliance versus IP&#x2019;s guaranteed 100%. IP-only achieved only 78.3% preference satisfaction versus the hybrid&#x2019;s 88.1%. Computation time averaged 12.7 minutes per monthly schedule versus 32.0 hours for manual scheduling (99.3% reduction). Emergency rescheduling resolved within 5&#x2010;8 minutes.</p><table-wrap id="t3" position="float"><label>Table 3.</label><caption><p>Algorithm performance comparison. Results are based on a 6-month postimplementation period (n=48 schedules).</p></caption><table id="table3" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Method</td><td align="left" valign="bottom">Hard constraint compliance (%)</td><td align="left" valign="bottom">Preference satisfaction (%)</td><td align="left" valign="bottom">Workload CV<sup><xref ref-type="table-fn" rid="table3fn1">a</xref></sup></td><td align="left" valign="bottom">Computation time</td></tr></thead><tbody><tr><td align="left" valign="top">Manual scheduling (baseline)</td><td align="left" valign="top">81.7</td><td align="left" valign="top">72.4</td><td align="left" valign="top">0.18</td><td align="left" valign="top">32.0 h</td></tr><tr><td align="left" valign="top">&#x2003;IP<sup><xref ref-type="table-fn" rid="table3fn2">b</xref></sup> only</td><td align="left" valign="top">100</td><td align="left" valign="top">78.3</td><td align="left" valign="top">0.14</td><td align="left" valign="top">8.2 min</td></tr><tr><td align="left" valign="top">&#x2003;BDE<sup><xref ref-type="table-fn" rid="table3fn3">c</xref></sup> only</td><td align="left" valign="top">95.2</td><td align="left" valign="top">85.6</td><td align="left" valign="top">0.11</td><td align="left" valign="top">15.4 min</td></tr><tr><td align="left" valign="top">&#x2003;Hybrid IP+BDE (proposed)</td><td align="left" valign="top">100</td><td align="left" valign="top">88.1</td><td align="left" valign="top">0.09</td><td align="left" valign="top">12.7 min</td></tr></tbody></table><table-wrap-foot><fn id="table3fn1"><p><sup>a</sup>CV: coefficient of variation.</p></fn><fn id="table3fn2"><p><sup>b</sup>IP: integer programming. </p></fn><fn id="table3fn3"><p><sup>c</sup>BDE: binary differential evolution.</p></fn></table-wrap-foot></table-wrap></sec><sec id="s3-5"><title>Fairness and Equity Analysis</title><sec id="s3-5-1"><title>Workload Distribution Equity</title><p>Postimplementation workload equity improved substantially. Hospital-wide CV decreased 50.0% (mean 0.18, SD 0.03-mean o 0.09, SD 0.02; <italic>P</italic>&#x003C;.001; <italic>d</italic>=3.74; 95% CI for mean difference: &#x2212;0.10 to &#x2212;0.08). The Gini coefficient improved 45.8% (0.24-0.13), corroborating CV findings. Post implementation, experience level no longer predicted workload variability (<italic>F</italic><sub>2,153</sub>=1.42; <italic>P</italic>=.24), and improvements were uniform across all 8 departments (<italic>F</italic><sub>7,148</sub>=0.89; <italic>P</italic>=.51). Monthly workload CV trend data are shown in <xref ref-type="fig" rid="figure2">Figure 2D</xref>.</p></sec><sec id="s3-5-2"><title>Elimination of Systematic Bias in Undesirable Shift Allocation</title><p>As shown in <xref ref-type="table" rid="table1">Table 1</xref>, novice nurses were overrepresented in all 4 undesirable shift categories before implementation, accounting for 42.1% (69/164) of night shift assignments, 38.5% (69/179) of weekend shift assignments, 37.1% (69/186) of overtime shift assignments, and 36.3% (69/190) of consecutive-night events, despite representing 26.9% (42/156) of the nursing workforce. Postimplementation, these proportions decreased to 27.4% (49/179), 28.0% (49/175), 27.4% (49/179), and 27.2% (49/180), respectively, with disparate impact ratios normalized from 1.35-1.56 to 1.01-1.04. This represents a measurable, auditable transition from an algorithmically biased manual system to a provably equitable AI-assisted system.</p></sec></sec><sec id="s3-6"><title>Preference Satisfaction Equity</title><p>Preimplementation, experienced nurses received significantly higher preference satisfaction than novice nurses (76.2% vs 68.4%; gap=7.8 percentage points; <italic>P</italic>=.009). Postimplementation, this disparity was eliminated (ANOVA <italic>P</italic>=.38; all pairwise comparisons <italic>P</italic>&#x003E;.30), with all 3 experience tiers achieving satisfaction rates &#x2265;87%. Equity was achieved through a &#x201C;leveling up&#x201D; strategy&#x2014;absolute gains &#x003E;13 percentage points for all groups (<italic>P</italic>&#x003C;.001)&#x2014;rather than redistributing the burden from experienced to novice nurses.</p></sec><sec id="s3-7"><title>Sensitivity Analyses</title><p>Hawthorne effect analysis (Months 1&#x2010;3 vs 4&#x2010;6) confirmed sustained benefits, scheduling time remained stable (mean 6.2, SD 2.1 vs mean 5.8, SD 1.9 h; <italic>P</italic>=.34); satisfaction continued its upward trend (mean 4.2, SD 0.7-mean 4.6, SD 0.5; <italic>P</italic>=.03). Workload CV remained below the preimplementation level across all 6 months (range 0.08&#x2010;0.10), confirming sustained improvement rather than novelty effect. Seasonal adjustment revealed no significant interaction between time and holiday period (<italic>P</italic>=.41). Detailed results are provided in Table S5 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s3-8"><title>WSA</title><p>Beyond the prespecified sensitivity analyses reported above, a formal WSA was conducted to assess whether scheduling outcomes depended on the choice of objective-function weights. WSA was conducted across all 7 prespecified configurations (<xref ref-type="table" rid="table4">Table 4</xref>). One-way repeated-measures ANOVA revealed a significant main effect of weight configuration on workload equity CV (<italic>F</italic><sub>&#x2086;, &#x2082;&#x2088;&#x2082;</sub>=18.43; <italic>P</italic>&#x003C;.001; &#x03B7;&#x00B2;=0.28), preference fulfillment rate (<italic>F</italic><sub>&#x2086;, &#x2082;&#x2088;&#x2082;</sub>=22.17; <italic>P</italic>&#x003C;.001; &#x03B7;&#x00B2;=0.32), and composite schedule quality score (<italic>F</italic><sub>&#x2086;, &#x2082;&#x2088;&#x2082;</sub>=9.84; <italic>P</italic>&#x003C;.001; &#x03B7;&#x00B2;=0.17). No significant main effect was observed for the disparate impact ratio range (<italic>F</italic><sub>&#x2086;, &#x2082;&#x2088;&#x2082;</sub>=1.72; <italic>P</italic>=.12), indicating that the fairness-auditing module maintained equitable shift distribution regardless of weight settings.</p><table-wrap id="t4" position="float"><label>Table 4.</label><caption><p>Scheduling outcome metrics across weight sensitivity configurations (n=48 schedules per configuration).</p></caption><table id="table4" frame="hsides" rules="groups"><thead><tr><td align="left" valign="bottom">Configuration</td><td align="left" valign="bottom">Workload equity CV<sup><xref ref-type="table-fn" rid="table4fn1">a</xref></sup>, mean (SD)</td><td align="left" valign="bottom">Preference fulfillment (%)</td><td align="left" valign="bottom">Disparate impact ratio range</td><td align="left" valign="bottom">Composite quality score (0&#x2010;100)</td></tr></thead><tbody><tr><td align="left" valign="top">FP-Low<sup><xref ref-type="table-fn" rid="table4fn2">b</xref></sup></td><td align="left" valign="top">0.13 (0.02)</td><td align="left" valign="top">81.4 (4.1)</td><td align="left" valign="top">0.98&#x2010;1.06</td><td align="left" valign="top">74.2 (3.8)</td></tr><tr><td align="left" valign="top">FP-Default (Clinical)</td><td align="left" valign="top">0.09 (0.02)</td><td align="left" valign="top">84.6 (3.7)</td><td align="left" valign="top">1.01&#x2010;1.04</td><td align="left" valign="top">82.1 (3.2)</td></tr><tr><td align="left" valign="top">FP-High</td><td align="left" valign="top">0.07 (0.01)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">79.3 (4.8)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">1.00&#x2010;1.03</td><td align="left" valign="top">79.8 (4.1)</td></tr><tr><td align="left" valign="top">PP-Low<sup><xref ref-type="table-fn" rid="table4fn4">d</xref></sup></td><td align="left" valign="top">0.11 (0.02)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">76.2 (5.2)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">1.01&#x2010;1.05</td><td align="left" valign="top">76.4 (4.5)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td></tr><tr><td align="left" valign="top">PP-High</td><td align="left" valign="top">0.12 (0.03)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">89.1 (3.2)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">1.02&#x2010;1.07</td><td align="left" valign="top">78.3 (3.9)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td></tr><tr><td align="left" valign="top">EP<sup><xref ref-type="table-fn" rid="table4fn5">e</xref></sup></td><td align="left" valign="top">0.15 (0.03)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">74.8 (5.6)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">1.03&#x2010;1.09</td><td align="left" valign="top">71.6 (4.7)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td></tr><tr><td align="left" valign="top">EW<sup><xref ref-type="table-fn" rid="table4fn6">f</xref></sup></td><td align="left" valign="top">0.11 (0.02)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">80.7 (4.3)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td><td align="left" valign="top">1.00&#x2010;1.06</td><td align="left" valign="top">77.5 (3.6)<sup><xref ref-type="table-fn" rid="table4fn3">c</xref></sup></td></tr></tbody></table><table-wrap-foot><fn id="table4fn1"><p><sup>a</sup>CV: coefficient of variation.</p></fn><fn id="table4fn2"><p><sup>b</sup>FP: fairness-priority.</p></fn><fn id="table4fn3"><p><sup>c</sup>Significantly different from FP-Default (Bonferroni-corrected <italic>P</italic>&#x003C;.05).</p></fn><fn id="table4fn4"><p><sup>d</sup>PP: preference-priority.</p></fn><fn id="table4fn5"><p><sup>e</sup>EP: efficiency-priority.</p></fn><fn id="table4fn6"><p><sup>f</sup>EW: equal-weight.</p></fn></table-wrap-foot></table-wrap><sec id="s3-8-1"><title>Workload Equity</title><p>The FP-Default configuration achieved the best balance between equity (CV=0.09&#x00B1;0.02) and overall quality. FP-High yielded marginally lower CV (0.07&#x00B1;0.01; mean difference &#x2212;0.02, 95% CI &#x2212;0.03 to &#x2212;0.01; <italic>P</italic>=.008), but at the cost of a significant reduction in preference fulfillment (79.3% vs 84.6%; mean difference &#x2212;5.3 percentage points, 95% CI &#x2212;7.8 to &#x2212;2.8; <italic>P</italic>&#x003C;.001). The EP configuration produced the highest CV (0.15&#x00B1;0.03; mean difference 0.06; 95% CI 0.04-0.08; <italic>P</italic>&#x003C;.001), confirming that deprioritizing workload equity substantially degraded fairness outcomes.</p></sec><sec id="s3-8-2"><title>Preference Satisfaction</title><p>PP-High maximized preference fulfillment (mean 89.1, SD 3.2%), exceeding FP-Default by mean difference 4.5 percentage points (95% CI 2.1&#x2010;6.9; <italic>P</italic>=.001). However, this gain was accompanied by deterioration in workload equity (CV=0.12&#x00B1;0.03 vs 0.09&#x00B1;0.02; <italic>P</italic>=.003) and a reduction in composite quality score (78.3 vs 82.1; <italic>P</italic>=.01). Conversely, PP-Low reduced preference fulfillment to 76.2% (mean difference=&#x2212;8.4% percentage points; <italic>P</italic>&#x003C;.001) while offering no significant improvement in any other outcome domain, suggesting w&#x2082;=0.15 is below the minimum threshold for acceptable preference responsiveness in this institutional context.</p></sec><sec id="s3-8-3"><title>Disparate Impact Ratios</title><p>Critically, all 7 weight configurations maintained disparate impact ratios within the 0.80&#x2010;1.25 fairness threshold (range across all configurations: 0.98&#x2010;1.09), and the ANOVA revealed no significant between-configuration differences (<italic>P</italic>=.12). This finding demonstrates that the fairness-auditing module provides a structural guarantee against experience-based bias that is robust to changes in optimization priorities.</p></sec><sec id="s3-8-4"><title>Composite Schedule Quality</title><p>FP-Default achieved the highest composite quality score (mean 82.1, SD 3.2), significantly outperforming all alternative configurations (all Bonferroni-corrected <italic>P</italic>&#x003C;.05) except FP-High (mean 79.8, SD 4.1; mean difference=&#x2212;2.3, 95% CI &#x2212;4.8 to +0.2; <italic>P</italic>=.07). Applying the prespecified noninferiority criteria (CV within &#x00B1;0.02 and preference fulfillment within &#x00B1;5 percentage points), only FP-High met both criteria simultaneously. All other configurations failed at least one criterion, supporting the robustness of the FP-Default configuration as the clinically optimal choice for this institution.</p></sec></sec><sec id="s3-9"><title>Monthly Trend Analysis</title><p><xref ref-type="fig" rid="figure2">Figure 2</xref> presents monthly trend data across all 4 primary performance domains during the postimplementation period. The 2-month adaptation period followed by sustained stability aligns with the &#x201C;implementation cliff&#x201D; described in implementation science literature [<xref ref-type="bibr" rid="ref18">18</xref>] and supports the recommendation of a 3-month intensive support period for similar deployments. Detailed monthly data are provided in Table S6 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p></sec><sec id="s3-10"><title>Qualitative Findings</title><p>Semistructured interviews (n=24 nurses; n=8 managers; mean duration 38 min) yielded 5 major themes. A full participant characteristics table is provided in Table S3 in <xref ref-type="supplementary-material" rid="app1">Multimedia Appendix 1</xref>.</p><sec id="s3-10-1"><title>Transparency as a Conflict-Resolution Mechanism (21 of 24 Nurses; 8 of 8 Managers)</title><p>SHAP-derived rationale for unfavorable assignments substantially reduced grievance escalations. One nursing manager stated, &#x201C;There are fewer complaints about unfair schedules. When someone questions an assignment, I can show them the SHAP explanation.&#x201D;</p></sec><sec id="s3-10-2"><title>Fairness as a Structural Achievement (18 of 24 Nurses; 7 of 8 Managers)</title><p>Nurses attributed equity improvements to objective system design rather than managerial goodwill, increasing systemic trust.</p></sec><sec id="s3-10-3"><title>Administrative Burden Relief Enabling Clinical Refocus (8 of 8 Managers)</title><p>All managers described time savings as professionally transformative. Emergency department manager said, &#x201C;I used to spend an entire week every month on scheduling. Now it&#x2019;s done in a day.&#x201D;</p></sec><sec id="s3-10-4"><title>Learning-to-Trust Trajectory (19 of 24 Nurses)</title><p>Initial resistance in Months 1&#x2010;2 diminished substantially by Month 3. A nurse with 7 years of experience stated, &#x201C;At first I was skeptical, but once I learned how to input my preferences properly, it worked really well.&#x201D;</p></sec><sec id="s3-10-5"><title>Residual Tensions: Preference Override Acceptance (11 of 24 Nurses)</title><p>Explainability reduces but does not eliminate individual dissatisfaction when equity constraints conflict with strong personal preferences.</p></sec></sec></sec><sec id="s4" sec-type="discussion"><title>Discussion</title><sec id="s4-1"><title>Principal Findings</title><p>This study demonstrates that a fairness-audited, XAI scheduling system can simultaneously reduce administrative burden by 81.2%, eliminate preexisting experience-based algorithmic bias, and achieve 94.9% (148/156 nurses) system adoption in a real-world hospital setting. Three findings warrant particular emphasis: (1) preexisting experience-based bias was formally documented and completely eliminated; (2) SHAP engagement was significantly associated with user satisfaction; and (3) sustained improvements confirmed by sensitivity analyses ruled out novelty effects.</p></sec><sec id="s4-2"><title>Algorithmic Fairness as a Primary Clinical Contribution</title><p>The most significant finding is the systematic identification and complete elimination of preexisting experience-based bias. Preimplementation, 69 out of 156 novice nurses were over-represented in all 4 undesirable shift categories by 26%&#x2010;46% (disparate impact ratios 1.35&#x2010;1.56), exceeding the established four-fifths rule threshold for systemic discrimination [<xref ref-type="bibr" rid="ref11">11</xref>]. This trend aligns with documented informal seniority hierarchies in nursing workplaces [<xref ref-type="bibr" rid="ref19">19</xref>] but had not previously been quantified with formal fairness metrics in the AI scheduling literature.</p><p>The complete normalization of all disparate impact ratios postimplementation (1.01&#x2010;1.04) demonstrates that embedding W_imbalance and F_total into the objective function can mitigate institutionalized bias. The W_imbalance term minimizes variance in shift allocation across all nurses, and post hoc disparate impact analysis confirmed this proxy effectively eliminated experience-based disparities, validating the chosen surrogate metric. The Gini coefficient improvement (0.24-0.13) further confirms equity advancements. Future implementations should treat preexisting bias characterization as a mandatory predeployment audit step.</p></sec><sec id="s4-3"><title>SHAP Explainability as a Functional Trust Mechanism</title><p>A central hypothesis was that SHAP-based explainability would serve as an active trust-building mechanism. Our data show a significant positive association between SHAP engagement and satisfaction (<italic>r</italic>=0.456; <italic>P</italic>&#x003C;.001). While causality cannot be established from this observational correlation&#x2014;satisfied nurses may be more inclined to engage with explanations&#x2014;the qualitative data consistently suggest that explanations functionally mitigate organizational conflict when used, consistent with a bidirectional reinforcing relationship. This extends work by Liu et al [<xref ref-type="bibr" rid="ref20">20</xref>] on &#x201C;integrability&#x201D; as a determinant of AI acceptance, demonstrating that explanations must be actively used&#x2014;not merely available&#x2014;to generate trust benefits.</p><p>Critically, while 82 out of 156 nurses (52.6%) regularly viewed SHAP explanations, this study measured engagement frequency rather than comprehension accuracy. A formal assessment of whether nurses correctly interpreted feature importance rankings was not conducted, leaving a &#x201C;comprehension gap&#x201D; unquantified. Future research should use validated XAI literacy instruments to assess whether engagement translates to understanding.</p><p>The 52.6% rate of voluntary SHAP engagement surpasses engagement rates reported for passive transparency features in health care AI [<xref ref-type="bibr" rid="ref21">21</xref>]. The 1-hour domain-specific training investment appears to be an effective and scalable strategy for facilitating XAI adoption.</p></sec><sec id="s4-4"><title>Contextualizing Performance Against Prior Literature</title><p>Our 73.8% error rate reduction exceeds the 40%&#x2010;60% range reported in comparable scheduling optimization studies [<xref ref-type="bibr" rid="ref22">22</xref>,<xref ref-type="bibr" rid="ref23">23</xref>], attributable primarily to the human-in-the-loop verification enabled by SHAP transparency. The hybrid IP+BDE approach outperformed both single-method alternatives, consistent with the demonstration by Ben Said et al [<xref ref-type="bibr" rid="ref24">24</xref>] that hybrid constraint-learning pipelines outperform single-method approaches in health care scheduling. Regarding the role of XAI versus IP optimization, XAI in this system is not merely a technical overlay but a functional organizational mechanism. Without SHAP explanations, the system would generate algorithmically optimal schedules that clinicians cannot audit, verify, or trust, making sustained adoption unlikely regardless of algorithmic performance. The 94.9% adoption rate at Month 3 versus typical rates for opaque AI systems substantiates this claim [<xref ref-type="bibr" rid="ref9">9</xref>,<xref ref-type="bibr" rid="ref10">10</xref>].</p></sec><sec id="s4-5"><title>Weight Sensitivity and Optimization Robustness</title><p>The WSA addresses a fundamental challenge in multiobjective optimization for health care applications, the selection of objective weights is inherently value-laden and context-dependent; yet, the robustness of outcomes to weight perturbations has rarely been formally evaluated in prior nurse scheduling studies. Our findings contribute 3 key insights to this literature.</p><p>First, the consensus-derived FP-Default configuration (w&#x2081;=0.30; w&#x2082;=0.25) achieved the highest composite schedule quality score and was the only configuration meeting prespecified noninferiority criteria on both workload equity and preference fulfillment simultaneously. This validates the stakeholder co-design process as an effective method for identifying near-optimal weight configurations in institutional contexts, consistent with findings from participatory AI scheduling design studies [<xref ref-type="bibr" rid="ref10">10</xref>,<xref ref-type="bibr" rid="ref19">19</xref>].</p><p>Second, the analysis revealed an inherent trade-off between workload equity and preference satisfaction that cannot be eliminated through algorithmic design alone. Increasing w&#x2081; beyond 0.30 (FP-High) improved equity marginally but reduced preference fulfillment by 5.3 percentage points&#x2014;a clinically meaningful reduction given that preference accommodation is a primary driver of nurse satisfaction and retention [<xref ref-type="bibr" rid="ref5">5</xref>,<xref ref-type="bibr" rid="ref22">22</xref>]. Conversely, maximizing preference satisfaction (PP-High) degraded workload equity, potentially reintroducing the experience-based disparities that the system was designed to eliminate. This trade-off surface highlights the irreducible nature of the fairness&#x2013;preference tension and underscores the importance of transparent weight disclosure to affected stakeholders.</p><p>Third, and most critically for regulatory compliance, the disparate impact ratios remained within the 0.80&#x2010;1.25 fairness threshold across all 7 weight configurations (<italic>P</italic>=.12 for between-configuration differences). This structural invariance demonstrates that the fairness-auditing module provides a hard constraint on algorithmic bias that operates independently of optimization priorities, a design principle with direct implications for responsible AI deployment in health care workforce governance [<xref ref-type="bibr" rid="ref11">11</xref>,<xref ref-type="bibr" rid="ref25">25</xref>]. Institutions adopting the XAI-NSDSS framework can therefore customize weight configurations to reflect local priorities without compromising the fairness guarantees central to equitable workforce governance.</p><p>The differential engagement patterns across experience levels suggest that explainability features are particularly valuable for less-experienced staff who may have less institutional power to challenge unfair scheduling decisions. This finding aligns with qualitative research by Gerlach et al [<xref ref-type="bibr" rid="ref19">19</xref>] identifying transparency as a critical adoption factor for junior nurses, and extends it by quantifying the relationship between explanation engagement and satisfaction outcomes.</p></sec><sec id="s4-6"><title>Implementation Science Perspective</title><p>The initial satisfaction dip (Month 1) followed by sustained improvement (Months 3&#x2010;6) is consistent with the &#x201C;implementation cliff&#x201D; [<xref ref-type="bibr" rid="ref18">18</xref>]. Our data suggest a 2&#x2010;3 month stabilization window as the critical support period. The ASOC governance structure&#x2014;with monthly fairness dashboard reviews and multidisciplinary oversight&#x2014;addresses the requirements for organizational accountability in AI deployment reported by Saeed et al [<xref ref-type="bibr" rid="ref25">25</xref>], distinguishing this implementation from most published systems that lack ongoing governance postlaunch.</p></sec><sec id="s4-7"><title>Limitations</title><p>Single-site implementation in Taiwan limits generalizability to other health care systems, labor regulations, and cultural contexts; multisite validation is needed before broad adoption recommendations can be made. The 6-month postimplementation period does not address long-term system drift or multiyear organizational embedding. The quasiexperimental before-after design inherently limits causal inference: despite large effect sizes (Cohen <italic>d</italic>&#x003E;3.7 across all primary outcomes), secular trends, regression to the mean, or co-occurring organizational changes cannot be fully excluded. SHAP comprehension accuracy was not formally assessed&#x2014;only viewing frequency&#x2014;leaving a &#x201C;comprehension gap&#x201D; unquantified. Patient care outcomes (eg, medication error rates and fall incidence) were not measured; connecting scheduling equity to downstream clinical outcomes remains an important research direction. The SHAP-satisfaction correlation is observational and directional causality cannot be established without experimental manipulation.</p><p>The WSA was conducted within a single institutional context; the consensus-derived FP-Default weight configuration (w&#x2081;=0.30, w&#x2082;=0.25) reflects this institution&#x2019;s scheduling culture, labor regulations, and workforce demographics. While the structural robustness of fairness metrics across all 7 configurations is likely to generalize, the absolute weight values may require site-specific calibration in institutions with different operational priorities. Future multisite replications should include systematic WSA to determine whether FP-Default represents a transferable standard or an institution-specific optimum.</p></sec><sec id="s4-8"><title>Future Research Directions</title><p>Priority directions include (1) multisite validation across diverse health care systems, (2) randomized trials comparing explainable versus nonexplainable scheduling systems to establish the causal impact of XAI on trust and adoption, (3) integration with real-time patient acuity data, and (4) federated learning for privacy-preserving multi-institutional model development [<xref ref-type="bibr" rid="ref26">26</xref>].</p><p>Regarding optimization robustness, adaptive weight optimization methods&#x2014;such as Bayesian preference elicitation or reinforcement learning from stakeholder feedback&#x2014;could automate the weight configuration process and reduce reliance on expert consensus, potentially improving outcomes in institutions lacking access to multidisciplinary co-design teams. The WSA framework developed in this study should be replicated in multisite contexts to determine whether the FP-Default weight configuration generalizes across institutions with different staffing cultures and regulatory environments or whether site-specific calibration is required.</p></sec><sec id="s4-9"><title>Conclusions</title><p>This study presents a prospectively validated, fairness-audited XAI implementation framework for nurse scheduling delivering measurable operational improvements while maintaining interpretability and human oversight. Three key findings are noteworthy:</p><list list-type="order"><list-item><p>The formal documentation and complete elimination of preexisting experience-based algorithmic bias&#x2014;disparate impact ratios normalized from 1.35&#x2010;1.56 to 1.01&#x2010;1.04&#x2014;establishes a replicable methodology for fairness auditing in health care workforce AI.</p></list-item><list-item><p>The positive association between SHAP engagement and satisfaction (<italic>r</italic>=0.456), combined with qualitative evidence of explanations as conflict mediators, is consistent with explainability functioning as an organizational intervention, though directionality cannot be confirmed from observational data alone.</p></list-item><list-item><p>The complete implementation science documentation&#x2014;governance structure, phased rollout, learning curve data, and sensitivity analyses&#x2014;provides a practical guide for responsible AI adoption in health care workforce management. WSA across 7 objective-weight configurations confirmed that fairness guarantees remain intact regardless of optimization priority settings (disparate impact ratio <italic>P</italic>=.12 across all configurations), validating the framework for diverse institutional deployment contexts.</p></list-item></list><p>The XAI-NSDSS framework demonstrates that algorithmic decision support can simultaneously achieve efficiency, equity, and transparency. The framework is replicable, scalable, and aligned with emerging standards for responsible AI governance in clinical settings.</p></sec></sec></body><back><ack><p>The authors gratefully acknowledge the participating nurses and nurse managers at Fu Jen Catholic University Hospital for their dedication to this study. We thank the hospital administration for supporting this research and providing access to scheduling data and operational resources. We also acknowledge the contributions of the hospital's Information Technology Department for technical infrastructure support. Generative artificial intelligence (AI) tools were used to assist with drafting and editing selected sections (eg, phrasing and structure). All scientific content, analyses, interpretations, and references were verified by the authors, who take full responsibility for the manuscript.</p></ack><notes><sec><title>Funding</title><p>This research was supported by the National Science and Technology Council, Taiwan (Grant Number: NSTC 114-2622-8-030-002-TD2). The funding agency had no role in study design, data collection, analysis, interpretation, or manuscript preparation.</p></sec><sec><title>Data Availability</title><p>The datasets generated or analyzed during this study are not publicly available due to institutional privacy policies protecting employee data but are available from the corresponding author on reasonable request and with appropriate data use agreements. The explainable AI&#x2013;enabled nurse scheduling decision support system (XAI-NSDSS) source code is available from the corresponding author on reasonable request for noncommercial research purposes, subject to institutional approval.</p><p/></sec></notes><fn-group><fn fn-type="con"><p>Conceptualization: BCS, SRW</p><p>Data curation: SMP</p><p>Formal analysis: BCS, QYZ</p><p>Funding acquisition: SRW</p><p>Investigation: QYZ, CYL</p><p>Methodology: BCS, SRW</p><p>Project administration: BCS</p><p>Resources: CYL</p><p>Software: BCS, SMP</p><p>Supervision: SRW</p><p>Validation: SMP</p><p>Visualization: SMP</p><p>Writing &#x2013; original draft: BCS</p><p>Writing &#x2013; review &#x0026; editing: QYZ, CYL, SRW</p><p>All authors read and approved the final manuscript.</p></fn><fn fn-type="conflict"><p>The authors declare no conflicts of interest. No author has financial relationships with commercial scheduling software companies or other entities that could inappropriately influence this work. The XAI-NSDSS system is not commercially available, and the authors have no plans for commercialization.</p></fn></fn-group><glossary><title>Abbreviations</title><def-list><def-item><term id="abb1">AI</term><def><p> artificial intelligence</p></def></def-item><def-item><term id="abb2">ASOC</term><def><p> AI Scheduling Oversight Committee</p></def></def-item><def-item><term id="abb3">BDE</term><def><p>binary differential evolution</p></def></def-item><def-item><term id="abb4">CV</term><def><p>coefficient of variation</p></def></def-item><def-item><term id="abb5">EP</term><def><p>efficiency-priority</p></def></def-item><def-item><term id="abb6">EW</term><def><p>equal-weight</p></def></def-item><def-item><term id="abb7">FP</term><def><p>fairness-priority</p></def></def-item><def-item><term id="abb8">GEE</term><def><p>generalized estimating equations</p></def></def-item><def-item><term id="abb9">IP</term><def><p>integer programming</p></def></def-item><def-item><term id="abb10">IRR</term><def><p>incidence rate ratio</p></def></def-item><def-item><term id="abb11">LMM</term><def><p>linear mixed effects models</p></def></def-item><def-item><term id="abb12">MAE</term><def><p>mean absolute error</p></def></def-item><def-item><term id="abb13">PP</term><def><p>preference-priority</p></def></def-item><def-item><term id="abb14">RMSE</term><def><p>root-mean-square error</p></def></def-item><def-item><term id="abb15">SHAP</term><def><p>Shapley Additive Explanations</p></def></def-item><def-item><term id="abb16">SQUIRE</term><def><p>Standards for Quality Improvement Reporting Excellence</p></def></def-item><def-item><term id="abb17">WHO</term><def><p>World Health Organization</p></def></def-item><def-item><term id="abb18">WSA</term><def><p>weight sensitivity analysis</p></def></def-item><def-item><term id="abb19">XAI</term><def><p>explainable artificial intelligence</p></def></def-item><def-item><term id="abb20">XAI-NSDSS</term><def><p>explainable AI&#x2013;enabled nurse scheduling decision support system</p></def></def-item></def-list></glossary><ref-list><title>References</title><ref id="ref1"><label>1</label><nlm-citation citation-type="web"><article-title>State of the world&#x2019;s nursing 2020: investing in education, jobs and leadership</article-title><source>World Health Organization</source><year>2020</year><access-date>2026-05-19</access-date><comment><ext-link ext-link-type="uri" xlink:href="https://www.who.int/publications/i/item/9789240003279">https://www.who.int/publications/i/item/9789240003279</ext-link></comment></nlm-citation></ref><ref id="ref2"><label>2</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aiken</surname><given-names>LH</given-names> </name><name name-style="western"><surname>Clarke</surname><given-names>SP</given-names> </name><name name-style="western"><surname>Sloane</surname><given-names>DM</given-names> </name><name name-style="western"><surname>Sochalski</surname><given-names>J</given-names> </name><name name-style="western"><surname>Silber</surname><given-names>JH</given-names> </name></person-group><article-title>Hospital nurse staffing and patient mortality, nurse burnout, and job dissatisfaction</article-title><source>JAMA</source><year>2002</year><volume>288</volume><issue>16</issue><fpage>1987</fpage><lpage>1993</lpage><pub-id pub-id-type="doi">10.1001/jama.288.16.1987</pub-id><pub-id pub-id-type="medline">12387650</pub-id></nlm-citation></ref><ref id="ref3"><label>3</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Dall&#x2019;Ora</surname><given-names>C</given-names> </name><name name-style="western"><surname>Ball</surname><given-names>J</given-names> </name><name name-style="western"><surname>Reinius</surname><given-names>M</given-names> </name><name name-style="western"><surname>Griffiths</surname><given-names>P</given-names> </name></person-group><article-title>Burnout in nursing: a theoretical review</article-title><source>Hum Resour Health</source><year>2020</year><month>06</month><day>5</day><volume>18</volume><issue>1</issue><fpage>41</fpage><pub-id pub-id-type="doi">10.1186/s12960-020-00469-9</pub-id><pub-id pub-id-type="medline">32503559</pub-id></nlm-citation></ref><ref id="ref4"><label>4</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Burke</surname><given-names>EK</given-names> </name><name name-style="western"><surname>De Causmaecker</surname><given-names>P</given-names> </name><name name-style="western"><surname>Berghe</surname><given-names>GV</given-names> </name><name name-style="western"><surname>Van Landeghem</surname><given-names>H</given-names> </name></person-group><article-title>The state of the art of nurse rostering</article-title><source>J Sched</source><year>2004</year><month>11</month><volume>7</volume><issue>6</issue><fpage>441</fpage><lpage>499</lpage><pub-id pub-id-type="doi">10.1023/B:JOSH.0000046076.75950.0b</pub-id></nlm-citation></ref><ref id="ref5"><label>5</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Barker</surname><given-names>HR</given-names> </name><name name-style="western"><surname>Griffiths</surname><given-names>P</given-names> </name><name name-style="western"><surname>Dall&#x2019;Ora</surname><given-names>C</given-names> </name></person-group><article-title>&#x201C;I don&#x2019;t think there&#x2019;s necessarily a one size fits all&#x201D; negotiating competing priorities in nurse shift scheduling: a qualitative study</article-title><source>BMC Nurs</source><year>2025</year><month>08</month><day>11</day><volume>24</volume><issue>1</issue><fpage>1048</fpage><pub-id pub-id-type="doi">10.1186/s12912-025-03705-6</pub-id><pub-id pub-id-type="medline">40790199</pub-id></nlm-citation></ref><ref id="ref6"><label>6</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Turhan</surname><given-names>AM</given-names> </name><name name-style="western"><surname>Bilgen</surname><given-names>B</given-names> </name></person-group><article-title>A hybrid fix-and-optimize and simulated annealing approaches for nurse rostering problem</article-title><source>Comput Ind Eng</source><year>2020</year><month>07</month><volume>145</volume><fpage>106531</fpage><pub-id pub-id-type="doi">10.1016/j.cie.2020.106531</pub-id><pub-id pub-id-type="medline">33868622</pub-id></nlm-citation></ref><ref id="ref7"><label>7</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Aickelin</surname><given-names>U</given-names> </name><name name-style="western"><surname>Dowsland</surname><given-names>KA</given-names> </name></person-group><article-title>An indirect genetic algorithm for a nurse-scheduling problem</article-title><source>Comput Oper Res</source><year>2004</year><month>04</month><volume>31</volume><issue>5</issue><fpage>761</fpage><lpage>778</lpage><pub-id pub-id-type="doi">10.1016/S0305-0548(03)00034-0</pub-id></nlm-citation></ref><ref id="ref8"><label>8</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Eshghali</surname><given-names>M</given-names> </name><name name-style="western"><surname>Kannan</surname><given-names>D</given-names> </name><name name-style="western"><surname>Salmanzadeh-Meydani</surname><given-names>N</given-names> </name><name name-style="western"><surname>Esmaieeli Sikaroudi</surname><given-names>AM</given-names> </name></person-group><article-title>Machine learning based integrated scheduling and rescheduling for elective and emergency patients in the operating theatre</article-title><source>Ann Oper Res</source><year>2023</year><month>01</month><day>19</day><volume>332</volume><issue>1-3</issue><fpage>1</fpage><lpage>24</lpage><pub-id pub-id-type="doi">10.1007/s10479-023-05168-x</pub-id><pub-id pub-id-type="medline">36694896</pub-id></nlm-citation></ref><ref id="ref9"><label>9</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Knight</surname><given-names>DRT</given-names> </name><name name-style="western"><surname>Aakre</surname><given-names>CA</given-names> </name><name name-style="western"><surname>Anstine</surname><given-names>CV</given-names> </name><etal/></person-group><article-title>Artificial intelligence for patient scheduling in the real-world health care setting: a metanarrative review</article-title><source>Health Policy Technol</source><year>2023</year><month>12</month><volume>12</volume><issue>4</issue><fpage>100824</fpage><pub-id pub-id-type="doi">10.1016/j.hlpt.2023.100824</pub-id></nlm-citation></ref><ref id="ref10"><label>10</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Renggli</surname><given-names>FJ</given-names> </name><name name-style="western"><surname>Gerlach</surname><given-names>M</given-names> </name><name name-style="western"><surname>Bieri</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Golz</surname><given-names>C</given-names> </name><name name-style="western"><surname>Sariyar</surname><given-names>M</given-names> </name></person-group><article-title>Integrating nurse preferences into AI-based scheduling systems: qualitative study</article-title><source>JMIR Form Res</source><year>2025</year><month>06</month><day>4</day><volume>9</volume><fpage>e67747</fpage><pub-id pub-id-type="doi">10.2196/67747</pub-id><pub-id pub-id-type="medline">40466089</pub-id></nlm-citation></ref><ref id="ref11"><label>11</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Char</surname><given-names>DS</given-names> </name><name name-style="western"><surname>Shah</surname><given-names>NH</given-names> </name><name name-style="western"><surname>Magnus</surname><given-names>D</given-names> </name></person-group><article-title>Implementing machine learning in health care - addressing ethical challenges</article-title><source>N Engl J Med</source><year>2018</year><month>03</month><day>15</day><volume>378</volume><issue>11</issue><fpage>981</fpage><lpage>983</lpage><pub-id pub-id-type="doi">10.1056/NEJMp1714229</pub-id><pub-id pub-id-type="medline">29539284</pub-id></nlm-citation></ref><ref id="ref12"><label>12</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tun</surname><given-names>HM</given-names> </name><name name-style="western"><surname>Rahman</surname><given-names>HA</given-names> </name><name name-style="western"><surname>Naing</surname><given-names>L</given-names> </name><name name-style="western"><surname>Malik</surname><given-names>OA</given-names> </name></person-group><article-title>Trust in artificial intelligence-based clinical decision support systems among health care workers: systematic review</article-title><source>J Med Internet Res</source><year>2025</year><month>07</month><day>29</day><volume>27</volume><fpage>e69678</fpage><pub-id pub-id-type="doi">10.2196/69678</pub-id><pub-id pub-id-type="medline">40772775</pub-id></nlm-citation></ref><ref id="ref13"><label>13</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Tjoa</surname><given-names>E</given-names> </name><name name-style="western"><surname>Guan</surname><given-names>C</given-names> </name></person-group><article-title>A survey on explainable artificial intelligence (XAI): toward medical XAI</article-title><source>IEEE Trans Neural Netw Learn Syst</source><year>2021</year><month>11</month><volume>32</volume><issue>11</issue><fpage>4793</fpage><lpage>4813</lpage><pub-id pub-id-type="doi">10.1109/TNNLS.2020.3027314</pub-id><pub-id pub-id-type="medline">33079674</pub-id></nlm-citation></ref><ref id="ref14"><label>14</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Linardatos</surname><given-names>P</given-names> </name><name name-style="western"><surname>Papastefanopoulos</surname><given-names>V</given-names> </name><name name-style="western"><surname>Kotsiantis</surname><given-names>S</given-names> </name></person-group><article-title>Explainable AI: a review of machine learning interpretability methods</article-title><source>Entropy (Basel)</source><year>2020</year><month>12</month><day>25</day><volume>23</volume><issue>1</issue><fpage>18</fpage><pub-id pub-id-type="doi">10.3390/e23010018</pub-id><pub-id pub-id-type="medline">33375658</pub-id></nlm-citation></ref><ref id="ref15"><label>15</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Adadi</surname><given-names>A</given-names> </name><name name-style="western"><surname>Berrada</surname><given-names>M</given-names> </name></person-group><article-title>Peeking inside the black-box: a survey on explainable artificial intelligence (XAI)</article-title><source>IEEE Access</source><year>2018</year><volume>6</volume><fpage>52138</fpage><lpage>52160</lpage><pub-id pub-id-type="doi">10.1109/ACCESS.2018.2870052</pub-id></nlm-citation></ref><ref id="ref16"><label>16</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Oh</surname><given-names>MY</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>HS</given-names> </name><name name-style="western"><surname>Jung</surname><given-names>YM</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>HC</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SB</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>SM</given-names> </name></person-group><article-title>Machine learning-based explainable automated nonlinear computation scoring system for health score and an application for prediction of perioperative stroke: retrospective study</article-title><source>J Med Internet Res</source><year>2025</year><month>03</month><day>19</day><volume>27</volume><fpage>e58021</fpage><pub-id pub-id-type="doi">10.2196/58021</pub-id><pub-id pub-id-type="medline">40106818</pub-id></nlm-citation></ref><ref id="ref17"><label>17</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Braun</surname><given-names>V</given-names> </name><name name-style="western"><surname>Clarke</surname><given-names>V</given-names> </name></person-group><article-title>Using thematic analysis in psychology</article-title><source>Qual Res Psychol</source><year>2006</year><month>01</month><volume>3</volume><issue>2</issue><fpage>77</fpage><lpage>101</lpage><pub-id pub-id-type="doi">10.1191/1478088706qp063oa</pub-id></nlm-citation></ref><ref id="ref18"><label>18</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Chang</surname><given-names>SJ</given-names> </name><name name-style="western"><surname>Lee</surname><given-names>YW</given-names> </name><name name-style="western"><surname>Chou</surname><given-names>WJ</given-names> </name></person-group><article-title>Self-scheduling: a win-win for nurses and organizations</article-title><source>Hu Li Za Zhi</source><year>2025</year><month>10</month><volume>72</volume><issue>5</issue><fpage>12</fpage><lpage>18</lpage><pub-id pub-id-type="doi">10.6224/JN.202510_72(5).03</pub-id><pub-id pub-id-type="medline">41034164</pub-id></nlm-citation></ref><ref id="ref19"><label>19</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Gerlach</surname><given-names>M</given-names> </name><name name-style="western"><surname>Renggli</surname><given-names>FJ</given-names> </name><name name-style="western"><surname>Bieri</surname><given-names>JS</given-names> </name><name name-style="western"><surname>Sariyar</surname><given-names>M</given-names> </name><name name-style="western"><surname>Golz</surname><given-names>C</given-names> </name></person-group><article-title>Exploring nurse perspectives on AI-based shift scheduling for fairness, transparency, and work-life balance</article-title><source>BMC Nurs</source><year>2025</year><month>09</month><day>2</day><volume>24</volume><issue>1</issue><fpage>1161</fpage><pub-id pub-id-type="doi">10.1186/s12912-025-03808-0</pub-id><pub-id pub-id-type="medline">40898192</pub-id></nlm-citation></ref><ref id="ref20"><label>20</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Liu</surname><given-names>Y</given-names> </name><name name-style="western"><surname>Liu</surname><given-names>C</given-names> </name><name name-style="western"><surname>Zheng</surname><given-names>J</given-names> </name><name name-style="western"><surname>Xu</surname><given-names>C</given-names> </name><name name-style="western"><surname>Wang</surname><given-names>D</given-names> </name></person-group><article-title>Improving explainability and integrability of medical AI to promote health care professional acceptance and use: mixed systematic review</article-title><source>J Med Internet Res</source><year>2025</year><month>08</month><day>7</day><volume>27</volume><fpage>e73374</fpage><pub-id pub-id-type="doi">10.2196/73374</pub-id><pub-id pub-id-type="medline">40773743</pub-id></nlm-citation></ref><ref id="ref21"><label>21</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Cutillo</surname><given-names>CM</given-names> </name><name name-style="western"><surname>Sharma</surname><given-names>KR</given-names> </name><name name-style="western"><surname>Foschini</surname><given-names>L</given-names> </name><etal/></person-group><article-title>Machine intelligence in healthcare-perspectives on trustworthiness, explainability, usability, and transparency</article-title><source>NPJ Digit Med</source><year>2020</year><volume>3</volume><fpage>47</fpage><pub-id pub-id-type="doi">10.1038/s41746-020-0254-2</pub-id><pub-id pub-id-type="medline">32258429</pub-id></nlm-citation></ref><ref id="ref22"><label>22</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Kang</surname><given-names>HW</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>J</given-names> </name><name name-style="western"><surname>Kim</surname><given-names>KJ</given-names> </name><etal/></person-group><article-title>Shift nurses&#x2019; work quality and job satisfaction after implementing the Inha University hospital nursing AI scheduling system (IH-NASS)</article-title><source>BMC Nurs</source><year>2025</year><month>07</month><day>1</day><volume>24</volume><issue>1</issue><fpage>792</fpage><pub-id pub-id-type="doi">10.1186/s12912-025-03470-6</pub-id><pub-id pub-id-type="medline">40597282</pub-id></nlm-citation></ref><ref id="ref23"><label>23</label><nlm-citation citation-type="other"><person-group person-group-type="author"><name name-style="western"><surname>Patel</surname><given-names>V</given-names> </name><name name-style="western"><surname>Deodhar</surname><given-names>A</given-names> </name><name name-style="western"><surname>Birru</surname><given-names>D</given-names> </name></person-group><article-title>A multi-objective genetic algorithm for healthcare workforce scheduling</article-title><source>arXiv</source><comment>Preprint posted online on  Aug 28, 2025</comment><pub-id pub-id-type="doi">10.48550/arxiv.2508.20953</pub-id></nlm-citation></ref><ref id="ref24"><label>24</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Ben Said</surname><given-names>A</given-names> </name><name name-style="western"><surname>Mouhoub</surname><given-names>M</given-names> </name></person-group><article-title>Machine learning and constraint programming for efficient healthcare scheduling</article-title><source>Int J Soft Eng Knowl Eng</source><year>2026</year><month>06</month><day>30</day><volume>36</volume><issue>8</issue><fpage>1089</fpage><lpage>1120</lpage><pub-id pub-id-type="doi">10.1142/S0218194025501025</pub-id></nlm-citation></ref><ref id="ref25"><label>25</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Saeed</surname><given-names>M</given-names> </name><name name-style="western"><surname>Jalil</surname><given-names>MS</given-names> </name><name name-style="western"><surname>Dahwal</surname><given-names>FM</given-names> </name><etal/></person-group><article-title>The impact of AI on healthcare workforce management: business strategies for talent optimization and IT integration</article-title><source>tajmspr</source><year>2025</year><volume>07</volume><issue>3</issue><fpage>136</fpage><lpage>156</lpage><pub-id pub-id-type="doi">10.37547/tajmspr/Volume07Issue03-15</pub-id></nlm-citation></ref><ref id="ref26"><label>26</label><nlm-citation citation-type="journal"><person-group person-group-type="author"><name name-style="western"><surname>Rieke</surname><given-names>N</given-names> </name><name name-style="western"><surname>Hancox</surname><given-names>J</given-names> </name><name name-style="western"><surname>Li</surname><given-names>W</given-names> </name><etal/></person-group><article-title>The future of digital health with federated learning</article-title><source>NPJ Digit Med</source><year>2020</year><volume>3</volume><fpage>119</fpage><pub-id pub-id-type="doi">10.1038/s41746-020-00323-1</pub-id><pub-id pub-id-type="medline">33015372</pub-id></nlm-citation></ref></ref-list><app-group><supplementary-material id="app1"><label>Multimedia Appendix 1</label><p>Additional figures, tables, extended methods, additional results, and implementation details for the explainable artificial intelligence&#x2013;enabled nurse scheduling decision support system.</p><media xlink:href="nursing_v9i1e94450_app1.docx" xlink:title="DOCX File, 1068 KB"/></supplementary-material></app-group></back></article>