Full text
59,186 characters
· extracted from
preprint-html
· click to expand
A minimal set of prompts to surface reasoning in digital health | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search A minimal set of prompts to surface reasoning in digital health View ORCID Profile Ilona Kulikosvkikh , Tarzan Legović , Sergey Konovalov , Alexander Kolsanov , Tomislav Šmuc doi: https://doi.org/10.1101/2025.09.22.25336413 Ilona Kulikosvkikh 1 Laboratory for Machine Learning and Knowledge Representation, Ruder Boskovic Institute , Zagreb, Croatia Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Ilona Kulikosvkikh For correspondence: ilona{at}irb.hr Tarzan Legović 1 Laboratory for Machine Learning and Knowledge Representation, Ruder Boskovic Institute , Zagreb, Croatia 2 Libertas University , Zagreb, Croatia Find this author on Google Scholar Find this author on PubMed Search for this author on this site Sergey Konovalov 3 Department of Urology, Pirogov First City Clinical Hospital , Samara, Russia Find this author on Google Scholar Find this author on PubMed Search for this author on this site Alexander Kolsanov 4 Department of Operative Surgery and Topographic Anatomy, Samara State Medical University , Samara, Russia Find this author on Google Scholar Find this author on PubMed Search for this author on this site Tomislav Šmuc 1 Laboratory for Machine Learning and Knowledge Representation, Ruder Boskovic Institute , Zagreb, Croatia Find this author on Google Scholar Find this author on PubMed Search for this author on this site Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Digital health technologies can reduce workloads, enhance information retention, and minimize errors. However, when poorly integrated or misaligned with clinical practice, they often introduce new risks and allow unprocessed information to accumulate, amplifying existing challenges. The core problem is that reasoning often stays implicit and unstructured when translating needs into digital solutions. Without a shared way to make it explicit, critical inputs are missed, unprocessed information builds up, and reasoning faults spread through the system. We present a minimal, non-redundant set of eight plain-language prompts that spans the full reasoning process, guards against common reasoning faults, and provides a shared structure for aligning perspectives across stakeholders. We tested the set in a clinical case study on the initial management of septic shock, where the prompts helped to turn unstructured clinical reasoning into clear inputs for system design and workflow adjustments. To interpret its impact, we built a mathematical model that captures how unprocessed information changes over time. Compared with standard practice, the prompts reduced peak backlog by 20.3%, cumulative backlog by 22.2%, and improved recovery time from not reached to five time steps. We share an open-source code to model backlog dynamics, enabling easy adaptation to other clinical settings through parameter calibration. Author summary In digital health, the biggest challenge is not the technology but translation. What clinicians need and what developers create often do not align, resulting in tools that fail to meet the demands of real-world care. One key reason is that clinicians, developers, and administrators approach the same problem from different perspectives, and their reasoning is rarely made explicit or shared in a structured way. Our solution is a minimal yet complete set of plain-language prompts. These prompts make reasoning clear, bring experts onto the same page, and help to avoid common thinking traps like missing critical details, focusing too narrowly, or hesitating to act. In a clinical case of septic shock management, the prompts kept essential information visible, helped to set priorities in real time, and produced inputs directly relevant to patient care. By making critical details more visible, the prompt set enabled faster responses and led to fewer delays in treatment, while maintaining reliability. This set is compact enough for quick adoption and effective enough to bring together the perspectives of diverse expert groups, making it useful not only in hospitals but also in public health and other complex care settings. Introduction A neonate is admitted to a Denver hospital. Born to a mother with a history of syphilis, the indication for treatment remains unclear due to language barriers and incomplete records. After consulting with infectious disease specialists, the physician prescribes benzathine penicillin G. The pharmacist, unfamiliar with neonatal dosing, misreads the standard dose as 500,000 units/kg instead of 50,000 units/kg. The handwritten “150,000U” order adds to the confusion. The “U” for units appears as an extra zero, resulting in a tenfold overdose. When the medication reaches the nurses, they hesitate, questioning the pain of five intramuscular injections for a newborn. Seeking an alternative, they check a drug reference book that does not explicitly warn against intravenous use. The nurses see “Benzathine” capitalized and placed on a separate line from “penicillin G . ” They assume it is a brand name rather than a distinct formulation. The warning on the syringe “for intramuscular use only” is too small to read and goes unnoticed. The nurses know that only clear liquids are typically safe for intravenous use but believe some milky medications, like lipid-based drug products, can also be given intravenously. They proceed. After 1 . 8 ml is given, the baby becomes unresponsive and dies from a pulmonary embolism. An autopsy confirms the baby never had congenital syphilis. Three nurses are indicted, but expert testimony reveals over fifty system failures – misread orders, unclear references, and unchecked assumptions – turning small gaps into a fatal mistake. The public sees a clear-cut story of human error: they gave the wrong drug in the wrong way . – The Denver medication error/criminal negligence case, 1998 [ 1 ] Since that tragedy healthcare has undergone significant changes through digital transformation, yet similar incidents continue to occur [ 2 ]. Across the world, national and institutional reporting systems [ 3 ], designed to capture clinical near misses and incidents [ 4 – 6 ], have documented countless recurring patterns. These events are rarely the result of a single error [ 7 ]. Instead, they typically arise from information gaps that result from shortcomings in how health systems are designed [ 8 – 10 ]. In an ideal world, healthcare practitioners would have immediate access to all the data needed to make informed decisions. In reality, the information they see – and what they notice within it – depends on their role, experience, current circumstances, and how their workflow is organized. Strict regulations meant to standardize how data is recorded and shared can limit flexibility, and existing infrastructure further shapes how healthcare systems function. But, system limitations are not the only issue. Human cognition narrows the flow of information even more. Our sensory memory briefly captures a wide range of inputs for only a fraction of a second. From there, only some of these inputs move into short-term memory, which typically retains them for less than half a minute. During that time, working memory manipulates this data before a portion of it is encoded into long-term memory, which can last from days to years. These internal processes shape how we perceive events and handle incomplete information. When crucial details are lost, whether due to system constraints or human limitations [ 11 – 13 ], the result can be the very gaps illustrated in the opening Denver incident. Human cognition, molded by evolutionary pressures, is not optimized for instantly handling large volumes of data. Instead, it simplifies, filters, and interprets information based on the inputs available at the moment [ 12 , 14 ]. When information is scarce, the mind fills gaps with plausible but sometimes inaccurate assumptions [ 15 – 17 ]. When information is excessive, the limits of working memory [ 18 – 21 ] can cause cognitive overload [ 22 – 24 ]. In both cases, critical inputs remain unaddressed, creating a backlog of unprocessed information. Different reasoning faults contribute to this backlog in distinct ways. Omission prevents key data from entering the reasoning process [ 25 ], tunnel vision allows other relevant inputs to accumulate unresolved [ 26 – 29 ], clutter overwhelms limited processing capacity [ 30 ], and overconfidence lets incomplete or inaccurate information circulate unchecked [ 31 ]. This growing backlog not only slows reasoning and increases the risk of errors but also highlights the need for solutions specifically designed to reduce it. Digital health tools, by design, aim to support this need by reducing the cognitive burden of managing complex information. When well integrated, they can ease workload [ 32 , 33 ], help clinicians retain critical information [ 34 – 36 ], and reduce the risk of serious oversights [ 37 , 38 ]. However, when poorly aligned with real-world workflows [ 39 , 40 ], they may introduce new vulnerabilities [ 41 , 42 ] and, in some cases, worsen the very problems they were intended to solve [ 43 , 44 ]. Existing approaches to digital health design have focused on measuring cognitive burden [ 45 – 50 ] and recognizing fundamental differences between human and digital information processing [ 14 , 36 , 37 ]. Others have emphasized the importance of aligning how information is represented and understood across stakeholders [ 51 – 54 ]. However, gaps remain. Domain experts often struggle to fully articulate their reasoning, or they assume their needs have been clearly communicated when others have understood something entirely different. Without a structured way to externalize reasoning, each stakeholder brings a different frame of reference: clinicians focus on symptoms, risks, and urgency; developers on data models and workflow triggers; and administrators on efficiency and reporting metrics. As a result, the system fails to capture critical inputs in a consistent way, allowing a backlog of unprocessed information to accumulate and amplifying reasoning faults across the system. This study presents a non-redundant, complete set of eight plain-language prompts. The prompts mitigate common reasoning faults in time-critical clinical situations and provide a shared framework for making reasoning explicit. We tested this approach in a clinical case study, using the prompts to generate clear inputs ready for translation into technical requirements or workflow improvements. We also developed a mathematical model that interprets how these prompts influenced the backlog of unprocessed information in the case study, making their impact easier to evaluate. This study includes three main elements: the design of the minimal prompt set, a clinical case study demonstrating its practical application, and an interpretation of its effects on the accumulation of unprocessed information, highlighting reasoning bottlenecks. Figure 1 provides an overview of the full process, showing the underlying problems (left), the study design (center), and the impact (right). Download figure Open in new tab Fig 1. Overview of the study. The figure outlines the full process, starting with the underlying problems (left), moving through the study design (center), and ending with the expected impact (right). The approach targets system-level gaps, reasoning faults, and backlogs of unprocessed information by introducing a minimal eight-prompt set, testing it in a clinical case study, and interpreting its effects with a mathematical model. The resulting impact includes clearer inputs for design and operations, reduced backlog, better communication, and faster clinical responses without losing reliability. Results Prompt set The prompt set is a compact collection of plain-language questions that guide the full reasoning process across four stages: Search, Shape, Check, and Act. Whereas condition-specific checklists in clinical practice are typically applied once a diagnosis has been established and treatment is underway, the prompts support reasoning in situations where information is still incomplete and uncertainty is high. Each prompt targets one of eight common reasoning faults – omission, tunnel vision, conflation, fragmentation, clutter, misprioritization, overconfidence, and paralysis – and the types of unprocessed information they create. This design makes reasoning gaps visible in real time and helps reduce the backlog of unprocessed information that slows responses and introduces delays. Table 1 serves as a practical reference. For each prompt, it lists the guiding question, short instructions, and the type of backlog issue it helps resolve. Collectively, these components establish a structured way to make reasoning explicit. The underlying principles guiding the design of the prompt set are described in the Materials and methods section. View this table: View inline View popup Download powerpoint Table 1. Prompt reference. Each prompt includes a guiding question, practical steps, and the backlog issue it addresses. By connecting reasoning faults to backlog issues, the prompts provide a systematic way to uncover system-level gaps. We next demonstrate their use in a clinical case study on septic shock management, showing how they helped identify these gaps and how structured reasoning can be translated into clear technical requirements and targeted workflow improvements. Clinical case study Context We tested the prompt set in a clinical case study of septic shock, chosen because of its rapid progression, high mortality, and the frequent need to manage incomplete or conflicting information. The patient profile reflects an initial assessment on arrival commonly encountered in clinical practice: a male, aged 60–70 years, with impaired consciousness, diabetes mellitus, and cardiac arrhythmia, admitted to the emergency department with signs of septic shock. In addition to confirming sepsis and identifying its source, the clinical team needed to rule out both diabetic coma and acute cardiac pathology. The case was structured around established sepsis criteria, with team involvement and documentation procedures described in the Materials and methods. Application Across five observation points, a team of clinicians involved in the case study applied the prompts to structure reasoning in real time. This process exposed system-level issues or recurring gaps that disrupted information flow and clinical judgment. At each step, clinicians first defined the clinical context in terms of the findings available at that moment, and then identified the recurring issues where missing or delayed information slowed responses. A complete account of the case, including clinical findings, prompt responses, and issues identified at each step, together with clinician-documented scenarios showing how these issues arise in routine practice, is provided in Supplementary Information ( S1 Table , S2 Table ). The Sankey diagram ( Fig. 2 ) provides a visual summary of the case study, showing how prompts linked to issues across the five time steps. View this table: View inline View popup S1 Table. Prompt set in the initial management of septic shock. Structured case study showing how prompts were applied to identify system-level issues affecting information flow and clinical judgment. Prompts not applicable at a given step were skipped. View this table: View inline View popup Download powerpoint S2 Table. Clinician-reported scenarios illustrating system-level issues. Scenarios from routine clinical practice showing how each issue may arise in real-world settings. Download figure Open in new tab Fig 2. Application of the prompt set in a clinical case study on septic shock management. The Sankey diagram linking time steps (left), applied prompts (center), and identified system-level issues (right). At each time step, clinicians applied a subset of prompts to structure reasoning around available findings. This process revealed recurring system-level issues. The colors highlight distinct issue categories. It indicates that at each step clinicians applied a subset of prompts, and across the complete sequence every prompt was used at least once. Distinct issue categories are highlighted by color. Early in the process, What is missing? and Where else can I look? accounted for most issues (Steps 1–3), especially, delayed lab data, incomplete transfer of prior information, and poor coordination between related protocols. From Step 3 onward, What matters most? became dominant, surfacing multiple simultaneous critical abnormalities and showing how risks compound once partial data begins to arrive. The prompt How do I know this is right? repeatedly surfaced undefined minimal criteria, pointing to unclear confirmation rules across labs, imaging, and monitoring. What should I do first? was linked to conflicting multidisciplinary decisions at Steps 4–5, exposing friction within the team when urgent action was needed. Prompts that did not reveal new issues instead clarified available information, reducing ambiguity and keeping reasoning structured. To show how structured reasoning translates into clear inputs for system design and workflow improvements, we highlight an excerpt from the case study focusing on Steps 3–5 ( Table 2 ), where recurring issues converge and intensify. These steps illustrate how clinical data accumulate over time, while the prompts expose system-level issues by structuring reasoning and reducing unprocessed information. View this table: View inline View popup Download powerpoint Table 2. Excerpt from the septic shock case study. Each step shows the clinical findings available at that moment, the prompts used, and the system-level issues they revealed. The complete case study is provided in S1 Table . Translation The issues identified in Steps 3–5 were translated into four event-driven and state-driven requirements, summarized in the blocks below: keeping missing data visible until resolved, summarizing critical abnormalities by organ system, maintaining a shared record of urgent priorities across teams, and making diagnostic uncertainty explicit until standardized criteria are available. Requirement 1 (Event-driven) When results or history are missing, the system shall show them clearly and mark decisions as temporary. This prevents premature decisions from being treated as final . System-level issue addressed Delayed essential lab data; incomplete transfer of prior clinical information. Requirement 2 (Event-driven) When new critical findings appear, the system shall summarize them by organ system to show combined risk. This supports recognition of compounding risks . System-level issue addressed Multiple simultaneous critical abnormalities. Requirement 3 (State-driven) While urgent priorities are being managed, the system shall keep a shared, updated list across teams. This ensures all teams act on the same priorities . System-level issue addressed Conflicting multidisciplinary decisions. Requirement 4 (State-driven) When diagnostic criteria are unclear, the system shall highlight the uncertainty and align with standardized rules once available. This makes uncertainty explicit until clear rules are applicable . System-level issue addressed Undefined minimal criteria. These requirements illustrate how the prompts made critical gaps and risks more visible. In the next section, we model how the prompts affects the backlog of unprocessed information. Backlog dynamics Mathematical model Most existing models in healthcare focus on patient flow, task queues, or staff capacity. Our model instead captures the backlog of unprocessed information and how reasoning prompts shape it. By design, the prompt set aims to reduce the likelihood that crucial information will remain unprocessed. Building on this rationale, we developed a mathematical model to quantify how the prompts impact the backlog in clinical settings. Let t = 0, 1, …, n denote the discrete observation steps, where n is the final step in the observation period. The interval between two consecutive steps is given by Δ t . These intervals do not need to be evenly spaced, so their length may vary throughout the observation period. Let I t be the quantity of unprocessed information at time t . The discrete-time dynamics are given by where is the new information arriving in the interval from t to t + 1, with f > 0 a scaling parameter and P t ( λ ) the Poisson probability mass function with mean λ ; is the noise term, with w ≥ 0 quantifying the intensity of additive noise proportional to the current backlog (that is, the unprocessed information at time t ). The parameter w may vary over time due to organizational factors such as infrastructure and information flow within a medical facility, but is treated as constant to clarify the analysis of prompt effects; is the amount of information processed by the clinical team during the interval Δ t , where a > 0 denotes the intrinsic processing rate. The parameter a may, in general, be time dependent, reflecting factors such as fatigue, staffing, or patient load, but is held constant here to isolate the effects of the prompts; represents the combined impact of all selected prompts on the backlog at step t . Here, j = 1, …, k indexes the set of available prompts, where b j,t ∈ 0, 1 indicates whether the j -th prompt is applied at time t (1 if applied, 0 otherwise), and c j,t describes the immediate fractional effect of the j -th prompt on the backlog. A positive value c j,t > 0 indicates a reduction in unprocessed information, while c j,t < 0 reflects an increase. This behavior describes the expected impact of prompts. For example, What is missing? often uncovers gaps (e.g., pending labs, no history available). Making these gaps explicit temporarily enlarges the backlog ( c j,t < 0). However, this effect is constructive, since without the prompt the gaps would remain hidden, leaving the system unreliable. The prompts therefore do not always shrink the backlog immediately. Instead, they reshape it by exposing hidden issues that can then be addressed. In addition, the prompts interact dynamically. Resolving one issue may give rise to another. This transformation of issues is represented in the model by the time-varying values of c j,t . Steady-state behavior Steady-state analysis determines whether unprocessed information is eventually eliminated or persists in the system. Expanding Eq (1) with the definitions in Eq (2) – Eq (5) gives To find the equilibrium, set I t +1 = I t = I * , where I * is the steady-state value. Substituting this into Eq (6) above yields As t → ∞, the arrival rate of new information P t ( λ ) approaches zero, so I * = 0. Thus, the unique equilibrium corresponds to complete elimination of unprocessed information. Stability analysis Stability analysis is crucial for understanding whether the system returns to equilibrium after small disturbances. Consider a small perturbation δI t from equilibrium. For large t , the f P t ( λ ) term can be omitted, since it vanishes as the process concludes. The linearized update Eq (6) for the perturbation becomes Stability holds when the absolute value of the multiplier is less than one, as this guarantees that small deviations from the equilibrium decay with each time step: which makes all perturbations decay over time. For small enough time steps Δ t , Eq (7) reduces to thereby ensuring I * = 0 is a stable equilibrium. Minimum and maximum values The minimum and maximum values of I t ( Eq (6) ) provide additional insight into the system behavior, as these extremes indicate the potential range of unprocessed information during the observation period. Understanding these values is crucial for optimizing resource allocation: if the maximum value of I t is too high, it may indicate periods when the team is overloaded and additional personnel or capacity are required to process the incoming information effectively. The minimum is I t = 0, since a negative backlog is not possible. The maximum depends on the initial value, the time dependence of P t ( λ ), and the specific values of a, w , as well as the selection of b j,t and c j,t . Typically, I t increases as new information arrives, reaches a maximum near the peak of P t ( λ ), and decreases as arrivals decline and processing dominates. The time step t * at which I t attains its maximum can be found by setting I t +1 − I t = 0 in Eq (6) : where t * typically coincides with or near the peak of . By selecting parameter values a, w, b j,t , and c j,t appropriate to the clinical context, the discrete-time model presented here can be used to assess how effectively the prompt set impacts unprocessed information. Details on related models, model design, and the selection of parameters ( c, a, λ ) are provided in the Materials and methods section. Interpretation We applied the model to the septic shock case study to interpret the impact of the prompt set on the backlog of unprocessed information. The parameters were taken directly from the case study, reflecting the hospital setting, clinical team, infrastructure, and workflow. Figure 3 shows the simulated backlog I t ( Eq. 1 ) across time steps for two scenarios: the red dashed line represents performance without prompts, and the blue solid line shows performance with the prompt set. With prompts, the backlog reached a lower maximum and declined faster than in the baseline. The simulation indicates that the maximum backlog, the peak backlog, was reduced by 20.3% with prompts. The total backlog accumulated across all steps, the cumulative backlog, was reduced by 22.2%. The recovery, defined as the first step when the backlog fell to one unit or less, occurred at step five with prompts but was not reached under the baseline scenario. Details of parameter selection and metric definitions are provided in Materials and methods. The implementation of the backlog model, along with parameter estimates and key metrics, is provided in S1 File. Download figure Open in new tab Fig 3. Impact of prompts on the backlog of unprocessed information. The simulated backlog I t ( Eq. (1) ) for scenarios with and without prompts. With prompts, the peak backlog was 7.12 at t = 1; without prompts, 8.93 at t = 2 (20.3% reduction). With prompts, the cumulative backlog over the observation period was 22.2% lower, and recovery, defined as the first time the backlog falls to 1 unit or less, occurred at t = 5; without prompts, recovery was not reached. These improvements have direct practical implications. Lower peak backlog reduced the risk of overlooking critical findings during high information load. Reduced cumulative backlog meant more data were processed in time, with essential information integrated rather than left unresolved. Faster recovery helped the team regain situational clarity earlier, supporting clearer inputs for system design, better communication across the team, and quicker, more reliable responses with fewer delays in treatment. Discussion Lessons learned This study offers several practical insights and lessons learned. A key one was the value of plain-language prompts for structuring reasoning. Clinicians found that the prompts acted like ad-hoc checklists in situations of high uncertainty and limited time. Unlike fixed checklists, which assume the right pathway is already known, the prompts enriched the available information so that clinicians could decide which checklist or framework to apply. By breaking reasoning into simple steps, the prompts reduced ambiguity, surfaced overlooked issues, and kept critical information visible without adding cognitive burden. Another lesson is that the prompts helped make system-level gaps visible. By tracing where information was missing, delayed, or poorly shared, clinicians could see patterns that pointed to workflow problems rather than individual oversights. This shifted attention from personal error to structural issues, providing clearer input for improving communication and digital support systems. Limitations Several limitations should also be noted. The case study focused on a single condition, sepsis, in one hospital setting, which may limit direct generalizability. Second, the mathematical model was deliberately simplified to isolate the impact of prompts, and therefore does not capture the full complexity of team behavior, uncertainty, or evolving patient conditions. Third, the estimates for the key model parameters ( c, a, λ ) relied on clinician judgment, introducing subjectivity. Future directions This work points to several directions for further development. The prompt set can be extended beyond point-of-care use by linking it to low-code and AI-assisted development, where clear requirements are essential for building responsible and clinically relevant digital tools. Prompt mapping also has potential as an audit method. By comparing how prompts are used across cases, departments, or before and after digital interventions, hospitals could track shifts in workflow, identify which gaps are resolved, and detect new vulnerabilities. This could be particularly valuable in regulatory contexts, where evidence is needed to demonstrate that critical safety checks remain visible and no decision points are overlooked. Such audits could strengthen compliance reviews, target improvements, and reduce risks before widespread deployment. Further testing is needed to evaluate generalizability. Future studies should extend the approach to other acute conditions such as trauma, stroke, and cardiac arrest, and validate the backlog model with real-time data across multiple hospitals. Beyond backlog dynamics, research should also assess how prompts influence teamwork, diagnostic accuracy, and patient outcomes. Finally, adaptive prompt delivery, such as context-sensitive suggestions integrated into electronic health records or dashboards, could further reduce cognitive load while preserving clarity. Materials and methods Prompt set design The prompt set was designed to be minimal yet complete, covering the full reasoning process without redundancy. The design followed three principles: (1) each stage of reasoning is represented, (2) every prompt addresses a distinct reasoning fault documented in the literature [ 25 – 31 ], and (3) each fault is linked to a type of unprocessed information that slows clinical responses. The reasoning process was structured into four stages: Search, Shape, Check, and Act. These reflect common patterns in clinical reasoning, moving from gathering inputs to organizing them, checking priorities and assumptions, and deciding on actions. Each stage was linked to specific reasoning faults and the types of unprocessed information ( Table 3 ). View this table: View inline View popup Download powerpoint Table 3. Prompt design across reasoning stages. Each stage connects guiding questions with reasoning faults and types of unprocessed information. Each stage–fault link was expressed as a plain-language guiding question, paired with three to four short steps to make it usable in practice. The steps drew on clinical practice, where clinicians described how they reason under pressure, such as checking another source or asking for a second opinion. They were also informed by literature on cognitive strategies, aligning with heuristics like listing, grouping, or cross-checking to address reasoning faults. Finally, they were written in plain, action-oriented language so they could be applied in real clinical settings. To keep the set both minimal and complete, prompts were mapped onto a stage–fault matrix to ensure that each reasoning fault was addressed in the right stage. We then tested the set by removing prompts one by one. If removing a prompt left a fault uncovered or made another prompt carry overlapping functions, the prompt was kept. This process confirmed that all eight prompts were necessary to ensure complete coverage without overlap. The resulting set balances completeness with conciseness, aligning with Miller’s 7 ± 2 principle on limitation of working memory [ 18 ] to remain practical under time pressure. Case study setup The case study was structured around the qSOFA criteria [ 55 ] to ensure clinical relevance and alignment with established diagnostic frameworks. A team of clinicians experienced in emergency care and sepsis management estimated that the course of events from initial assessment on arrival to achieving a sufficient clinical picture for diagnosis corresponded to approximately five time points and 30 minutes in real practice. At each time point, the clinicians documented the findings available at that moment and worked through the prompts in the order provided in the prompt reference ( Table 1 ), skipping those not applicable. This structured reasoning process highlighted repeating prompts, which were grouped according to problems in the information flow. From these patterns, the clinicians identified recurring issues that reflected system-level gaps within the medical facility. For each issue, they also provided clinical scenarios from their routine practice where such problems typically arise. Clinicians organized their work using a structured layout that matched their reasoning process and made the case easier to document (S2 File). Each time point was placed at the top of a column, followed by the clinical findings available at that stage. Beneath, clinicians recorded their responses to the prompts, highlighting each stage of reasoning with a distinct color: white for finding missing information, blue for organizing and simplifying what is known, black for checking priorities and assumptions, and red for deciding what to do first. At the bottom, they reserved a separate space to list the system-level issues that surfaced during the process and show which prompt had triggered them. This layout allowed the team to track how information accumulated, how reasoning evolved, and how recurring issues emerged across steps. The identified issues were reviewed with hospital administrators, who assessed their relevance to existing workflows and potential digital interventions. Developers then formalized the prompt responses and issues into structured software requirements using the Easy Approach to Requirements Syntax (EARS) [ 56 , 57 ], ensuring consistency and reducing ambiguity, omission, and complexity. Model parameters and metrics The backlog model parameters were derived directly from the septic shock case study described above. This case, conducted in a hospital setting, reflected the characteristics of its clinical team, infrastructure, and workflow. Each parameter was selected to mirror this setting, ensuring that the model captured both the pace of new clinical inputs and the team’s capacity to process them ( Table 4 ). View this table: View inline View popup Download powerpoint Table 4. Scalar parameters. Model parameters of the backlog model derived from the septic shock case study. The arrival of new information was modeled as a Poisson process. The rate parameter λ was set to 1.2 to reflect the average number of new findings observed during the early phase of the case, when laboratory and monitoring results began to accumulate. The scale factor f was set to 15 to match the typical volume of information arriving per step. The initial backlog I 0 was set to 5, corresponding to the number of patient parameters documented at admission before additional findings began to accumulate. The team’s capacity to handle information was described by the processing rate coefficient a , set to 0.5 to represent the ability to resolve about half of the backlog per step. Since one step corresponded to 5–6 minutes (five steps over 30 minutes), this rate reflects a realistic pace for emergency care. The noise coefficient w was fixed at 0.15, representing the effect of unpredictable disturbances such as delayed lab results or communication bottlenecks. Prompt use was represented by a schedule b j,t ( Table 5 ) and effect values c j,t ( Table 6 ). These inputs captured when prompts were applied in practice and how they impacted backlog dynamics. View this table: View inline View popup Download powerpoint Table 5. Prompt schedule. Schedule showing which prompts were applied at each observation step. View this table: View inline View popup Download powerpoint Table 6. Prompt effects. Estimated impact of each prompt on the backlog of unprocessed information at each observation step. Using this parameterization, we simulated backlog dynamics for two scenarios: with prompts and without prompts. To interpret the impact of the prompt set, model performance was assessed with three complementary metrics, each capturing a different aspect of backlog behavior: The peak backlog, defined as the highest backlog observed across the observation period, the total backlog accumulated across all steps, and the recovery time, defined as the first step when the backlog falls to one unit or less: These metrics enabled comparison of the scenarios with and without prompts by capturing backlog intensity, total accumulation, and recovery time. Data Availability All relevant data are within the manuscript and its Supporting Information files. Supporting information S1 Table. Prompt set in the initial management of septic shock . A documented case study illustrates how prompts were applied to identify system-level issues affecting information flow and clinical judgment. Prompts not applicable at a given step were skipped. S2 Table. Clinician-reported scenarios illustrating system-level issues . Documented scenarios from routine clinical practice show how each issue can arise in real-world settings. S1 File. Backlog dynamics notebook . A Jupyter notebook provides parameter estimates from the case study, model implementation, and key metrics to compare system performance with and without prompts. S2 File. Structured case study documentation . A clinician-documented case study shows how prompts were applied across time points, with clinical findings, responses, and system-level issues recorded in an intuitive layout. Reasoning stages are highlighted in color, and issues are linked directly to the prompts that revealed them. Structured case study documentation Download figure Open in new tab Acknowledgments We thank all participants for sharing their perspectives during the pilot program, which contributed to refining the prompt set. We are also grateful to Dr. Mate Lerga from the Clinical Hospital Center, Rijeka, Croatia for his assistance in developing the clinician-reported scenarios used in the case study. References 1. ↵ Smetzer JL , Cohen MR . Lessons from the Denver medication error/criminal negligence case: Look beyond blaming individuals . Hospital Pharmacy . 1998 ; 33 ( 6 ): 640 – 657 . doi: 10.17226/11623 . OpenUrl CrossRef 2. ↵ Salber P. Wachter’s Digital Doctor explores the dark side of health IT . Mhealth . 2015 ; 1 ( 18 ). doi: 10.3978/j.issn.2306-9740.2015.09.01 . OpenUrl CrossRef 3. ↵ World Health Organization . Patient safety incident reporting and learning systems: technical report and guidance ; 2020 . Available from: https://www.who.int/publications/i/item/9789240032705 . 4. ↵ Agency for Healthcare Research and Quality . Data Reporting Tools ; 2021 . Available from: https://www.ahrq.gov/npsd/data/index.html . 5. The Japan Council for Quality Health Care . Project to collect medical near-miss/adverse event information ; 2022 . Available from: https://www.med-safe.jp/contents/english/index.html . 6. ↵ NHS England . Data on patient safety events ; 2023 . Available from: https://www.england.nhs.uk/patient-safety/patient-safety-insight/learning-from-patient-safety-events/data-on-patient-safety-events/ . 7. ↵ Aspden P , Wolcott J , Bootman JL , Cronenwett LR , editors Institute of Medicine Committee on Identifying and Preventing Medication Errors . Preventing Medication Errors . Aspden P , Wolcott J , Bootman JL , Cronenwett LR , editors. Washington, DC : The National Academies Press ; 2007 . 8. ↵ Kohn LT , Corrigan JM , Donaldson MS , editors Institute of Medicine Committee on Quality of Health Care in America . To err is human: Building a safer health system . Kohn LT , Corrigan JM , Donaldson MS , editors. DC : The National Academies Press ; 2000 . 9. Cook R , Rasmussen J. “Going solid”: a model of system dynamics and consequences for patient safety . BMJ Quality & Safety . 2005 ; 14 ( 2 ): 130 – 134 . doi: 10.1136/qshc.2003.009530 . OpenUrl Abstract / FREE Full Text 10. ↵ Hooftman J , Dijkstra AC , Suurmeijer I , van der Bij A , Paap E , Zwaan L. Common contributing factors of diagnostic error: A retrospective analysis of 109 serious adverse event reports from Dutch hospitals . BMJ Quality & Safety . 2024 ; 33 ( 10 ): 642 – 651 . doi: 10.1136/bmjqs-2022-015876 . OpenUrl Abstract / FREE Full Text 11. ↵ Rasmussen J , Lind M. In: Coping with complexity . Risø National Laboratory. Risø-M No . 2293 ; 1981 . 12. ↵ Nemeth C , O’connor M , Klock PA. R C. Mapping cognitive work: the way out of healthcare IT system failures . AMIA Annu Symp Proc . 2005 ; 2005 : 560 – 564 . doi: 10.1186/s12911-018-0584-z . OpenUrl CrossRef PubMed 13. ↵ Griffiths TL . Understanding human intelligence through human limitations . Trends in Cognitive Sciences . 2020 ; 24 ( 11 ): 873 – 883 . doi: 10.1016/j.tics.2020.09.001 . OpenUrl CrossRef PubMed 14. ↵ Tikhomirov L , Semmler C , McCradden M , Searston R , Ghassemi M , Oakden-Rayner L. Medical artificial intelligence for clinicians: the lost cognitive perspective . The Lancet Digital Health . 2024 ; 6 ( 8 ): e589 – e594 . doi: 10.1016/S2589-7500(24)00095-5 . OpenUrl CrossRef 15. ↵ Whelehan DF , Conlon KC , Ridgway PF . Medicine and heuristics: cognitive biases and medical decision-making . Irish journal of medical science . 2020 ; 189 ( 4 ): 1477 – 1484 . doi: 10.1007/s11845-020-02235-1 . OpenUrl CrossRef PubMed 16. Küper A , Lodde G , Livingstone E , Schadendorf D , Krämer N. Mitigating cognitive bias with clinical decision support systems: an experimental study . Journal of Decision Systems . 2024 ; 33 ( 3 ): 439 – 458 . doi: 10.1080/12460125.2023.2245215 . OpenUrl CrossRef 17. ↵ Ainge LE , Edgar AK , Kirkman JM , Armitage JA . Developing clinical reasoning along the cognitive continuum: A mixed methods evaluation of a novel Clinical Diagnosis Assessment . BMC Medical Education . 2025 ; 25 ( 1 ): 31 . doi: 10.1186/s12909-024-06613-6 . OpenUrl CrossRef PubMed 18. ↵ Miller GA . The magical number seven, plus or minus two: Some limits on our capacity for processing information . Psychological Review . 1956 ; 63 ( 2 ): 81 – 97 . doi: 10.1037/h0043158 . OpenUrl CrossRef PubMed Web of Science 19. Cowan N. The magical number 4 in short-term memory: a reconsideration of mental storage capacity . The Behavioral and brain sciences . 2001 ; 24 ( 1 ): 87 – 114 . doi: 10.1017/s0140525×01003922 . OpenUrl CrossRef PubMed Web of Science 20. Gobet F , Clarkson G. Chunks in expert memory: evidence for the magical number four … or is it two? Memory . 2004 ; 12 ( 6 ): 732 – 747 . doi: 10.1080/09658210344000530 . OpenUrl CrossRef PubMed Web of Science 21. ↵ Thalmann M , Souza AS , Oberauer K. How does chunking help working memory? Journal of Experimental Psychology Learning, Memory, and Cognition . 2019 ; 45 ( 1 ): 37 – 55 . doi: 10.1037/xlm0000578 . OpenUrl CrossRef PubMed 22. ↵ Lyell D , Magrabi F , Coiera E. The effect of cognitive load and task complexity on automation bias in electronic prescribing . Human factors . 2018 ; 60 ( 7 ): 1008 – 1021 . doi: 10.1177/0018720818781224 . OpenUrl CrossRef PubMed 23. Coiera E , Kocaballi B , Halamka J , & Laranjo L. The digital scribe . npj Digital Medicine . 2018 ; 1 ( 58 ): e2448714 – e2448714 . doi: 10.1038/s41746-018-0066-9 . OpenUrl CrossRef 24. ↵ Andersson U , Maurin Söderholm H , Wireklint Sundström B , Andersson Hagiwara M , Andersson H. Clinical reasoning in the emergency medical services: an integrative review . Scandinavian Journal of Trauma, Resuscitation and Emergency Medicine . 2019 ; 27 ( 1 ): 76 . doi: 10.1186/s13049-019-0646-y . OpenUrl CrossRef 25. ↵ Ng M , Wong E , Sim GG , Heng PJ , Terry G , Yann FY . Dropping the baton: Cognitive biases in emergency physicians . PLOS ONE . 2025 ; 20 ( 1 ): 1 – 15 . doi: 10.1371/journal.pone.0316361 . OpenUrl CrossRef 26. ↵ Ogdie A , Reilly J , Pang W , Keddem S , Barg F , Von Feldt J , et al. Seen through their eyes: residents’ reflections on the cognitive and contextual components of diagnostic errors in medicine . Acad Med . 2012 ; 87 ( 10 ): 1361 – 1367 . doi: 10.1097/ACM.0b013e31826742c9 . OpenUrl CrossRef PubMed Web of Science 27. Newman-Toker DE . From Possible to Probable to Sure to Wrong—Premature Closure and Anchoring in a Complicated Case . PSNet [internet] . 2013 ;. 28. Green B , Parry D , Oeppen R , Plint S , Dale T , Brennan P. Situational awareness - what it means for clinicians, its recognition and importance in patient safety . Oral Dis . 2017 ; 23 ( 6 ): 721 – 725 . doi: 10.1111/odi.12547 . OpenUrl CrossRef PubMed 29. ↵ Redelmeier D. E S. The Fallacy of a Single Diagnosis . Med Decis Making . 2023 ; 43 ( 2 ): 183 – 190 . doi: 10.1177/0272989X231185372 . OpenUrl CrossRef PubMed 30. ↵ Moacdieh N , Ganje T , Sarter N. Electronic health records: effects of clutter and stress on physicians’ information search and noticing performance . Proceedings of the Human Factors and Ergonomics Society Annual Meeting . 2014 ; 58 ( 1 ): 718 – 722 . doi: 10.1177/1541931214581167 . OpenUrl CrossRef 31. ↵ Kunitomo K , Harada T , Watari T. Cognitive biases encountered by physicians in the emergency room . BMC Emergency Medicine . 2022 ; 22 ( 1 ): 148 . doi: 10.1186/s12873-022-00708-3 . OpenUrl CrossRef PubMed 32. ↵ Chen M , Wang Y , Wang Q , Shi J , Wang H , Ye Z , et al. Impact of human and artificial intelligence collaboration on workload reduction in medical image interpretation . npj Digital Medicine . 2024 ; 7 ( 1 ): 349 . doi: 10.1038/s41746-024-01328-w . OpenUrl CrossRef PubMed 33. ↵ Kim J , Chen ML , Rezaei SJ , Liang AS , Seav SM , Onyeka S , et al. Perspectives on Artificial Intelligence–generated responses to patient messages . JAMA Network Open . 2024 ; 7 ( 10 ): e2438535 – e2438535 . doi: 10.1001/jamanetworkopen.2024.38535 . OpenUrl CrossRef PubMed 34. ↵ Ghassemi M. Presentation matters for AI-generated clinical advice . Nature Human Behaviour . 2023 ; 7 ( 11 ): 1833 – 1835 . doi: 10.1038/s41562-023-01721-7 . OpenUrl CrossRef PubMed 35. Ali R , Connolly ID , Tang OY , Mirza FN , Johnston B , Abdulrazeq HF , et al. Bridging the literacy gap for surgical consents: an AI-human expert collaborative approach . npj Digital Medicine . 2024 ; 7 ( 1 ): 63 . doi: 10.1038/s41746-024-01039-2 . OpenUrl CrossRef PubMed 36. ↵ Pavuluri S , Sangal R , Sather J , Taylor RA . Balancing act: the complex role of artificial intelligence in addressing burnout and healthcare workforce dynamics . BMJ Health & Care Informatics . 2024 ; 31 ( 1 ): e101120 . doi: 10.1136/bmjhci-2024-101120 . OpenUrl Abstract / FREE Full Text 37. ↵ Liu X , Glocker B , McCradden MM , Ghassemi M , Denniston AK , Oakden-Rayner L. The medical algorithmic audit . The Lancet Digital Health . 2022 ; 4 ( 5 ): e384 – e397 . doi: 10.1016/S2589-7500(22)00003-6 . OpenUrl CrossRef PubMed 38. ↵ Cross JL , Choma MA , Onofrey JA . Bias in medical AI: Implications for clinical decision-making . PLOS Digital Health . 2024 ; 3 ( 11 ): 1 – 19 . doi: 10.1371/journal.pdig.0000651 . OpenUrl CrossRef 39. ↵ Aristidou A , Jena R , Topol EJ . Bridging the chasm between AI and clinical implementation . The Lancet . 2022 ; 399 ( 10325 ): 620 . doi: 10.1016/S0140-6736(22)00235-5 . OpenUrl CrossRef 40. ↵ Jongsma KR , Sand M , Milota M. Why we should not mistake accuracy of medical AI for efficiency . npj Digital Medicine . 2024 ; 7 ( 1 ): 57 . doi: 10.1038/s41746-024-01047-2 . OpenUrl CrossRef PubMed 41. ↵ Quiroz JC , Laranjo L , Kocaballi AB , Berkovsky S , Rezazadegan D , Coiera E. Challenges of developing a digital scribe to reduce clinical documentation burden . npj Digital Medicine . 2019 ; 2 ( 114 ): e101120 . doi: 10.1038/s41746-019-0190-1 . OpenUrl CrossRef 42. ↵ Wosny M , Strasser LM , Hastings J. The paradoxes of digital tools in hospitals: Qualitative interview study . J Med Internet Res . 2024 ; 26 : e56095 . doi: 10.2196/56095 . OpenUrl CrossRef PubMed 43. ↵ Liu H , Ding N , Li X , Chen Y , Sun H , Huang Y , et al. Artificial Intelligence and radiologist burnout . JAMA Network Open . 2024 ; 7 ( 11 ): e2448714 – e2448714 . doi: 10.1001/jamanetworkopen.2024.48714 . OpenUrl CrossRef 44. ↵ Ball SL , Rucci JM , Molloy-Paolillo BK , Cutrona SL , Brunner J , Mohr DC , et al. “For the first time … I am seriously fighting burnout”: clinician experiences with a challenging electronic health record transition . JAMIA Open . 2024 ; 7 ( 3 ): ooae067 . doi: 10.1093/jamiaopen/ooae067 . OpenUrl CrossRef 45. ↵ Lintern G , Motavalli A. Healthcare information systems: the cognitive challenge . BMC Medical Informatics and Decision Making . 2018 ; 18 ( 1 ): 3 . doi: 10.1186/s12911-018-0584-z . OpenUrl CrossRef 46. Kannampallil T , Adler-Milstein J. Using electronic health record audit log data for research: insights from early efforts . J Am Med Inform Assoc . 2022 ; 30 ( 1 ): 167 – 171 . doi: 10.1093/jamia/ocac173 . OpenUrl CrossRef PubMed 47. Ehrmann DE , Gallant SN , Nagaraj S , Goodfellow SD , Eytan D , Goldenberg A , et al. Evaluating and reducing cognitive load should be a priority for machine learning in healthcare . Nature Medicine . 2022 ; 28 ( 7 ): 1331 – 1333 . doi: 10.1038/s41591-022-01833-z . OpenUrl CrossRef PubMed 48. Scott IA . Using information technology to reduce diagnostic error: still a bridge too far? Internal Medicine Journal . 2022 ; 52 ( 6 ): 908 – 911 . doi: 10.1111/imj.15804 . OpenUrl CrossRef PubMed 49. Sheahan M. Ghosts in the machine . Journal of Vascular Surgery . 2023 ; 77 ( 6 ): 1803 . doi: 10.1016/j.jvs.2023.01.199 . OpenUrl CrossRef PubMed 50. ↵ Asgari E , Kaur J , Nuredini G , Balloch J , Taylor AM , Sebire N , et al. Impact of electronic health record use on cognitive load and burnout among clinicians: Narrative review . JMIR Med Inform . 2024 ; 12 : e55499 . doi: 10.2196/55499 . OpenUrl CrossRef PubMed 51. ↵ Landers C , Vayena E , Amann J , Blasimme A. Stuck in translation: Stakeholder perspectives on impediments to responsible digital health . Front Digit Health . 2023 ; 5 : 1069410 . doi: 10.3389/fdgth.2023.1069410 . OpenUrl CrossRef PubMed 52. Boag W , Hasan A , Kim JY , Revoir M , Nichols M , Ratliff W , et al. The algorithm journey map: A tangible approach to implementing AI solutions in healthcare . npj Digital Medicine . 2024 ; 7 ( 1 ): 87 . doi: 10.1038/s41746-024-01061-4 . OpenUrl CrossRef PubMed 53. Akello CK , Nabukenya J. Users involvement in the electronic health information systems development process in Uganda: what is missing in relation to requirements gathering and analysis . Oxford Open Digital Health . 2024 ; 2 : oqae020 . doi: 10.1093/oodh/oqae020 . OpenUrl CrossRef 54. ↵ Tennant R , Graham J , Kern J , Mercer K , Ansermino JM , Burns CM . A scoping review on pediatric sepsis prediction technologies in healthcare . npj Digital Medicine . 2024 ; 7 ( 1 ): 353 . doi: 10.1038/s41746-024-01361-9 . OpenUrl CrossRef PubMed 55. ↵ Society of Critical Care Medicine . Surviving Sepsis Campaign Guidelines ; 2021 . Available from: https://www.sccm.org/clinical-resources/guidelines/guidelines/surviving-sepsis-guidelines-2021 . 56. ↵ Mavin A , Wilkinson P , Harwood A , Novak M. Easy Approach to Requirements Syntax (EARS) . In: 2009 17th IEEE International Requirements Engineering Conference ; 2009 . p. 317 – 322 . 57. ↵ AWS . Kiro: The AI IDE for prototype to production ; 2025 . Available from: https://kiro.dev/ . View the discussion thread. Back to top Previous Next Posted September 24, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following A minimal set of prompts to surface reasoning in digital health Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share A minimal set of prompts to surface reasoning in digital health Ilona Kulikosvkikh , Tarzan Legović , Sergey Konovalov , Alexander Kolsanov , Tomislav Šmuc medRxiv 2025.09.22.25336413; doi: https://doi.org/10.1101/2025.09.22.25336413 Share This Article: Copy Citation Tools A minimal set of prompts to surface reasoning in digital health Ilona Kulikosvkikh , Tarzan Legović , Sergey Konovalov , Alexander Kolsanov , Tomislav Šmuc medRxiv 2025.09.22.25336413; doi: https://doi.org/10.1101/2025.09.22.25336413 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Health Informatics Subject Areas All Articles Addiction Medicine (568) Allergy and Immunology (863) Anesthesia (297) Cardiovascular Medicine (4421) Dentistry and Oral Medicine (443) Dermatology (382) Emergency Medicine (606) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1507) Epidemiology (15212) Forensic Medicine (30) Gastroenterology (1121) Genetic and Genomic Medicine (6581) Geriatric Medicine (667) Health Economics (996) Health Informatics (4520) Health Policy (1366) Health Systems and Quality Improvement (1611) Hematology (539) HIV/AIDS (1264) Infectious Diseases (except HIV/AIDS) (15906) Intensive Care and Critical Care Medicine (1103) Medical Education (620) Medical Ethics (144) Nephrology (667) Neurology (6580) Nursing (345) Nutrition (998) Obstetrics and Gynecology (1141) Occupational and Environmental Health (956) Oncology (3324) Ophthalmology (970) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (663) Pediatrics (1689) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5432) Public and Global Health (9212) Radiology and Imaging (2193) Rehabilitation Medicine and Physical Therapy (1368) Respiratory Medicine (1194) Rheumatology (593) Sexual and Reproductive Health (709) Sports Medicine (529) Surgery (709) Toxicology (99) Transplantation (288) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9ff4c6343d130db4',t:'MTc3OTM3OTAxOA=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.