Multimodal Machine Learning Approach for Diagnosing... | F1000Research "use strict";function _typeof(t){return(_typeof="function"==typeof Symbol&&"symbol"==typeof Symbol.iterator?function(t){return typeof t}:function(t){return t&&"function"==typeof Symbol&&t.constructor===Symbol&&t!==Symbol.prototype?"symbol":typeof t})(t)}!function(){var t=function(){var t,e,o=[],n=window,r=n;for(;r;){try{if(r.frames.__tcfapiLocator){t=r;break}}catch(t){}if(r===n.top)break;r=r.parent}t||(!function t(){var e=n.document,o=!!n.frames.__tcfapiLocator;if(!o)if(e.body){var r=e.createElement("iframe");r.style.cssText="display:none",r.name="__tcfapiLocator",e.body.appendChild(r)}else setTimeout(t,5);return!o}(),n.__tcfapi=function(){for(var t=arguments.length,n=new Array(t),r=0;r 3&&2===parseInt(n[1],10)&&"boolean"==typeof n[3]&&(e=n[3],"function"==typeof n[2]&&n[2]("set",!0)):"ping"===n[0]?"function"==typeof n[2]&&n[2]({gdprApplies:e,cmpLoaded:!1,cmpStatus:"stub"}):o.push(n)},n.addEventListener("message",(function(t){var e="string"==typeof t.data,o={};if(e)try{o=JSON.parse(t.data)}catch(t){}else o=t.data;var n="object"===_typeof(o)&&null!==o?o.__tcfapiCall:null;n&&window.__tcfapi(n.command,n.version,(function(o,r){var a={__tcfapiReturn:{returnValue:o,success:r,callId:n.callId}};t&&t.source&&t.source.postMessage&&t.source.postMessage(e?JSON.stringify(a):a,"*")}),n.parameter)}),!1))};"undefined"!=typeof module?module.exports=t:t()}(); dataLayer = dataLayer || []; // Standard GTM initialization - Google Consent Mode handles consent automatically (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start': new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0], j=d.createElement(s),dl=l!='dataLayer'?'&l='+l:'';j.async=true;j.src= 'https://www.googletagmanager.com/gtm.js?id='+i+dl+ '>m_auth=hzk0Vc3qFsQYhCrIoHz68A>m_preview=env-1>m_cookies_win=x';f.parentNode.insertBefore(j,f); })(window,document,'script','dataLayer','GTM-MWFK8L5J'); ;window.NREUM||(NREUM={});NREUM.init={distributed_tracing:{enabled:true},privacy:{cookies_enabled:true},ajax:{deny_list:["bam.nr-data.net"]}}; ;NREUM.loader_config={accountID:"438030",trustKey:"438030",agentID:"772317073",licenseKey:"97f8f67f26",applicationID:"772317073"} ;NREUM.info={beacon:"bam.nr-data.net",errorBeacon:"bam.nr-data.net",licenseKey:"97f8f67f26",applicationID:"772317073",sa:1} ;/*! For license information please see nr-loader-spa-1.236.0.min.js.LICENSE.txt */ (()=>{"use strict";var e,t,r={5763:(e,t,r)=>{r.d(t,{P_:()=>l,Mt:()=>g,C5:()=>s,DL:()=>v,OP:()=>T,lF:()=>D,Yu:()=>y,Dg:()=>h,CX:()=>c,GE:()=>b,sU:()=>_});var n=r(8632),i=r(9567);const o={beacon:n.ce.beacon,errorBeacon:n.ce.errorBeacon,licenseKey:void 0,applicationID:void 0,sa:void 0,queueTime:void 0,applicationTime:void 0,ttGuid:void 0,user:void 0,account:void 0,product:void 0,extra:void 0,jsAttributes:{},userAttributes:void 0,atts:void 0,transactionName:void 0,tNamePlain:void 0},a={};function s(e){if(!e)throw new Error("All info objects require an agent identifier!");if(!a[e])throw new Error("Info for ".concat(e," was never set"));return a[e]}function c(e,t){if(!e)throw new Error("All info objects require an agent identifier!");a[e]=(0,i.D)(t,o),(0,n.Qy)(e,a[e],"info")}var u=r(7056);const d=()=>{const e={blockSelector:"[data-nr-block]",maskInputOptions:{password:!0}};return{allow_bfcache:!0,privacy:{cookies_enabled:!0},ajax:{deny_list:void 0,enabled:!0,harvestTimeSeconds:10},distributed_tracing:{enabled:void 0,exclude_newrelic_header:void 0,cors_use_newrelic_header:void 0,cors_use_tracecontext_headers:void 0,allowed_origins:void 0},session:{domain:void 0,expiresMs:u.oD,inactiveMs:u.Hb},ssl:void 0,obfuscate:void 0,jserrors:{enabled:!0,harvestTimeSeconds:10},metrics:{enabled:!0},page_action:{enabled:!0,harvestTimeSeconds:30},page_view_event:{enabled:!0},page_view_timing:{enabled:!0,harvestTimeSeconds:30,long_task:!1},session_trace:{enabled:!0,harvestTimeSeconds:10},harvest:{tooManyRequestsDelay:60},session_replay:{enabled:!1,harvestTimeSeconds:60,sampleRate:.1,errorSampleRate:.1,maskTextSelector:"*",maskAllInputs:!0,get blockClass(){return"nr-block"},get ignoreClass(){return"nr-ignore"},get maskTextClass(){return"nr-mask"},get blockSelector(){return e.blockSelector},set blockSelector(t){e.blockSelector+=",".concat(t)},get maskInputOptions(){return e.maskInputOptions},set maskInputOptions(t){e.maskInputOptions={...t,password:!0}}},spa:{enabled:!0,harvestTimeSeconds:10}}},f={};function l(e){if(!e)throw new Error("All configuration objects require an agent identifier!");if(!f[e])throw new Error("Configuration for ".concat(e," was never set"));return f[e]}function h(e,t){if(!e)throw new Error("All configuration objects require an agent identifier!");f[e]=(0,i.D)(t,d()),(0,n.Qy)(e,f[e],"config")}function g(e,t){if(!e)throw new Error("All configuration objects require an agent identifier!");var r=l(e);if(r){for(var n=t.split("."),i=0;i {r.d(t,{D:()=>i});var n=r(50);function i(e,t){try{if(!e||"object"!=typeof e)return(0,n.Z)("Setting a Configurable requires an object as input");if(!t||"object"!=typeof t)return(0,n.Z)("Setting a Configurable requires a model to set its initial properties");const r=Object.create(Object.getPrototypeOf(t),Object.getOwnPropertyDescriptors(t)),o=0===Object.keys(r).length?e:r;for(let a in o)if(void 0!==e[a])try{"object"==typeof e[a]&&"object"==typeof t[a]?r[a]=i(e[a],t[a]):r[a]=e[a]}catch(e){(0,n.Z)("An error occurred while setting a property of a Configurable",e)}return r}catch(e){(0,n.Z)("An error occured while setting a Configurable",e)}}},6818:(e,t,r)=>{r.d(t,{Re:()=>i,gF:()=>o,q4:()=>n});const n="1.236.0",i="PROD",o="CDN"},385:(e,t,r)=>{r.d(t,{FN:()=>a,IF:()=>u,Nk:()=>f,Tt:()=>s,_A:()=>o,il:()=>n,pL:()=>c,v6:()=>i,w1:()=>d});const n="undefined"!=typeof window&&!!window.document,i="undefined"!=typeof WorkerGlobalScope&&("undefined"!=typeof self&&self instanceof WorkerGlobalScope&&self.navigator instanceof WorkerNavigator||"undefined"!=typeof globalThis&&globalThis instanceof WorkerGlobalScope&&globalThis.navigator instanceof WorkerNavigator),o=n?window:"undefined"!=typeof WorkerGlobalScope&&("undefined"!=typeof self&&self instanceof WorkerGlobalScope&&self||"undefined"!=typeof globalThis&&globalThis instanceof WorkerGlobalScope&&globalThis),a=""+o?.location,s=/iPad|iPhone|iPod/.test(navigator.userAgent),c=s&&"undefined"==typeof SharedWorker,u=(()=>{const e=navigator.userAgent.match(/Firefox[/\s](\d+\.\d+)/);return Array.isArray(e)&&e.length>=2?+e[1]:0})(),d=Boolean(n&&window.document.documentMode),f=!!navigator.sendBeacon},1117:(e,t,r)=>{r.d(t,{w:()=>o});var n=r(50);const i={agentIdentifier:"",ee:void 0};class o{constructor(e){try{if("object"!=typeof e)return(0,n.Z)("shared context requires an object as input");this.sharedContext={},Object.assign(this.sharedContext,i),Object.entries(e).forEach((e=>{let[t,r]=e;Object.keys(i).includes(t)&&(this.sharedContext[t]=r)}))}catch(e){(0,n.Z)("An error occured while setting SharedContext",e)}}}},8e3:(e,t,r)=>{r.d(t,{L:()=>d,R:()=>c});var n=r(2177),i=r(1284),o=r(4322),a=r(3325);const s={};function c(e,t){const r={staged:!1,priority:a.p[t]||0};u(e),s[e].get(t)||s[e].set(t,r)}function u(e){e&&(s[e]||(s[e]=new Map))}function d(){let e=arguments.length>0&&void 0!==arguments[0]?arguments[0]:"",t=arguments.length>1&&void 0!==arguments[1]?arguments[1]:"feature";if(u(e),!e||!s[e].get(t))return a(t);s[e].get(t).staged=!0;const r=[...s[e]];function a(t){const r=e?n.ee.get(e):n.ee,a=o.X.handlers;if(r.backlog&&a){var s=r.backlog[t],c=a[t];if(c){for(var u=0;s&&u {let[t,r]=e;return r.staged}))&&(r.sort(((e,t)=>e[1].priority-t[1].priority)),r.forEach((e=>{let[t]=e;a(t)})))}function f(e,t){var r=e[1];(0,i.D)(t[r],(function(t,r){var n=e[0];if(r[0]===n){var i=r[1],o=e[3],a=e[2];i.apply(o,a)}}))}},2177:(e,t,r)=>{r.d(t,{c:()=>f,ee:()=>u});var n=r(8632),i=r(2210),o=r(1284),a=r(5763),s="nr@context";let c=(0,n.fP)();var u;function d(){}function f(e){return(0,i.X)(e,s,l)}function l(){return new d}function h(){u.aborted=!0,u.backlog={}}c.ee?u=c.ee:(u=function e(t,r){var n={},c={},f={},g=!1;try{g=16===r.length&&(0,a.OP)(r).isolatedBacklog}catch(e){}var p={on:b,addEventListener:b,removeEventListener:y,emit:v,get:x,listeners:w,context:m,buffer:A,abort:h,aborted:!1,isBuffering:E,debugId:r,backlog:g?{}:t&&"object"==typeof t.backlog?t.backlog:{}};return p;function m(e){return e&&e instanceof d?e:e?(0,i.X)(e,s,l):l()}function v(e,r,n,i,o){if(!1!==o&&(o=!0),!u.aborted||i){t&&o&&t.emit(e,r,n);for(var a=m(n),s=w(e),d=s.length,f=0;fn,p:()=>i});var n=r(2177).ee.get("handle");function i(e,t,r,i,o){o?(o.buffer([e],i),o.emit(e,t,r)):(n.buffer([e],i),n.emit(e,t,r))}},4322:(e,t,r)=>{r.d(t,{X:()=>o});var n=r(5546);o.on=a;var i=o.handlers={};function o(e,t,r,o){a(o||n.E,i,e,t,r)}function a(e,t,r,i,o){o||(o="feature"),e||(e=n.E);var a=t[o]=t[o]||{};(a[r]=a[r]||[]).push([e,i])}},3239:(e,t,r)=>{r.d(t,{bP:()=>s,iz:()=>c,m$:()=>a});var n=r(385);let i=!1,o=!1;try{const e={get passive(){return i=!0,!1},get signal(){return o=!0,!1}};n._A.addEventListener("test",null,e),n._A.removeEventListener("test",null,e)}catch(e){}function a(e,t){return i||o?{capture:!!e,passive:i,signal:t}:!!e}function s(e,t){let r=arguments.length>2&&void 0!==arguments[2]&&arguments[2],n=arguments.length>3?arguments[3]:void 0;window.addEventListener(e,t,a(r,n))}function c(e,t){let r=arguments.length>2&&void 0!==arguments[2]&&arguments[2],n=arguments.length>3?arguments[3]:void 0;document.addEventListener(e,t,a(r,n))}},4402:(e,t,r)=>{r.d(t,{Ht:()=>u,M:()=>c,Rl:()=>a,ky:()=>s});var n=r(385);const i="xxxxxxxx-xxxx-4xxx-yxxx-xxxxxxxxxxxx";function o(e,t){return e?15&e[t]:16*Math.random()|0}function a(){const e=n._A?.crypto||n._A?.msCrypto;let t,r=0;return e&&e.getRandomValues&&(t=e.getRandomValues(new Uint8Array(31))),i.split("").map((e=>"x"===e?o(t,++r).toString(16):"y"===e?(3&o()|8).toString(16):e)).join("")}function s(e){const t=n._A?.crypto||n._A?.msCrypto;let r,i=0;t&&t.getRandomValues&&(r=t.getRandomValues(new Uint8Array(31)));const a=[];for(var s=0;s {r.d(t,{Bq:()=>n,Hb:()=>o,oD:()=>i});const n="NRBA",i=144e5,o=18e5},7894:(e,t,r)=>{function n(){return Math.round(performance.now())}r.d(t,{z:()=>n})},7243:(e,t,r)=>{r.d(t,{e:()=>o});var n=r(385),i={};function o(e){if(e in i)return i[e];if(0===(e||"").indexOf("data:"))return{protocol:"data"};let t;var r=n._A?.location,o={};if(n.il)t=document.createElement("a"),t.href=e;else try{t=new URL(e,r.href)}catch(e){return o}o.port=t.port;var a=t.href.split("://");!o.port&&a[1]&&(o.port=a[1].split("/")[0].split("@").pop().split(":")[1]),o.port&&"0"!==o.port||(o.port="https"===a[0]?"443":"80"),o.hostname=t.hostname||r.hostname,o.pathname=t.pathname,o.protocol=a[0],"/"!==o.pathname.charAt(0)&&(o.pathname="/"+o.pathname);var s=!t.protocol||":"===t.protocol||t.protocol===r.protocol,c=t.hostname===r.hostname&&t.port===r.port;return o.sameOrigin=s&&(!t.hostname||c),"/"===o.pathname&&(i[e]=o),o}},50:(e,t,r)=>{function n(e,t){"function"==typeof console.warn&&(console.warn("New Relic: ".concat(e)),t&&console.warn(t))}r.d(t,{Z:()=>n})},2587:(e,t,r)=>{r.d(t,{N:()=>c,T:()=>u});var n=r(2177),i=r(5546),o=r(8e3),a=r(3325);const s={stn:[a.D.sessionTrace],err:[a.D.jserrors,a.D.metrics],ins:[a.D.pageAction],spa:[a.D.spa],sr:[a.D.sessionReplay,a.D.sessionTrace]};function c(e,t){const r=n.ee.get(t);e&&"object"==typeof e&&(Object.entries(e).forEach((e=>{let[t,n]=e;void 0===u[t]&&(s[t]?s[t].forEach((e=>{n?(0,i.p)("feat-"+t,[],void 0,e,r):(0,i.p)("block-"+t,[],void 0,e,r),(0,i.p)("rumresp-"+t,[Boolean(n)],void 0,e,r)})):n&&(0,i.p)("feat-"+t,[],void 0,void 0,r),u[t]=Boolean(n))})),Object.keys(s).forEach((e=>{void 0===u[e]&&(s[e]?.forEach((t=>(0,i.p)("rumresp-"+e,[!1],void 0,t,r))),u[e]=!1)})),(0,o.L)(t,a.D.pageViewEvent))}const u={}},2210:(e,t,r)=>{r.d(t,{X:()=>i});var n=Object.prototype.hasOwnProperty;function i(e,t,r){if(n.call(e,t))return e[t];var i=r();if(Object.defineProperty&&Object.keys)try{return Object.defineProperty(e,t,{value:i,writable:!0,enumerable:!1}),i}catch(e){}return e[t]=i,i}},1284:(e,t,r)=>{r.d(t,{D:()=>n});const n=(e,t)=>Object.entries(e||{}).map((e=>{let[r,n]=e;return t(r,n)}))},4351:(e,t,r)=>{r.d(t,{P:()=>o});var n=r(2177);const i=()=>{const e=new WeakSet;return(t,r)=>{if("object"==typeof r&&null!==r){if(e.has(r))return;e.add(r)}return r}};function o(e){try{return JSON.stringify(e,i())}catch(e){try{n.ee.emit("internal-error",[e])}catch(e){}}}},3960:(e,t,r)=>{r.d(t,{K:()=>a,b:()=>o});var n=r(3239);function i(){return"undefined"==typeof document||"complete"===document.readyState}function o(e,t){if(i())return e();(0,n.bP)("load",e,t)}function a(e){if(i())return e();(0,n.iz)("DOMContentLoaded",e)}},8632:(e,t,r)=>{r.d(t,{EZ:()=>u,Qy:()=>c,ce:()=>o,fP:()=>a,gG:()=>d,mF:()=>s});var n=r(7894),i=r(385);const o={beacon:"bam.nr-data.net",errorBeacon:"bam.nr-data.net"};function a(){return i._A.NREUM||(i._A.NREUM={}),void 0===i._A.newrelic&&(i._A.newrelic=i._A.NREUM),i._A.NREUM}function s(){let e=a();return e.o||(e.o={ST:i._A.setTimeout,SI:i._A.setImmediate,CT:i._A.clearTimeout,XHR:i._A.XMLHttpRequest,REQ:i._A.Request,EV:i._A.Event,PR:i._A.Promise,MO:i._A.MutationObserver,FETCH:i._A.fetch}),e}function c(e,t,r){let i=a();const o=i.initializedAgents||{},s=o[e]||{};return Object.keys(s).length||(s.initializedAt={ms:(0,n.z)(),date:new Date}),i.initializedAgents={...o,[e]:{...s,[r]:t}},i}function u(e,t){a()[e]=t}function d(){return function(){let e=a();const t=e.info||{};e.info={beacon:o.beacon,errorBeacon:o.errorBeacon,...t}}(),function(){let e=a();const t=e.init||{};e.init={...t}}(),s(),function(){let e=a();const t=e.loader_config||{};e.loader_config={...t}}(),a()}},7956:(e,t,r)=>{r.d(t,{N:()=>i});var n=r(3239);function i(e){let t=arguments.length>1&&void 0!==arguments[1]&&arguments[1],r=arguments.length>2?arguments[2]:void 0,i=arguments.length>3?arguments[3]:void 0;return void(0,n.iz)("visibilitychange",(function(){if(t)return void("hidden"==document.visibilityState&&e());e(document.visibilityState)}),r,i)}},1214:(e,t,r)=>{r.d(t,{em:()=>v,u5:()=>N,QU:()=>S,_L:()=>I,Gm:()=>L,Lg:()=>M,gy:()=>U,BV:()=>Q,Kf:()=>ee});var n=r(2177);const i="nr@original";var o=Object.prototype.hasOwnProperty,a=!1;function s(e,t){return e||(e=n.ee),r.inPlace=function(e,t,n,i,o){n||(n="");var a,s,c,u="-"===n.charAt(0);for(c=0;c 2?n-2:0),o=2;o {r(A[T],e,w),r(E[T],e,w)})),r(l._A,"fetch",y),t.on(y+"end",(function(e,r){var n=this;if(r){var i=r.headers.get("content-length");null!==i&&(n.rxSize=i),t.emit(y+"done",[null,r],n)}else t.emit(y+"done",[e],n)})),t}const O={},j=["pushState","replaceState"];function S(e){const t=function(e){return(e||n.ee).get("history")}(e);return!l.il||O[t.debugId]++||(O[t.debugId]=1,s(t).inPlace(window.history,j,"-")),t}var P=r(3239);const C={},R=["appendChild","insertBefore","replaceChild"];function I(e){const t=function(e){return(e||n.ee).get("jsonp")}(e);if(!l.il||C[t.debugId])return t;C[t.debugId]=!0;var r=s(t),i=/[?&](?:callback|cb)=([^&#]+)/,o=/(.*)\.([^.]+)/,a=/^(\w+)(\.|$)(.*)$/;function c(e,t){var r=e.match(a),n=r[1],i=r[3];return i?c(i,t[n]):t[n]}return r.inPlace(Node.prototype,R,"dom-"),t.on("dom-start",(function(e){!function(e){if(!e||"string"!=typeof e.nodeName||"script"!==e.nodeName.toLowerCase())return;if("function"!=typeof e.addEventListener)return;var n=(a=e.src,s=a.match(i),s?s[1]:null);var a,s;if(!n)return;var u=function(e){var t=e.match(o);if(t&&t.length>=3)return{key:t[2],parent:c(t[1],window)};return{key:e,parent:window}}(n);if("function"!=typeof u.parent[u.key])return;var d={};function f(){t.emit("jsonp-end",[],d),e.removeEventListener("load",f,(0,P.m$)(!1)),e.removeEventListener("error",l,(0,P.m$)(!1))}function l(){t.emit("jsonp-error",[],d),t.emit("jsonp-end",[],d),e.removeEventListener("load",f,(0,P.m$)(!1)),e.removeEventListener("error",l,(0,P.m$)(!1))}r.inPlace(u.parent,[u.key],"cb-",d),e.addEventListener("load",f,(0,P.m$)(!1)),e.addEventListener("error",l,(0,P.m$)(!1)),t.emit("new-jsonp",[e.src],d)}(e[0])})),t}var k=r(5763);const H={};function L(e){const t=function(e){return(e||n.ee).get("mutation")}(e);if(!l.il||H[t.debugId])return t;H[t.debugId]=!0;var r=s(t),i=k.Yu.MO;return i&&(window.MutationObserver=function(e){return this instanceof i?new i(r(e,"fn-")):i.apply(this,arguments)},MutationObserver.prototype=i.prototype),t}const z={};function M(e){const t=function(e){return(e||n.ee).get("promise")}(e);if(z[t.debugId])return t;z[t.debugId]=!0;var r=n.c,o=s(t),a=k.Yu.PR;return a&&function(){function e(r){var n=t.context(),i=o(r,"executor-",n,null,!1);const s=Reflect.construct(a,[i],e);return t.context(s).getCtx=function(){return n},s}l._A.Promise=e,Object.defineProperty(e,"name",{value:"Promise"}),e.toString=function(){return a.toString()},Object.setPrototypeOf(e,a),["all","race"].forEach((function(r){const n=a[r];e[r]=function(e){let i=!1;[...e||[]].forEach((e=>{this.resolve(e).then(a("all"===r),a(!1))}));const o=n.apply(this,arguments);return o;function a(e){return function(){t.emit("propagate",[null,!i],o,!1,!1),i=i||!e}}}})),["resolve","reject"].forEach((function(r){const n=a[r];e[r]=function(e){const r=n.apply(this,arguments);return e!==r&&t.emit("propagate",[e,!0],r,!1,!1),r}})),e.prototype=a.prototype;const n=a.prototype.then;a.prototype.then=function(){var e=this,i=r(e);i.promise=e;for(var a=arguments.length,s=new Array(a),c=0;c e())),t};function m(e,t){i.inPlace(t,["onreadystatechange"],"fn-",E)}function b(){var e=this,t=r.context(e);e.readyState>3&&!t.resolved&&(t.resolved=!0,r.emit("xhr-resolved",[],e)),i.inPlace(e,f,"fn-",E)}if(function(e,t){for(var r in e)t[r]=e[r]}(o,p),p.prototype=o.prototype,i.inPlace(p.prototype,J,"-xhr-",E),r.on("send-xhr-start",(function(e,t){m(e,t),function(e){h.push(e),a&&(y?y.then(A):u?u(A):(w=-w,x.data=w))}(t)})),r.on("open-xhr-start",m),a){var y=c&&c.resolve();if(!u&&!c){var w=1,x=document.createTextNode(w);new a(A).observe(x,{characterData:!0})}}else t.on("fn-end",(function(e){e[0]&&e[0].type===d||A()}));function A(){for(var e=0;e {r.d(t,{t:()=>n});const n=r(3325).D.ajax},6660:(e,t,r)=>{r.d(t,{A:()=>i,t:()=>n});const n=r(3325).D.jserrors,i="nr@seenError"},3081:(e,t,r)=>{r.d(t,{gF:()=>o,mY:()=>i,t9:()=>n,vz:()=>s,xS:()=>a});const n=r(3325).D.metrics,i="sm",o="cm",a="storeSupportabilityMetrics",s="storeEventMetrics"},4649:(e,t,r)=>{r.d(t,{t:()=>n});const n=r(3325).D.pageAction},7633:(e,t,r)=>{r.d(t,{Dz:()=>i,OJ:()=>a,qw:()=>o,t9:()=>n});const n=r(3325).D.pageViewEvent,i="firstbyte",o="domcontent",a="windowload"},9251:(e,t,r)=>{r.d(t,{t:()=>n});const n=r(3325).D.pageViewTiming},3614:(e,t,r)=>{r.d(t,{BST_RESOURCE:()=>i,END:()=>s,FEATURE_NAME:()=>n,FN_END:()=>u,FN_START:()=>c,PUSH_STATE:()=>d,RESOURCE:()=>o,START:()=>a});const n=r(3325).D.sessionTrace,i="bstResource",o="resource",a="-start",s="-end",c="fn"+a,u="fn"+s,d="pushState"},7836:(e,t,r)=>{r.d(t,{BODY:()=>A,CB_END:()=>E,CB_START:()=>u,END:()=>x,FEATURE_NAME:()=>i,FETCH:()=>_,FETCH_BODY:()=>v,FETCH_DONE:()=>m,FETCH_START:()=>p,FN_END:()=>c,FN_START:()=>s,INTERACTION:()=>l,INTERACTION_API:()=>d,INTERACTION_EVENTS:()=>o,JSONP_END:()=>b,JSONP_NODE:()=>g,JS_TIME:()=>T,MAX_TIMER_BUDGET:()=>a,REMAINING:()=>f,SPA_NODE:()=>h,START:()=>w,originalSetTimeout:()=>y});var n=r(5763);const i=r(3325).D.spa,o=["click","submit","keypress","keydown","keyup","change"],a=999,s="fn-start",c="fn-end",u="cb-start",d="api-ixn-",f="remaining",l="interaction",h="spaNode",g="jsonpNode",p="fetch-start",m="fetch-done",v="fetch-body-",b="jsonp-end",y=n.Yu.ST,w="-start",x="-end",A="-body",E="cb"+x,T="jsTime",_="fetch"},5938:(e,t,r)=>{r.d(t,{W:()=>o});var n=r(5763),i=r(2177);class o{constructor(e,t,r){this.agentIdentifier=e,this.aggregator=t,this.ee=i.ee.get(e,(0,n.OP)(this.agentIdentifier).isolatedBacklog),this.featureName=r,this.blocked=!1}}},9144:(e,t,r)=>{r.d(t,{j:()=>m});var n=r(3325),i=r(5763),o=r(5546),a=r(2177),s=r(7894),c=r(8e3),u=r(3960),d=r(385),f=r(50),l=r(3081),h=r(8632);function g(){const e=(0,h.gG)();["setErrorHandler","finished","addToTrace","inlineHit","addRelease","addPageAction","setCurrentRouteName","setPageViewName","setCustomAttribute","interaction","noticeError","setUserId"].forEach((t=>{e[t]=function(){for(var r=arguments.length,n=new Array(r),i=0;i 1?r-1:0),i=1;i {e.exposed&&e.api[t]&&o.push(e.api[t](...n))})),o.length>1?o:o[0]}(t,...n)}}))}var p=r(2587);function m(e){let t=arguments.length>1&&void 0!==arguments[1]?arguments[1]:{},m=arguments.length>2?arguments[2]:void 0,v=arguments.length>3?arguments[3]:void 0,{init:b,info:y,loader_config:w,runtime:x={loaderType:m},exposed:A=!0}=t;const E=(0,h.gG)();y||(b=E.init,y=E.info,w=E.loader_config),(0,i.Dg)(e,b||{}),(0,i.GE)(e,w||{}),(0,i.sU)(e,x),y.jsAttributes??={},d.v6&&(y.jsAttributes.isWorker=!0),(0,i.CX)(e,y),g();const T=function(e,t){t||(0,c.R)(e,"api");const h={};var g=a.ee.get(e),p=g.get("tracer"),m="api-",v=m+"ixn-";function b(t,r,n,o){const a=(0,i.C5)(e);return null===r?delete a.jsAttributes[t]:(0,i.CX)(e,{...a,jsAttributes:{...a.jsAttributes,[t]:r}}),x(m,n,!0,o||null===r?"session":void 0)(t,r)}function y(){}["setErrorHandler","finished","addToTrace","inlineHit","addRelease"].forEach((e=>h[e]=x(m,e,!0,"api"))),h.addPageAction=x(m,"addPageAction",!0,n.D.pageAction),h.setCurrentRouteName=x(m,"routeName",!0,n.D.spa),h.setPageViewName=function(t,r){if("string"==typeof t)return"/"!==t.charAt(0)&&(t="/"+t),(0,i.OP)(e).customTransaction=(r||"http://custom.transaction")+t,x(m,"setPageViewName",!0)()},h.setCustomAttribute=function(e,t){let r=arguments.length>2&&void 0!==arguments[2]&&arguments[2];if("string"==typeof e){if(["string","number"].includes(typeof t)||null===t)return b(e,t,"setCustomAttribute",r);(0,f.Z)("Failed to execute setCustomAttribute.\nNon-null value must be a string or number type, but a type of was provided."))}else(0,f.Z)("Failed to execute setCustomAttribute.\nName must be a string type, but a type of was provided."))},h.setUserId=function(e){if("string"==typeof e||null===e)return b("enduser.id",e,"setUserId",!0);(0,f.Z)("Failed to execute setUserId.\nNon-null value must be a string type, but a type of was provided."))},h.interaction=function(){return(new y).get()};var w=y.prototype={createTracer:function(e,t){var r={},i=this,a="function"==typeof t;return(0,o.p)(v+"tracer",[(0,s.z)(),e,r],i,n.D.spa,g),function(){if(p.emit((a?"":"no-")+"fn-start",[(0,s.z)(),i,a],r),a)try{return t.apply(this,arguments)}catch(e){throw p.emit("fn-err",[arguments,this,"string"==typeof e?new Error(e):e],r),e}finally{p.emit("fn-end",[(0,s.z)()],r)}}}};function x(e,t,r,i){return function(){return(0,o.p)(l.xS,["API/"+t+"/called"],void 0,n.D.metrics,g),i&&(0,o.p)(e+t,[(0,s.z)(),...arguments],r?null:this,i,g),r?void 0:this}}function A(){r.e(439).then(r.bind(r,7438)).then((t=>{let{setAPI:r}=t;r(e),(0,c.L)(e,"api")})).catch((()=>(0,f.Z)("Downloading runtime APIs failed...")))}return["actionText","setName","setAttribute","save","ignore","onEnd","getContext","end","get"].forEach((e=>{w[e]=x(v,e,void 0,n.D.spa)})),h.noticeError=function(e,t){"string"==typeof e&&(e=new Error(e)),(0,o.p)(l.xS,["API/noticeError/called"],void 0,n.D.metrics,g),(0,o.p)("err",[e,(0,s.z)(),!1,t],void 0,n.D.jserrors,g)},d.il?(0,u.b)((()=>A()),!0):A(),h}(e,v);return(0,h.Qy)(e,T,"api"),(0,h.Qy)(e,A,"exposed"),(0,h.EZ)("activatedFeatures",p.T),T}},3325:(e,t,r)=>{r.d(t,{D:()=>n,p:()=>i});const n={ajax:"ajax",jserrors:"jserrors",metrics:"metrics",pageAction:"page_action",pageViewEvent:"page_view_event",pageViewTiming:"page_view_timing",sessionReplay:"session_replay",sessionTrace:"session_trace",spa:"spa"},i={[n.pageViewEvent]:1,[n.pageViewTiming]:2,[n.metrics]:3,[n.jserrors]:4,[n.ajax]:5,[n.sessionTrace]:6,[n.pageAction]:7,[n.spa]:8,[n.sessionReplay]:9}}},n={};function i(e){var t=n[e];if(void 0!==t)return t.exports;var o=n[e]={exports:{}};return r[e](o,o.exports,i),o.exports}i.m=r,i.d=(e,t)=>{for(var r in t)i.o(t,r)&&!i.o(e,r)&&Object.defineProperty(e,r,{enumerable:!0,get:t[r]})},i.f={},i.e=e=>Promise.all(Object.keys(i.f).reduce(((t,r)=>(i.f[r](e,t),t)),[])),i.u=e=>(({78:"page_action-aggregate",147:"metrics-aggregate",242:"session-manager",317:"jserrors-aggregate",348:"page_view_timing-aggregate",412:"lazy-feature-loader",439:"async-api",538:"recorder",590:"session_replay-aggregate",675:"compressor",733:"session_trace-aggregate",786:"page_view_event-aggregate",873:"spa-aggregate",898:"ajax-aggregate"}[e]||e)+"."+{78:"ac76d497",147:"3dc53903",148:"1a20d5fe",242:"2a64278a",317:"49e41428",348:"bd6de33a",412:"2f55ce66",439:"30bd804e",538:"1b18459f",590:"cf0efb30",675:"ae9f91a8",733:"83105561",786:"06482edd",860:"03a8b7a5",873:"e6b09d52",898:"998ef92b"}[e]+"-1.236.0.min.js"),i.o=(e,t)=>Object.prototype.hasOwnProperty.call(e,t),e={},t="NRBA:",i.l=(r,n,o,a)=>{if(e[r])e[r].push(n);else{var s,c;if(void 0!==o)for(var u=document.getElementsByTagName("script"),d=0;d {s.onerror=s.onload=null,clearTimeout(h);var i=e[r];if(delete e[r],s.parentNode&&s.parentNode.removeChild(s),i&&i.forEach((e=>e(n))),t)return t(n)},h=setTimeout(l.bind(null,void 0,{type:"timeout",target:s}),12e4);s.onerror=l.bind(null,s.onerror),s.onload=l.bind(null,s.onload),c&&document.head.appendChild(s)}},i.r=e=>{"undefined"!=typeof Symbol&&Symbol.toStringTag&&Object.defineProperty(e,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(e,"__esModule",{value:!0})},i.j=364,i.p="https://js-agent.newrelic.com/",(()=>{var e={364:0,953:0};i.f.j=(t,r)=>{var n=i.o(e,t)?e[t]:void 0;if(0!==n)if(n)r.push(n[2]);else{var o=new Promise(((r,i)=>n=e[t]=[r,i]));r.push(n[2]=o);var a=i.p+i.u(t),s=new Error;i.l(a,(r=>{if(i.o(e,t)&&(0!==(n=e[t])&&(e[t]=void 0),n)){var o=r&&("load"===r.type?"missing":r.type),a=r&&r.target&&r.target.src;s.message="Loading chunk "+t+" failed.\n("+o+": "+a+")",s.name="ChunkLoadError",s.type=o,s.request=a,n[1](s)}}),"chunk-"+t,t)}};var t=(t,r)=>{var n,o,[a,s,c]=r,u=0;if(a.some((t=>0!==e[t]))){for(n in s)i.o(s,n)&&(i.m[n]=s[n]);if(c)c(i)}for(t&&t(r);u {i.r(o);var e=i(3325),t=i(5763);const r=Object.values(e.D);function n(e){const n={};return r.forEach((r=>{n[r]=function(e,r){return!1!==(0,t.Mt)(r,"".concat(e,".enabled"))}(r,e)})),n}var a=i(9144);var s=i(5546),c=i(385),u=i(8e3),d=i(5938),f=i(3960),l=i(50);class h extends d.W{constructor(e,t,r){let n=!(arguments.length>3&&void 0!==arguments[3])||arguments[3];super(e,t,r),this.auto=n,this.abortHandler,this.featAggregate,this.onAggregateImported,n&&(0,u.R)(e,r)}importAggregator(){let e=arguments.length>0&&void 0!==arguments[0]?arguments[0]:{};if(this.featAggregate||!this.auto)return;const r=c.il&&!0===(0,t.Mt)(this.agentIdentifier,"privacy.cookies_enabled");let n;this.onAggregateImported=new Promise((e=>{n=e}));const o=async()=>{let t;try{if(r){const{setupAgentSession:e}=await Promise.all([i.e(860),i.e(242)]).then(i.bind(i,3228));t=e(this.agentIdentifier)}}catch(e){(0,l.Z)("A problem occurred when starting up session manager. This page will not start or extend any session.",e)}try{if(!this.shouldImportAgg(this.featureName,t))return void(0,u.L)(this.agentIdentifier,this.featureName);const{lazyFeatureLoader:r}=await i.e(412).then(i.bind(i,8582)),{Aggregate:o}=await r(this.featureName,"aggregate");this.featAggregate=new o(this.agentIdentifier,this.aggregator,e),n(!0)}catch(e){(0,l.Z)("Downloading and initializing ".concat(this.featureName," failed..."),e),this.abortHandler?.(),n(!1)}};c.il?(0,f.b)((()=>o()),!0):o()}shouldImportAgg(r,n){return r!==e.D.sessionReplay||!1!==(0,t.Mt)(this.agentIdentifier,"session_trace.enabled")&&(!!n?.isNew||!!n?.state.sessionReplay)}}var g=i(7633),p=i(7894);class m extends h{static featureName=g.t9;constructor(r,n){let i=!(arguments.length>2&&void 0!==arguments[2])||arguments[2];if(super(r,n,g.t9,i),("undefined"==typeof PerformanceNavigationTiming||c.Tt)&&"undefined"!=typeof PerformanceTiming){const n=(0,t.OP)(r);n[g.Dz]=Math.max(Date.now()-n.offset,0),(0,f.K)((()=>n[g.qw]=Math.max((0,p.z)()-n[g.Dz],0))),(0,f.b)((()=>{const t=(0,p.z)();n[g.OJ]=Math.max(t-n[g.Dz],0),(0,s.p)("timing",["load",t],void 0,e.D.pageViewTiming,this.ee)}))}this.importAggregator()}}var v=i(1117),b=i(1284);class y extends v.w{constructor(e){super(e),this.aggregatedData={}}store(e,t,r,n,i){var o=this.getBucket(e,t,r,i);return o.metrics=function(e,t){t||(t={count:0});return t.count+=1,(0,b.D)(e,(function(e,r){t[e]=w(r,t[e])})),t}(n,o.metrics),o}merge(e,t,r,n,i){var o=this.getBucket(e,t,n,i);if(o.metrics){var a=o.metrics;a.count+=r.count,(0,b.D)(r,(function(e,t){if("count"!==e){var n=a[e],i=r[e];i&&!i.c?a[e]=w(i.t,n):a[e]=function(e,t){if(!t)return e;t.c||(t=x(t.t));return t.min=Math.min(e.min,t.min),t.max=Math.max(e.max,t.max),t.t+=e.t,t.sos+=e.sos,t.c+=e.c,t}(i,a[e])}}))}else o.metrics=r}storeMetric(e,t,r,n){var i=this.getBucket(e,t,r);return i.stats=w(n,i.stats),i}getBucket(e,t,r,n){this.aggregatedData[e]||(this.aggregatedData[e]={});var i=this.aggregatedData[e][t];return i||(i=this.aggregatedData[e][t]={params:r||{}},n&&(i.custom=n)),i}get(e,t){return t?this.aggregatedData[e]&&this.aggregatedData[e][t]:this.aggregatedData[e]}take(e){for(var t={},r="",n=!1,i=0;i t.max&&(t.max=e),e 2&&void 0!==arguments[2])||arguments[2];super(e,r,j.t,n),c.il&&((0,t.OP)(e).initHidden=Boolean("hidden"===document.visibilityState),(0,N.N)((()=>(0,s.p)("docHidden",[(0,p.z)()],void 0,j.t,this.ee)),!0),(0,O.bP)("pagehide",(()=>(0,s.p)("winPagehide",[(0,p.z)()],void 0,j.t,this.ee))),this.importAggregator())}}var P=i(3081);class C extends h{static featureName=P.t9;constructor(e,t){let r=!(arguments.length>2&&void 0!==arguments[2])||arguments[2];super(e,t,P.t9,r),this.importAggregator()}}var R,I=i(2210),k=i(1214),H=i(2177),L={};try{R=localStorage.getItem("__nr_flags").split(","),console&&"function"==typeof console.log&&(L.console=!0,-1!==R.indexOf("dev")&&(L.dev=!0),-1!==R.indexOf("nr_dev")&&(L.nrDev=!0))}catch(e){}function z(e){try{L.console&&z(e)}catch(e){}}L.nrDev&&H.ee.on("internal-error",(function(e){z(e.stack)})),L.dev&&H.ee.on("fn-err",(function(e,t,r){z(r.stack)})),L.dev&&(z("NR AGENT IN DEVELOPMENT MODE"),z("flags: "+(0,b.D)(L,(function(e,t){return e})).join(", ")));var M=i(6660);class B extends h{static featureName=M.t;constructor(r,n){let i=!(arguments.length>2&&void 0!==arguments[2])||arguments[2];super(r,n,M.t,i),this.skipNext=0;try{this.removeOnAbort=new AbortController}catch(e){}const o=this;o.ee.on("fn-start",(function(e,t,r){o.abortHandler&&(o.skipNext+=1)})),o.ee.on("fn-err",(function(t,r,n){o.abortHandler&&!n[M.A]&&((0,I.X)(n,M.A,(function(){return!0})),this.thrown=!0,(0,s.p)("err",[n,(0,p.z)()],void 0,e.D.jserrors,o.ee))})),o.ee.on("fn-end",(function(){o.abortHandler&&!this.thrown&&o.skipNext>0&&(o.skipNext-=1)})),o.ee.on("internal-error",(function(t){(0,s.p)("ierr",[t,(0,p.z)(),!0],void 0,e.D.jserrors,o.ee)})),this.origOnerror=c._A.onerror,c._A.onerror=this.onerrorHandler.bind(this),c._A.addEventListener("unhandledrejection",(t=>{const r=function(e){let t="Unhandled Promise Rejection: ";if(e instanceof Error)try{return e.message=t+e.message,e}catch(t){return e}if(void 0===e)return new Error(t);try{return new Error(t+(0,D.P)(e))}catch(e){return new Error(t)}}(t.reason);(0,s.p)("err",[r,(0,p.z)(),!1,{unhandledPromiseRejection:1}],void 0,e.D.jserrors,this.ee)}),(0,O.m$)(!1,this.removeOnAbort?.signal)),(0,k.gy)(this.ee),(0,k.BV)(this.ee),(0,k.em)(this.ee),(0,t.OP)(r).xhrWrappable&&(0,k.Kf)(this.ee),this.abortHandler=this.#e,this.importAggregator()}#e(){this.removeOnAbort?.abort(),this.abortHandler=void 0}onerrorHandler(t,r,n,i,o){"function"==typeof this.origOnerror&&this.origOnerror(...arguments);try{this.skipNext?this.skipNext-=1:(0,s.p)("err",[o||new F(t,r,n),(0,p.z)()],void 0,e.D.jserrors,this.ee)}catch(t){try{(0,s.p)("ierr",[t,(0,p.z)(),!0],void 0,e.D.jserrors,this.ee)}catch(e){}}return!1}}function F(e,t,r){this.message=e||"Uncaught error with no additional information",this.sourceURL=t,this.line=r}let U=1;const q="nr@id";function G(e){const t=typeof e;return!e||"object"!==t&&"function"!==t?-1:e===c._A?0:(0,I.X)(e,q,(function(){return U++}))}function V(e){if("string"==typeof e&&e.length)return e.length;if("object"==typeof e){if("undefined"!=typeof ArrayBuffer&&e instanceof ArrayBuffer&&e.byteLength)return e.byteLength;if("undefined"!=typeof Blob&&e instanceof Blob&&e.size)return e.size;if(!("undefined"!=typeof FormData&&e instanceof FormData))try{return(0,D.P)(e).length}catch(e){return}}}var X=i(7243);class W{constructor(e){this.agentIdentifier=e,this.generateTracePayload=this.generateTracePayload.bind(this),this.shouldGenerateTrace=this.shouldGenerateTrace.bind(this)}generateTracePayload(e){if(!this.shouldGenerateTrace(e))return null;var r=(0,t.DL)(this.agentIdentifier);if(!r)return null;var n=(r.accountID||"").toString()||null,i=(r.agentID||"").toString()||null,o=(r.trustKey||"").toString()||null;if(!n||!i)return null;var a=(0,_.M)(),s=(0,_.Ht)(),c=Date.now(),u={spanId:a,traceId:s,timestamp:c};return(e.sameOrigin||this.isAllowedOrigin(e)&&this.useTraceContextHeadersForCors())&&(u.traceContextParentHeader=this.generateTraceContextParentHeader(a,s),u.traceContextStateHeader=this.generateTraceContextStateHeader(a,c,n,i,o)),(e.sameOrigin&&!this.excludeNewrelicHeader()||!e.sameOrigin&&this.isAllowedOrigin(e)&&this.useNewrelicHeaderForCors())&&(u.newrelicHeader=this.generateTraceHeader(a,s,c,n,i,o)),u}generateTraceContextParentHeader(e,t){return"00-"+t+"-"+e+"-01"}generateTraceContextStateHeader(e,t,r,n,i){return i+"@nr=0-1-"+r+"-"+n+"-"+e+"----"+t}generateTraceHeader(e,t,r,n,i,o){if(!("function"==typeof c._A?.btoa))return null;var a={v:[0,1],d:{ty:"Browser",ac:n,ap:i,id:e,tr:t,ti:r}};return o&&n!==o&&(a.d.tk=o),btoa((0,D.P)(a))}shouldGenerateTrace(e){return this.isDtEnabled()&&this.isAllowedOrigin(e)}isAllowedOrigin(e){var r=!1,n={};if((0,t.Mt)(this.agentIdentifier,"distributed_tracing")&&(n=(0,t.P_)(this.agentIdentifier).distributed_tracing),e.sameOrigin)r=!0;else if(n.allowed_origins instanceof Array)for(var i=0;i 2&&void 0!==arguments[2])||arguments[2];super(r,n,Z.t,i),(0,t.OP)(r).xhrWrappable&&(this.dt=new W(r),this.handler=(e,t,r,n)=>(0,s.p)(e,t,r,n,this.ee),(0,k.u5)(this.ee),(0,k.Kf)(this.ee),function(r,n,i,o){function a(e){var t=this;t.totalCbs=0,t.called=0,t.cbTime=0,t.end=E,t.ended=!1,t.xhrGuids={},t.lastSize=null,t.loadCaptureCalled=!1,t.params=this.params||{},t.metrics=this.metrics||{},e.addEventListener("load",(function(r){_(t,e)}),(0,O.m$)(!1)),c.IF||e.addEventListener("progress",(function(e){t.lastSize=e.loaded}),(0,O.m$)(!1))}function s(e){this.params={method:e[0]},T(this,e[1]),this.metrics={}}function u(e,n){var i=(0,t.DL)(r);i.xpid&&this.sameOrigin&&n.setRequestHeader("X-NewRelic-ID",i.xpid);var a=o.generateTracePayload(this.parsedOrigin);if(a){var s=!1;a.newrelicHeader&&(n.setRequestHeader("newrelic",a.newrelicHeader),s=!0),a.traceContextParentHeader&&(n.setRequestHeader("traceparent",a.traceContextParentHeader),a.traceContextStateHeader&&n.setRequestHeader("tracestate",a.traceContextStateHeader),s=!0),s&&(this.dt=a)}}function d(e,t){var r=this.metrics,i=e[0],o=this;if(r&&i){var a=V(i);a&&(r.txSize=a)}this.startTime=(0,p.z)(),this.listener=function(e){try{"abort"!==e.type||o.loadCaptureCalled||(o.params.aborted=!0),("load"!==e.type||o.called===o.totalCbs&&(o.onloadCalled||"function"!=typeof t.onload)&&"function"==typeof o.end)&&o.end(t)}catch(e){try{n.emit("internal-error",[e])}catch(e){}}};for(var s=0;s 1?e[1]=i:e.push(i)}else e[0]&&e[0].headers&&s(e[0].headers,n)&&(this.dt=n);function s(e,t){var r=!1;return t.newrelicHeader&&(e.set("newrelic",t.newrelicHeader),r=!0),t.traceContextParentHeader&&(e.set("traceparent",t.traceContextParentHeader),t.traceContextStateHeader&&e.set("tracestate",t.traceContextStateHeader),r=!0),r}}function x(e,t){this.params={},this.metrics={},this.startTime=(0,p.z)(),this.dt=t,e.length>=1&&(this.target=e[0]),e.length>=2&&(this.opts=e[1]);var r,n=this.opts||{},i=this.target;"string"==typeof i?r=i:"object"==typeof i&&i instanceof Y?r=i.url:c._A?.URL&&"object"==typeof i&&i instanceof URL&&(r=i.href),T(this,r);var o=(""+(i&&i instanceof Y&&i.method||n.method||"GET")).toUpperCase();this.params.method=o,this.txSize=V(n.body)||0}function A(t,r){var n;this.endTime=(0,p.z)(),this.params||(this.params={}),this.params.status=r?r.status:0,"string"==typeof this.rxSize&&this.rxSize.length>0&&(n=+this.rxSize);var o={txSize:this.txSize,rxSize:n,duration:(0,p.z)()-this.startTime};i("xhr",[this.params,o,this.startTime,this.endTime,"fetch"],this,e.D.ajax)}function E(t){var r=this.params,n=this.metrics;if(!this.ended){this.ended=!0;for(var o=0;o 2&&void 0!==arguments[2])||arguments[2];super(e,t,we.t,r),this.importAggregator()}}new class{constructor(e){let t=arguments.length>1&&void 0!==arguments[1]?arguments[1]:(0,_.ky)(16);c._A?(this.agentIdentifier=t,this.sharedAggregator=new y({agentIdentifier:this.agentIdentifier}),this.features={},this.desiredFeatures=new Set(e.features||[]),this.desiredFeatures.add(m),Object.assign(this,(0,a.j)(this.agentIdentifier,e,e.loaderType||"agent")),this.start()):(0,l.Z)("Failed to initial the agent. Could not determine the runtime environment.")}get config(){return{info:(0,t.C5)(this.agentIdentifier),init:(0,t.P_)(this.agentIdentifier),loader_config:(0,t.DL)(this.agentIdentifier),runtime:(0,t.OP)(this.agentIdentifier)}}start(){const t="features";try{const r=n(this.agentIdentifier),i=[...this.desiredFeatures];i.sort(((t,r)=>e.p[t.featureName]-e.p[r.featureName])),i.forEach((t=>{if(r[t.featureName]||t.featureName===e.D.pageViewEvent){const n=function(t){switch(t){case e.D.ajax:return[e.D.jserrors];case e.D.sessionTrace:return[e.D.ajax,e.D.pageViewEvent];case e.D.sessionReplay:return[e.D.sessionTrace];case e.D.pageViewTiming:return[e.D.pageViewEvent];default:return[]}}(t.featureName);n.every((e=>r[e]))||(0,l.Z)("".concat(t.featureName," is enabled but one or more dependent features has been disabled (").concat((0,D.P)(n),"). This may cause unintended consequences or missing data...")),this.features[t.featureName]=new t(this.agentIdentifier,this.sharedAggregator)}})),(0,T.Qy)(this.agentIdentifier,this.features,t)}catch(e){(0,l.Z)("Failed to initialize all enabled instrument classes (agent aborted) -",e);for(const e in this.features)this.features[e].abortHandler?.();const r=(0,T.fP)();return delete r.initializedAgents[this.agentIdentifier]?.api,delete r.initializedAgents[this.agentIdentifier]?.[t],delete this.sharedAggregator,r.ee?.abort(),delete r.ee?.get(this.agentIdentifier),!1}}}({features:[J,m,S,class extends h{static featureName=oe;constructor(t,r){if(super(t,r,oe,!(arguments.length>2&&void 0!==arguments[2])||arguments[2]),!c.il)return;const n=this.ee;let i;(0,k.QU)(n),this.eventsEE=(0,k.em)(n),this.eventsEE.on(se,(function(e,t){this.bstStart=(0,p.z)()})),this.eventsEE.on(ae,(function(t,r){(0,s.p)("bst",[t[0],r,this.bstStart,(0,p.z)()],void 0,e.D.sessionTrace,n)})),n.on(ce+ne,(function(e){this.time=(0,p.z)(),this.startPath=location.pathname+location.hash})),n.on(ce+ie,(function(t){(0,s.p)("bstHist",[location.pathname+location.hash,this.startPath,this.time],void 0,e.D.sessionTrace,n)}));try{i=new PerformanceObserver((t=>{const r=t.getEntries();(0,s.p)(te,[r],void 0,e.D.sessionTrace,n)})),i.observe({type:re,buffered:!0})}catch(e){}this.importAggregator({resourceObserver:i})}},C,xe,B,class extends h{static featureName=de;constructor(e,r){if(super(e,r,de,!(arguments.length>2&&void 0!==arguments[2])||arguments[2]),!c.il)return;if(!(0,t.OP)(e).xhrWrappable)return;try{this.removeOnAbort=new AbortController}catch(e){}let n,i=0;const o=this.ee.get("tracer"),a=(0,k._L)(this.ee),s=(0,k.Lg)(this.ee),u=(0,k.BV)(this.ee),d=(0,k.Kf)(this.ee),f=this.ee.get("events"),l=(0,k.u5)(this.ee),h=(0,k.QU)(this.ee),g=(0,k.Gm)(this.ee);function m(e,t){h.emit("newURL",[""+window.location,t])}function v(){i++,n=window.location.hash,this[ve]=(0,p.z)()}function b(){i--,window.location.hash!==n&&m(0,!0);var e=(0,p.z)();this[pe]=~~this[pe]+e-this[ve],this[ye]=e}function y(e,t){e.on(t,(function(){this[t]=(0,p.z)()}))}this.ee.on(ve,v),s.on(be,v),a.on(be,v),this.ee.on(ye,b),s.on(ge,b),a.on(ge,b),this.ee.buffer([ve,ye,"xhr-resolved"],this.featureName),f.buffer([ve],this.featureName),u.buffer(["setTimeout"+le,"clearTimeout"+fe,ve],this.featureName),d.buffer([ve,"new-xhr","send-xhr"+fe],this.featureName),l.buffer([me+fe,me+"-done",me+he+fe,me+he+le],this.featureName),h.buffer(["newURL"],this.featureName),g.buffer([ve],this.featureName),s.buffer(["propagate",be,ge,"executor-err","resolve"+fe],this.featureName),o.buffer([ve,"no-"+ve],this.featureName),a.buffer(["new-jsonp","cb-start","jsonp-error","jsonp-end"],this.featureName),y(l,me+fe),y(l,me+"-done"),y(a,"new-jsonp"),y(a,"jsonp-end"),y(a,"cb-start"),h.on("pushState-end",m),h.on("replaceState-end",m),window.addEventListener("hashchange",m,(0,O.m$)(!0,this.removeOnAbort?.signal)),window.addEventListener("load",m,(0,O.m$)(!0,this.removeOnAbort?.signal)),window.addEventListener("popstate",(function(){m(0,i>1)}),(0,O.m$)(!0,this.removeOnAbort?.signal)),this.abortHandler=this.#e,this.importAggregator()}#e(){this.removeOnAbort?.abort(),this.abortHandler=void 0}}],loaderType:"spa"})})(),window.NRBA=o})(); window.jQuery || document.write(' ') CKEDITOR_BASEPATH='https://f1000research.com/js/vendor/ckeditor/' window.reactTheme = 'research'; window.MathJax = { CommonHTML: { linebreaks: { automatic: true } }, 'HTML-CSS': { linebreaks: { automatic: true } }, SVG: { linebreaks: { automatic: true } }, AuthorInit: function() { MathJax.Hub.Register.MessageHook('End Process', function () { let timeout = false; // holder for timeout id const delay = 250; // delay after event is "complete" to run callback const reflowMath = function() { const dispFormulas = document.querySelectorAll('.disp-formula.panel'); if (!dispFormulas) { return; } for (const dispFormula of dispFormulas) { const child = dispFormula.querySelector('.MathJax_Preview').nextSibling.firstChild; const isMultiline = MathJax.Hub.getAllJax(dispFormula)[0].root.isMultiline; if (dispFormula.offsetWidth < child.offsetWidth || isMultiline) { MathJax.Hub.Queue(['Rerender', MathJax.Hub, dispFormula]); } } }; window.addEventListener('resize', function() { clearTimeout(timeout); // clear the timeout timeout = setTimeout(reflowMath, delay); // start timing for event "completion" }); }); }, }; if (window.location.hash == '#_=_'){ window.location = window.location.href.split('#')[0] } !function(f,b,e,v,n,t,s){if(f.fbq)return;n=f.fbq=function() {n.callMethod? n.callMethod.apply(n,arguments):n.queue.push(arguments)} ;if(!f._fbq)f._fbq=n; n.push=n;n.loaded=!0;n.version='2.0';n.queue=[];t=b.createElement(e);t.async=!0; t.src=v;s=b.getElementsByTagName(e)[0];s.parentNode.insertBefore(t,s)}(window, document,'script','https://connect.facebook.net/en_US/fbevents.js'); fbq('init', '1641728616063202'); fbq('track', "PixelInitialized", {}); (function(h,o,t,j,a,r){ h.hj=h.hj||function(){(h.hj.q=h.hj.q||[]).push(arguments)}; h._hjSettings={hjid:2318163,hjsv:6}; a=o.getElementsByTagName('head')[0]; r=o.createElement('script');r.async=1; r.src=t+h._hjSettings.hjid+j+h._hjSettings.hjsv; a.appendChild(r); })(window,document,'https://static.hotjar.com/c/hotjar-','.js?sv='); search file_upload Submit your research search menu close search Browse Gateways & Collections How to Publish Submit your Research My Submissions Article Guidelines Article Guidelines (New Versions) Open Data, Software and Code Guidelines Open Data and Accessible Source Materials Guidelines (HSS) Open Data, Software and Code Guidelines (PSE) Prepublication Checks Production Process Posters and Slides Guidelines Document Guidelines Article Processing Charges Peer Review Finding Article Reviewers About How it Works For Reviewers Our Advisors Policies Glossary FAQs For Developers Newsroom Contact My Research Submissions Content and Tracking Alerts My Details Sign In file_upload Submit your research { "@context": "https://schema.org", "@type": "ScholarlyArticle", "mainEntityOfPage": { "@type": "WebPage", "@id": "https://f1000research.com/articles/14-952" }, "headline": "Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis", "datePublished": "2025-09-19T15:56:56", "dateModified": "2026-02-09T13:40:11", "author": [ { "@type": "Person", "name": "Alida Widiawaty" }, { "@type": "Person", "name": "Wresti Indriatmi" }, { "@type": "Person", "name": "Wisnu Jatmiko" }, { "@type": "Person", "name": "Endi Novianto" }, { "@type": "Person", "name": "Aria Kekalih" }, { "@type": "Person", "name": "Hendra Gunawan" }, { "@type": "Person", "name": "Pramudita Satria Palar" }, { "@type": "Person", "name": "Muhammad Febrian Rachmadi" }, { "@type": "Person", "name": "Sherly Dermawan" }, { "@type": "Person", "name": "Tengku Laras Malahayati" }, { "@type": "Person", "name": "Alif Wicaksana Ramadhan" } ], "publisher": { "@type": "Organization", "name": "F1000Research", "logo": { "@type": "ImageObject", "url": "https://f1000research.com/img/AMP/F1000Research_image.png", "height": 480, "width": 60 } }, "image": { "@type": "ImageObject", "url": "https://f1000research.com/img/AMP/F1000Research_image.png", "height": 1200, "width": 150 }, "description": " Background Atopic dermatitis (AD) is a prevalent, chronic inflammatory skin disease with diverse clinical presentations, often overlapping with other dermatoses. Its diagnosis remains largely dependent on clinical expertise, leading to variability and limited diagnostic accuracy, particularly among general practitioners. This study aimed to develop and evaluate a multimodal artificial intelligence (AI) model that integrates lesion image analysis and structured anamnesis to improve AD diagnosis. Methods This diagnostic study was conducted in two phases: Phase 1 used retrospective data from 2021–2024, and Phase 2 involved prospective external validation from multiple hospitals in 2025. Patients with AD or related skin conditions were included, with diagnoses based on AAD 2014 criteria. Multimodal fusion combined ResNet50-extracted image features and MPNet-based anamnesis text features using a late fusion model. This approach mimics clinical reasoning by integrating visual and contextual clinical information to classify cases as AD or non-AD. Results and Discussion The multimodal AI model integrating ResNet50 (image) and MPNet (anamnesis) achieved 98.28% accuracy in classifying AD vs non-AD, outperforming image-or text-only models. It offers clinical advantages by mimicking physician reasoning, improving diagnostic consistency, reducing subjectivity, and enabling mass triage. However, real-world generalizability remains a challenge due to limited training diversity, potential language constraints (Bahasa Indonesia), and narrow differential diagnoses. External validation and explainable AI (XAI) are critical for broader application. Despite limitations, the model aligns with emerging literature, showing multimodal AI can approach or surpass expert-level performance in dermatological diagnosis when rigorously validated. Conclusions The multimodal ResNet50-MPNet model shows near-perfect accuracy in diagnosing AD by mimicking clinician reasoning. It offers consistent, holistic assessment but requires external validation and improved interpretability for clinical adoption. Continued AI-clinician collaboration is vital to translating this promising technology into real-world dermatological care. " } { "@context": "http://schema.org", "@type": "BreadcrumbList", "itemListElement": [ { "@type": "ListItem", "position": "1", "item": { "@id": "https://f1000research.com/", "name": "Home" } }, { "@type": "ListItem", "position": "2", "item": { "@id": "https://f1000research.com/browse/articles", "name": "Browse" } }, { "@type": "ListItem", "position": "3", "item": { "@id": "https://f1000research.com/articles/14-952/v1", "name": "Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis" } } ] } Home Browse Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis ALL Metrics - Views Downloads Get PDF Get XML Cite How to cite this article Widiawaty A, Indriatmi W, Jatmiko W et al. Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis [version 1; peer review: 1 approved, 1 approved with reservations] . F1000Research 2025, 14 :952 ( https://doi.org/10.12688/f1000research.169102.1 ) NOTE: If applicable, it is important to ensure the information in square brackets after the title is included in all citations of this article. Close Copy Citation Details Export Export Citation Sciwheel EndNote Ref. Manager Bibtex ProCite Sente EXPORT Select a format first Track Share ▬ ✚ Research Article Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis [version 1; peer review: 1 approved, 1 approved with reservations] Alida Widiawaty https://orcid.org/0009-0002-6325-0843 1,2 , Wresti Indriatmi 2,3 , Wisnu Jatmiko 4 , [...] Endi Novianto 3 , Aria Kekalih 5 , Hendra Gunawan 6 , Pramudita Satria Palar 7 , Muhammad Febrian Rachmadi 4 , Sherly Dermawan https://orcid.org/0009-0004-8530-662X 1 , Tengku Laras Malahayati 4 , Alif Wicaksana Ramadhan 4 Alida Widiawaty https://orcid.org/0009-0002-6325-0843 1,2 , Wresti Indriatmi 2,3 , [...] Wisnu Jatmiko 4 , Endi Novianto 3 , Aria Kekalih 5 , Hendra Gunawan 6 , Pramudita Satria Palar 7 , Muhammad Febrian Rachmadi 4 , Sherly Dermawan https://orcid.org/0009-0004-8530-662X 1 , Tengku Laras Malahayati 4 , Alif Wicaksana Ramadhan 4 PUBLISHED 19 Sep 2025 Author details Author details 1 Faculty of Medicine, Universitas Riau, Pekanbaru, Riau, Indonesia 2 Medical Science, Doctoral Study Program, Universitas Indonesia, Jakarta Pusat, Jakarta, Indonesia 3 Department of Dermatology and Venereology, Universitas Indonesia, Jakarta Pusat, Jakarta, Indonesia 4 Faculty of Computer Science, Universitas Indonesia, Depok, West Java, Indonesia 5 Occupational Medicine, Universitas Indonesia, Jakarta Pusat, Jakarta, Indonesia 6 Department of Dermatology and Venereology, Universitas Padjadjaran, Bandung, West Java, Indonesia 7 Faculty of Mechanical and Aerospace Engineering, Institut Teknologi Bandung, Bandung, West Java, Indonesia Alida Widiawaty Roles: Conceptualization, Methodology, Resources, Software, Writing – Original Draft Preparation, Writing – Review & Editing Wresti Indriatmi Roles: Conceptualization, Writing – Original Draft Preparation, Writing – Review & Editing Wisnu Jatmiko Roles: Writing – Original Draft Preparation, Writing – Review & Editing Endi Novianto Roles: Resources, Writing – Original Draft Preparation, Writing – Review & Editing Aria Kekalih Roles: Methodology, Writing – Review & Editing Hendra Gunawan Roles: Writing – Review & Editing Pramudita Satria Palar Roles: Writing – Review & Editing Muhammad Febrian Rachmadi Roles: Software Sherly Dermawan Roles: Writing – Review & Editing Tengku Laras Malahayati Roles: Software Alif Wicaksana Ramadhan Roles: Software OPEN PEER REVIEW DETAILS REVIEWER STATUS This article is included in the Artificial Intelligence and Machine Learning gateway. Abstract Background Atopic dermatitis (AD) is a prevalent, chronic inflammatory skin disease with diverse clinical presentations, often overlapping with other dermatoses. Its diagnosis remains largely dependent on clinical expertise, leading to variability and limited diagnostic accuracy, particularly among general practitioners. This study aimed to develop and evaluate a multimodal artificial intelligence (AI) model that integrates lesion image analysis and structured anamnesis to improve AD diagnosis. Methods This diagnostic study was conducted in two phases: Phase 1 used retrospective data from 2021–2024, and Phase 2 involved prospective external validation from multiple hospitals in 2025. Patients with AD or related skin conditions were included, with diagnoses based on AAD 2014 criteria. Multimodal fusion combined ResNet50-extracted image features and MPNet-based anamnesis text features using a late fusion model. This approach mimics clinical reasoning by integrating visual and contextual clinical information to classify cases as AD or non-AD. Results and Discussion The multimodal AI model integrating ResNet50 (image) and MPNet (anamnesis) achieved 98.28% accuracy in classifying AD vs non-AD, outperforming image-or text-only models. It offers clinical advantages by mimicking physician reasoning, improving diagnostic consistency, reducing subjectivity, and enabling mass triage. However, real-world generalizability remains a challenge due to limited training diversity, potential language constraints (Bahasa Indonesia), and narrow differential diagnoses. External validation and explainable AI (XAI) are critical for broader application. Despite limitations, the model aligns with emerging literature, showing multimodal AI can approach or surpass expert-level performance in dermatological diagnosis when rigorously validated. Conclusions The multimodal ResNet50-MPNet model shows near-perfect accuracy in diagnosing AD by mimicking clinician reasoning. It offers consistent, holistic assessment but requires external validation and improved interpretability for clinical adoption. Continued AI-clinician collaboration is vital to translating this promising technology into real-world dermatological care. READ ALL READ LESS Keywords Atopic dermatitis, Multimodal Artificial Intelligence (AI), ResNet50, MPNet, Dermatology diagnosis, Clinical decision support, Machine learning, Explainable AI (XAI) Corresponding Author(s) Alida Widiawaty ( [email protected] ) Close Corresponding author: Alida Widiawaty Competing interests: No competing interests were disclosed. Grant information: This study was supported by the Indonesian Education Scholarship, the Center for Higher Education Funding and Assessment, and the Indonesian Endowment Fund for Education. The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript. Copyright: © 2025 Widiawaty A et al . This is an open access article distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. How to cite: Widiawaty A, Indriatmi W, Jatmiko W et al. Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis [version 1; peer review: 1 approved, 1 approved with reservations] . F1000Research 2025, 14 :952 ( https://doi.org/10.12688/f1000research.169102.1 ) First published: 19 Sep 2025, 14 :952 ( https://doi.org/10.12688/f1000research.169102.1 ) Latest published: 09 Feb 2026, 14 :952 ( https://doi.org/10.12688/f1000research.169102.2 ) There is a newer version of this article available. Suppress this message for one day. Introduction Atopic dermatitis (AD) is a chronic and relapsing inflammatory skin disease frequently encountered in both children and adults. Its prevalence is estimated to be 15–20% in children and 10% in adults. 1 – 3 The onset typically occurs before the age of five, underscoring the importance of timely and accurate diagnosis to prevent complications and improve quality of life. 4 – 6 Clinically, AD is characterized by severe pruritus and xerosis, and is often associated with allergic comorbidities such as asthma and allergic rhinitis. 5 , 7 The complexity of its pathogenesis—encompassing genetic, immunologic, and environmental factors—along with diverse clinical presentations can hinder accurate diagnosis. 8 – 10 Morphologically, AD may mimic other dermatoses (e.g., psoriasis vulgaris, contact dermatitis, nummular dermatitis), leading to potential misdiagnosis if not thoroughly evaluated. 11 – 13 Another diagnostic challenge is the high inter-clinician variability. Diagnosis of AD currently relies on the clinician’s expertise through careful anamnesis and physical examination. This conventional approach is subjective, resulting in variable diagnostic accuracy, especially among general practitioners. Previous studies report diagnostic accuracy for skin diseases by general practitioners to range from 24% to 70%, markedly lower than that of dermatologists. 14 This variation in expertise and experience leads to diagnostic inconsistencies and may result in inappropriate or prolonged treatment. Even standardized severity scoring tools (e.g., SCORAD or EASI) show interobserver disparities due to the subjectivity in assessing certain clinical elements. This condition underscores the need for a more reliable and consistent diagnostic method for AD. 13 , 15 To address these diagnostic challenges, artificial intelligence (AI) presents a promising solution. Advances in AI, particularly deep learning (DL), offer new opportunities in dermatology to enhance diagnostic accuracy and consistency. Research on AI-based tools for diagnosing inflammatory skin diseases has demonstrated significant potential. 16 – 18 Various Convolutional Neural Network (CNN)-based algorithms have successfully recognized and classified skin lesions with high accuracy, comparable to that of dermatologists. 13 Wu et al. (2020) developed a DL model using EfficientNet-b4 to classify psoriasis and AD from lesion images, achieving accuracy, sensitivity, and specificity rates above 90%. Maron et al. (2019) showed that CNNs systematically outperformed 112 dermatologists in multi-class skin lesion classification, highlighting the potential of DL in dermatological diagnostics. 19 Dautovic et al. applied an artificial neural network (ANN) using nine clinical parameters to diagnose AD in both healthy individuals and AD patients. Yang et al. also utilized DL to recognize dermoscopic images of psoriasis and inflammatory diseases such as dermatitis, achieving a sensitivity of 73%. 20 Despite these promising results, several limitations persist—particularly the lack of clinical context. Most current models are trained on images alone, neglecting additional clinical information that could enhance diagnostic decision-making. 21 Such single-modality approaches risk overlooking important patient context that clinicians routinely consider in clinical practice. In fact, anamnesis and clinical information—such as patient age, chief complaints, history of atopy, lesion distribution, and family medical history—contain valuable insights that can aid in distinguishing AD from its differential diagnoses and provide a more comprehensive assessment of the patient’s condition. Fundamentally, physicians establish a diagnosis based on a combination of history taking and physical examination. The fact that only a few multimodal AI models are currently available in dermatology—especially for inflammatory skin diseases such as AD—reveals a significant research gap. Integrating clinical data into AI models has the potential to bridge this disparity, in line with the current medical trend of leveraging diverse patient data sources to enhance diagnostic accuracy. Multimodal AI approaches represent a highly promising avenue for achieving more comprehensive and accurate diagnoses of complex conditions such as AD (Yu et al., 2025). 13 , 22 , 23 This study aims to develop and evaluate an AI model with a multimodal approach, combining DL-based clinical image analysis with structured textual anamnesis using a transformer-based language model. Specifically, the architecture employs a 50-layer Residual Network (ResNet50) for image feature extraction and a Masked and Permuted Pre-training for Language Understanding (MPNet) for textual feature extraction. ResNet50 is a widely used CNN model with proven success in both medical and general image classification. 24 Its architecture introduces skip connections that help the network learn deep image features without losing critical information. In dermatology, ResNet50 has demonstrated high accuracy—for example, achieving 90% on the ISIC 2018 dataset and 95.8% on the PH2 dataset for skin disease detection. 25 MPNet is a transformer-based NLP model designed to produce rich contextual sentence representations. Combining the strengths of BERT and XLNet, MPNet effectively captures complex language patterns and generates high-dimensional text embeddings. In this study, MPNet processes structured anamnesis data (e.g., chief complaints, subjective symptoms, history of allergies, family medical history, and others) into numerical text features. The integration of MPNet ensures that relevant non-visual clinical information is appropriately incorporated into the model. Methods This diagnostic study was conducted in two phases. Phase 1 focused on the development of the AI model. This phase comprised several stages. The first stage involved the collection of medical data through retrospective review of hospital medical records from 2021 to 2024. Data included clinical information and skin lesion images of patients diagnosed with AD, psoriasis vulgaris (PV), chronic lichen simplex (CLS), nummular dermatitis (ND), and contact dermatitis (CD), as diagnosed by board-certified dermatologists. In the second stage, images were pre-labeled with relevant clinical information. The third stage involved training the machine learning (ML) model to identify discriminative features and characteristics that differentiate AD from non-AD ( Figure 4 ). Figure 1. ResNet50 training and validation accuracy image. Figure 2. F1 score image. Figure 3. Multimodal model algorithm flowchart. Figure 4. Research flow – Phase 1. Phase 2 was a multicenter validation study designed to evaluate the generalizability of the ML model trained in Phase 1. Clinical data and lesion images were collected from patients diagnosed with AD or non-AD skin conditions who visited board-certified dermatologists at various hospitals between January and May 2025. In this phase, dermatologists performed complete clinical interviews, and all clinical data were recorded using a structured form ( Figure 5 ). Figure 5. Research flow – Phase 2. In both Phases 1 and 2, skin lesion images were captured using mobile phones owned by the examining physicians. All participants formed a consecutive and provided written informed consent and agreed to the use and publication of their anonymized data, including medical history and lesion images. For minor participants, written consent was obtained from their legal guardians. Ethical approval was obtained from the Ethics Committee of the Faculty of Medicine, Universitas Indonesia–Cipto Mangunkusumo Hospital. The diagnosis of AD was established based on the criteria outlined in the American Academy of Dermatology (AAD) guidelines for the diagnosis and assessment of AD 2014. Two board-certified dermatologists independently annotated all images, achieving 100% agreement. The learning outcome was binary: AD or non-AD. All clinical images and patient data were archived systematically. The sample size was calculated using the formula for diagnostic studies, resulting in a minimum requirement of 346 participants for the AD group and 138 for the non-AD group. Multimodal fusion was implemented by integrating visual features from ResNet50 and textual features from MPNet prior to final prediction. A late fusion approach was used, in which feature vectors from both modalities were concatenated and passed through a classification layer to determine the diagnosis. This method leverages the strengths of both modalities: images provide morphological and distributional characteristics of lesions, while anamnesis text offers clinical context such as chronic pruritus, personal or family history of atopy, and comorbid asthma. The combined approach is expected to reach above 90% accuracy and emulate the way dermatologists diagnose—by integrating visual inspection with the patient’s clinical information. Results The characteristics of subjects with and without AD are presented in Table 1 . In Phase 1, a total of 926 AD samples and 697 non-AD samples were collected, while Phase 2 yielded 525 AD samples and 663 non-AD samples. The findings indicate that AD was most frequently observed in infants and children, accounting for 45.45% of cases in Phase 1 and 40% in Phase 2. Its prevalence declined with increasing age, with only 0.21% of cases occurring in individuals over 65 years old. These results are consistent with the known epidemiology of AD, which typically begins in childhood or adolescence. AD most commonly manifests in infancy and early childhood, with approximately 60% of cases developing before the age of one, and nearly all cases occurring before the age of five. 26 Table 1. Demographic and clinical characteristics of phase 1 and phase 2 study subjects. Characteristics Phase 1 Phase 2 AD Non-AD AD Non-AD n % n % n % n % Age Group Toddler: 0–5 years 189 20.41 0 0 69 13.14 3 0.45 Child: 5–11 years 125 13.50 4 0.57 98 18.67 32 4.83 Early adolescent: 12–16 years 107 11.56 20 2.87 43 8.19 11 1.66 Late adolescent: 17–25 years 199 21.49 60 8.61 89 16.95 86 12.97 Young adult: 26–35 years 107 11.56 192 27.54 77 14.67 128 19.31 Middle-aged adult: 36–45 years 109 11.77 115 16.50 67 12.76 84 12.67 Early elderly: 46–55 years 73 7.89 232 33.29 41 7.81 142 21.42 Late elderly: 56–65 years 15 1.61 74 10.62 12 2.29 109 16.44 Senior: > 65 years 2 0.21 0 0 29 5.52 68 10.26 Sex Male 460 49.68 256 36.73 242 46.10 313 47.21 Female 466 50.32 441 63.27 283 53.90 350 52.79 Duration of illness 1 week 31 3.35 16 2.30 18 3.43 58 8.75 2 weeks 15 1.62 0 0 38 7.24 50 7.54 3 weeks 0 0 2 0.29 0 0 0 0 4 weeks 34 3.67 53 7.60 23 4.38 14 2.11 > 4 weeks 846 91.36 626 89.81 446 84.95 541 81.6 Image The dataset used in this study consists of images of skin lesions from patients diagnosed with AD as well as patients suffering from other skin conditions whose lesions visually resemble those found in AD cases. To perform a supervised classification task, we categorized the images into two distinct classes: AD (representing AD lesions) and Non-AD (representing non-AD lesions). In order to enhance model generalization and robustness, we applied extensive data augmentation prior to training. Each original image was augmented five times using the Albumentations library to produce image sets with various transformations. These included horizontal and vertical flipping, random adjustments to brightness and contrast, rotations of up to 30 degrees, mild Gaussian blurring, and the addition of Gaussian noise. After augmentation, all images were resized to a standardized dimension of 224 × 224 pixels. Furthermore, pixel values were normalized using the ImageNet mean [0.485, 0.456, 0.406] and standard deviation [0.229, 0.224, 0.225] to match the input expectations of the pretrained models. For the classification task, we evaluated two different DL architectures: ResNet50 and Vision Transformer (ViT). Each model’s final classification layer was adapted to produce outputs corresponding to the two target classes, AD and Non-AD. Training was conducted using the PyTorch DL framework, which is widely used in the field of computer vision research due to its flexibility and high performance. Since the dataset used in this study is relatively small in scale, which is a common situation in the medical field where obtaining labeled images can be challenging, it becomes crucial to adopt an evaluation strategy that maximizes the use of available data while still providing a reliable estimate of the model performance. To address this, we employed the use of K-fold Cross Validation. Rather than splitting the dataset into a single training and testing group, the cross-validation approach divides the dataset into ten equal parts, or “folds.” In each round of training, the model is trained using nine of these folds and evaluated on the remaining one. This process is repeated ten times, with each fold taking a turn as the validation set. At the end of this procedure, the results from all ten rounds are averaged to provide a comprehensive assessment of the model’s performance. This technique reduces the risk of the evaluation being biased by the specific choice of training or testing data and is particularly important when dealing with medical datasets, where the number of samples can be limited. It offers a favorable balance between model accuracy and computational efficiency. During training, we also implemented an optimization algorithm called Adam, which automatically adjusts the learning rate during training to improve the model’s ability to learn from data. To further refine the training process, we applied a strategy called learning rate scheduling, where the learning rate was reduced gradually over time to allow the model to converge more smoothly. In addition, we implemented early stopping, a technique where the training process is halted if the model’s performance on validation data does not improve after a few consecutive training rounds. This prevents the model from overfitting, or memorizing the training data too much, and helps ensure that it learns patterns that are generalizable to unseen data. Throughout the training and evaluation process, we monitored several key metrics to assess model performance. These included accuracy, which measures how often the model’s predictions matched the correct labels; precision, which indicates how many of the predicted DA cases were actually correct; recall, which measures how many actual DA cases the model successfully identified; and F1-score, which balances precision and recall into a single number to give an overall sense of the model’s effectiveness. By considering these multiple aspects, we aimed to evaluate not just whether the model made correct predictions overall, but also whether it was good at correctly identifying cases of AD without missing too many or falsely predicting AD where there was none. After completing the full training and evaluation pipeline, ResNet50 emerged as the best-performing model among the three architectures tested, achieving an accuracy score of 0.8750, compared to 0.6013 for the ViT. ResNet50 consistently demonstrated superior performance across all key metrics, including higher accuracy, precision, recall, and F1-score when compared to the other model ( Table 2 ). In particular, ResNet50 exhibited strong stability during training and converged more rapidly. These results suggest that convolutional architectures with residual connections, such as ResNet, are particularly well-suited for medical image classification tasks such as skin lesion analysis, where fine-grained texture analysis is the highlight. Table 2. Key performance metrics of Resnet50 vs ViT. Model Accuracy Precision Recall F1-Score Resnet50 0.8750 0.8809 0.8750 0.8728 ViT 0.6013 0.5809 0.6013 0.5487 Text The dataset used in this study consists of anamnesis text of patients whose diagnosed with AD as well as patients suffering from other skin conditions whose lesions visually resemble those found in AD cases. Clinical text inputs were derived from dermatologist notes within medical records during Phase 1, and from patient anamnesis recorded in structured forms during Phase 2. The text in the dataset are written in Bahasa Indonesia. To perform a supervised classification task, we categorized the anamnesis into two classes, the AD and Non-AD. The anamnesis contains several parameters such as patient age, gender, symptoms, contact history, etc. Those parameters were then configured to follows a template as follows: Pasien dengan jenis kelamin: usia: klasifikasi usia: Keluhan utama dan onset: Riwayat kontak dengan bahan alergen atau iritan: Sumber infeksi: Faktor pencetus penyakit saat ini: Lama sakit: Lokasi lesi: Kriteria mayor: Kriteria minor: Riwayat penyakit dahulu: Riwayat penyakit keluarga: By generating text following this template, we obtained a string as the model input to be classified by the proposed method. After we obtain the full text as model input, we need to do pre-processing to the text before feeding it to the model. In this text processing task, the preprocessing part was done by using a tokenizer. A tokenizer is a tool or process used in natural language processing (NLP) to break down a text into smaller units, called tokens. These tokens can be words, subwords, or characters, depending on the tokenization method used. The purpose of tokenization is to transform raw text into a more manageable and structured form that can be analyzed or fed into ML models. In this study we used a pre-trained model, MPNet which is a state-of-the-art transformer model that was introduced as a variant of BERT (Bidirectional Encoder Representations from Transformers) and other transformer-based models like RoBERTa and ALBERT. MPNet improves upon BERT’s pretraining strategy by using a more sophisticated approach for handling masked tokens and learning better dependencies between tokens in a sequence. The tokenizer used in MPNet is based on the WordPiece tokenization method, which is also used in BERT and similar transformer models. The output of this MPNet pre-trained model is 768 sized vectors. To do classification task, we added some dense networks downstream the MPNet architecture and formed a single output classification. The model was created using PyTorch DL framework, which is widely used in the field of computer vision research due to its flexibility and high performance. For the training process, we splitted the dataset into training and validation parts with a ratio of 8:2. After the training process, the fine-tuned MPNet model obtained an accuracy of 100% in both validation and training data. Multimodal The multimodal approach in this study integrates two powerful models: ResNet50 for visual data and MPNet for textual data, to enhance classification performance by leveraging both image and text information. ResNet50, a deep CNN, is employed to process the images of skin lesions. These images are first preprocessed through augmentation, resizing, and normalization, ensuring compatibility with the input requirements of ResNet50. The model then generates a feature vector from the image, capturing the essential visual characteristics of the skin lesion, which represents the image data for subsequent processing. In parallel, MPNet, a transformer-based model, is applied to the textual data consisting of patients’ anamnesis information. MPNet tokenizes the text and generates a fixed-size vector (768-dimensional), which encodes the relationships and context between the words. This representation is essential for understanding the nuanced medical history of the patients, such as symptoms, age, and other relevant factors. MPNet’s ability to model contextual dependencies and generate more accurate token representations provides an edge over traditional models like BERT, especially when dealing with complex and diverse medical texts. Once both ResNet50 and MPNet have processed their respective modalities and produced their vectorized outputs, the next step is to combine these two vectors into a single unified feature representation. This fusion of image and text data ensures that the model is utilizing all available information, combining the fine-grained visual analysis from the images with the rich, contextual information from the text. The feature vectors from both modalities are concatenated, creating a comprehensive representation that encapsulates the full scope of the data. Finally, to refine the combined feature vector and prepare it for classification, several dense layers are applied downstream. These dense layers help the model learn the most relevant patterns from the multimodal data. The final output from the dense layers is a classification label that distinguishes between the two target classes: AD and Non-AD. This multimodal approach effectively leverages both image and text data, improving the model’s robustness and accuracy by considering multiple facets of the data simultaneously, which is crucial in medical classification tasks. Clinical implications, strengths, and limitations of the multimodal AI model The image-only model achieved an accuracy of 87.50% on the training set and 90.13% on the test set ( Figure 1 ). Key performance metrics, including accuracy, precision, recall, and F1 score are presented in Figure 2 and Table 2 . The text-only model achieved 100% accuracy on both the training and validation sets. Following the fusion of both modalities, the overall accuracy increased significantly to 98.28% ( Figure 3 ). The multimodal AI approach employed in this study offers several advantages. First, the AI model can consistently analyze hundreds of microscopic visual features and textual patterns without fatigue, enabling the potential for high accuracy and sensitivity across diverse cases. In fact, numerous studies have demonstrated that AI performance in dermatological diagnosis can match or even surpass that of dermatology specialists for certain specific tasks. 27 For instance, a recent meta-analysis by Salinas et al. (2024) on skin cancer diagnosis reported AI algorithms achieving a sensitivity of 87% and specificity of 77%, comparable to expert dermatologists (sensitivity 84%, specificity 74%). 28 In the context of AD, the ResNet50 model, when specifically trained, has outperformed conventional models and approached expert-level performance in assessing AD severity. 29 By integrating anamnesis data, AI can also account for factors typically gathered through patient interviews, thereby allowing for more clinically informed decision-making. AI systems can also process multiple cases simultaneously, supporting mass screening or triage workflows, thereby allowing physicians to prioritize complex cases. Moreover, multimodal AI reduces subjectivity: decisions are derived from patterns learned across hundreds of examples, rather than individual intuition, which can vary among physicians. With a reported accuracy of 98.28%, this system has strong potential as a reliable diagnostic aid, offering second opinions to clinicians and enhancing general practitioners’ confidence in correctly identifying AD. 30 Nevertheless, several important considerations must be addressed. First, the model’s outstanding performance in a controlled setting may not necessarily reflect its effectiveness in real-world clinical practice. Generalizability remains a common challenge in AI models, as they may learn patterns specific to a particular hospital’s dataset, potentially resulting in reduced accuracy when applied to different patient populations or images captured with other camera devices. While 10-fold cross-validation provides a comprehensive internal evaluation, external validation using data from independent clinics is essential to ensure the model is not overfitting. The high accuracy of 98.28% raises a concern that the model may have been overtrained on a limited dataset. In this study, external validation was conducted using datasets from multiple hospitals to ensure that the model maintains reliable and consistent performance. In future work, explainable AI (XAI) techniques could be employed to enhance interpretability, allowing the model’s decision-making process to be visually explained and verified against clinical reasoning. 31 , 32 Another key issue is interpretability. Although AI can achieve high levels of accuracy, it remains limited in its ability to explain the rationale behind a given prediction. Physicians, by contrast, can justify a diagnosis based on observable clinical features (e.g., “there is excoriation due to intense itching, a typical distribution pattern on the infant’s cheeks, and a positive family history of atopy, consistent with AD”). AI models require XAI techniques to offer similar justifications. Without such interpretability, trust in AI-generated recommendations—both among physicians and patients—may be diminished. Moreover, broader clinical context is often necessary for final decision-making. Physicians may rely on direct physical examination (e.g., palpating the skin texture), additional diagnostic tests, or further clinical history. AI models, on the other hand, can only process the limited input they are provided (i.e., images and structured textual data), making their reasoning less flexible than that of physicians. Clinicians can pose follow-up questions, revise diagnostic hypotheses in real time, and manage atypical or complex cases not represented in the training data—for example, a patient presenting with two concurrent skin conditions. Finally, physicians possess critical strengths in empathy and clinical ethics—for example, delivering a diagnosis and treatment plan in a psychologically appropriate and compassionate manner. This human element lies beyond the scope of AI models. Therefore, AI should be viewed as a complementary tool that supports physicians, rather than as a full replacement. AI is intended to serve as a decision support system, not a substitute for clinical judgment. Collaborative use of AI and physicians has been shown to improve diagnostic accuracy compared to either working alone. 33 In practice, AI can provide a rapid second opinion, while the final decision and any necessary contextual adjustments remain the responsibility of the physician. Discussion Accuracy of 98.28% and its relevance in current literature The final accuracy of 98.28% achieved by the multimodal ResNet50 and MPNet model in distinguishing between AD and non-AD cases represents an exceptionally high performance. To assess its relevance, this result must be compared with recent studies in the field of computer-aided dermatological diagnosis. In general, AI models for skin lesion classification typically achieve accuracies above 80–90%. For example, Wu et al., (2020) developed and validated an image-based DL model, AIDDA, using the EfficientNet-b4 convolutional neural network architecture to automate the diagnosis of common inflammatory skin diseases, including psoriasis, eczema, and AD. Trained on a dataset of 4,740 expert-labeled clinical images, the model achieved high diagnostic performance, with an overall accuracy of 95.8%, sensitivity of 94.4%, and specificity of 97.2%. Therefore, the 98.28% accuracy achieved in this study warrants attention as a highly promising result. It highlights the potential advantage of a multimodal approach. By incorporating additional clinical data, the model may resolve ambiguities that remain when relying on image analysis alone, allowing for near-perfect classification across samples. Other multimodal studies have also reported strong performance. Adebiyi et al. (2024), for instance, integrated lesion images with patient metadata and achieved an area under the curve (AUC) of 0.94 (94%) on the HAM10000 dataset—an improvement over image-only models. 34 In addition, recent developments in transformer-based fusion approaches, such as TFormer, have been specifically designed to deeply integrate multimodal information and have demonstrated enhanced diagnostic accuracy across various types of skin lesions. 17 Nevertheless, the scientific community emphasizes the necessity of validating AI models in real-world clinical scenarios. Burlando et al. (2024), in a recent meta-analysis, stressed the importance of external validation across diverse populations and collaborative decision-making between AI and clinicians. 28 Near-perfect accuracy may indicate model excellence, but also raises the concern of potential data leakage or bias. For instance, if structured anamnesis texts contain inadvertently predictive features (e.g., specific keywords unique to AD cases), the model might overfit to non-clinical artifacts. Thus, transparent methodological reporting—such as details on 10-fold cross-validation and feature importance analyses—is essential for interpreting these results responsibly. The 98.28% accuracy is consistent with previous studies reporting that advanced DL models, particularly those utilizing multimodal inputs, can achieve diagnostic performance comparable to or exceeding that of experienced clinicians in specific tasks. 19 This parallels recent innovations in digital dermatology, such as the PanDerm foundation model, trained on millions of multimodal images, which outperformed dermatologists in early melanoma detection. 35 Similarly, generative models like SkinGPT-4 (2024) now integrate ViT with large language models to generate diagnostic reports that approximate physician reasoning. 36 In this context, our findings contribute compelling evidence that multimodal AI has the potential to reshape dermatological diagnostics, provided that it is demonstrated to be consistent in larger-scale studies. Several limitations warrant consideration. First, the model was trained on anamnesis written in Bahasa Indonesia using a language-specific version of MPNet. Although MPNet has multilingual variants, the one applied here may not generalize effectively to English or other languages. Moreover, differences in documentation style (e.g., brief vs. narrative notes) could also impact model performance. Future implementations should consider language adaptation or employ inherently multilingual models for broader applicability. 37 Second, the differential diagnosis in the present study was restricted to four conditions: lichen simplex chronicus, psoriasis vulgaris, nummular dermatitis, and contact dermatitis. In clinical reality, AD mimickers may also include conditions such as scabies, fungal infections, or seborrheic dermatitis, which were not represented in the training data. This raises concerns about generalizability when the model is applied to unfamiliar cases. Expanding the dataset to encompass a broader spectrum of dermatoses, or transitioning to a multiclass classification model, could improve both utility and clinical relevance. Third, real-world deployment of this system would require regulatory approval, robust documentation of safety and reliability, and integration with electronic health records to ensure seamless clinical workflow. This would necessitate interdisciplinary collaboration among clinicians, engineers, and policy makers. However, to successfully implement AI, key barriers need to be addressed. Efforts should focus on ensuring algorithm transparency and adequate regulation of algorithms. Simultaneously, improving knowledge about AI could reduce the fear of replacement. Conclusion The multimodal approach combining ResNet50 and MPNet represents a breakthrough in the automated diagnosis of AD. By integrating image and textual data, the model is able to emulate a holistic diagnostic approach similar to that of clinicians, as demonstrated by its near-perfect internal accuracy. Compared to baseline physician assessments, this model offers the potential for greater consistency in diagnosis. However, its adoption in clinical practice must be supported by robust external validation and improved interpretability to gain trust within the medical community. The reported 98.28% accuracy reflects the promise of multimodal AI in dermatology, echoing broader trends in the field toward increasingly sophisticated diagnostic systems. Nonetheless, it is essential to remain critical of the limitations and challenges involved in real-world implementation. With continued advancement in AI research, collaboration between AI and clinicians holds great promise for improving diagnostic accuracy and the overall quality of care, particularly for patients with AD and other dermatologic conditions. 38 , 39 Ethical considerations Ethical approval for the study was obtained from the Health Research Ethics Committee, Faculty of Medicine, Universitas Indonesia–Cipto Mangunkusumo Hospital (certificate number KET-1477/UN2.F1/ETIK/PPM.00.02/2024). All participants provided written informed consent prior to data collection. For minor participants, written consent was obtained from their legal guardians. Ethical approval was obtained from the Ethics Committee of the Faculty of Medicine, Universitas Indonesia–Cipto Mangunkusumo Hospital. Patient data and images were anonymized before use, and no identifiable information was included in the analysis. This diagnostic study did not involve any interventional procedures. Reporting guidelines Figshare: STARD checklist for “ Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis ” https://doi.org/10.6084/m9.figshare.29925533 Data are available under the terms of the Creative Commons Attribution 4.0 International license (CC-BY 4.0). Software availability Source code available from: • https://github.com/AlidaWidiawaty/multimodal-skin-lesion-classification 41 • https://github.com/AlidaWidiawaty/multimodal-dermatitis-classification-anamnesys 42 Archived software availabile from: • https://doi.org/10.5281/zenodo.16983448 43 • https://doi.org/10.5281/zenodo.16983460 44 License: MIT License Data availability Underlying data Figshare: Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis . 40 https://doi.org/10.6084/m9.figshare.29925533 The project contains the following underlying data: • Clinical data of AD and non-AD research samples from phases 1 and 2.xlsx. Extended data Figshare: Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis . 40 https://doi.org/10.6084/m9.figshare.29925533 The project contains the following underlying data: • Questionnaires in the form of a Google Form containing clinical data of AD and non-AD patients • Translated and signed informed consent forms obtained from participants prior to lesion photography • Tables and Figures Acknowledgements The authors would like to thank the board-certified dermatologists, participating hospitals, and patients for their contributions. References 1. Langan SM, Mulick AR, Rutter CE, et al. : Trends in eczema prevalence in children and adolescents: A Global Asthma Network Phase I Study. Clin Exp Allergy. 2023 Mar; 53 (3): 337–352. Publisher Full Text 2. Hadi HA, Tarmizi AI, Khalid KA, et al. : The Epidemiology and Global Burden of Atopic Dermatitis: A Narrative Review. Life (Basel). 2021 Sept 9; 11 (9): 936. Publisher Full Text 3. Urban K, Mehrmal S, Uppal P, et al. : The global burden of skin cancer: A longitudinal analysis from the Global Burden of Disease Study, 1990-2017. JAAD Int. 2021 Mar; 2 : 98–108. PubMed Abstract | Publisher Full Text | Free Full Text 4. Kelly KA, Balogh EA, Kaplan SG, et al. : Skin Disease in Children: Effects on Quality of Life, Stigmatization, Bullying, and Suicide Risk in Pediatric Acne, Atopic Dermatitis, and Psoriasis Patients. Children (Basel). 2021 Nov 16; 8 (11): 1057. Publisher Full Text 5. Abdel-Mageed HM: Atopic dermatitis: a comprehensive updated review of this intriguing disease with futuristic insights. Inflammopharmacol. 2025 Mar 1; 33 (3): 1161–1187. PubMed Abstract | Publisher Full Text | Free Full Text 6. Hon KL, Chu S, Leung AKC: Quality of Life for Children with Allergic Skin Diseases. Curr. Pediatr. Rev. 2022; 18 (3): 191–196. Publisher Full Text 7. Jeskey J, Kurien C, Blunk H, et al. : Atopic Dermatitis: A Review of Diagnosis and Treatment. J. Pediatr. Pharmacol. Ther. 2024 Dec; 29 (6): 587–603. PubMed Abstract | Publisher Full Text | Free Full Text 8. Fyhrquist N, Yang Y, Karisola P, et al. : Endotypes of atopic dermatitis. J. Allergy Clin. Immunol. 2025 July; 156 (1): 24–40.e4. PubMed Abstract | Publisher Full Text 9. Criado PR, Miot HA, Bueno-Filho R, et al. : Update on the pathogenesis of atopic dermatitis. An. Bras. Dermatol. 2024; 99 (6): 895–915. PubMed Abstract | Publisher Full Text | Free Full Text 10. Eichenfield LF, Tom WL, Berger TG, et al. : Guidelines of care for the management of atopic dermatitis: section 2. Management and treatment of atopic dermatitis with topical therapies. J. Am. Acad. Dermatol. 2014 July; 71 (1): 116–132. PubMed Abstract | Publisher Full Text | Free Full Text 11. Johansson EK, Bergström A, Kull I, et al. : Prevalence and characteristics of atopic dermatitis among young adult females and males-report from the Swedish population-based study BAMSE. J. Eur. Acad. Dermatol. Venereol. 2022 May; 36 (5): 698–704. PubMed Abstract | Publisher Full Text | Free Full Text 12. Napolitano M, Fabbrocini G, Martora F, et al. : Children atopic dermatitis: Diagnosis, mimics, overlaps, and therapeutic implication. Dermatol. Ther. 2022 Dec; 35 (12): e15901. PubMed Abstract | Publisher Full Text 13. Cao F, Yang Y, Guo C, et al. : Advancements in artificial intelligence for atopic dermatitis: diagnosis, treatment, and patient management. Ann. Med. 2025 Dec; 57 (1): 2484665. PubMed Abstract | Publisher Full Text | Free Full Text 14. Tran H, Chen K, Lim AC, et al. : Assessing diagnostic skill in dermatology: a comparison between general practitioners and dermatologists. Australas. J. Dermatol. 2005 Nov; 46 (4): 230–234. PubMed Abstract | Publisher Full Text 15. Chopra R, Vakharia PP, Sacotte R, et al. : Relationship between EASI and SCORAD severity assessments for atopic dermatitis. J. Allergy Clin. Immunol. 2017 Dec; 140 (6): 1708–1710.e1. PubMed Abstract | Publisher Full Text | Free Full Text 16. Chan S, Reddy V, Myers B, et al. : Machine Learning in Dermatology: Current Applications, Opportunities, and Limitations. Dermatol Ther (Heidelb). 2020 June; 10 (3): 365–386. PubMed Abstract | Publisher Full Text | Free Full Text 17. Zhang Y, Xie F, Chen J: TFormer: A throughout fusion transformer for multi-modal skin lesion diagnosis. Comput. Biol. Med. 2023 May; 157 : 106712. PubMed Abstract | Publisher Full Text 18. Escalé-Besa A, Yélamos O, Vidal-Alaball J, et al. : Exploring the potential of artificial intelligence in improving skin lesion diagnosis in primary care. Sci. Rep. 2023 Mar 15; 13 (1): 4293. PubMed Abstract | Publisher Full Text | Free Full Text 19. Wu H, Yin H, Chen H, et al. : A deep learning, image based approach for automated diagnosis for inflammatory skin diseases. Ann Transl Med. 2020 May; 8 (9): 581. PubMed Abstract | Publisher Full Text | Free Full Text 20. Dautovic A, Dondras B, Dervisbegovic F, et al. : Diagnosis of Atopic dermatitis Using Artificial Neural Network. IFAC PapersOnLine. 2022; 55 (4): 51–55. Publisher Full Text 21. Luo N, Zhong X, Su L, et al. : Artificial intelligence-assisted dermatology diagnosis: From unimodal to multimodal. Comput. Biol. Med. 2023 Oct; 165 : 107413. PubMed Abstract | Publisher Full Text 22. Yu Y, Jia H, Zhang L, et al. : Deep multi-modal skin-imaging based information-switching network for skinlesion recognition. Bioengineering. 2025; 12 : 282. PubMed Abstract | Publisher Full Text | Free Full Text 23. Mohamed EH, Abdu N, Khalil M, et al. : MiSC: A hybrid multi-modal deep learning approach for accurate skin cancer detection. Multimed. Tools Appl. 2025 June 4 [cited 2025 Aug 15]. Publisher Full Text 24. Abid MH, Ashraf R, Mahmood T, et al. : Multi-modal medical image classification using deep residual network and genetic algorithm. PLoS One. 2023; 18 (6): e0287786. PubMed Abstract | Publisher Full Text | Free Full Text 25. Musthafa MM, Mahesh TR, Vinoth Kumar V, et al. : Enhanced skin cancer diagnosis using optimized CNN architecture and checkpoints for automated dermatological lesion classification. BMC Med. Imaging. 2024 Aug 2; 24 (1): 201. PubMed Abstract | Publisher Full Text | Free Full Text 26. Kolb L, Ferrer-Bruker SJ: Atopic Dermatitis. StatPearls. Treasure Island (FL): StatPearls Publishing; 2025 [cited 2025 Aug 15]. Reference Source 27. Mevorach L, Farcomeni A, Pellacani G, et al. : A Comparison of Skin Lesions’ Diagnoses Between AI-Based Image Classification, an Expert Dermatologist, and a Non-Expert. Diagnostics (Basel). 2025 Apr 28; 15 (9): 1115. PubMed Abstract | Publisher Full Text | Free Full Text 28. Salinas MP, Sepúlveda J, Hidalgo L, et al. : A systematic review and meta-analysis of artificial intelligence versus clinicians for skin cancer diagnosis. npj Digit Med. 2024 May 14; 7 (1): 125. PubMed Abstract | Publisher Full Text | Free Full Text 29. Maulana A, Noviandy TR, Suhendra R, et al. : Evaluation of atopic dermatitis severity using artificial intelligence. Narra J. 2023 Dec; 3 (3): e511. PubMed Abstract | Publisher Full Text | Free Full Text 30. Park H, Woo CY, Lim S, et al. : Comparisons between a Large Language Model-based Real-Time Compound Diagnostic Medical AI Interface and Physicians for Common Internal Medicine Cases using Simulated Patients. arXiv. 2025 [cited 2025 June 19]. Reference Source 31. de Hond AAH , Leeuwenberg AM, Hooft L, et al. : Guidelines and quality criteria for artificial intelligence-based prediction models in healthcare: a scoping review. npj Digit Med. 2022 Jan 10; 5 (1): 2. PubMed Abstract | Publisher Full Text | Free Full Text 32. Liopyris K, Gregoriou S, Dias J, et al. : Artificial Intelligence in Dermatology: Challenges and Perspectives. Dermatol Ther (Heidelb). 2022 Oct 28; 12 (12): 2637–2651. PubMed Abstract | Publisher Full Text | Free Full Text 33. Verghese A, Shah NH, Harrington RA: What This Computer Needs Is a Physician: Humanism and Artificial Intelligence. JAMA. 2018 Jan 2; 319 (1): 19–20. Publisher Full Text 34. Raza A, Penuel WR, Sumner T: Designing Visual Learning Analytics for Supporting Equity in STEM Classrooms. arXiv.org. 2024 [cited 2025 June 19]: 1–14. Publisher Full Text Reference Source 35. Yan S, Yu Z, Primiero C, et al. : A multimodal vision foundation model for clinical dermatology. Nat. Med. 2025 June 6; 1–12. 36. Zhou J, He X, Sun L, et al. : Pre-trained multimodal large language model enhances dermatological diagnosis using SkinGPT-4. Nat. Commun. 2024 July 5; 15 (1): 5649. PubMed Abstract | Publisher Full Text | Free Full Text 37. Muennighoff N, Tazi N, Magne L, et al. : MTEB: Massive Text Embedding Benchmark. arXiv. 2023 [cited 2025 June 19]. Reference Source 38. Daneshjou R, Kovarik C, Ko JM: Towards Realization of Augmented Intelligence in Dermatology: Advances and Future Directions. arXiv.org. 2021 [cited 2025 June 19]. Reference Source 39. Kaczmarczyk R, Wilhelm TI, Martin R, et al. : Evaluating multimodal AI in medical diagnostics. npj Digit Med. 2024 Aug 7; 7 (1): 205. PubMed Abstract | Publisher Full Text | Free Full Text 40. Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis. figshare 2025 [cited 2025 Aug 17]. Reference Source 41. AlidaWidiawaty: AlidaWidiawaty/multimodal-skin-lesion-classification.2025 [cited 2025 Aug 29]. Reference Source 42. AlidaWidiawaty: AlidaWidiawaty/multimodal-dermatitis-classification-anamnesys.2025 [cited 2025 Aug 29]. Reference Source 43. AlidaWidiawaty: AlidaWidiawaty/multimodal-skin-lesion-classification: v1.0.0. Zenodo. 2025 [cited 2025 Aug 29]. Reference Source 44. AlidaWidiawaty: AlidaWidiawaty/multimodal-dermatitis-classification-anamnesys: v1.0.0. Zenodo. 2025 [cited 2025 Aug 29]. Reference Source Comments on this article Comments (0) Version 2 VERSION 2 PUBLISHED 19 Sep 2025 ADD YOUR COMMENT Comment Author details Author details 1 Faculty of Medicine, Universitas Riau, Pekanbaru, Riau, Indonesia 2 Medical Science, Doctoral Study Program, Universitas Indonesia, Jakarta Pusat, Jakarta, Indonesia 3 Department of Dermatology and Venereology, Universitas Indonesia, Jakarta Pusat, Jakarta, Indonesia 4 Faculty of Computer Science, Universitas Indonesia, Depok, West Java, Indonesia 5 Occupational Medicine, Universitas Indonesia, Jakarta Pusat, Jakarta, Indonesia 6 Department of Dermatology and Venereology, Universitas Padjadjaran, Bandung, West Java, Indonesia 7 Faculty of Mechanical and Aerospace Engineering, Institut Teknologi Bandung, Bandung, West Java, Indonesia Alida Widiawaty Roles: Conceptualization, Methodology, Resources, Software, Writing – Original Draft Preparation, Writing – Review & Editing Wresti Indriatmi Roles: Conceptualization, Writing – Original Draft Preparation, Writing – Review & Editing Wisnu Jatmiko Roles: Writing – Original Draft Preparation, Writing – Review & Editing Endi Novianto Roles: Resources, Writing – Original Draft Preparation, Writing – Review & Editing Aria Kekalih Roles: Methodology, Writing – Review & Editing Hendra Gunawan Roles: Writing – Review & Editing Pramudita Satria Palar Roles: Writing – Review & Editing Muhammad Febrian Rachmadi Roles: Software Sherly Dermawan Roles: Writing – Review & Editing Tengku Laras Malahayati Roles: Software Alif Wicaksana Ramadhan Roles: Software Competing interests No competing interests were disclosed. Grant information This study was supported by the Indonesian Education Scholarship, the Center for Higher Education Funding and Assessment, and the Indonesian Endowment Fund for Education. The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript. Article Versions (2) version 2 Revised Published: 09 Feb 2026, 14:952 https://doi.org/10.12688/f1000research.169102.2 version 1 Published: 19 Sep 2025, 14:952 https://doi.org/10.12688/f1000research.169102.1 Copyright © 2025 Widiawaty A et al . This is an open access article distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. Download Export To Sciwheel Bibtex EndNote ProCite Ref. Manager (RIS) Sente metrics Views Downloads F1000Research - - PubMed Central info_outline Data from PMC are received and updated monthly. - - Citations open_in_new 0 open_in_new 0 open_in_new SEE MORE DETAILS CITE how to cite this article Widiawaty A, Indriatmi W, Jatmiko W et al. Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis [version 1; peer review: 1 approved, 1 approved with reservations] . F1000Research 2025, 14 :952 ( https://doi.org/10.12688/f1000research.169102.1 ) NOTE: If applicable, it is important to ensure the information in square brackets after the title is included in all citations of this article. COPY CITATION DETAILS track receive updates on this article Track an article to receive email alerts on any updates to this article. TRACK THIS ARTICLE Share Open Peer Review Current Reviewer Status: ? Key to Reviewer Statuses VIEW HIDE Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions Version 1 VERSION 1 PUBLISHED 19 Sep 2025 Views 0 Cite How to cite this report: Krzywicki T. Reviewer Report For: Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis [version 1; peer review: 1 approved, 1 approved with reservations] . F1000Research 2025, 14 :952 ( https://doi.org/10.5256/f1000research.186388.r446710 ) The direct URL for this report is: https://f1000research.com/articles/14-952/v1#referee-response-446710 NOTE: it is important to ensure the information in square brackets after the title is included in this citation. Close Copy Citation Details Reviewer Report 16 Jan 2026 Tomasz Krzywicki , University of Warmia and Mazury in Olsztyn, Olsztyn, Warmian-Masurian Voivodeship, Poland Approved with Reservations VIEWS 0 https://doi.org/10.5256/f1000research.186388.r446710 The article concerns the proposal of a solution in the form of a multimodal neural network model supporting skin diagnostics by aggregating clinical information from photos and texts. The idea of aggregation of many modalities in modelling a clinical ... Continue reading READ ALL The article concerns the proposal of a solution in the form of a multimodal neural network model supporting skin diagnostics by aggregating clinical information from photos and texts. The idea of aggregation of many modalities in modelling a clinical decision is already well known in the scientific literature, and the authors used in this case the common generic families of neural network architectures: ResNet and BERT. While the article itself looks interesting, I have noticed a few flaws that the authors should refer to. It is worth specifying at the beginning what kind of clinical information was included in the text data. Was there information that was unobservable from the point of view of the visual skin analysis, which meant that it was not correlated with the information contained in the photos? It is worth clarifying what experience the specialists have had in describing the data. Is it worth clarifying how the ground truth of the photo descriptions was selected? What would be the procedure if the specialists (with a completely independent evaluation) assigned different ratings to the photos? Sections regarding descriptions of dataset characteristics, details of training models and initial data preparation should be moved from "Results" to "Methods" or create a separate chapter, e.g. "Materials". The details of the training do not apply to the results. This chapter should contain the final results. Table 2 should be included in the paragraph with the first reference to. In this table, the authors present the result of the comparison of the accuracy of the classification obtained on the ViT and ResNet architectures. It is worth mentioning that these results, with the current data set, should not be summarised with each other. One of the important requirements of the Transformer architecture is a sufficiently large set of training data, where most often the minimum requirements apply to several hundred thousand images, and reasonably, at least a million. With such a small dataset, the ViT architecture is doomed to failure. With such a small dataset, other CNN-based architectures should be compared, e.g. ResNet, Inception and Xception. The article lacks a coherent scheme presenting the final multimodal architecture and information about the training. Yes, Figure 3 presents a complete flow from data collection stage to inference. However, there is no information about the final model itself. Were the models that process the image and text learned together with the final classifier, jointly correcting errors? Or is the final classifier a separate model that classifies independent image and text inputs? Figures 1 and 2 only provide information about how the quality of the classification indicators changed during the training iterations. In my opinion, they do not contribute anything significant to the results. In addition, Figure 1 shows the features of overfitting model based on the ResNet architecture, which raises serious doubts about the reliability of the results. The dataset used in the experiment was unbalanced in terms of the number of photos in decision classes. The authors do not specify how they solved this problem in the context of training and evaluating model results. According to the names of the quality measures, the authors refer to their global versions intended for balanced datasets. Figures 4 and 5 are trivial and contribute nothing but to the repetition of the content of the previous paragraphs. The final results of the accuracy of clinical models are standard given in confidence intervals at least using typical statistical indicators: sensitivity, specificity, PPV and NPV. For better reception, it is worth listing them in the table. Is the work clearly and accurately presented and does it cite the current literature? Yes Is the study design appropriate and is the work technically sound? No Are sufficient details of methods and analysis provided to allow replication by others? No If applicable, is the statistical analysis and its interpretation appropriate? Partly Are all the source data underlying the results available to ensure full reproducibility? No Are the conclusions drawn adequately supported by the results? Partly Competing Interests: No competing interests were disclosed. Reviewer Expertise: computer vision, deep learning, reinforcement learning, biomedical engineering, parallel processing I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above. Close READ LESS CITE CITE HOW TO CITE THIS REPORT Krzywicki T. Reviewer Report For: Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis [version 1; peer review: 1 approved, 1 approved with reservations] . F1000Research 2025, 14 :952 ( https://doi.org/10.5256/f1000research.186388.r446710 ) The direct URL for this report is: https://f1000research.com/articles/14-952/v1#referee-response-446710 NOTE: it is important to ensure the information in square brackets after the title is included in all citations of this article. COPY CITATION DETAILS Report a concern Author Response 09 Feb 2026 Alida Widiawaty , Faculty of Medicine, Universitas Riau, Pekanbaru, Indonesia 09 Feb 2026 Author Response Dear Tomasz Krzywicki University of Warmia and Mazury in Olsztyn, Olsztyn, Warmian-Masurian Voivodeship, Poland We thank the reviewer for the thorough evaluation of our manuscript and for the constructive ... Continue reading Dear Tomasz Krzywicki University of Warmia and Mazury in Olsztyn, Olsztyn, Warmian-Masurian Voivodeship, Poland We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved the clarity, transparency, and methodological rigor of the study. All points raised have been carefully addressed, and the manuscript has been revised accordingly. 1. Clarification of clinical information Reviewer comment: It is worth specifying at the beginning what kind of clinical information was included in the text data. Was there information that was unobservable from the point of view of the visual skin analysis, which meant that it was not correlated with the information contained in the photos? Response: Thank you for this valuable suggestion. We have clarified the clinical variables included in the textual modality at the beginning of the Methods section. Specifically, clinical information incorporated into the text data for non–atopic dermatitis (non-AD) cases comprised sex, age, chief complaint with onset, history of exposure to allergens or irritants, source of infection, current triggering factors, duration of illness, lesion location, past medical history, and family medical history. For atopic dermatitis (AD) cases, additional inputs included major and minor diagnostic criteria. Importantly, several of these variables—such as symptom onset, exposure history, triggering factors, and family history—are not directly observable from visual skin analysis and therefore provide complementary, non-visual clinical context beyond the information contained in the images. 2. Clarification of the specialists' experience Reviewer comment: It is worth clarifying what experience the specialists have had in describing the data. Response: Thank you for this suggestion. We have clarified the expertise of the annotators in the Methods section. Specifically, all images were independently annotated by two board-certified dermatologists, each with over 20 years of clinical experience in inflammatory dermatoses, achieving 100% inter-rater agreement. 3. Clarification of how the photo descriptions was selected Reviewer comment: Is it worth clarifying how the ground truth of the photo descriptions was selected? What would be the procedure if the specialists (with a completely independent evaluation) assigned different ratings to the photos? Response: Thank you for this comment. Ground truth photo descriptions were established based on independent annotations performed by two board-certified dermatologists. Complete inter-rater agreement (100%) was achieved across all images; therefore, all annotated photo descriptions were retained for analysis. We have added clarification that, in the event of discrepant ratings, images with discordant annotations and their associated clinical data would have been excluded from the dataset to avoid introducing ambiguity in the ground truth labels. 4. Revision of the results section Reviewer comment: Sections regarding descriptions of dataset characteristics, details of training models and initial data preparation should be moved from "Results" to "Methods" or create a separate chapter, e.g. "Materials". The details of the training do not apply to the results. This chapter should contain the final results. Response: Thank you for this comment. We have revised the manuscript structure by moving the descriptions of dataset characteristics, model training details, and initial data preparation from the Results section to a separate chapter entitled Materials, as suggested. The Results section has been streamlined to present only the final performance outcomes of the models. 5. Clarification of the comparison between ResNet and Vision Transformer (ViT) Reviewer comment: Table 2 should be included in the paragraph with the first reference to. In this table, the authors present the result of the comparison of the accuracy of the classification obtained on the ViT and ResNet architectures. It is worth mentioning that these results, with the current data set, should not be summarised with each other. One of the important requirements of the Transformer architecture is a sufficiently large set of training data, where most often the minimum requirements apply to several hundred thousand images, and reasonably, at least a million. With such a small dataset, the ViT architecture is doomed to failure. With such a small dataset, other CNN-based architectures should be compared, e.g. ResNet, Inception and Xception. Response: Thank you for this valuable comment. Table 2 has been relocated to appear immediately after its first mention in the text. In response to the reviewer’s concern, the direct performance comparison with the Vision Transformer (ViT) architecture has been removed from Table 2. We have also revised the Methods section to clarify that the ViT model was included for exploratory purposes only. Given the limited dataset size, ViT was not expected to achieve optimal performance, as transformer-based architectures generally require substantially larger training datasets. Accordingly, ViT results were not used as a basis for direct performance comparison with CNN-based models. In addition, the Discussion section has been expanded to explicitly state that any comparison between CNN-based architectures and ViT should be interpreted with caution. The relatively small dataset in this study likely constrained the performance of the ViT model, consistent with the known data requirements of transformer-based approaches. 6. Clarification of the final multimodal architecture and information about the training Reviewer comment: The article lacks a coherent scheme presenting the final multimodal architecture and information about the training. Yes, Figure 3 presents a complete flow from data collection stage to inference. However, there is no information about the final model itself. Were the models that process the image and text learned together with the final classifier, jointly correcting errors? Or is the final classifier a separate model that classifies independent image and text inputs? Response: Thank you for this comment. We have clarified the final multimodal architecture and training strategy in the Methods section. Once ResNet50 and MPNet processed their respective modalities and generated modality-specific feature embeddings, the resulting vectors were concatenated to form a unified multimodal representation. This late-fusion strategy integrates fine-grained visual information from images with contextual information derived from clinical text. The image and text encoders were trained independently, and their parameters were kept fixed during multimodal training. The concatenated feature vector was subsequently passed through several fully connected layers, which were trained as a separate classifier to distinguish between atopic dermatitis (AD) and non–atopic dermatitis (non-AD) cases. No end-to-end joint optimization across modalities was performed. 7. Revision of results section and removal of redundant figures Reviewer comment: Figures 1 and 2 only provide information about how the quality of the classification indicators changed during the training iterations. In my opinion, they do not contribute anything significant to the results. In addition, Figure 1 shows the features of overfitting model based on the ResNet architecture, which raises serious doubts about the reliability of the results. Response: Thank you for this insightful comment. We agree that Figures 1 and 2 primarily illustrate training dynamics rather than final model performance and do not add substantial value to the presentation of the results. Moreover, as the learning curves may raise concerns regarding overfitting, we have removed Figures 1 and 2 from the revised manuscript. The Results section has been refocused on the final evaluation metrics obtained on the test set, which more accurately reflect the clinical performance of the proposed models. 8. Handling Class Imbalance and Evaluation Metrics Reviewer comment: The dataset used in the experiment was unbalanced in terms of the number of photos in decision classes. The authors do not specify how they solved this problem in the context of training and evaluating model results. According to the names of the quality measures, the authors refer to their global versions intended for balanced datasets. Response: Thank you for this comment. The dataset was imbalanced with respect to the number of samples per class. To address this issue during model development, we have added information indicating that stratified splitting was applied to preserve class proportions across the training, validation, and test sets. For performance evaluation, class-imbalance–aware metrics were used, including weighted precision, weighted recall, and weighted F1-score, in addition to overall accuracy. These weighted metrics compute class-wise scores and aggregate them according to class prevalence, thereby providing a more reliable assessment under imbalanced data conditions. 9. Inclusion of research flow diagrams Reviewer comment: Figures 4 and 5 are trivial and contribute nothing but to the repetition of the content of the previous paragraphs. Response: Thank you for this comment. Figures 2 and 3 (previously Figures 4 and 5) were included to comply with the STARD 2015 reporting guidelines, specifically the recommended flow of participants diagram. These figures provide a transparent visual summary of the study flow, including participant inclusion and data processing steps, which may not be fully conveyed through narrative text alone. 10. Addition of confidence intervals and diagnostic performance table Reviewer comment: The final results of the accuracy of clinical models are standard given in confidence intervals at least using typical statistical indicators: sensitivity, specificity, PPV and NPV. For better reception, it is worth listing them in the table. Thank you for this important comment. We have revised the manuscript to report the final diagnostic performance of the multimodal ResNet50–MPNet model using standard clinical metrics, including accuracy, sensitivity, specificity, PPV, and NPV, each accompanied by 95% confidence intervals. The final accuracy of 98.28% (95% confidence interval = 96.93 - 99.65), sensitivity of 99.71% (95% confidence interval = 99.14 - 100), specificity of 97.21% (95% confidence interval = 95.01 - 99.41), Negative Predictive Value (NPV) 99.5% and Positive Predictive Value (PPV) 98.3%. These results are now summarized in a dedicated table entitled “Diagnostic Performance of the Multimodal ResNet50–MPNet Model” to improve clarity and clinical interpretability. We have revised the manuscript in accordance with all the reviewers’ comments. Thank you once again for your constructive guidance. Please let us know if any further clarification or revisions are required. Warm regards, Alida Widiawaty Faculty of Medicine, Universitas Riau, Pekanbaru, 28133, Indonesia The Doctoral Program in Medical Sciences, Faculty of Medicine Universitas Indonesia, Jakarta, 10430, Indonesia Dear Tomasz Krzywicki University of Warmia and Mazury in Olsztyn, Olsztyn, Warmian-Masurian Voivodeship, Poland We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved the clarity, transparency, and methodological rigor of the study. All points raised have been carefully addressed, and the manuscript has been revised accordingly. 1. Clarification of clinical information Reviewer comment: It is worth specifying at the beginning what kind of clinical information was included in the text data. Was there information that was unobservable from the point of view of the visual skin analysis, which meant that it was not correlated with the information contained in the photos? Response: Thank you for this valuable suggestion. We have clarified the clinical variables included in the textual modality at the beginning of the Methods section. Specifically, clinical information incorporated into the text data for non–atopic dermatitis (non-AD) cases comprised sex, age, chief complaint with onset, history of exposure to allergens or irritants, source of infection, current triggering factors, duration of illness, lesion location, past medical history, and family medical history. For atopic dermatitis (AD) cases, additional inputs included major and minor diagnostic criteria. Importantly, several of these variables—such as symptom onset, exposure history, triggering factors, and family history—are not directly observable from visual skin analysis and therefore provide complementary, non-visual clinical context beyond the information contained in the images. 2. Clarification of the specialists' experience Reviewer comment: It is worth clarifying what experience the specialists have had in describing the data. Response: Thank you for this suggestion. We have clarified the expertise of the annotators in the Methods section. Specifically, all images were independently annotated by two board-certified dermatologists, each with over 20 years of clinical experience in inflammatory dermatoses, achieving 100% inter-rater agreement. 3. Clarification of how the photo descriptions was selected Reviewer comment: Is it worth clarifying how the ground truth of the photo descriptions was selected? What would be the procedure if the specialists (with a completely independent evaluation) assigned different ratings to the photos? Response: Thank you for this comment. Ground truth photo descriptions were established based on independent annotations performed by two board-certified dermatologists. Complete inter-rater agreement (100%) was achieved across all images; therefore, all annotated photo descriptions were retained for analysis. We have added clarification that, in the event of discrepant ratings, images with discordant annotations and their associated clinical data would have been excluded from the dataset to avoid introducing ambiguity in the ground truth labels. 4. Revision of the results section Reviewer comment: Sections regarding descriptions of dataset characteristics, details of training models and initial data preparation should be moved from "Results" to "Methods" or create a separate chapter, e.g. "Materials". The details of the training do not apply to the results. This chapter should contain the final results. Response: Thank you for this comment. We have revised the manuscript structure by moving the descriptions of dataset characteristics, model training details, and initial data preparation from the Results section to a separate chapter entitled Materials, as suggested. The Results section has been streamlined to present only the final performance outcomes of the models. 5. Clarification of the comparison between ResNet and Vision Transformer (ViT) Reviewer comment: Table 2 should be included in the paragraph with the first reference to. In this table, the authors present the result of the comparison of the accuracy of the classification obtained on the ViT and ResNet architectures. It is worth mentioning that these results, with the current data set, should not be summarised with each other. One of the important requirements of the Transformer architecture is a sufficiently large set of training data, where most often the minimum requirements apply to several hundred thousand images, and reasonably, at least a million. With such a small dataset, the ViT architecture is doomed to failure. With such a small dataset, other CNN-based architectures should be compared, e.g. ResNet, Inception and Xception. Response: Thank you for this valuable comment. Table 2 has been relocated to appear immediately after its first mention in the text. In response to the reviewer’s concern, the direct performance comparison with the Vision Transformer (ViT) architecture has been removed from Table 2. We have also revised the Methods section to clarify that the ViT model was included for exploratory purposes only. Given the limited dataset size, ViT was not expected to achieve optimal performance, as transformer-based architectures generally require substantially larger training datasets. Accordingly, ViT results were not used as a basis for direct performance comparison with CNN-based models. In addition, the Discussion section has been expanded to explicitly state that any comparison between CNN-based architectures and ViT should be interpreted with caution. The relatively small dataset in this study likely constrained the performance of the ViT model, consistent with the known data requirements of transformer-based approaches. 6. Clarification of the final multimodal architecture and information about the training Reviewer comment: The article lacks a coherent scheme presenting the final multimodal architecture and information about the training. Yes, Figure 3 presents a complete flow from data collection stage to inference. However, there is no information about the final model itself. Were the models that process the image and text learned together with the final classifier, jointly correcting errors? Or is the final classifier a separate model that classifies independent image and text inputs? Response: Thank you for this comment. We have clarified the final multimodal architecture and training strategy in the Methods section. Once ResNet50 and MPNet processed their respective modalities and generated modality-specific feature embeddings, the resulting vectors were concatenated to form a unified multimodal representation. This late-fusion strategy integrates fine-grained visual information from images with contextual information derived from clinical text. The image and text encoders were trained independently, and their parameters were kept fixed during multimodal training. The concatenated feature vector was subsequently passed through several fully connected layers, which were trained as a separate classifier to distinguish between atopic dermatitis (AD) and non–atopic dermatitis (non-AD) cases. No end-to-end joint optimization across modalities was performed. 7. Revision of results section and removal of redundant figures Reviewer comment: Figures 1 and 2 only provide information about how the quality of the classification indicators changed during the training iterations. In my opinion, they do not contribute anything significant to the results. In addition, Figure 1 shows the features of overfitting model based on the ResNet architecture, which raises serious doubts about the reliability of the results. Response: Thank you for this insightful comment. We agree that Figures 1 and 2 primarily illustrate training dynamics rather than final model performance and do not add substantial value to the presentation of the results. Moreover, as the learning curves may raise concerns regarding overfitting, we have removed Figures 1 and 2 from the revised manuscript. The Results section has been refocused on the final evaluation metrics obtained on the test set, which more accurately reflect the clinical performance of the proposed models. 8. Handling Class Imbalance and Evaluation Metrics Reviewer comment: The dataset used in the experiment was unbalanced in terms of the number of photos in decision classes. The authors do not specify how they solved this problem in the context of training and evaluating model results. According to the names of the quality measures, the authors refer to their global versions intended for balanced datasets. Response: Thank you for this comment. The dataset was imbalanced with respect to the number of samples per class. To address this issue during model development, we have added information indicating that stratified splitting was applied to preserve class proportions across the training, validation, and test sets. For performance evaluation, class-imbalance–aware metrics were used, including weighted precision, weighted recall, and weighted F1-score, in addition to overall accuracy. These weighted metrics compute class-wise scores and aggregate them according to class prevalence, thereby providing a more reliable assessment under imbalanced data conditions. 9. Inclusion of research flow diagrams Reviewer comment: Figures 4 and 5 are trivial and contribute nothing but to the repetition of the content of the previous paragraphs. Response: Thank you for this comment. Figures 2 and 3 (previously Figures 4 and 5) were included to comply with the STARD 2015 reporting guidelines, specifically the recommended flow of participants diagram. These figures provide a transparent visual summary of the study flow, including participant inclusion and data processing steps, which may not be fully conveyed through narrative text alone. 10. Addition of confidence intervals and diagnostic performance table Reviewer comment: The final results of the accuracy of clinical models are standard given in confidence intervals at least using typical statistical indicators: sensitivity, specificity, PPV and NPV. For better reception, it is worth listing them in the table. Thank you for this important comment. We have revised the manuscript to report the final diagnostic performance of the multimodal ResNet50–MPNet model using standard clinical metrics, including accuracy, sensitivity, specificity, PPV, and NPV, each accompanied by 95% confidence intervals. The final accuracy of 98.28% (95% confidence interval = 96.93 - 99.65), sensitivity of 99.71% (95% confidence interval = 99.14 - 100), specificity of 97.21% (95% confidence interval = 95.01 - 99.41), Negative Predictive Value (NPV) 99.5% and Positive Predictive Value (PPV) 98.3%. These results are now summarized in a dedicated table entitled “Diagnostic Performance of the Multimodal ResNet50–MPNet Model” to improve clarity and clinical interpretability. We have revised the manuscript in accordance with all the reviewers’ comments. Thank you once again for your constructive guidance. Please let us know if any further clarification or revisions are required. Warm regards, Alida Widiawaty Faculty of Medicine, Universitas Riau, Pekanbaru, 28133, Indonesia The Doctoral Program in Medical Sciences, Faculty of Medicine Universitas Indonesia, Jakarta, 10430, Indonesia Competing Interests: No competing interests were disclosed. Close Report a concern Respond or Comment COMMENTS ON THIS REPORT Author Response 09 Feb 2026 Alida Widiawaty , Faculty of Medicine, Universitas Riau, Pekanbaru, Indonesia 09 Feb 2026 Author Response Dear Tomasz Krzywicki University of Warmia and Mazury in Olsztyn, Olsztyn, Warmian-Masurian Voivodeship, Poland We thank the reviewer for the thorough evaluation of our manuscript and for the constructive ... Continue reading Dear Tomasz Krzywicki University of Warmia and Mazury in Olsztyn, Olsztyn, Warmian-Masurian Voivodeship, Poland We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved the clarity, transparency, and methodological rigor of the study. All points raised have been carefully addressed, and the manuscript has been revised accordingly. 1. Clarification of clinical information Reviewer comment: It is worth specifying at the beginning what kind of clinical information was included in the text data. Was there information that was unobservable from the point of view of the visual skin analysis, which meant that it was not correlated with the information contained in the photos? Response: Thank you for this valuable suggestion. We have clarified the clinical variables included in the textual modality at the beginning of the Methods section. Specifically, clinical information incorporated into the text data for non–atopic dermatitis (non-AD) cases comprised sex, age, chief complaint with onset, history of exposure to allergens or irritants, source of infection, current triggering factors, duration of illness, lesion location, past medical history, and family medical history. For atopic dermatitis (AD) cases, additional inputs included major and minor diagnostic criteria. Importantly, several of these variables—such as symptom onset, exposure history, triggering factors, and family history—are not directly observable from visual skin analysis and therefore provide complementary, non-visual clinical context beyond the information contained in the images. 2. Clarification of the specialists' experience Reviewer comment: It is worth clarifying what experience the specialists have had in describing the data. Response: Thank you for this suggestion. We have clarified the expertise of the annotators in the Methods section. Specifically, all images were independently annotated by two board-certified dermatologists, each with over 20 years of clinical experience in inflammatory dermatoses, achieving 100% inter-rater agreement. 3. Clarification of how the photo descriptions was selected Reviewer comment: Is it worth clarifying how the ground truth of the photo descriptions was selected? What would be the procedure if the specialists (with a completely independent evaluation) assigned different ratings to the photos? Response: Thank you for this comment. Ground truth photo descriptions were established based on independent annotations performed by two board-certified dermatologists. Complete inter-rater agreement (100%) was achieved across all images; therefore, all annotated photo descriptions were retained for analysis. We have added clarification that, in the event of discrepant ratings, images with discordant annotations and their associated clinical data would have been excluded from the dataset to avoid introducing ambiguity in the ground truth labels. 4. Revision of the results section Reviewer comment: Sections regarding descriptions of dataset characteristics, details of training models and initial data preparation should be moved from "Results" to "Methods" or create a separate chapter, e.g. "Materials". The details of the training do not apply to the results. This chapter should contain the final results. Response: Thank you for this comment. We have revised the manuscript structure by moving the descriptions of dataset characteristics, model training details, and initial data preparation from the Results section to a separate chapter entitled Materials, as suggested. The Results section has been streamlined to present only the final performance outcomes of the models. 5. Clarification of the comparison between ResNet and Vision Transformer (ViT) Reviewer comment: Table 2 should be included in the paragraph with the first reference to. In this table, the authors present the result of the comparison of the accuracy of the classification obtained on the ViT and ResNet architectures. It is worth mentioning that these results, with the current data set, should not be summarised with each other. One of the important requirements of the Transformer architecture is a sufficiently large set of training data, where most often the minimum requirements apply to several hundred thousand images, and reasonably, at least a million. With such a small dataset, the ViT architecture is doomed to failure. With such a small dataset, other CNN-based architectures should be compared, e.g. ResNet, Inception and Xception. Response: Thank you for this valuable comment. Table 2 has been relocated to appear immediately after its first mention in the text. In response to the reviewer’s concern, the direct performance comparison with the Vision Transformer (ViT) architecture has been removed from Table 2. We have also revised the Methods section to clarify that the ViT model was included for exploratory purposes only. Given the limited dataset size, ViT was not expected to achieve optimal performance, as transformer-based architectures generally require substantially larger training datasets. Accordingly, ViT results were not used as a basis for direct performance comparison with CNN-based models. In addition, the Discussion section has been expanded to explicitly state that any comparison between CNN-based architectures and ViT should be interpreted with caution. The relatively small dataset in this study likely constrained the performance of the ViT model, consistent with the known data requirements of transformer-based approaches. 6. Clarification of the final multimodal architecture and information about the training Reviewer comment: The article lacks a coherent scheme presenting the final multimodal architecture and information about the training. Yes, Figure 3 presents a complete flow from data collection stage to inference. However, there is no information about the final model itself. Were the models that process the image and text learned together with the final classifier, jointly correcting errors? Or is the final classifier a separate model that classifies independent image and text inputs? Response: Thank you for this comment. We have clarified the final multimodal architecture and training strategy in the Methods section. Once ResNet50 and MPNet processed their respective modalities and generated modality-specific feature embeddings, the resulting vectors were concatenated to form a unified multimodal representation. This late-fusion strategy integrates fine-grained visual information from images with contextual information derived from clinical text. The image and text encoders were trained independently, and their parameters were kept fixed during multimodal training. The concatenated feature vector was subsequently passed through several fully connected layers, which were trained as a separate classifier to distinguish between atopic dermatitis (AD) and non–atopic dermatitis (non-AD) cases. No end-to-end joint optimization across modalities was performed. 7. Revision of results section and removal of redundant figures Reviewer comment: Figures 1 and 2 only provide information about how the quality of the classification indicators changed during the training iterations. In my opinion, they do not contribute anything significant to the results. In addition, Figure 1 shows the features of overfitting model based on the ResNet architecture, which raises serious doubts about the reliability of the results. Response: Thank you for this insightful comment. We agree that Figures 1 and 2 primarily illustrate training dynamics rather than final model performance and do not add substantial value to the presentation of the results. Moreover, as the learning curves may raise concerns regarding overfitting, we have removed Figures 1 and 2 from the revised manuscript. The Results section has been refocused on the final evaluation metrics obtained on the test set, which more accurately reflect the clinical performance of the proposed models. 8. Handling Class Imbalance and Evaluation Metrics Reviewer comment: The dataset used in the experiment was unbalanced in terms of the number of photos in decision classes. The authors do not specify how they solved this problem in the context of training and evaluating model results. According to the names of the quality measures, the authors refer to their global versions intended for balanced datasets. Response: Thank you for this comment. The dataset was imbalanced with respect to the number of samples per class. To address this issue during model development, we have added information indicating that stratified splitting was applied to preserve class proportions across the training, validation, and test sets. For performance evaluation, class-imbalance–aware metrics were used, including weighted precision, weighted recall, and weighted F1-score, in addition to overall accuracy. These weighted metrics compute class-wise scores and aggregate them according to class prevalence, thereby providing a more reliable assessment under imbalanced data conditions. 9. Inclusion of research flow diagrams Reviewer comment: Figures 4 and 5 are trivial and contribute nothing but to the repetition of the content of the previous paragraphs. Response: Thank you for this comment. Figures 2 and 3 (previously Figures 4 and 5) were included to comply with the STARD 2015 reporting guidelines, specifically the recommended flow of participants diagram. These figures provide a transparent visual summary of the study flow, including participant inclusion and data processing steps, which may not be fully conveyed through narrative text alone. 10. Addition of confidence intervals and diagnostic performance table Reviewer comment: The final results of the accuracy of clinical models are standard given in confidence intervals at least using typical statistical indicators: sensitivity, specificity, PPV and NPV. For better reception, it is worth listing them in the table. Thank you for this important comment. We have revised the manuscript to report the final diagnostic performance of the multimodal ResNet50–MPNet model using standard clinical metrics, including accuracy, sensitivity, specificity, PPV, and NPV, each accompanied by 95% confidence intervals. The final accuracy of 98.28% (95% confidence interval = 96.93 - 99.65), sensitivity of 99.71% (95% confidence interval = 99.14 - 100), specificity of 97.21% (95% confidence interval = 95.01 - 99.41), Negative Predictive Value (NPV) 99.5% and Positive Predictive Value (PPV) 98.3%. These results are now summarized in a dedicated table entitled “Diagnostic Performance of the Multimodal ResNet50–MPNet Model” to improve clarity and clinical interpretability. We have revised the manuscript in accordance with all the reviewers’ comments. Thank you once again for your constructive guidance. Please let us know if any further clarification or revisions are required. Warm regards, Alida Widiawaty Faculty of Medicine, Universitas Riau, Pekanbaru, 28133, Indonesia The Doctoral Program in Medical Sciences, Faculty of Medicine Universitas Indonesia, Jakarta, 10430, Indonesia Dear Tomasz Krzywicki University of Warmia and Mazury in Olsztyn, Olsztyn, Warmian-Masurian Voivodeship, Poland We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved the clarity, transparency, and methodological rigor of the study. All points raised have been carefully addressed, and the manuscript has been revised accordingly. 1. Clarification of clinical information Reviewer comment: It is worth specifying at the beginning what kind of clinical information was included in the text data. Was there information that was unobservable from the point of view of the visual skin analysis, which meant that it was not correlated with the information contained in the photos? Response: Thank you for this valuable suggestion. We have clarified the clinical variables included in the textual modality at the beginning of the Methods section. Specifically, clinical information incorporated into the text data for non–atopic dermatitis (non-AD) cases comprised sex, age, chief complaint with onset, history of exposure to allergens or irritants, source of infection, current triggering factors, duration of illness, lesion location, past medical history, and family medical history. For atopic dermatitis (AD) cases, additional inputs included major and minor diagnostic criteria. Importantly, several of these variables—such as symptom onset, exposure history, triggering factors, and family history—are not directly observable from visual skin analysis and therefore provide complementary, non-visual clinical context beyond the information contained in the images. 2. Clarification of the specialists' experience Reviewer comment: It is worth clarifying what experience the specialists have had in describing the data. Response: Thank you for this suggestion. We have clarified the expertise of the annotators in the Methods section. Specifically, all images were independently annotated by two board-certified dermatologists, each with over 20 years of clinical experience in inflammatory dermatoses, achieving 100% inter-rater agreement. 3. Clarification of how the photo descriptions was selected Reviewer comment: Is it worth clarifying how the ground truth of the photo descriptions was selected? What would be the procedure if the specialists (with a completely independent evaluation) assigned different ratings to the photos? Response: Thank you for this comment. Ground truth photo descriptions were established based on independent annotations performed by two board-certified dermatologists. Complete inter-rater agreement (100%) was achieved across all images; therefore, all annotated photo descriptions were retained for analysis. We have added clarification that, in the event of discrepant ratings, images with discordant annotations and their associated clinical data would have been excluded from the dataset to avoid introducing ambiguity in the ground truth labels. 4. Revision of the results section Reviewer comment: Sections regarding descriptions of dataset characteristics, details of training models and initial data preparation should be moved from "Results" to "Methods" or create a separate chapter, e.g. "Materials". The details of the training do not apply to the results. This chapter should contain the final results. Response: Thank you for this comment. We have revised the manuscript structure by moving the descriptions of dataset characteristics, model training details, and initial data preparation from the Results section to a separate chapter entitled Materials, as suggested. The Results section has been streamlined to present only the final performance outcomes of the models. 5. Clarification of the comparison between ResNet and Vision Transformer (ViT) Reviewer comment: Table 2 should be included in the paragraph with the first reference to. In this table, the authors present the result of the comparison of the accuracy of the classification obtained on the ViT and ResNet architectures. It is worth mentioning that these results, with the current data set, should not be summarised with each other. One of the important requirements of the Transformer architecture is a sufficiently large set of training data, where most often the minimum requirements apply to several hundred thousand images, and reasonably, at least a million. With such a small dataset, the ViT architecture is doomed to failure. With such a small dataset, other CNN-based architectures should be compared, e.g. ResNet, Inception and Xception. Response: Thank you for this valuable comment. Table 2 has been relocated to appear immediately after its first mention in the text. In response to the reviewer’s concern, the direct performance comparison with the Vision Transformer (ViT) architecture has been removed from Table 2. We have also revised the Methods section to clarify that the ViT model was included for exploratory purposes only. Given the limited dataset size, ViT was not expected to achieve optimal performance, as transformer-based architectures generally require substantially larger training datasets. Accordingly, ViT results were not used as a basis for direct performance comparison with CNN-based models. In addition, the Discussion section has been expanded to explicitly state that any comparison between CNN-based architectures and ViT should be interpreted with caution. The relatively small dataset in this study likely constrained the performance of the ViT model, consistent with the known data requirements of transformer-based approaches. 6. Clarification of the final multimodal architecture and information about the training Reviewer comment: The article lacks a coherent scheme presenting the final multimodal architecture and information about the training. Yes, Figure 3 presents a complete flow from data collection stage to inference. However, there is no information about the final model itself. Were the models that process the image and text learned together with the final classifier, jointly correcting errors? Or is the final classifier a separate model that classifies independent image and text inputs? Response: Thank you for this comment. We have clarified the final multimodal architecture and training strategy in the Methods section. Once ResNet50 and MPNet processed their respective modalities and generated modality-specific feature embeddings, the resulting vectors were concatenated to form a unified multimodal representation. This late-fusion strategy integrates fine-grained visual information from images with contextual information derived from clinical text. The image and text encoders were trained independently, and their parameters were kept fixed during multimodal training. The concatenated feature vector was subsequently passed through several fully connected layers, which were trained as a separate classifier to distinguish between atopic dermatitis (AD) and non–atopic dermatitis (non-AD) cases. No end-to-end joint optimization across modalities was performed. 7. Revision of results section and removal of redundant figures Reviewer comment: Figures 1 and 2 only provide information about how the quality of the classification indicators changed during the training iterations. In my opinion, they do not contribute anything significant to the results. In addition, Figure 1 shows the features of overfitting model based on the ResNet architecture, which raises serious doubts about the reliability of the results. Response: Thank you for this insightful comment. We agree that Figures 1 and 2 primarily illustrate training dynamics rather than final model performance and do not add substantial value to the presentation of the results. Moreover, as the learning curves may raise concerns regarding overfitting, we have removed Figures 1 and 2 from the revised manuscript. The Results section has been refocused on the final evaluation metrics obtained on the test set, which more accurately reflect the clinical performance of the proposed models. 8. Handling Class Imbalance and Evaluation Metrics Reviewer comment: The dataset used in the experiment was unbalanced in terms of the number of photos in decision classes. The authors do not specify how they solved this problem in the context of training and evaluating model results. According to the names of the quality measures, the authors refer to their global versions intended for balanced datasets. Response: Thank you for this comment. The dataset was imbalanced with respect to the number of samples per class. To address this issue during model development, we have added information indicating that stratified splitting was applied to preserve class proportions across the training, validation, and test sets. For performance evaluation, class-imbalance–aware metrics were used, including weighted precision, weighted recall, and weighted F1-score, in addition to overall accuracy. These weighted metrics compute class-wise scores and aggregate them according to class prevalence, thereby providing a more reliable assessment under imbalanced data conditions. 9. Inclusion of research flow diagrams Reviewer comment: Figures 4 and 5 are trivial and contribute nothing but to the repetition of the content of the previous paragraphs. Response: Thank you for this comment. Figures 2 and 3 (previously Figures 4 and 5) were included to comply with the STARD 2015 reporting guidelines, specifically the recommended flow of participants diagram. These figures provide a transparent visual summary of the study flow, including participant inclusion and data processing steps, which may not be fully conveyed through narrative text alone. 10. Addition of confidence intervals and diagnostic performance table Reviewer comment: The final results of the accuracy of clinical models are standard given in confidence intervals at least using typical statistical indicators: sensitivity, specificity, PPV and NPV. For better reception, it is worth listing them in the table. Thank you for this important comment. We have revised the manuscript to report the final diagnostic performance of the multimodal ResNet50–MPNet model using standard clinical metrics, including accuracy, sensitivity, specificity, PPV, and NPV, each accompanied by 95% confidence intervals. The final accuracy of 98.28% (95% confidence interval = 96.93 - 99.65), sensitivity of 99.71% (95% confidence interval = 99.14 - 100), specificity of 97.21% (95% confidence interval = 95.01 - 99.41), Negative Predictive Value (NPV) 99.5% and Positive Predictive Value (PPV) 98.3%. These results are now summarized in a dedicated table entitled “Diagnostic Performance of the Multimodal ResNet50–MPNet Model” to improve clarity and clinical interpretability. We have revised the manuscript in accordance with all the reviewers’ comments. Thank you once again for your constructive guidance. Please let us know if any further clarification or revisions are required. Warm regards, Alida Widiawaty Faculty of Medicine, Universitas Riau, Pekanbaru, 28133, Indonesia The Doctoral Program in Medical Sciences, Faculty of Medicine Universitas Indonesia, Jakarta, 10430, Indonesia Competing Interests: No competing interests were disclosed. Close Report a concern COMMENT ON THIS REPORT Views 0 Cite How to cite this report: Sitaru S. Reviewer Report For: Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis [version 1; peer review: 1 approved, 1 approved with reservations] . F1000Research 2025, 14 :952 ( https://doi.org/10.5256/f1000research.186388.r420623 ) The direct URL for this report is: https://f1000research.com/articles/14-952/v1#referee-response-420623 NOTE: it is important to ensure the information in square brackets after the title is included in this citation. Close Copy Citation Details Reviewer Report 29 Oct 2025 Sebastian Sitaru , Technical University of Munich, Munich, Munich, Germany Approved VIEWS 0 https://doi.org/10.5256/f1000research.186388.r420623 In their manuscript, the authors describe the creation and validation of a multimodal image-text AI algorithm for the diagnosis of atopic dermatitis. The topic is highly relevant and the technical approach seems sound. The manuscript is overall ... Continue reading READ ALL In their manuscript, the authors describe the creation and validation of a multimodal image-text AI algorithm for the diagnosis of atopic dermatitis. The topic is highly relevant and the technical approach seems sound. The manuscript is overall well written and concise. It is commendable that the authors decided to share their source code. I have a couple of minor points which could be improved before Indexing: - In the methods it says, "Two board-certified dermatologists independently annotated all images". Do you mean all cases, so image+text? Or did they just annotate the images alone? - Was the skin tone of the patients recorded? Even if not, I think this point deserves a mention in the discussion Is the work clearly and accurately presented and does it cite the current literature? Yes Is the study design appropriate and is the work technically sound? Yes Are sufficient details of methods and analysis provided to allow replication by others? Yes If applicable, is the statistical analysis and its interpretation appropriate? Yes Are all the source data underlying the results available to ensure full reproducibility? Yes Are the conclusions drawn adequately supported by the results? Yes Competing Interests: No competing interests were disclosed. Reviewer Expertise: Data analysis and AI applications in dermatology I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard. Close READ LESS CITE CITE HOW TO CITE THIS REPORT Sitaru S. Reviewer Report For: Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis [version 1; peer review: 1 approved, 1 approved with reservations] . F1000Research 2025, 14 :952 ( https://doi.org/10.5256/f1000research.186388.r420623 ) The direct URL for this report is: https://f1000research.com/articles/14-952/v1#referee-response-420623 NOTE: it is important to ensure the information in square brackets after the title is included in all citations of this article. COPY CITATION DETAILS Report a concern Author Response 09 Feb 2026 Alida Widiawaty , Faculty of Medicine, Universitas Riau, Pekanbaru, Indonesia 09 Feb 2026 Author Response Dear Sebastian Sitaru Technical University of Munich, Munich, Germany We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved ... Continue reading Dear Sebastian Sitaru Technical University of Munich, Munich, Germany We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved the clarity, transparency, and methodological rigor of the study. All points raised have been carefully addressed, and the manuscript has been revised accordingly. 1. Clarification of annotation scope Reviewer comment: In the methods it says, "Two board-certified dermatologists independently annotated all images". Do you mean all cases, so image + text? Or did they just annotate the images alone? Response: Thank you for this insightful comment. We have clarified this point in the manuscript to state that two board-certified dermatologists independently annotated both the clinical images and the corresponding text data for all cases. 2. Clarification of patients' skin tone Reviewer comment: Was the skin tone of the patients recorded? Even if not, I think this point deserves a mention in the discussion Response: Thank you for this comment. Skin tone was not explicitly recorded as a standalone variable in this study. However, the study population predominantly consisted of Indonesian patients, who generally fall within Fitzpatrick skin phototypes III–IV. Within this relatively homogeneous skin tone range, no systematic variation in clinical presentation or image-based model performance attributable to skin tone was observed. Therefore, skin tone was not considered a confounding factor influencing the study outcomes. Nonetheless, we acknowledge in the Discussion that external validation in cohorts with a broader range of Fitzpatrick skin types would be valuable to confirm the model’s robustness across more diverse populations. We have revised the manuscript in accordance with all the reviewers’ comments. Thank you once again for your constructive guidance. Please let us know if any further clarification or revisions are required. Warm regards, Alida Widiawaty Faculty of Medicine, Universitas Riau, Pekanbaru, 28133, Indonesia The Doctoral Program in Medical Sciences, Faculty of Medicine Universitas Indonesia, Jakarta, 10430, Indonesia Dear Sebastian Sitaru Technical University of Munich, Munich, Germany We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved the clarity, transparency, and methodological rigor of the study. All points raised have been carefully addressed, and the manuscript has been revised accordingly. 1. Clarification of annotation scope Reviewer comment: In the methods it says, "Two board-certified dermatologists independently annotated all images". Do you mean all cases, so image + text? Or did they just annotate the images alone? Response: Thank you for this insightful comment. We have clarified this point in the manuscript to state that two board-certified dermatologists independently annotated both the clinical images and the corresponding text data for all cases. 2. Clarification of patients' skin tone Reviewer comment: Was the skin tone of the patients recorded? Even if not, I think this point deserves a mention in the discussion Response: Thank you for this comment. Skin tone was not explicitly recorded as a standalone variable in this study. However, the study population predominantly consisted of Indonesian patients, who generally fall within Fitzpatrick skin phototypes III–IV. Within this relatively homogeneous skin tone range, no systematic variation in clinical presentation or image-based model performance attributable to skin tone was observed. Therefore, skin tone was not considered a confounding factor influencing the study outcomes. Nonetheless, we acknowledge in the Discussion that external validation in cohorts with a broader range of Fitzpatrick skin types would be valuable to confirm the model’s robustness across more diverse populations. We have revised the manuscript in accordance with all the reviewers’ comments. Thank you once again for your constructive guidance. Please let us know if any further clarification or revisions are required. Warm regards, Alida Widiawaty Faculty of Medicine, Universitas Riau, Pekanbaru, 28133, Indonesia The Doctoral Program in Medical Sciences, Faculty of Medicine Universitas Indonesia, Jakarta, 10430, Indonesia Competing Interests: No competing interests were disclosed. Close Report a concern Respond or Comment COMMENTS ON THIS REPORT Author Response 09 Feb 2026 Alida Widiawaty , Faculty of Medicine, Universitas Riau, Pekanbaru, Indonesia 09 Feb 2026 Author Response Dear Sebastian Sitaru Technical University of Munich, Munich, Germany We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved ... Continue reading Dear Sebastian Sitaru Technical University of Munich, Munich, Germany We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved the clarity, transparency, and methodological rigor of the study. All points raised have been carefully addressed, and the manuscript has been revised accordingly. 1. Clarification of annotation scope Reviewer comment: In the methods it says, "Two board-certified dermatologists independently annotated all images". Do you mean all cases, so image + text? Or did they just annotate the images alone? Response: Thank you for this insightful comment. We have clarified this point in the manuscript to state that two board-certified dermatologists independently annotated both the clinical images and the corresponding text data for all cases. 2. Clarification of patients' skin tone Reviewer comment: Was the skin tone of the patients recorded? Even if not, I think this point deserves a mention in the discussion Response: Thank you for this comment. Skin tone was not explicitly recorded as a standalone variable in this study. However, the study population predominantly consisted of Indonesian patients, who generally fall within Fitzpatrick skin phototypes III–IV. Within this relatively homogeneous skin tone range, no systematic variation in clinical presentation or image-based model performance attributable to skin tone was observed. Therefore, skin tone was not considered a confounding factor influencing the study outcomes. Nonetheless, we acknowledge in the Discussion that external validation in cohorts with a broader range of Fitzpatrick skin types would be valuable to confirm the model’s robustness across more diverse populations. We have revised the manuscript in accordance with all the reviewers’ comments. Thank you once again for your constructive guidance. Please let us know if any further clarification or revisions are required. Warm regards, Alida Widiawaty Faculty of Medicine, Universitas Riau, Pekanbaru, 28133, Indonesia The Doctoral Program in Medical Sciences, Faculty of Medicine Universitas Indonesia, Jakarta, 10430, Indonesia Dear Sebastian Sitaru Technical University of Munich, Munich, Germany We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved the clarity, transparency, and methodological rigor of the study. All points raised have been carefully addressed, and the manuscript has been revised accordingly. 1. Clarification of annotation scope Reviewer comment: In the methods it says, "Two board-certified dermatologists independently annotated all images". Do you mean all cases, so image + text? Or did they just annotate the images alone? Response: Thank you for this insightful comment. We have clarified this point in the manuscript to state that two board-certified dermatologists independently annotated both the clinical images and the corresponding text data for all cases. 2. Clarification of patients' skin tone Reviewer comment: Was the skin tone of the patients recorded? Even if not, I think this point deserves a mention in the discussion Response: Thank you for this comment. Skin tone was not explicitly recorded as a standalone variable in this study. However, the study population predominantly consisted of Indonesian patients, who generally fall within Fitzpatrick skin phototypes III–IV. Within this relatively homogeneous skin tone range, no systematic variation in clinical presentation or image-based model performance attributable to skin tone was observed. Therefore, skin tone was not considered a confounding factor influencing the study outcomes. Nonetheless, we acknowledge in the Discussion that external validation in cohorts with a broader range of Fitzpatrick skin types would be valuable to confirm the model’s robustness across more diverse populations. We have revised the manuscript in accordance with all the reviewers’ comments. Thank you once again for your constructive guidance. Please let us know if any further clarification or revisions are required. Warm regards, Alida Widiawaty Faculty of Medicine, Universitas Riau, Pekanbaru, 28133, Indonesia The Doctoral Program in Medical Sciences, Faculty of Medicine Universitas Indonesia, Jakarta, 10430, Indonesia Competing Interests: No competing interests were disclosed. Close Report a concern COMMENT ON THIS REPORT Comments on this article Comments (0) Version 2 VERSION 2 PUBLISHED 19 Sep 2025 ADD YOUR COMMENT Comment keyboard_arrow_left keyboard_arrow_right Open Peer Review Reviewer Status info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions Reviewer Reports Invited Reviewers 1 2 Version 2 (revision) 09 Feb 26 read Version 1 19 Sep 25 read read Sebastian Sitaru , Technical University of Munich, Munich, Germany Tomasz Krzywicki , University of Warmia and Mazury in Olsztyn, Olsztyn, Poland Comments on this article All Comments (0) Add a comment Sign up for content alerts Sign Up You are now signed up to receive this alert Browse by related subjects keyboard_arrow_left Back to all reports Reviewer Report 0 Views copyright © 2026 Krzywicki T. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. 17 Feb 2026 | for Version 2 Tomasz Krzywicki , University of Warmia and Mazury in Olsztyn, Olsztyn, Warmian-Masurian Voivodeship, Poland 0 Views copyright © 2026 Krzywicki T. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. format_quote Cite this report speaker_notes Responses (0) Approved info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions I thank the authors for addressing my comments. The article now looks much better. I have no further comments. Competing Interests No competing interests were disclosed. Reviewer Expertise computer vision, deep learning, reinforcement learning, biomedical engineering, parallel processing I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard. reply Respond to this report Responses (0) Krzywicki T. Peer Review Report For: Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis [version 1; peer review: 1 approved, 1 approved with reservations] . F1000Research 2025, 14 :952 ( https://doi.org/10.5256/f1000research.195755.r456887) NOTE: it is important to ensure the information in square brackets after the title is included in this citation. The direct URL for this report is: https://f1000research.com/articles/14-952/v2#referee-response-456887 keyboard_arrow_left Back to all reports Reviewer Report 0 Views copyright © 2026 Krzywicki T. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. 16 Jan 2026 | for Version 1 Tomasz Krzywicki , University of Warmia and Mazury in Olsztyn, Olsztyn, Warmian-Masurian Voivodeship, Poland 0 Views copyright © 2026 Krzywicki T. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. format_quote Cite this report speaker_notes Responses (1) Approved With Reservations info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions The article concerns the proposal of a solution in the form of a multimodal neural network model supporting skin diagnostics by aggregating clinical information from photos and texts. The idea of aggregation of many modalities in modelling a clinical decision is already well known in the scientific literature, and the authors used in this case the common generic families of neural network architectures: ResNet and BERT. While the article itself looks interesting, I have noticed a few flaws that the authors should refer to. It is worth specifying at the beginning what kind of clinical information was included in the text data. Was there information that was unobservable from the point of view of the visual skin analysis, which meant that it was not correlated with the information contained in the photos? It is worth clarifying what experience the specialists have had in describing the data. Is it worth clarifying how the ground truth of the photo descriptions was selected? What would be the procedure if the specialists (with a completely independent evaluation) assigned different ratings to the photos? Sections regarding descriptions of dataset characteristics, details of training models and initial data preparation should be moved from "Results" to "Methods" or create a separate chapter, e.g. "Materials". The details of the training do not apply to the results. This chapter should contain the final results. Table 2 should be included in the paragraph with the first reference to. In this table, the authors present the result of the comparison of the accuracy of the classification obtained on the ViT and ResNet architectures. It is worth mentioning that these results, with the current data set, should not be summarised with each other. One of the important requirements of the Transformer architecture is a sufficiently large set of training data, where most often the minimum requirements apply to several hundred thousand images, and reasonably, at least a million. With such a small dataset, the ViT architecture is doomed to failure. With such a small dataset, other CNN-based architectures should be compared, e.g. ResNet, Inception and Xception. The article lacks a coherent scheme presenting the final multimodal architecture and information about the training. Yes, Figure 3 presents a complete flow from data collection stage to inference. However, there is no information about the final model itself. Were the models that process the image and text learned together with the final classifier, jointly correcting errors? Or is the final classifier a separate model that classifies independent image and text inputs? Figures 1 and 2 only provide information about how the quality of the classification indicators changed during the training iterations. In my opinion, they do not contribute anything significant to the results. In addition, Figure 1 shows the features of overfitting model based on the ResNet architecture, which raises serious doubts about the reliability of the results. The dataset used in the experiment was unbalanced in terms of the number of photos in decision classes. The authors do not specify how they solved this problem in the context of training and evaluating model results. According to the names of the quality measures, the authors refer to their global versions intended for balanced datasets. Figures 4 and 5 are trivial and contribute nothing but to the repetition of the content of the previous paragraphs. The final results of the accuracy of clinical models are standard given in confidence intervals at least using typical statistical indicators: sensitivity, specificity, PPV and NPV. For better reception, it is worth listing them in the table. Is the work clearly and accurately presented and does it cite the current literature? Yes Is the study design appropriate and is the work technically sound? No Are sufficient details of methods and analysis provided to allow replication by others? No If applicable, is the statistical analysis and its interpretation appropriate? Partly Are all the source data underlying the results available to ensure full reproducibility? No Are the conclusions drawn adequately supported by the results? Partly Competing Interests No competing interests were disclosed. Reviewer Expertise computer vision, deep learning, reinforcement learning, biomedical engineering, parallel processing I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above. reply Respond to this report Responses (1) Author Response 09 Feb 2026 Alida Widiawaty, Faculty of Medicine, Universitas Riau, Pekanbaru, Indonesia Dear Tomasz Krzywicki University of Warmia and Mazury in Olsztyn, Olsztyn, Warmian-Masurian Voivodeship, Poland We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved the clarity, transparency, and methodological rigor of the study. All points raised have been carefully addressed, and the manuscript has been revised accordingly. 1. Clarification of clinical information Reviewer comment: It is worth specifying at the beginning what kind of clinical information was included in the text data. Was there information that was unobservable from the point of view of the visual skin analysis, which meant that it was not correlated with the information contained in the photos? Response: Thank you for this valuable suggestion. We have clarified the clinical variables included in the textual modality at the beginning of the Methods section. Specifically, clinical information incorporated into the text data for non–atopic dermatitis (non-AD) cases comprised sex, age, chief complaint with onset, history of exposure to allergens or irritants, source of infection, current triggering factors, duration of illness, lesion location, past medical history, and family medical history. For atopic dermatitis (AD) cases, additional inputs included major and minor diagnostic criteria. Importantly, several of these variables—such as symptom onset, exposure history, triggering factors, and family history—are not directly observable from visual skin analysis and therefore provide complementary, non-visual clinical context beyond the information contained in the images. 2. Clarification of the specialists' experience Reviewer comment: It is worth clarifying what experience the specialists have had in describing the data. Response: Thank you for this suggestion. We have clarified the expertise of the annotators in the Methods section. Specifically, all images were independently annotated by two board-certified dermatologists, each with over 20 years of clinical experience in inflammatory dermatoses, achieving 100% inter-rater agreement. 3. Clarification of how the photo descriptions was selected Reviewer comment: Is it worth clarifying how the ground truth of the photo descriptions was selected? What would be the procedure if the specialists (with a completely independent evaluation) assigned different ratings to the photos? Response: Thank you for this comment. Ground truth photo descriptions were established based on independent annotations performed by two board-certified dermatologists. Complete inter-rater agreement (100%) was achieved across all images; therefore, all annotated photo descriptions were retained for analysis. We have added clarification that, in the event of discrepant ratings, images with discordant annotations and their associated clinical data would have been excluded from the dataset to avoid introducing ambiguity in the ground truth labels. 4. Revision of the results section Reviewer comment: Sections regarding descriptions of dataset characteristics, details of training models and initial data preparation should be moved from "Results" to "Methods" or create a separate chapter, e.g. "Materials". The details of the training do not apply to the results. This chapter should contain the final results. Response: Thank you for this comment. We have revised the manuscript structure by moving the descriptions of dataset characteristics, model training details, and initial data preparation from the Results section to a separate chapter entitled Materials, as suggested. The Results section has been streamlined to present only the final performance outcomes of the models. 5. Clarification of the comparison between ResNet and Vision Transformer (ViT) Reviewer comment: Table 2 should be included in the paragraph with the first reference to. In this table, the authors present the result of the comparison of the accuracy of the classification obtained on the ViT and ResNet architectures. It is worth mentioning that these results, with the current data set, should not be summarised with each other. One of the important requirements of the Transformer architecture is a sufficiently large set of training data, where most often the minimum requirements apply to several hundred thousand images, and reasonably, at least a million. With such a small dataset, the ViT architecture is doomed to failure. With such a small dataset, other CNN-based architectures should be compared, e.g. ResNet, Inception and Xception. Response: Thank you for this valuable comment. Table 2 has been relocated to appear immediately after its first mention in the text. In response to the reviewer’s concern, the direct performance comparison with the Vision Transformer (ViT) architecture has been removed from Table 2. We have also revised the Methods section to clarify that the ViT model was included for exploratory purposes only. Given the limited dataset size, ViT was not expected to achieve optimal performance, as transformer-based architectures generally require substantially larger training datasets. Accordingly, ViT results were not used as a basis for direct performance comparison with CNN-based models. In addition, the Discussion section has been expanded to explicitly state that any comparison between CNN-based architectures and ViT should be interpreted with caution. The relatively small dataset in this study likely constrained the performance of the ViT model, consistent with the known data requirements of transformer-based approaches. 6. Clarification of the final multimodal architecture and information about the training Reviewer comment: The article lacks a coherent scheme presenting the final multimodal architecture and information about the training. Yes, Figure 3 presents a complete flow from data collection stage to inference. However, there is no information about the final model itself. Were the models that process the image and text learned together with the final classifier, jointly correcting errors? Or is the final classifier a separate model that classifies independent image and text inputs? Response: Thank you for this comment. We have clarified the final multimodal architecture and training strategy in the Methods section. Once ResNet50 and MPNet processed their respective modalities and generated modality-specific feature embeddings, the resulting vectors were concatenated to form a unified multimodal representation. This late-fusion strategy integrates fine-grained visual information from images with contextual information derived from clinical text. The image and text encoders were trained independently, and their parameters were kept fixed during multimodal training. The concatenated feature vector was subsequently passed through several fully connected layers, which were trained as a separate classifier to distinguish between atopic dermatitis (AD) and non–atopic dermatitis (non-AD) cases. No end-to-end joint optimization across modalities was performed. 7. Revision of results section and removal of redundant figures Reviewer comment: Figures 1 and 2 only provide information about how the quality of the classification indicators changed during the training iterations. In my opinion, they do not contribute anything significant to the results. In addition, Figure 1 shows the features of overfitting model based on the ResNet architecture, which raises serious doubts about the reliability of the results. Response: Thank you for this insightful comment. We agree that Figures 1 and 2 primarily illustrate training dynamics rather than final model performance and do not add substantial value to the presentation of the results. Moreover, as the learning curves may raise concerns regarding overfitting, we have removed Figures 1 and 2 from the revised manuscript. The Results section has been refocused on the final evaluation metrics obtained on the test set, which more accurately reflect the clinical performance of the proposed models. 8. Handling Class Imbalance and Evaluation Metrics Reviewer comment: The dataset used in the experiment was unbalanced in terms of the number of photos in decision classes. The authors do not specify how they solved this problem in the context of training and evaluating model results. According to the names of the quality measures, the authors refer to their global versions intended for balanced datasets. Response: Thank you for this comment. The dataset was imbalanced with respect to the number of samples per class. To address this issue during model development, we have added information indicating that stratified splitting was applied to preserve class proportions across the training, validation, and test sets. For performance evaluation, class-imbalance–aware metrics were used, including weighted precision, weighted recall, and weighted F1-score, in addition to overall accuracy. These weighted metrics compute class-wise scores and aggregate them according to class prevalence, thereby providing a more reliable assessment under imbalanced data conditions. 9. Inclusion of research flow diagrams Reviewer comment: Figures 4 and 5 are trivial and contribute nothing but to the repetition of the content of the previous paragraphs. Response: Thank you for this comment. Figures 2 and 3 (previously Figures 4 and 5) were included to comply with the STARD 2015 reporting guidelines, specifically the recommended flow of participants diagram. These figures provide a transparent visual summary of the study flow, including participant inclusion and data processing steps, which may not be fully conveyed through narrative text alone. 10. Addition of confidence intervals and diagnostic performance table Reviewer comment: The final results of the accuracy of clinical models are standard given in confidence intervals at least using typical statistical indicators: sensitivity, specificity, PPV and NPV. For better reception, it is worth listing them in the table. Thank you for this important comment. We have revised the manuscript to report the final diagnostic performance of the multimodal ResNet50–MPNet model using standard clinical metrics, including accuracy, sensitivity, specificity, PPV, and NPV, each accompanied by 95% confidence intervals. The final accuracy of 98.28% (95% confidence interval = 96.93 - 99.65), sensitivity of 99.71% (95% confidence interval = 99.14 - 100), specificity of 97.21% (95% confidence interval = 95.01 - 99.41), Negative Predictive Value (NPV) 99.5% and Positive Predictive Value (PPV) 98.3%. These results are now summarized in a dedicated table entitled “Diagnostic Performance of the Multimodal ResNet50–MPNet Model” to improve clarity and clinical interpretability. We have revised the manuscript in accordance with all the reviewers’ comments. Thank you once again for your constructive guidance. Please let us know if any further clarification or revisions are required. Warm regards, Alida Widiawaty Faculty of Medicine, Universitas Riau, Pekanbaru, 28133, Indonesia The Doctoral Program in Medical Sciences, Faculty of Medicine Universitas Indonesia, Jakarta, 10430, Indonesia View more View less Competing Interests No competing interests were disclosed. reply Respond Report a concern Krzywicki T. Peer Review Report For: Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis [version 1; peer review: 1 approved, 1 approved with reservations] . F1000Research 2025, 14 :952 ( https://doi.org/10.5256/f1000research.186388.r446710) NOTE: it is important to ensure the information in square brackets after the title is included in this citation. The direct URL for this report is: https://f1000research.com/articles/14-952/v1#referee-response-446710 keyboard_arrow_left Back to all reports Reviewer Report 0 Views copyright © 2025 Sitaru S. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. 29 Oct 2025 | for Version 1 Sebastian Sitaru , Technical University of Munich, Munich, Munich, Germany 0 Views copyright © 2025 Sitaru S. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. format_quote Cite this report speaker_notes Responses (1) Approved info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions In their manuscript, the authors describe the creation and validation of a multimodal image-text AI algorithm for the diagnosis of atopic dermatitis. The topic is highly relevant and the technical approach seems sound. The manuscript is overall well written and concise. It is commendable that the authors decided to share their source code. I have a couple of minor points which could be improved before Indexing: - In the methods it says, "Two board-certified dermatologists independently annotated all images". Do you mean all cases, so image+text? Or did they just annotate the images alone? - Was the skin tone of the patients recorded? Even if not, I think this point deserves a mention in the discussion Is the work clearly and accurately presented and does it cite the current literature? Yes Is the study design appropriate and is the work technically sound? Yes Are sufficient details of methods and analysis provided to allow replication by others? Yes If applicable, is the statistical analysis and its interpretation appropriate? Yes Are all the source data underlying the results available to ensure full reproducibility? Yes Are the conclusions drawn adequately supported by the results? Yes Competing Interests No competing interests were disclosed. Reviewer Expertise Data analysis and AI applications in dermatology I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard. reply Respond to this report Responses (1) Author Response 09 Feb 2026 Alida Widiawaty, Faculty of Medicine, Universitas Riau, Pekanbaru, Indonesia Dear Sebastian Sitaru Technical University of Munich, Munich, Germany We thank the reviewer for the thorough evaluation of our manuscript and for the constructive comments that have substantially improved the clarity, transparency, and methodological rigor of the study. All points raised have been carefully addressed, and the manuscript has been revised accordingly. 1. Clarification of annotation scope Reviewer comment: In the methods it says, "Two board-certified dermatologists independently annotated all images". Do you mean all cases, so image + text? Or did they just annotate the images alone? Response: Thank you for this insightful comment. We have clarified this point in the manuscript to state that two board-certified dermatologists independently annotated both the clinical images and the corresponding text data for all cases. 2. Clarification of patients' skin tone Reviewer comment: Was the skin tone of the patients recorded? Even if not, I think this point deserves a mention in the discussion Response: Thank you for this comment. Skin tone was not explicitly recorded as a standalone variable in this study. However, the study population predominantly consisted of Indonesian patients, who generally fall within Fitzpatrick skin phototypes III–IV. Within this relatively homogeneous skin tone range, no systematic variation in clinical presentation or image-based model performance attributable to skin tone was observed. Therefore, skin tone was not considered a confounding factor influencing the study outcomes. Nonetheless, we acknowledge in the Discussion that external validation in cohorts with a broader range of Fitzpatrick skin types would be valuable to confirm the model’s robustness across more diverse populations. We have revised the manuscript in accordance with all the reviewers’ comments. Thank you once again for your constructive guidance. Please let us know if any further clarification or revisions are required. Warm regards, Alida Widiawaty Faculty of Medicine, Universitas Riau, Pekanbaru, 28133, Indonesia The Doctoral Program in Medical Sciences, Faculty of Medicine Universitas Indonesia, Jakarta, 10430, Indonesia View more View less Competing Interests No competing interests were disclosed. reply Respond Report a concern Sitaru S. Peer Review Report For: Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis [version 1; peer review: 1 approved, 1 approved with reservations] . F1000Research 2025, 14 :952 ( https://doi.org/10.5256/f1000research.186388.r420623) NOTE: it is important to ensure the information in square brackets after the title is included in this citation. The direct URL for this report is: https://f1000research.com/articles/14-952/v1#referee-response-420623 Alongside their report, reviewers assign a status to the article: Approved - the paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations - A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved - fundamental flaws in the paper seriously undermine the findings and conclusions Adjust parameters to alter display View on desktop for interactive features Includes Interactive Elements View on desktop for interactive features Competing Interests Policy Provide sufficient details of any financial or non-financial competing interests to enable users to assess whether your comments might lead a reasonable person to question your impartiality. Consider the following examples, but note that this is not an exhaustive list: Examples of 'Non-Financial Competing Interests' Within the past 4 years, you have held joint grants, published or collaborated with any of the authors of the selected paper. You have a close personal relationship (e.g. parent, spouse, sibling, or domestic partner) with any of the authors. You are a close professional associate of any of the authors (e.g. scientific mentor, recent student). You work at the same institute as any of the authors. You hope/expect to benefit (e.g. favour or employment) as a result of your submission. You are an Editor for the journal in which the article is published. Examples of 'Financial Competing Interests' You expect to receive, or in the past 4 years have received, any of the following from any commercial organisation that may gain financially from your submission: a salary, fees, funding, reimbursements. You expect to receive, or in the past 4 years have received, shared grant support or other funding with any of the authors. You hold, or are currently applying for, any patents or significant stocks/shares relating to the subject matter of the paper you are commenting on. Stay Updated Sign up for content alerts and receive a weekly or monthly email with all newly published articles Register with F1000Research Already registered? Sign in Not now, thanks close PLEASE NOTE If you are an AUTHOR of this article, please check that you signed in with the account associated with this article otherwise we cannot automatically identify your role as an author and your comment will be labelled as a “User Comment”. If you are a REVIEWER of this article, please check that you have signed in with the account associated with this article and then go to your account to submit your report, please do not post your review here. If you do not have access to your original account, please contact us . All commenters must hold a formal affiliation as per our Policies . The information that you give us will be displayed next to your comment. User comments must be in English, comprehensible and relevant to the article under discussion. We reserve the right to remove any comments that we consider to be inappropriate, offensive or otherwise in breach of the User Comment Terms and Conditions . Commenters must not use a comment for personal attacks. When criticisms of the article are based on unpublished data, the data should be made available. I accept the User Comment Terms and Conditions Please confirm that you accept the User Comment Terms and Conditions. Affiliation ✕ refresh Please enter your institution. Note: To add your institution or organisation, start typing the name and then select the correct name from the list. Where applicable, the name will appear in both the original language and in English. Do not paste in the name. If the name does not appear in the drop-down list, we will display the information you have entered. ✕ refresh Country/Region * USA UK Canada China France Germany Afghanistan Aland Islands Albania Algeria American Samoa Andorra Angola Anguilla Antarctica Antigua and Barbuda Argentina Armenia Aruba Australia Austria Azerbaijan Bahamas Bahrain Bangladesh Barbados Belarus Belgium Belize Benin Bermuda Bhutan Bolivia Bosnia and Herzegovina Botswana Bouvet Island Brazil British Indian Ocean Territory British Virgin Islands Brunei Bulgaria Burkina Faso Burundi Cambodia Cameroon Canada Cape Verde Cayman Islands Central African Republic Chad Chile China Christmas Island Cocos (Keeling) Islands Colombia Comoros Congo Cook Islands Costa Rica Cote d'Ivoire Croatia Cuba Cyprus Czech Republic Democratic Republic of the Congo Denmark Djibouti Dominica Dominican Republic Ecuador Egypt El Salvador Equatorial Guinea Eritrea Estonia Ethiopia Falkland Islands Faroe Islands Federated States of Micronesia Fiji Finland France French Guiana French Polynesia French Southern Territories Gabon Georgia Germany Ghana Gibraltar Greece Greenland Grenada Guadeloupe Guam Guatemala Guernsey Guinea Guinea-Bissau Guyana Haiti Heard Island and Mcdonald Islands Holy See (Vatican City State) Honduras Hong Kong Hungary Iceland India Indonesia Iran Iraq Ireland Israel Italy Jamaica Japan Jersey Jordan Kazakhstan Kenya Kiribati Kosovo (Serbia and Montenegro) Kuwait Kyrgyzstan Lao People's Democratic Republic Latvia Lebanon Lesotho Liberia Libya Liechtenstein Lithuania Luxembourg Macao Madagascar Malawi Malaysia Maldives Mali Malta Marshall Islands Martinique Mauritania Mauritius Mayotte Mexico Minor Outlying Islands of the United States Moldova Monaco Mongolia Montenegro Montserrat Morocco Mozambique Myanmar Namibia Nauru Nepal Netherlands Antilles New Caledonia New Zealand Nicaragua Niger Nigeria Niue Norfolk Island North Korea North Macedonia Northern Mariana Islands Norway Oman Pakistan Palau Palestinian Territory Panama Papua New Guinea Paraguay Peru Philippines Pitcairn Poland Portugal Puerto Rico Qatar Reunion Romania Russian Federation Rwanda Saint Helena Saint Kitts and Nevis Saint Lucia Saint Pierre and Miquelon Saint Vincent and the Grenadines Samoa San Marino Sao Tome and Principe Saudi Arabia Senegal Serbia Seychelles Sierra Leone Singapore Slovakia Slovenia Solomon Islands Somalia South Africa South Georgia and the South Sandwich Is South Korea South Sudan Spain Sri Lanka Sudan Suriname Svalbard and Jan Mayen Swaziland Sweden Switzerland Syria Taiwan Tajikistan Tanzania Thailand The Gambia The Netherlands Timor-Leste Togo Tokelau Tonga Trinidad and Tobago Tunisia Turkey Turkmenistan Turks and Caicos Islands Tuvalu UK USA Uganda Ukraine United Arab Emirates United States Virgin Islands Uruguay Uzbekistan Vanuatu Venezuela Vietnam Wallis and Futuna West Bank and Gaza Strip Western Sahara Yemen Zambia Zimbabwe Please select your country/region. You must enter a comment. Competing Interests Please disclose any competing interests that might be construed to influence your judgment of the article's or peer review report's validity or importance. Competing Interests Policy Provide sufficient details of any financial or non-financial competing interests to enable users to assess whether your comments might lead a reasonable person to question your impartiality. Consider the following examples, but note that this is not an exhaustive list: Examples of 'Non-Financial Competing Interests' Within the past 4 years, you have held joint grants, published or collaborated with any of the authors of the selected paper. You have a close personal relationship (e.g. parent, spouse, sibling, or domestic partner) with any of the authors. You are a close professional associate of any of the authors (e.g. scientific mentor, recent student). You work at the same institute as any of the authors. You hope/expect to benefit (e.g. favour or employment) as a result of your submission. You are an Editor for the journal in which the article is published. Examples of 'Financial Competing Interests' You expect to receive, or in the past 4 years have received, any of the following from any commercial organisation that may gain financially from your submission: a salary, fees, funding, reimbursements. You expect to receive, or in the past 4 years have received, shared grant support or other funding with any of the authors. You hold, or are currently applying for, any patents or significant stocks/shares relating to the subject matter of the paper you are commenting on. Please state your competing interests The comment has been saved. An error has occurred. Please try again. Cancel Post var lTitle = "Multimodal Machine Learning Approach for...".replace("'", ''); var linkedInUrl = "http://www.linkedin.com/shareArticle?url=https://f1000research.com/articles/14-952/v1" + "&title=" + encodeURIComponent(lTitle) + "&summary=" + encodeURIComponent('Read the article by '); var deliciousUrl = "https://del.icio.us/post?url=https://f1000research.com/articles/14-952/v1&title=" + encodeURIComponent(lTitle); var redditUrl = "http://reddit.com/submit?url=https://f1000research.com/articles/14-952/v1" + "&title=" + encodeURIComponent(lTitle); linkedInUrl += encodeURIComponent('Widiawaty A et al.'); var offsetTop = /chrome/i.test( navigator.userAgent ) ? 4 : -10; var addthis_config = { ui_offset_top: offsetTop, services_compact : "facebook,twitter,www.linkedin.com,www.mendeley.com,reddit.com", services_expanded : "facebook,twitter,www.linkedin.com,www.mendeley.com,reddit.com", services_custom : [ { name: "LinkedIn", url: linkedInUrl, icon:"/img/icon/at_linkedin.svg" }, { name: "Mendeley", url: "http://www.mendeley.com/import/?url=https://f1000research.com/articles/14-952/v1/mendeley", icon:"/img/icon/at_mendeley.svg" }, { name: "Reddit", url: redditUrl, icon:"/img/icon/at_reddit.svg" }, ] }; var addthis_share = { url: "https://f1000research.com/articles/14-952", templates : { twitter : "Multimodal Machine Learning Approach for Diagnosing Atopic Dermatitis. Widiawaty A et al., published by " + "@F1000Research" + ", https://f1000research.com/articles/14-952/v1" } }; if (typeof(addthis) != "undefined"){ addthis.addEventListener('addthis.ready', checkCount); addthis.addEventListener('addthis.menu.share', checkCount); } $(".f1r-shares-twitter").attr("href", "https://twitter.com/intent/tweet?text=" + addthis_share.templates.twitter); $(".f1r-shares-facebook").attr("href", "https://www.facebook.com/sharer/sharer.php?u=" + addthis_share.url); $(".f1r-shares-linkedin").attr("href", addthis_config.services_custom[0].url); $(".f1r-shares-reddit").attr("href", addthis_config.services_custom[2].url); $(".f1r-shares-mendelay").attr("href", addthis_config.services_custom[1].url); function checkCount(){ setTimeout(function(){ $(".addthis_button_expanded").each(function(){ var count = $(this).text(); if (count !== "" && count != "0") $(this).removeClass("is-hidden"); else $(this).addClass("is-hidden"); }); }, 1000); } close How to cite this report {{reportCitation}} Cancel Copy Citation Details $(function(){R.ui.buttonDropdowns('.dropdown-for-downloads');}); $(function(){R.ui.toolbarDropdowns('.toolbar-dropdown-for-downloads');}); $.get("/articles/acj/169102/186388") new F1000.Clipboard(); new F1000.ThesaurusTermsDisplay("articles", "article", "186388"); $(document).ready(function() { $( "#frame1" ).on('load', function() { var mydiv = $(this).contents().find("div"); var h = mydiv.height(); console.log(h) }); var tooltipLivingFigure = jQuery(".interactive-living-figure-label .icon-more-info"), titleLivingFigure = tooltipLivingFigure.attr("title"); tooltipLivingFigure.simpletip({ fixed: true, position: ["-115", "30"], baseClass: 'small-tooltip', content:titleLivingFigure + " " }); tooltipLivingFigure.removeAttr("title"); $("body").on("click", ".cite-living-figure", function(e) { e.preventDefault(); var ref = $(this).attr("data-ref"); $(this).closest(".living-figure-list-container").find("#" + ref).fadeIn(200); }); $("body").on("click", ".close-cite-living-figure", function(e) { e.preventDefault(); $(this).closest(".popup-window-wrapper").fadeOut(200); }); $(document).on("mouseup", function(e) { var metricsContainer = $(".article-metrics-popover-wrapper"); if (!metricsContainer.is(e.target) && metricsContainer.has(e.target).length === 0) { $(".article-metrics-close-button").click(); } }); var articleId = $('#articleId').val(); if($("#main-article-count-box").attachArticleMetrics) { $("#main-article-count-box").attachArticleMetrics(articleId, { articleMetricsView: true }); } }); var figshareWidget = $(".new_figshare_widget"); if (figshareWidget.length > 0) { window.figshare.load("f1000", function(Widget) { // Select a tag/tags defined in your page. In this tag we will place the widget. _.map(figshareWidget, function(el){ var widget = new Widget({ articleId: $(el).attr("figshare_articleId") //height:300 // this is the height of the viewer part. [Default: 550] }); widget.initialize(); // initialize the widget widget.mount(el); // mount it in a tag that's on your page // this will save the widget on the global scope for later use from // your JS scripts. This line is optional. //window.widget = widget; }); }); } close Error Close Add Reset F1000.MICROSERVICES.AFFILIATION = ''; $(document).ready(function () { $('.js-affiliations-form').each((index, form) => { new AffiliationForm({ formId: form.id, institutionErrorSelector: '.comment-enter-institution', departmentErrorSelector: '.comment-enter-department', placeSelector: '.js-add-comment-place', stateSelector: '.js-add-comment-state', zipCodeSelector: '.js-add-comment-zipcode', countrySelector: '.js-add-comment-country', countryErrorSelector: '.comment-enter-country', }); }); }); $(document).ready(function () { var reportIds = { "420615": 0, "416900": 0, "416898": 0, "416899": 0, "416896": 0, "416897": 0, "420622": 0, "420623": 39, "420620": 0, "420621": 0, "420618": 0, "420619": 0, "420616": 0, "420617": 0, "420624": 0, "456886": 0, "425910": 0, "456887": 35, "425911": 0, "425908": 0, "425909": 0, "425906": 0, "425907": 0, "425904": 0, "425905": 0, "425912": 0, "425913": 0, "441286": 0, "441287": 0, "441294": 0, "441295": 0, "441292": 0, "441293": 0, "441290": 0, "441291": 0, "441288": 0, "441289": 0, "457966": 0, "424046": 0, "446702": 0, "457967": 0, "424047": 0, "446703": 0, "457964": 0, "424044": 0, "457965": 0, "424045": 0, "424042": 0, "457963": 0, "424043": 0, "424041": 0, "446710": 21, "446711": 0, "457972": 0, "446708": 0, "446709": 0, "457970": 0, "424050": 0, "446706": 0, "457971": 0, "446707": 0, "457968": 0, "424048": 0, "446704": 0, "457969": 0, "424049": 0, "446705": 0, "416894": 0, "416895": 0, "416892": 0, "416893": 0, "416891": 0, }; $(".referee-response-container,.js-referee-report").each(function(index, el) { var reportId = $(el).attr("data-reportid"), reportCount = reportIds[reportId] || 0; $(el).find(".comments-count-container,.js-referee-report-views").html(reportCount); }); var uuidInput = $("#article_uuid"), oldUUId = uuidInput.val(), newUUId = "ed9ad1f6-58ba-4fff-b168-876d4144fb95"; uuidInput.val(newUUId); $("a[href*='article_uuid=']").each(function(index, el) { var newHref = $(el).attr("href").replace(oldUUId, newUUId); $(el).attr("href", newHref); }); }); An innovative open access publishing platform offering rapid publication and open peer review, whilst supporting data deposition and sharing. Browse Gateways Collections How it Works Contact For Developers Cookie Notice Privacy Notice RSS Submit Your Research Follow us © 2012-2026 F1000 Research Ltd. ISSN 2046-1402 | Legal | Partner of Research4Life • CrossRef • ORCID • FAIRSharing R.templateTests.simpleTemplate = R.template(' $text $text $text $text $text '); R.templateTests.runTests(); var F1000platform = new F1000.Platform({ name: "f1000research", displayName: "F1000Research", hostName: "f1000research.com", id: "1", editorialEmail: "
[email protected]", infoEmail: "
[email protected]", usePmcStats: true }); $(function(){R.ui.dropdowns('.dropdown-for-authors, .dropdown-for-about, .dropdown-for-myresearch');}); // $(function(){R.ui.dropdowns('.dropdown-for-referees');}); $(document).ready(function () { if ($(".cookie-warning").is(":visible")) { $(".sticky").css("margin-bottom", "35px"); $(".devices").addClass("devices-and-cookie-warning"); } $(".cookie-warning .close-button").click(function (e) { $(".devices").removeClass("devices-and-cookie-warning"); $(".sticky").css("margin-bottom", "0"); }); $("#tweeter-feed .tweet-message").each(function (i, message) { var self = $(message); self.html(linkify(self.html())); }); $(".partner").on("mouseenter mouseleave", function() { $(this).find(".gray-scale, .colour").toggleClass("is-hidden"); }); }); Sign In Remember me Forgotten your password? Sign In Cancel Email or password not correct. Please try again Please wait... $(function(){ // Note: All the setup needs to run against a name attribute and *not* the id due the clonish // nature of facebox... $("a[id=googleSignInButton]").click(function(event){ event.preventDefault(); $("input[id=oAuthSystem]").val("GOOGLE"); $("form[id=oAuthForm]").submit(); }); $("a[id=facebookSignInButton]").click(function(event){ event.preventDefault(); $("input[id=oAuthSystem]").val("FACEBOOK"); $("form[id=oAuthForm]").submit(); }); $("a[id=orcidSignInButton]").click(function(event){ event.preventDefault(); $("input[id=oAuthSystem]").val("ORCID"); $("form[id=oAuthForm]").submit(); }); }); If you've forgotten your password, please enter your email address below and we'll send you instructions on how to reset your password. The email address should be the one you originally registered with F1000. Email address not valid, please try again You registered with F1000 via Google, so we cannot reset your password. To sign in, please click here . If you still need help with your Google account password, please click here . You registered with F1000 via Facebook, so we cannot reset your password. To sign in, please click here . If you still need help with your Facebook account password, please click here . Code not correct, please try again Reset password Cancel Email us for further assistance. Server error, please try again. If your email address is registered with us, we will email you instructions to reset your password. If you think you should have received this email but it has not arrived, please check your spam filters and/or contact for further assistance. Please wait... Register $(document).ready(function () { signIn.createSignInAsRow($("#sign-in-form-gfb-popup")); $(".target-field").each(function () { var uris = $(this).val().split("/"); if (uris.pop() === "login") { $(this).val(uris.toString().replace(",","/")); } }); });
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.