Full text
40,527 characters
· extracted from
preprint-html
· click to expand
Automated Deep Learning-Based 3D-to-2D Segmentation of Geographic Atrophy in Optical Coherence Tomography Data | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Automated Deep Learning-Based 3D-to-2D Segmentation of Geographic Atrophy in Optical Coherence Tomography Data Hasenin Al-khersan , View ORCID Profile Jonathan Oakley , Daniel Russakoff , Jessica Cao , Stanley Saju , Avery Zhou , Simrat Sodhi , Niveditha Pattathil , Netan Choudhry , David Boyer , Charles Wykoff doi: https://doi.org/10.1101/2025.07.07.25330902 Hasenin Al-khersan 1 Retina Consultants of Texas , Houston, TX, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jonathan Oakley 2 Voxeleron Inc. , TX, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jonathan Oakley For correspondence: jonathan{at}voxeleron.com Daniel Russakoff 2 Voxeleron Inc. , TX, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jessica Cao 1 Retina Consultants of Texas , Houston, TX, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Stanley Saju 1 Retina Consultants of Texas , Houston, TX, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Avery Zhou 1 Retina Consultants of Texas , Houston, TX, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Simrat Sodhi 3 University of Cambridge Find this author on Google Scholar Find this author on PubMed Search for this author on this site Niveditha Pattathil 4 Vitreous Retina Macula Specialists of Toronto , Etobicoke, ON, Canada Find this author on Google Scholar Find this author on PubMed Search for this author on this site Netan Choudhry 4 Vitreous Retina Macula Specialists of Toronto , Etobicoke, ON, Canada Find this author on Google Scholar Find this author on PubMed Search for this author on this site David Boyer 5 Retina Vitreous Associates Medical Group , Beverly Hills, CA, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Charles Wykoff 1 Retina Consultants of Texas , Houston, TX, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Purpose We report on a deep learning-based approach to the segmentation of geographic atrophy (GA) in patients with advanced age-related macular degeneration (AMD). Method Three-dimensional (3D) optical coherence tomography (OCT) data was collected from two instruments at two different retina practices. This totaled 367 and 348 volumes, respectively, of routinely collected clinical data. For all data, the accuracy of a 3D-to-2D segmentation model was assessed relative to ground-truth manual labeling. Results Dice Similarity Scores (DSC) averaged 0.824 and 0.826 for each data set. Correlations (r 2 ) between manual and automated areas were 0.883 and 0.906, respectively. The inclusion of near Infra-red imagery as an additional information channel to the algorithm did not notably improve performance. Conclusion Accurate assessment of GA in real-world clinical OCT data can be achieved using deep learning. In the advent of therapeutics to slow the rate of GA progression, reliable, automated assessment is a clinical objective and this work validates one such method. Introduction Geographic atrophy (GA) is a late-stage manifestation of non-exudative age-related macular degeneration (AMD), representing one of the leading causes of vision loss in adults over 50 years of age. GA is characterized by the progressive degeneration of the retinal pigment epithelium (RPE) and overlying photoreceptors, resulting in irreversible central vision loss [ Sarda 2021 ]. Recently, two intravitreal anti-complement therapies, pegcetacoplan and avacincaptad pegol, were introduced in the United States for the treatment of GA. These therapies were approved by the Food and Drug Administration based on structural endpoints. Both therapies demonstrated a slower rate of progression of GA relative to sham though neither showed a visual acuity benefit [ Heier 2023 ]. Given the introduction of these therapies, the identification of GA and its progression is of heightened importance. GA is typically diagnosed using non-invasive imaging techniques including optical coherence tomography (OCT), fundus autofluorescence (FAF), and fundus photography. OCT is particularly useful for identifying GA due to its widespread availability in clinical practice, ability to identify subtle morphological changes in early disease, and ease of capture. In 2018, OCT was proposed as the gold standard to diagnose GA by the international expert Consensus Definition for Atrophy Associated with Age-Related Macular Degeneration on OCT group [ Sadda 2018 ]. Specific OCT criteria to diagnose complete RPE and outer retinal atrophy (cRORA) were proposed. While these criteria may accurately define GA, they are challenging for ophthalmologists to methodically apply across hundreds to thousands of B-scans in routine clinical practice. Toward this end, artificial intelligence (AI) can serve to simplify the process by automating the identification of GA. Different approaches to segmenting GA in image data have been developed by both device manufacturers and research groups. For OCT, the only software with clinical approval in the US is the advanced retinal pigment epithelial (RPE) analysis tool (ARPET; Carl Zeiss Meditec, CA, USA). Marketed now as a GA tool kit, it was approved to automatically segment sub-RPE “increased illumination” based on an en face view generated using a layer-based limited integration range [ K111157 2012 ]. The success of any 2D approach based on a limited axial integration of the 3D volume is entirely dependent on the relevance and location of the automatically generated integration limits. The approval of this method for clinical use was based on repeatability (precision) and, interestingly, correlation to the sum areas of manually segmented GA in FAF images, but not to the location accuracy of those areas as could be reported using the Dice similarity coefficient (DSC). This is the same in a study of the algorithm, where the intraclass correlation coefficient (ICC) was 0.795, but no accuracy of segmentation localization was reported [ Yehoshua 2013 ]. The advent of deep learning has resulted in several fully automated applications. Available via the Heidelberg AppWay product, users in the EU may access the GA model developed by RetinAI (Bern, Switzerland). The method is based on segmenting each B-scan using a U-Net individually to yield a 2D probability image of the atrophic region [ Derradji 2021 ]. This result is then integrated axially to form a 1d signal that, when combined with all other B-scan-based 1d signals, reconstructs the final 2D image of GA. Using a training set of 44 volumes, the authors are able to demonstrate high DSCs of 0.881 and 0.844 relative to two graders on a test set of 18 volumes. The method’s advantage is its simplicity; its disadvantage is it not making full use of the 3D data set, which can result in discontinuities in the final segmentation as each B-scan is segmented independently. A very similar approach has been used by [ Zhang 2021 ], but a far larger data set of 984 OCT volumes was used, and the median DCS was very high at 0.96. [ Lachinov 2021 ] overcomes some limitations of the aforementioned approaches by working directly with the 3D data using a then novel architecture that modifies a U-Net to encode in 3D and decode in 2D. In this approach, the skip connections, common to the U-Net architecture, drop one dimension from the data and go from 3D to 2D. Our extension to that method adds residual blocks to allow for better feature representations [ He 2016 ]. In the following we examine the ability of this 3D U-Net-type architecture to identify GA on OCT data from real-world patient data. Methods Data Collection and Grading Data was collected from two sites retrospectively, the Retina Consultants of Texas (RCTX) and Retina-Vitreous Associates (RVA), from 2016 and 2022. Inclusion criteria included a confirmed diagnosis of GA with accompanying OCT imaging; eyes with GA and concurrent nAMD were included. Institutional review board approval was obtained from Advarra. The present study was conducted in accordance with the Declaration of Helsinki. Optical coherence tomography imaging was performed on the Heidelberg Spectralis (Heidelberg Engineering, Heidelberg, Germany) at RCTX and the Zeiss Cirrus (Carl Zeiss Meditec, CA, USA) at RVA as part of routine clinical care. Both used similar protocols for capturing data at the macula using a 20 degree (∼6mm^2) lateral field of view (FOV). For Spectralis, the macular scan protocol was used with ART setting of up to 10 averaged frames. The volumes comprised 49 slices, where each B-scan was 512 by 496 pixels. The Spectralis data included near-infrared (nIR) images, which were across a 30-degree FOV and used 100 frame averaging. A quality index of at least 25 was required for inclusion. For Cirrus data, the macular protocol included 200 B-scans, each with 200 by 1024 pixels. The Zeiss macular protocol does not use frame averaging. A minimal signal score of 5 was required for inclusion. No associated nIR data was collected by the device. Grading Manual grading was performed by expert graders who delineated areas of complete retinal pigment epithelial and outer retinal atrophy (cRORA) on OCT based on the Classification of Atrophy Meetings (CAM) criteria as previously described. 1 Graders marked areas of cRORA using the Orion (Voxeleron Inc., TX, USA) application [Alex 2021]. Specifically, graders marked the bounds of atrophy on the B-scan cross-sections ( Figure 1 ). The delineated areas are subsequently represented two-dimensionally on the OCT en face view for confirmation of correct demarcation. Graders were masked to the nIR images collected in the Spectralis data set for consistency with the Cirrus labeling, which had no nIR data. Download figure Open in new tab Figure 1. The graders used Orion to place landmarks at each of the end points of the atrophy in each B-scan. The resulting 2D mask (area) is shown in the OCT en face view (top right). Once the editing is complete, the results file is saved and the mask exported as our ground truth area delineation. Deep Learning Architecture A 3D U-Net architecture was used for the deep learning with the output modified to generate a 2D mask. It extends the approach of [ Lachinov 2021 ] by adding attention blocks to the architecture in an effort to better localize the region in which the atrophy is imaged. Explicit localization is done in both [ Yehoshua 2013 ] and [ Derradji 2021 ] using layer segmentation, but here we do this in 3D and in a single architecture with the localization learned. A schematic of the 3D-to-2D U-Net is given in Figure 2 . Download figure Open in new tab Figure 2. Schematic of the CNN-based 3D to 2D neural network used for this study. To alleviate memory management issues caused by large 3D volumes, in the Spectralis data the volume was sub-sampled to 128-by-128-by-64 pixels (i.e., to 64 B-scans each of 128^2 pixels). The Cirrus data, due to the more isotropic distribution, was sub-sampled instead to 128-by-128-by-128 pixels (i.e., to 128 B-scans each of 128^2 pixels). The output was a 2D mask of GA at a resolution of 128-by-64 pixels and 128-by-128 pixels for Spectralis and Cirrus, respectively. For the Spectralis implementation, the architecture was also capable of receiving the 2D nIR images in a second input channel to see if this additional information would improve the algorithm’s performance. The implementation used TensorFlow 2.15 running under a Linux system on a Dell Precision 7920 Workstation, housing two NVIDIA A6000s connected via the NVLINK system allowing for distributed learning and shared GPU memory. The parameters only differed in batch size as the Cirrus volumes were larger. The optimization algorithm used was AdamW, with a learning rate of 5e-5. The loss function used the DSC, with even weighting of 0.5 to each class (GA, non-GA). Training each of the models used 450 epochs with a batch size of 32 for Spectralis, and 20 for Cirrus data. A patience parameter was set to 70 meaning that, if after 70 iterations no improvement was seen in the performance relative to the validation split (a part of the training set), the learning stopped. Analysis Methods N-fold cross-validation was performed. In this scenario, data is split N times, where at each of the N-folds, 1/Nth of the entire data set is set aside for testing and the remaining for training. Training further splits the data into train and validate groups, where the latter is used to determine when the training iterations stop. For the present study, five folds were used. For repeat cases from the same subject, the folds were structured such that at no time was data from a single subject represented both in the train and test sets. Dice Similarity Scores (DSC) and correlation (r 2 ) between manual and automated areas of atrophy were calculated. All final analysis was done using Matlab and its Statistics Toolbox (Mathworks, Natick, MA, USA). Results For the Spectralis data, 367 scans were used from 55 subject eyes and 33 subjects. The data was collected over a period of eight years. All 367 scans had confirmed GA: 267 demonstrated concurrent nAMD while the remaining 100 had GA without nAMD. The Cirrus data subset was comprised of 348 subject eyes from 326 subjects representing 348 total scans. All cases had confirmed GA, but 101 were also undergoing active treatment for fluid. For the Spectralis data, the mean DSC score was 0.826 and r 2 was 0.906 ( Table 1 – Summary analysis results for all data and experiments.). There was little change in the mean DSC score (0.829) and r 2 (0.908) with the addition of nIR data. For the Cirrus data, the mean DSC score was 0.824 and r 2 was 0.883. Splitting the Spectralis results into GA only and GA and concurrent nAMD, we interestingly see an increase in DSC scores where nAMD is present, but far better area correlations in GA only cases. In the case of the average correlation scores, the difference was notable in the Spectralis data; for the DSC scores the changes were only slight. View this table: View inline View popup Table 1. Summary analysis results for all data and experiments. Figure 3 shows the scatter plot and Bland-Altman plot for automated and manual measurements. Figures 4 and 5 show the same but for the Spectralis using just the OCT data, and using OCT + nIR data, respectively. Figures 6 through 9 show example segmentations for both the Spectralis and Cirrus data. Download figure Open in new tab Figure 3. Correlation of area measurements for the Cirrus data set. Left: scatter plot showing the manual area measurements (y axis) versus the automated measurements (x-axis) and their resulting correlation (r 2 = 0.88). Right: Bland-Altman plot showing the limits of agreement (LOA) between automated and manual measurements. The y axis shows the difference between the manual and automated measurements; the x-axis their average. Download figure Open in new tab Figure 4. Correlation of area measurements for the Spectralis data set. Left: scatter plot showing the manual area measurements (y axis) versus the automated measurements (x-axis) and their resulting correlation (r 2 = 0.92). Right: Bland-Altman plot showing the limits of agreement (LOA) between automated and manual measurements. The y axis shows the difference between the manual and automated measurements; the x-axis their average. Download figure Open in new tab Figure 5. Correlation of area measurements for the Spectralis OCT + nIR data set. Left: scatter plot showing the manual area measurements (y axis) versus the automated measurements (x-axis) and their resulting correlation (r 2 = 0.91). Right: Bland-Altman plot showing the limits of agreement (LOA) between automated and manual measurements. The y axis shows the difference between the manual and automated measurements; the x-axis their average. Download figure Open in new tab Figure 6. Example Spectralis data. Clockwise from top left we have: input nIR en face image; manual area delineation (blue) and automated area delineation (red); example B-scan showing the manual atrophy delineation; example B-scan showing the automated delineation; final automated mask and dashed line showing the location of the presented B-scan; final manual mask and a dashed line showing the location of its presented B-scan. Discussion The FDA has recognized the area of geographic atrophy as a primary endpoint in the development of treatments for GA. This important designation means that GA area, as measured using imaging, is considered relevant and clinically meaningful. This designation is, however, limited to using fundus autofluorescence which works by detecting natural fluorescence emitted by lipofuscin, a pigment that accumulates in the retinal pigment epithelium (RPE). This modality, however, offers no cross-sectional information and obscures foveal involvement that can lead to misinterpretation of the extent of the GA and risk to vision. Within a clinical setting, OCT is the standard of care and, given its depth resolution, is capable of revealing outer retinal disruption that is prognostic of GA progression [ Vogl 2023 ]. In the advent of complement inhibitor-based treatments for slowing the progression of GA is it important that clinicians have the tools to measure the endpoint of GA area automatically and thereby gauge the effectiveness of the treatments they are using. The current work has presented a means for doing this automatic monitoring, looking at how well the automated approach compares to expertly labeled data. Importantly, we have used two widely used OCT devices from two different manufacturers, where the data has been collected from two different sites. Important also is the fact that this is real-world clinical data, and not data from a clinical trial. Relative to ground truth assessment, we have shown for both devices excellent correlation, narrow limits of agreement, and very high DSC scores. This is also true in cases of different ocular comorbidities, as was predominantly seen in the data from the Cirrus device. The results are encouraging with respect to the presence concurrent nAMD and other comorbidities that involve fluid. This, perhaps, is due to the fact that fluid reflects very little light and does not, therefore, attenuate the signal that penetrates through to the choroid. It is the hyperreflectivity that is such a distinctive feature of cRORA in OCT volumes. Ground truth data is, of course, subjective and while the grading was strictly based on adherence to the CAM classification’s definition of cRORA, it is difficult for graders to be consistent across large data sets of variant image quality. This, however, is a general limitation and is confirmed in the variability seen in other studies [ Chandra 2022 , Schmitz-Valckenberg 2023 ], and something that we have not investigated in this study. The approach adopted in this study takes the entire OCT volume as input and returns a 2D area as a result. To do this we have created a quite bespoke architecture based around a residual U-Net. An alternate approach is to process each 2D B-scan separately and combine outputs to produce a final result. These approaches are based on segmenting each B-scan to yield a 2D probability image of the atrophic region [ Derradji 2021 , Zhang 2021 ]. This result is then integrated axially to form a 1d signal that, when combined with all other B-scan-based 1d signals, reconstructs the final 2D image of GA. This has the advantage of having a low overhead in terms of memory requirements, but the disadvantage in losing the context of the 3D data. Subsequently, this can result in segmentation areas having discontinuities between slices. While solving for this, the 3D data processing we have chosen incurs significant overhead in terms of memory requirements for model building. Our solution has been to reduce the size of the volumes by sub-sampling. But while this can have a nice denoising effect, the fidelity of the data comes into question, meaning detail may be lost, which is possibly the case in Figure 7 . This can be circumvented through better memory management or indeed larger GPUs, and can be immediately solved by using large server clusters. However, these solutions come at a high financial cost. Interestingly though, where the data was more isotropic, that is the Cirrus used 128 B-scans as opposed to the Spectralis’ 64 B-scans, this issue goes away ( Figure 8 ). For 3D processing, isotropic data is far more preferrable. The Spectralis protocol collects at least as much data, but gives preference to averaging often sparsely spaced B-scans as opposed to creating a dense, but unaveraged cube. Download figure Open in new tab Figure 7. Example Spectralis data. Clockwise from top left we have: input nIR en face image; manual area delineation (blue) and automated area delineation (red); example B-scan showing the manual atrophy delineation; example B-scan showing the automated delineation; final automated mask and dashed line showing the location of the presented B-scan; final manual mask and a dashed line showing the location of its presented B-scan. Download figure Open in new tab Figure 8. Example Cirrus data. Clockwise from top left we have: input OCT en face image; manual area delineation (blue) and automated area delineation (red); example B-scan showing the manual atrophy delineation; example B-scan showing the automated delineation; final automated mask and dashed line showing the location of the presented B-scan; final manual mask and a dashed line showing the location of its presented B-scan. Our study is not, however, without some limitations that must be considered in interpreting these results. For the Spectralis grading it was a design decision not to use the nIR images during the grading. Given this image data is quite unique to that device, this would go against the ultimate objectives of having a device agnostic automated approach. This, however, will reduce a grader’s ability to accurately assess GA as additional modalities are complementary and supportive of a final assessment. This leads to the question of accuracy of the ground truth data when not all information was available. Indeed, we have seen in the work of [Lachinov et al.], who used FAF in their grading, and just OCT in their segmentations, their performance dropped. It makes intuitive sense that the labeling task, the visual task, must use the same modality as that given to the segmentation algorithm. The main visual cues for cRORA are the absence of RPE and hyper transmission defects. It is possible that the network only learns the latter, but this might not be a limitation given that the appearance and growth of persistent choroidal hypertransmission defects in eyes with iAMD is an early sign of GA, making it a candidate for clinical trial endpoints [Liu2023]. And iRORA, cRORA both require hypertransmission defects and do not require a completely absent RPE. Using the OCT data alone likely has the consequence of a potential performance ceiling to the performance of the CNN. This was somewhat tested when nIR data was also given as input information to the network. In this case, we did not expect, therefore, that the CNN would improve its performance. If, however, we had graded with the user of nIR images, we might expect this to be different. It is beyond the scope of this current study to assess such permutations that incorporate different modalities, but it is an important consideration in both study design and ultimately clinical deployment to determine the appropriate combinations. We have instead adhered to two important tenets in this work: firstly, that OCT is the reference standard for diagnosis and staging of GA [Sadda 2018]; and secondly that the approach presented be applicable to any OCT device. Lastly, Spectralis data with a noise score below the manufacturers’ recommendations were excluded from this study. Not only because it causes a drop in algorithm performance, it results in data that is harder to grade, so performance targets become increasingly ambiguous. It is, however, an open question as to whether or not such data should be included in the training data given labeling inaccuracies, and one that is not addressed in this study. Data Availability All results produced in the present study are available upon reasonable request to the authors. References Alex V , Motevasseli T , Freeman WR , Jayamon JA , Bartsch DG , Borooah S. Assessing the validity of a cross-platform retinal image segmentation tool in normal and diseased retina . Sci Rep . 2021 Nov 8; 11 ( 1 ): 21784 . doi: 10.1038/s41598-021-01105-9 . PMID: 34750415 ; PMCID: PMC8575997 . OpenUrl CrossRef PubMed ↵ Chandra , S. , Rasheed , R. , Sen , P. et al. Inter-rater reliability for diagnosis of geographic atrophy using spectral domain OCT in age-related macular degeneration . Eye 36 , 392 – 397 ( 2022 ). OpenUrl PubMed Cheng QE et al. , “ Design Characteristics of Geographic Atrophy Treatment Trials: Systematic Review of Registered Trials in ClinicalTrials.gov ,” Ophthalmol Retina , 2 , 518 ( 2018 ). PMID: 31047604 . OpenUrl PubMed Csaky KG , Richman EA , Ferris 3rd FL . Report from the NEI/FDA Ophthalmic Clinical Trial Design and Endpoints Symposium . Invest Ophthalmol Vis Sci . 2008 ; 49 : 479 – 489 . OpenUrl FREE Full Text ↵ Derradji Y , Mosinska A , Apostolopoulos S , Ciller C , De Zanet S , Mantel I. Fully-automated atrophy segmentation in dry age-related macular degeneration in optical coherence tomography . Sci Rep . 2021 Nov 8; 11 ( 1 ): 21893 . doi: 10.1038/s41598-021-01227-0 . PMID: 34751189 ; PMCID: PMC8575929 . OpenUrl CrossRef PubMed Giocanti-Auregan A. Tadayoni R. Fajnkuchen F. et al. Predictive value of outer retina en face OCT imaging for geographic atrophy progression . Invest Ophthalmol Vis Sci . 2015 ; 56 : 8325 – 8330 OpenUrl PubMed ↵ He , K. , Zhang , X. , Ren , S. , & Sun , J. ( 2016 ). Deep Residual Learning for Image Recognition . In Proceedings of the IEEE Conference on Computer Vision and Pattern Recognition (CVPR) . ↵ Heier JS , Lad EM , Holz FG , et al. Pegcetacoplan for the treatment of geographic atrophy secondary to age-related macular degeneration (OAKS and DERBY): two multicentre, randomised, double-masked, sham-controlled, phase 3 trials . Lancet . 2023 Oct 21; 402 ( 10411 ): 1434 – 1448 . doi: 10.1016/S0140-6736(23)01520-9 . PMID: 37865470 . OpenUrl CrossRef PubMed ↵ K111157 . 510(k) Premarket Notification: CIRRUS HD-OCT WITH RETINAL NERVE FIBER LAYER, MACULAR, OPTIC NERVE HEAD, and GANGLION CELL NORMATIVE DATABASES , 2012 . ↵ Lachinov , D. , Seeböck , P. , Mai , J. , Goldbach , F. , Schmidt-Erfurth , U. , Bogunovic , H. ( 2021 ). Projective Skip-Connections for Segmentation Along a Subset of Dimensions in Retinal OCT. In: de Bruijne, M., et al. Medical Image Computing and Computer Assisted Intervention – MICCAI 2021 . MICCAI 2021. Lecture Notes in Computer Science (), vol 12901 . Springer , Cham . doi: 10.1007/978-3-030-87193-2_41 OpenUrl CrossRef Liu J , Shen M , Laiginhas R et al. Onset and progression of persistent choroidal hypertransmission defects in intermediate AMD: a novel clinical trial endpoint: hypertransmission defects as a clinical trial endpoint . Am J Ophthalmol . 2023 ; 254 : 11 – 22 doi: 10.1016/j.ajo.2023.03.012 OpenUrl CrossRef PubMed Morano J , Aresta G , Lachinov D et al. , Self-supervised learning via inter-modal reconstruction and feature projection networks for label-efficient 3D-to-2D segmentation https://arxiv.org/abs/2307.03008 Najman L and Schmitt M. Watershed of a continuous function . In Signal Processing (Special issue on Mathematical Morphology .), Vol. 38 ( 1994 ), pages 99 – 112 OpenUrl Pfau M , Schmitz-Valckenberg S Ribeiro R et al. Association of complement C3 inhibitor pegcetacoplan with reduced photoreceptor degeneration beyond areas of geographic atrophy . Sci Rep . 2022 ; 12 : 17870 doi: 10.1038/s41598-022-22404-9 OpenUrl CrossRef PubMed Riedl S , Vogl WD , Mai J , et al. The effect of pegcetacoplan treatment on photoreceptor maintenance in geographic atrophy monitored by artificial intelligence-based OCT analysis . Ophthalmol Retina . 2022 ; 6 ( 11 ): 1009e1018 . OpenUrl Reumueller A , Sacu S , Karantonis MG , Steiner I , Weigert G , Schmidt-Erfurth U. Semi-automated quantification of geographic atrophy with blue-light autofluorescence and spectral-domain optical coherence tomography: a comparison between the region finder and the advanced retinal pigment epithelium tool in the clinical setting . Acta Ophthalmol . 2019 Sep ; 97 ( 6 ): e887 – e895 . doi: 10.1111/aos.14085 . Epub 2019 Mar 24. PMID: 30907074 ; PMCID: PMC6767530 . OpenUrl CrossRef PubMed ↵ Sadda SR , Guymer R , Holz FG , Schmitz-Valckenberg S , Curcio CA , Bird AC , Blodi BA , Bottoni F , Chakravarthy U , Chew EY , Csaky K , Danis RP , Fleckenstein M , Freund KB , Grunwald J , Hoyng CB , Jaffe GJ , Liakopoulos S , Monés JM , Pauleikhoff D , Rosenfeld PJ , Sarraf D , Spaide RF , Tadayoni R , Tufail A , Wolf S , Staurenghi G. Consensus Definition for Atrophy Associated with Age-Related Macular Degeneration on OCT: Classification of Atrophy Report 3 . Ophthalmology . 2018 Apr ; 125 ( 4 ): 537 – 548 . doi: 10.1016/j.ophtha.2017.09.028 . Epub 2017 Nov 2. Erratum in: Ophthalmology. 2019 Jan;126(1):177. doi: 10.1016/j.ophtha.2018.10.038. PMID: 29103793 . OpenUrl CrossRef PubMed ↵ Sarda SP , Heyes A , Bektas M , Thakur T , Chao W , Intorcia M , Wronski S , Jones DL . Humanistic and Economic Burden of Geographic Atrophy: A Systematic Literature Review . Clin Ophthalmol . 2021 Dec 8; 15 : 4629 – 4644 . doi: 10.2147/OPTH.S338253 . PMID: 34916775 ; PMCID: PMC8667751 . OpenUrl CrossRef PubMed ↵ Schmitz-Valckenberg , Steffen , et al. “ Interreader agreement and longitudinal progression of incomplete/complete retinal pigment epithelium and outer retinal atrophy in age-related macular degeneration .” Ophthalmology Retina 7 . 12 ( 2023 ): 1059 – 1068 . OpenUrl PubMed Seeböck P , Vogl WD , Waldstein SM , Orlando JI , Baratsits M , Alten T , Arikan M , Mylonas G , Bogunović H , Schmidt-Erfurth U. Linking Function and Structure with ReSensNet: Predicting Retinal Sensitivity from OCT using Deep Learning . Ophthalmol Retina . 2022 Jun ; 6 ( 6 ): 501 – 511 . doi: 10.1016/j.oret.2022.01.021 . Epub 2022 Feb 5. PMID: 35134543 . OpenUrl CrossRef PubMed Shmueli , O. ; Szeskin , A. ; Benhamou , I. ; Joskowicz , L. ; Shwartz , Y. ; Levy , J. Measuring Geographic Atrophy Area Using Column-Based Machine Learning Software on Spectral-Domain Optical Coherence Tomography versus Fundus Auto Fluorescence . Bioengineering 2024 , 11 , 849 . doi: 10.3390/bioengineering11080849 OpenUrl CrossRef PubMed Vallino V , Berni A , Coletto A , Serafino S , Bandello F , Reibaldi M , Borrelli E. Structural OCT and OCT angiography biomarkers associated with the development and progression of geographic atrophy in AMD . Graefes Arch Clin Exp Ophthalmol . 2024 Apr 30. doi: 10.1007/s00417-024-06497-8 . Epub ahead of print. PMID: 38689123 . OpenUrl CrossRef PubMed Velaga SB , Nittala MG , Hariri A , Sadda SR . Correlation between Fundus Autofluorescence and En Face OCT Measurements of Geographic Atrophy . Ophthalmol Retina . 2022 Aug ; 6 ( 8 ): 676 – 683 . doi: 10.1016/j.oret.2022.03.017 . Epub 2022 Mar 23. PMID: 35338026 . OpenUrl CrossRef PubMed ↵ Vogl W-D , Riedl S , Mai J et al. , Predicting Topographic Disease Progression and Treatment Response of Pegcetacoplan in Geographic Atrophy Quantified by Deep Learning , Ophthalmology Retina , Volume 7 , Issue 1 , 2023 . Wu Z , Luu CD , Ayton LN , Goh JK , Lucci LM , Hubbard WC , Hageman JL , Hageman GS , Guymer RH . Optical coherence tomography-defined changes preceding the development of drusen-associated atrophy in age-related macular degeneration . Ophthalmology . 2014 Dec ; 121 ( 12 ): 2415 – 22 . doi: 10.1016/j.ophtha.2014.06.034 . Epub 2014 Aug 8. PMID: 25109931 . OpenUrl CrossRef PubMed Web of Science ↵ Yehoshua Z , Garcia Filho CA , Penha FM , Gregori G , Stetson PF , Feuer WJ , Rosenfeld PJ . Comparison of geographic atrophy measurements from the OCT fundus image and the sub-RPE slab image . Ophthalmic Surg Lasers Imaging Retina . 2013 Mar -Apr; 44 ( 2 ): 127 – 32 . doi: 10.3928/23258160-20130313-05 . PMID: 23510038 . OpenUrl CrossRef PubMed Web of Science ↵ Zhang , Gongyu et al. Clinically relevant deep learning for detection and quantification of geographic atrophy from optical coherence tomography: a model development and external validation study , The Lancet Digital Health , Volume 3 , Issue 10 , e665 – e675 , 2021 . OpenUrl View the discussion thread. Back to top Previous Next Posted July 07, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Automated Deep Learning-Based 3D-to-2D Segmentation of Geographic Atrophy in Optical Coherence Tomography Data Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Automated Deep Learning-Based 3D-to-2D Segmentation of Geographic Atrophy in Optical Coherence Tomography Data Hasenin Al-khersan , Jonathan Oakley , Daniel Russakoff , Jessica Cao , Stanley Saju , Avery Zhou , Simrat Sodhi , Niveditha Pattathil , Netan Choudhry , David Boyer , Charles Wykoff medRxiv 2025.07.07.25330902; doi: https://doi.org/10.1101/2025.07.07.25330902 Share This Article: Copy Citation Tools Automated Deep Learning-Based 3D-to-2D Segmentation of Geographic Atrophy in Optical Coherence Tomography Data Hasenin Al-khersan , Jonathan Oakley , Daniel Russakoff , Jessica Cao , Stanley Saju , Avery Zhou , Simrat Sodhi , Niveditha Pattathil , Netan Choudhry , David Boyer , Charles Wykoff medRxiv 2025.07.07.25330902; doi: https://doi.org/10.1101/2025.07.07.25330902 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Ophthalmology Subject Areas All Articles Addiction Medicine (567) Allergy and Immunology (863) Anesthesia (297) Cardiovascular Medicine (4411) Dentistry and Oral Medicine (443) Dermatology (380) Emergency Medicine (606) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1505) Epidemiology (15205) Forensic Medicine (30) Gastroenterology (1119) Genetic and Genomic Medicine (6574) Geriatric Medicine (666) Health Economics (994) Health Informatics (4511) Health Policy (1365) Health Systems and Quality Improvement (1608) Hematology (537) HIV/AIDS (1263) Infectious Diseases (except HIV/AIDS) (15903) Intensive Care and Critical Care Medicine (1103) Medical Education (620) Medical Ethics (144) Nephrology (666) Neurology (6573) Nursing (345) Nutrition (998) Obstetrics and Gynecology (1139) Occupational and Environmental Health (954) Oncology (3319) Ophthalmology (968) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (662) Pediatrics (1689) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5422) Public and Global Health (9205) Radiology and Imaging (2191) Rehabilitation Medicine and Physical Therapy (1367) Respiratory Medicine (1191) Rheumatology (593) Sexual and Reproductive Health (709) Sports Medicine (529) Surgery (709) Toxicology (99) Transplantation (288) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9feb7afb8f44df94',t:'MTc3OTI4MTU2Ng=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.