Full text
48,892 characters
· extracted from
preprint-html
· click to expand
Appendix300: A multi-institutional laparoscopic appendectomy video dataset for computational modeling tasks | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Appendix300: A multi-institutional laparoscopic appendectomy video dataset for computational modeling tasks View ORCID Profile Fiona R. Kolbinger , Max Kirchner , Kevin Pfeiffer , View ORCID Profile Sebastian Bodenstedt , View ORCID Profile Alexander C. Jenke , Julia Barthel , Matthias Carstens , Karolin Dehlke , Sophia Dietz , Sotirios Emmanouilidis , Guido Fitze , Martin Freitag , Fabian Holderried , Thorsten Jacobi , Weam Kanjo , Linda Leitermann , Sören Torge Mees , Steffen Pistorius , Conrad Prudlo , Astrid Seiberth , View ORCID Profile Jurek Schultz , Karolin Thiel , Daniel Ziehn , View ORCID Profile Stefanie Speidel , Jürgen Weitz , View ORCID Profile Jakob Nikolas Kather , View ORCID Profile Marius Distler , View ORCID Profile Oliver Lester Saldanha doi: https://doi.org/10.1101/2025.09.05.25335174 Fiona R. Kolbinger 1 Department of Visceral, Thoracic and Vascular Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany 2 Else Kroener Fresenius Center for Digital Health, Faculty of Medicine and University Hospital Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany 3 Weldon School of Biomedical Engineering, Purdue University , West Lafayette, IN, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Fiona R. Kolbinger For correspondence: fiona.kolbinger{at}uniklinikum-dresden.de oliverlester.saldanha{at}tu-dresden.de Max Kirchner 4 Department of Translational Surgical Oncology, National Center for Tumor Diseases (NCT), NCT/UCC Dresden, a partnership between DKFZ, Faculty of Medicine and University Hospital Carl Gustav Carus, TUD Dresden University of Technology, and Helmholtz-Zentrum Dresden-Rossendorf (HZDR) , Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Kevin Pfeiffer 2 Else Kroener Fresenius Center for Digital Health, Faculty of Medicine and University Hospital Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Sebastian Bodenstedt 4 Department of Translational Surgical Oncology, National Center for Tumor Diseases (NCT), NCT/UCC Dresden, a partnership between DKFZ, Faculty of Medicine and University Hospital Carl Gustav Carus, TUD Dresden University of Technology, and Helmholtz-Zentrum Dresden-Rossendorf (HZDR) , Germany 5 Centre for Tactile Internet with Human-in-the-Loop (CeTI), TUD Dresden University of Technology , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Sebastian Bodenstedt Alexander C. Jenke 4 Department of Translational Surgical Oncology, National Center for Tumor Diseases (NCT), NCT/UCC Dresden, a partnership between DKFZ, Faculty of Medicine and University Hospital Carl Gustav Carus, TUD Dresden University of Technology, and Helmholtz-Zentrum Dresden-Rossendorf (HZDR) , Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Alexander C. Jenke Julia Barthel 1 Department of Visceral, Thoracic and Vascular Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Matthias Carstens 1 Department of Visceral, Thoracic and Vascular Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Karolin Dehlke 1 Department of Visceral, Thoracic and Vascular Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany 11 Asklepios-ASB Krankenhaus Radeberg , Radeberg, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Sophia Dietz 1 Department of Visceral, Thoracic and Vascular Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany 11 Asklepios-ASB Krankenhaus Radeberg , Radeberg, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Sotirios Emmanouilidis 6 Department of General, Visceral and Thoracic Surgery, St. Elisabethen-Klinikum Ravensburg , Ravensburg, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Guido Fitze 7 Department of Pediatric Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Martin Freitag 8 Krankenhaus St. Joseph-Stift Dresden GmbH , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Fabian Holderried 6 Department of General, Visceral and Thoracic Surgery, St. Elisabethen-Klinikum Ravensburg , Ravensburg, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Thorsten Jacobi 9 Diakonissenkrankenhaus Dresden , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Weam Kanjo 8 Krankenhaus St. Joseph-Stift Dresden GmbH , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Linda Leitermann 10 Department of General and Visceral Surgery, Dresden-Friedrichstadt General Hospital , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Sören Torge Mees 10 Department of General and Visceral Surgery, Dresden-Friedrichstadt General Hospital , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Steffen Pistorius 1 Department of Visceral, Thoracic and Vascular Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany 11 Asklepios-ASB Krankenhaus Radeberg , Radeberg, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Conrad Prudlo 7 Department of Pediatric Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Astrid Seiberth 10 Department of General and Visceral Surgery, Dresden-Friedrichstadt General Hospital , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jurek Schultz 7 Department of Pediatric Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jurek Schultz Karolin Thiel 6 Department of General, Visceral and Thoracic Surgery, St. Elisabethen-Klinikum Ravensburg , Ravensburg, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Daniel Ziehn 9 Diakonissenkrankenhaus Dresden , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Stefanie Speidel 4 Department of Translational Surgical Oncology, National Center for Tumor Diseases (NCT), NCT/UCC Dresden, a partnership between DKFZ, Faculty of Medicine and University Hospital Carl Gustav Carus, TUD Dresden University of Technology, and Helmholtz-Zentrum Dresden-Rossendorf (HZDR) , Germany 5 Centre for Tactile Internet with Human-in-the-Loop (CeTI), TUD Dresden University of Technology , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Stefanie Speidel Jürgen Weitz 1 Department of Visceral, Thoracic and Vascular Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany 5 Centre for Tactile Internet with Human-in-the-Loop (CeTI), TUD Dresden University of Technology , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jakob Nikolas Kather 2 Else Kroener Fresenius Center for Digital Health, Faculty of Medicine and University Hospital Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany 12 Department of Medicine I, Faculty of Medicine and University Hospital Carl Gustav Carus, TUD Dresden University of Technology , 01307 Dresden, Germany 13 Medical Oncology, National Center for Tumor Diseases (NCT), University Hospital Heidelberg , Heidelberg, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jakob Nikolas Kather Marius Distler 1 Department of Visceral, Thoracic and Vascular Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Marius Distler Oliver Lester Saldanha 2 Else Kroener Fresenius Center for Digital Health, Faculty of Medicine and University Hospital Carl Gustav Carus, TUD Dresden University of Technology , Dresden, Germany 13 Medical Oncology, National Center for Tumor Diseases (NCT), University Hospital Heidelberg , Heidelberg, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Oliver Lester Saldanha For correspondence: fiona.kolbinger{at}uniklinikum-dresden.de oliverlester.saldanha{at}tu-dresden.de Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Structured Abstract Background The limited availability of diverse and representative training data poses a critical barrier to the development of clinically relevant computational tools for intraoperative surgical decision support. Surgical procedures are not routinely recorded, and annotation requires domain expertise, resulting in a scarcity of open-access surgical video datasets with high-quality annotations. Existing datasets are typically limited to single institutions and specific procedures, such as cholecystectomy, and rarely comprise patient-level metadata like demographic characteristics, disease history, or laboratory parameters. Methods The Appendix300 dataset comprises 330 laparoscopic surgery recordings, including 325 full-length laparoscopic appendectomies and 5 control recordings from non-appendectomy procedures in pediatric and adult patients treated at five German centers. The dataset includes patient-level clinical metadata (demographics, medical history, clinical symptoms, laboratory parameters, and histopathological findings), as well as standardized expert annotations of the laparoscopic grade of appendicitis. Results Appendix300 currently represents the largest publicly available collection of surgical video data with patient metadata and the first curated dataset of laparoscopic appendectomies. It enables novel validation tasks for computer vision in surgery, including the classification of appendicitis severity and the detection of appendiceal perforation. Technical validation of the laparoscopic appendicitis grade annotations showed substantial interrater agreement (weighted Cohen’s κ = 0.615). Conclusion The Appendix300 dataset expands the scope of surgical data science by integrating video data with clinical and pathological metadata across institutions. It enables new and clinically relevant patient-level validation tasks for computer vision in laparoscopic surgery and facilitates decentralized learning approaches, overall enhancing the breadth and translational relevance of AI-based surgical video analysis. Dataset Description Appendix300 is a multi-institutional dataset comprising 330 laparoscopic surgery recordings, including 325 appendectomies and 5 control cases, detailed patient-level metadata (demographics, medical history, clinical symptoms, laboratory parameters, and histopathological findings), and expert annotations of appendicitis severity. It enables novel validation tasks for surgical AI, such as inflammation grading and perforation detection, and supports decentralized learning across diverse patient populations. Background & Summary Computational analysis of medical imaging and clinical data has the potential to improve diagnostic accuracy and treatment stratification across medical fields. Increasing evidence from prospective clinical trials supports the clinical applicability and benefit of Artificial Intelligence (AI)-based tools. 1 For example, computational tools have demonstrated expert-level performance for polyp detection during colonoscopy 2 , the detection of pulmonary nodules in chest X-rays 3 , and mammogram interpretation for breast cancer screening 4 . Computational model performance and generalizability depend on the availability of large and diverse sets of clinical training and test data. Some clinical fields produce imaging as a means of documentation that becomes a component of patient records and is repetitively reviewed after acquisition for diagnostic follow-up or therapeutic decision-making (i.e., electrocardiograms in cardiology, X-rays in radiology, pictures of polyps in colonoscopy). In contrast, surgical video data is more complex to acquire and store in a standardized way due to its large file size. Reviewing and annotating surgical video data are time-consuming and require surgical domain knowledge. 5 While surgical video recordings represent an objective documentation of a surgical procedure and capture information that could be used for educational and prognostic purposes 6 – 8 , surgeries are not routinely recorded, and retrospectively written operation notes remain the sole standard at most clinical institutions 9 . The largest available open-access datasets of intraoperative imaging comprise data from about 100 patients and cover a limited variety of procedures, including cholecystectomy (i.e., Cholec80 10 , CholecT50 11 ) and cataract surgeries (i.e., Cataract-101 12 , CATARACTS 13 ). Most datasets exclusively comprise spatial or categorical annotations of the surgical scene (i.e., presence of tools and anatomical structures in a video frame) rather than patient-level or clinical data, allowing for a limited number of surgical AI validation tasks that insufficiently represent the breadth of clinical reasoning tasks in surgery. 14 To increase the diversity of annotated surgical video data and validation tasks for surgical data science 15 approaches, we curated the Appendix300 dataset, comprising 330 video recordings of laparoscopic appendectomies and healthy control surgeries (i.e., appendix recordings from non-appendectomy laparoscopic surgeries) performed at five centers, as well as matched clinical metadata and annotations of the intraoperative grade of appendicitis ( Figure 1 ). Appendix300 currently represents the largest publicly available collection of surgical video data with patient metadata and the first curated dataset of laparoscopic appendectomies. By combining patient-level clinical data and pathology-related annotations with laparoscopic video data, this dataset connects a range of structured data types along the diagnostic and therapeutic pathway, facilitating pathophysiology-related investigations. Furthermore, the multicentric nature of the dataset allows for the evaluation of decentralized learning approaches. In the context of acute appendicitis, potential future applications include the development of intraoperative assistance systems for quality control and a harmonization of the intraoperative inflammation grade and the histopathological phenotype, which are often discordant 16 . Relation with preoperative imaging 17 and postoperative outcome data (i.e., surgical complications) are possible future extensions that are beyond the scope of this clinical use case but will need to be generated for other clinical use cases. Download figure Open in new tab Figure 1. Dataset Overview. The Appendix300 dataset covers preoperative, intraoperative, and postoperative data of 325 patients with suspected appendicitis undergoing laparoscopic appendectomy and 5 patients undergoing non-appendectomy laparoscopic surgery at five surgical centers. Preoperative data comprise demographics, select medical history details, clinical symptoms of acute appendicitis, laboratory parameters, and recent antibiotic medication history. The surgery video recording was temporally annotated with regard to the timepoint of complete appendix visibility before appendix dissection, the laparoscopic grade of appendicitis, and perforation. Two surgeons independently annotated the laparoscopic grade and major disagreements were resolved through a third independent annotation. Postoperative metadata include the histopathological grade of appendicitis as well as the presence or absence of an appendiceal carcinoid. Abbreviations: CRP (C-reactive protein), PMN (polymorphonuclear). Methods This dataset comprises laparoscopic video recordings of 325 laparoscopic appendectomies and 5 non-appendectomy laparoscopic surgeries, matched clinical metadata along the preoperative and postoperative treatment pathway, and annotations of the intraoperative grade of appendicitis ( Figure 1 , Figure 2 ). Download figure Open in new tab Figure 2. Data preprocessing and annotation of the intraoperative grade of appendicitis. (a) Schematic representation of the data processing steps. Following the deidentification of extracorporeal laparoscopic video sequences, each appendectomy recording was labeled with a temporal label (timestamp) marking the beginning of appendiceal dissection. Up to 200 equidistant frames were sampled from a 100-second key video sequence spanning 50 seconds before and after the timestamp. (b) Intraoperative grades of appendicitis were defined based on Gomes et al . (2012) 19 . Based on an annotation protocol ( Supplementary Material 3 ), each video was classified by the surgical team. For technical validation, a second reviewer performed a second annotation of the intraoperative grade of appendicitis. In case of major disagreement, a third independent annotation was acquired to adjust the ground truth where necessary. Video Recording Between June 2023 and September 2024, video data from 325 laparoscopic appendectomies and 5 non-appendectomy laparoscopic surgeries were gathered at five German surgical centers. The participating centers comprise four public hospitals (Asklepios-ASB Krankenhaus Radeberg, Diakonissenkrankenhaus Dresden, Krankenhaus St. Joseph Stift Dresden, St. Elisabethen-Krankenhaus Ravensburg) and one academic surgical department (Department of Pediatric Surgery, University Hospital Carl Gustav Carus Dresden). All included patients had a clinical indication for the surgical procedure. Appendectomy recordings and clinical metadata were consecutively gathered in clinical routine. Patients with an indication of laparoscopic appendectomy for suspected acute appendicitis and documented histopathologic inflammation grade were included in the appendectomy dataset. Exclusion criteria comprised conversion to open surgery, incomplete surgery recordings, and cases with corrupted files. Surgeries were performed, recorded, and saved using locally available laparoscopic hardware ( Table 1 ). View this table: View inline View popup Download powerpoint Table 1: Recording infrastructure and technical details of the dataset for all contributing centers. Acquisition of Clinical Labels and Annotations A graphical user interface ( Supplementary Material 1 ) was implemented to save raw surgery recordings, corresponding clinical labels, and original annotations of the laparoscopic grade of appendicitis on local hardware in anonymized form. This process was identical for laparoscopic appendectomy recordings and appendix recordings from non-appendectomy laparoscopic surgeries. The graphical user interface was implemented in Python using tkinter and integrates a custom video playback component based on PyAV and Pillow for frame-accurate seeking, stereo video handling, and consistent frame rate rendering. It supports hospital-specific configurations (e.g., multi-video workflows, stereo cropping) via a centralized config structure and allows for timestamp annotation and structured metadata input through predefined form elements. All annotations and associated videos were saved to a defined output structure, with the metadata stored in a standardized CSV file, enabling reproducible and site-adaptive data extraction. Clinical labels were derived from routine documentation based on a clinical labeling protocol ( Supplementary Material 2 ). Following this protocol, the following parameters were preoperatively gathered: Sex, age, body-mass index (BMI), clinical symptoms based on the Alvarado score 18 (migration of abdominal pain to the right lower quadrant, anorexia or acetone in the urine, nausea/vomiting, point tenderness in the right lower quadrant, rebound peritonism in the right iliac fossa, body temperature), preoperative laboratory parameters (hemoglobin, leukocytes, granulocytes, proportion of polymorphonuclear cells, C-reactive protein), select medical history details (history of intraabdominal surgery, active tumor disease, pregnancy), and the duration of preoperative antibiotic treatment ( Figure 1 ). Using the graphical user interface’s video review function ( Supplementary Material 1 ), a timestamp, at which the appendix is fully visible prior to invasive preparation, was documented by the contributing surgery residents and attendings (FRK, JB, KD, SD, FH, WK, LL, JS, AS, DZ). Based on this timestamp, a 100-second video snippet was extracted from the full video recording, which covers 50 seconds before and after the timepoint of full appendix visibility ( Figure 2 a ). The intraoperative grade of appendicitis and the presence of perforation were classified by the surgical teams carrying out the procedure based on an annotation protocol ( Supplementary Material 3, Figure 2 b ), which follows the intraoperative classification proposed by Gomes et al . 19 (annotation 1). Annotation 1 represents the original ground truth annotation. For technical validation and to identify outliers and possible annotation errors, a second reviewer (general surgery resident with 4 years of experience in laparoscopic surgery) independently annotated the intraoperative grade of appendicitis for all recordings (annotation 2). Outliers were defined as a disagreement of at least three appendicitis grades between annotation 1 and annotation 2 (e.g., grade 2 and grade 5; grade 3A and grade 4B). We report the interrater agreement between annotation 1 and annotation 2 quantitatively using weighted Cohen’s kappa 20 ( Table 2 , Figure 3 a ), and qualitatively through a review of divergent ratings ( Figure 3 b ). View this table: View inline View popup Download powerpoint Table 2: Summary of patient characteristics and surgery-related data. Download figure Open in new tab Figure 3. Technical validation of the laparoscopic grade of appendicitis annotations. Confusion matrices (a) indicate the agreement between the original annotation by the operating surgeon (annotation 1) and the independent second annotation (annotation 2) for all patients. (b) Of all 330 cases, 30 outlier cases with a disagreement of more than two appendicitis grades between annotation 1 and annotation 2 were subjected to a third independent annotation, and ground truth labels were adjusted as necessary. Case indices (x-axis ticks) comprise the center number and the case number, separated by a dash. To adjust the ground truth where necessary, outliers were subjected to a third independent annotation by a general surgery resident with 7 years of experience in laparoscopic surgery (annotation 3). In case of a major disagreement between annotation 1 and annotation 3 (i.e., a disagreement of 3 or more appendicitis grades), the ground truth was adjusted to annotation 3. If annotation 3 was in agreement with annotation 1 (i.e., disagreement of up to 2 appendicitis grades), the ground truth was not adjusted ( Figure 3 b ). Table 2 summarizes patient characteristics and appendicitis grade annotations for all surgeries. Ethics Statement This dataset was collected in accordance with the Declaration of Helsinki and its later amendments. All data were compiled in an anonymized fashion using the described user interface. The responsible Institutional Review Boards reviewed and approved this study on August 4th, 2022 (ethics committee at the Technical University Dresden, approval number BO-EK-332072022), September 13th, 2023 (ethics committee of the Sächsische Landesärztekammer, approval number EK-BR-75/23-1), and December 23rd, 2023 (ethics committee of the Landesärztekammer Baden-Württemberg, approval number B-F-2023-023). The trial, in the context of which this dataset was acquired, was prospectively registered at the German Clinical Trials Register (Deutsches Register Klinischer Studien, DRKS) on December 9th, 2022 (trial registration ID: DRKS00030874). Patients were informed about the anonymized acquisition, analysis, and publication of data from their inpatient treatment. Following local legislation, no written informed consent was required for anonymized acquisition, analysis, and publication of clinical data. Data Records The Appendix300 dataset comprises 100-second video snippets from 330 surgery video recordings, along with patient metadata and annotations. These video snippets cover 50 seconds before and after the annotated timepoint of full appendix visibility. Due to the large file size of the deidentified full-length surgery recordings, they are made available to interested researchers upon reasonable request. To access the full-length surgery recordings, data requestors must sign a data use agreement. During the peer review process, the data are accessible via the following link: https://nextcloud.tso.ukdd.de/s/mitAaKT8RiPqw3p . The dataset is publicly available for non-commercial use under the Creative Commons Attribution CC-BY. If readers wish to use or reference this dataset, they should cite this paper. Description of the data folder structure The dataset is structured into two main directories: “Video_Snippets” and “Images”. Each of these directories is organized by contributing center, with data grouped into subfolders for each patient, such as “Center1_001”. The “Video_Snippets” directory contains patient subfolders with the respective 100-second video snippet covering 50 seconds before and after the annotated timepoint of full appendix visibility, following the same folder structure. In the “Images” directory, each patient subfolder includes a frames.zip archive with 200 frames extracted from the corresponding video snippet at 2 frames per second. At the top level of the dataset, an “overall_merged.csv” file is available to provide a consolidated view of all centers and patients, including metadata and annotations. Technical Validation For technical validation of the annotations of the intraoperative grade of appendicitis, an independent secondary annotation was acquired. The overall interrater agreement (weighted Cohen’s kappa) was 0.614, with variations across the contributing centers ( Table 2 , Figure 3 a ). Of 330 cases, 30 (9.1%) were classified as outliers or potential annotation errors based on a major disagreement between annotation 1 and annotation 2. Upon a third independent review of these 30 outlier cases (annotation 3), ground truths were adjusted to annotation 3 for 14 cases (4.2% of all cases) and original grade labels (annotation 1) were retained for 16 cases ( Figure 3 b ). These findings provide a baseline for interrater variability in laparoscopic grading of appendicitis. Usage Notes The Appendix300 dataset can be used for various purposes in the field of machine learning, either on its own or in combination with other, already existing datasets. Used on its own, it facilitates the training of computational models identifying the intraoperative grade of appendicitis as a classification task and differentiation of perforated and non-perforated appendicitis (binary classification task), which are new clinical use cases for algorithm validation in surgical data science. The multi-institutional nature of the Appendix300 dataset also facilitates the evaluation of decentralized and federated machine learning models for the above-mentioned validation tasks. We report the results of a benchmarking study evaluating Swarm Learning for decentralized, privacy-preserving collaboration in surgical video analysis in a separate publication. The Appendix300 dataset has three key limitations: First, some clinical data are incompletely available due to the manual entry of anonymized metadata at contributing centers. For example, no information about the BMI could be obtained from center 1 and center 3 ( Table 2 ). This limitation represents a common scenario in multi-institutional data collection efforts and could be overcome through direct access to electronic health records, which was not feasible in this work due to legal and administrative restrictions at the contributing centers. Second, the dataset does not include any preoperative imaging data or imaging-derived variables that have been identified as predictors of a complicated course, e.g., the presence of free intraabdominal air or an intra-abdominal abscess. 21 Similarly, no data on postoperative complications are available in this dataset. Third, annotations of the laparoscopic grade of appendicitis followed the Gomes classification, which, in itself, has limitations. 19 For example, this classification requires the presence of macroscopic necroses for the assignment of grade 3, and the presence of encapsulated abscesses or leakage of pus into the abdominal cavity for the assignment of grade 4 ( Figure 2 b , Supplementary Material 3 ). While it is applicable to most laparoscopic presentations of appendicitis, some intermediate cases may be particularly ambiguous to classify. For example, an appendix presenting with fibrin coverage, mild regional peritonitis, and small amounts of opaque (i.e., likely purulent) ascites, yet without macroscopic necroses or encapsulated abscesses, may fall into either grade 2 (fibrin) or grade 4B (regional peritonitis). This ambiguity and potential non-linearity of the clinical progression of appendicitis and its laparoscopic presentation have been acknowledged by previous research. 22 , 23 Despite these limitations, the Appendix300 dataset represents a considerable step towards clinically relevant applications for computational surgical video analysis, as it connects demographic, symptom-related, laparoscopic, and histopathological data for a large, multi-institutional patient cohort, and introduces a novel use case that will help diversify the clinical applications of research efforts in surgical data science. Data Availability Data will be made publicly available following the peer review process for non-commercial use under the Creative Commons Attribution CC-BY. If readers wish to use or reference this dataset, they should cite this paper. Code Availability No custom code was used in the generation or processing of this dataset. Author Contributions Conceptualization: FRK, JNK, MD, OLS; Methodology: FRK, SB, JS, SS, JNK, OLS; Software: MK, KP, SB, ACJ, OLS; Validation: FRK, MK, KP, SB, ACJ, MC, OLS; Formal analysis: FRK, MK, KP, OLS; Investigation: FRK, KP, SB, JB, MC, KD, SD, SE, FH, WK, LL, CP, AS, JS, DZ, MD, OLS; Resources: GF, MF, TJ, STM, SP, JS, KT, SS, JW, JNK, MD; Data Curation: FRK, MK, KP, SB, JB, MC, KD, SD, SE, FH, WK, LL, CP, AS, JS, DZ, MD, OLS; Writing - Original Draft: FRK; Writing - Review & Editing: MK, KP, SB, ACJ, JB, MC, KD, SD, SE, GF, MF, FH, TJ, WK, LL, STM, SP, CP, AS, JS, KT, DZ, SS, JW, JNK, MD; Visualization: FRK, MK; Supervision: FRK, SS, JW, JNK, MD, OLS; Project administration: FRK, OLS; Funding acquisition: FRK, SB, SS, JW, JNK, MD. Competing Interests FRK declares advisory roles for Radical Healthcare, USA; and the Surgical Data Science Collective (SDSC), USA. JNK declares consulting services for Bioptimus, France; Owkin, France; DoMore Diagnostics, Norway; Panakeia, UK; AstraZeneca, UK; Scailyte, Switzerland; Mindpeak, Germany; and MultiplexDx, Slovakia. Furthermore, he holds shares in StratifAI, Synagen, and Ignition Labs, Germany, has received a research grant by GSK, and has received honoraria by AstraZeneca, Bayer, Eisai, Janssen, MSD, BMS, Roche, Pfizer and Fresenius. MD declares advisory roles for AESCULAP AG, Germany; and Intuitive Surgical, USA, and has received honoraria from Medtronic. All other authors declare no competing interests. Acknowledgements The authors gratefully acknowledge administrative support from Sandra Korn, Ulrike Neckmann, Christian Praetorius, and Anika Stützer (Clinical Trial Center, Department of Visceral, Thoracic and Vascular Surgery, University Hospital and Faculty of Medicine Carl Gustav Carus Dresden, Dresden, Germany) and technical support from all participating institutions in locally setting up data collection infrastructure. This work was supported by the German Cancer Research Center (CoBot 2.0) and the German Research Foundation (Deutsche Forschungsgemeinschaft, DFG) as part of Germany’s Excellence Strategy (EXC 2050/1, Project ID 390696704) within the Cluster of Excellence “Centre for Tactile Internet with Human-in-the-Loop” (CeTI) of the Dresden University of Technology. FRK receives support from the Joachim Herz Foundation (Add-On Fellowship for Interdisciplinary Life Science), the Central Indiana Corporate Partnership AnalytiXIN Initiative, the Evan and Sue Ann Werling Pancreatic Cancer Research Fund, and the Indiana Clinical and Translational Sciences Institute (EPAR4157) funded, in part, by Grant Number UM1TR004402 from the National Institutes of Health, National Center for Advancing Translational Sciences, Clinical and Translational Sciences Award. MK and ACJ are supported by the European Union through NEARDATA under grant agreement ID 101092644. JNK is supported by the German Cancer Aid (DECADE, 70115166), the German Federal Ministry of Education and Research (PEARL, 01KD2104C; CAMINO, 01EO2101; SWAG, 01KD2215A; TRANSFORM LIVER, 031L0312A; TANGERINE, 01KT2302 through ERA-NET Transcan; Come2Data, 16DKZ2044A; DEEP-HCC, 031L0315A), the German Academic Exchange Service (SECAI, 57616814), the German Federal Joint Committee (TransplantKI, 01VSF21048) the European Union’s Horizon Europe and innovation programme (ODELIA, 101057091; GENIAL, 101096312), the European Research Council (ERC; NADIR, 101114631), the National Institutes of Health (EPICO, R01 CA263318) and the National Institute for Health and Care Research (NIHR, NIHR203331) Leeds Biomedical Research Centre. The views expressed are those of the author(s) and not necessarily those of the NHS, the National Institutes of Health, the NIHR, or the Department of Health and Social Care. This work was funded by the European Union. Views and opinions expressed are those of the authors only and do not necessarily reflect those of the European Union. Neither the European Union nor other granting authorities can be held responsible for them. Footnotes Correction of data distribution error References 1. ↵ Han , R. et al. Randomised controlled trials evaluating artificial intelligence in clinical practice: a scoping review . Lancet Digit Health 6 , e367 – e373 ( 2024 ). OpenUrl CrossRef 2. ↵ Repici , A. et al. Artificial intelligence and colonoscopy experience: lessons from two randomised trials . Gut 71 , 757 – 765 ( 2022 ). OpenUrl Abstract / FREE Full Text 3. ↵ Nam , J. G. et al. AI Improves Nodule Detection on Chest Radiographs in a Health Screening Population: A Randomized Controlled Trial . Radiology 307 , e221894 ( 2023 ). OpenUrl PubMed 4. ↵ Lång , K. et al. Artificial intelligence-supported screen reading versus standard double reading in the Mammography Screening with Artificial Intelligence trial (MASAI): a clinical safety analysis of a randomised, controlled, non-inferiority, single-blinded, screening accuracy study . Lancet Oncol . 24 , 936 – 944 ( 2023 ). OpenUrl CrossRef PubMed 5. ↵ Nyangoh Timoh , K. et al. A systematic review of annotation for surgical process model analysis in minimally invasive surgery based on video . Surg. Endosc . 37 , 4298 – 4314 ( 2023 ). OpenUrl PubMed 6. ↵ Jin , A. et al. Tool Detection and Operative Skill Assessment in Surgical Videos Using Region-Based Convolutional Neural Networks . in 2018 IEEE Winter Conference on Applications of Computer Vision (WACV) 691 – 699 ( IEEE , 2018 ). 7. Brown , J. A. et al. Video review reveals technical factors predictive of biliary stricture and cholangitis after robotic pancreaticoduodenectomy . HPB 23 , 144 – 153 ( 2021 ). OpenUrl PubMed 8. ↵ Varban , O. A. et al. Evaluating the Effect of Surgical Skill on Outcomes for Laparoscopic Sleeve Gastrectomy: A Video-based Study . Ann. Surg . 273 , 766 – 771 ( 2021 ). OpenUrl PubMed 9. ↵ Yiu , A. , Lam , K. , Simister , C. , Clarke , J. & Kinross , J. Adoption of routine surgical video recording: a nationwide freedom of information act request across England and Wales . EClinicalMedicine 70 , 102545 ( 2024 ). OpenUrl PubMed 10. ↵ Twinanda , A. P. et al. EndoNet: A Deep Architecture for Recognition Tasks on Laparoscopic Videos . IEEE Trans. Med. Imaging 36 , 86 – 97 ( 2016 ). OpenUrl PubMed 11. ↵ Nwoye , C. I. et al. Rendezvous: Attention mechanisms for the recognition of surgical action triplets in endoscopic videos . Med. Image Anal . 78 , 102433 ( 2022 ). OpenUrl PubMed 12. ↵ Schoeffmann , K. et al. Cataract-101: video dataset of 101 cataract surgeries . in Proceedings of the 9th ACM Multimedia Systems Conference 421 – 425 ( Association for Computing Machinery , New York, NY, USA , 2018 ). 13. ↵ Al Hajj , H. et al. CATARACTS: Challenge on automatic tool annotation for cataRACT surgery . Med. Image Anal . 52 , 24 – 41 ( 2019 ). OpenUrl PubMed 14. ↵ Carstens , M. et al. Artificial Intelligence for surgical scene understanding: A systematic review and reporting quality meta-analysis . medRxiv 2025.07.12.25330122 ( 2025 ) doi: 10.1101/2025.07.12.25330122 . OpenUrl Abstract / FREE Full Text 15. ↵ Maier-Hein , L. et al. Surgical data science – from concepts toward clinical translation . Med. Image Anal . 76 , 102306 – 102306 ( 2022 ). OpenUrl CrossRef PubMed 16. ↵ Bolmers , M. D. M. et al. Discrepancies between Intraoperative and Histological Evaluation of the Appendix in Acute Appendicitis . J. Gastrointest. Surg . 24 , 2088 – 2095 ( 2020 ). OpenUrl PubMed 17. ↵ Rajpurkar , P. et al. AppendiXNet: Deep Learning for Diagnosis of Appendicitis from A Small Dataset of CT Exams Using Video Pretraining . Sci. Rep . 10 , 3958 ( 2020 ). OpenUrl PubMed 18. ↵ Alvarado , A. A practical score for the early diagnosis of acute appendicitis . Ann. Emerg. Med . 15 , 557 – 564 ( 1986 ). OpenUrl CrossRef PubMed Web of Science 19. ↵ Gomes , C. A. , Nunes , T. A. , Fonseca Chebli , J. M. , Junior , C. S. & Gomes , C. C. Laparoscopy grading system of acute appendicitis: new insight for future trials . Surg. Laparosc. Endosc. Percutan. Tech . 22 , 463 – 466 ( 2012 ). OpenUrl PubMed 20. ↵ Yilmaz , A. E. & Demirhan , H. Weighted kappa measures for ordinal multi-class classification performance . Appl. Soft Comput . 134 , 110020 ( 2023 ). OpenUrl 21. ↵ Scheijmans , J. C. G. et al. Development and validation of the Scoring System of Appendicitis Severity 2.0 . JAMA surgery vol. 159 642 – 649 ( 2024 ). OpenUrl PubMed 22. ↵ Gomes , C. A. et al. Acute appendicitis: proposal of a new comprehensive grading system based on clinical, imaging and laparoscopic findings . World J. Emerg. Surg . 10 , 60 ( 2015 ). OpenUrl PubMed 23. ↵ Temple , C. , Huchcroft , S. & Temple , W. The natural history of appendicitis in adults A prospective study . Ann. Surg . 221 , 278 – 281 ( 1995 ). OpenUrl CrossRef PubMed Web of Science View the discussion thread. Back to top Previous Next Posted October 02, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Appendix300: A multi-institutional laparoscopic appendectomy video dataset for computational modeling tasks Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Appendix300: A multi-institutional laparoscopic appendectomy video dataset for computational modeling tasks Fiona R. Kolbinger , Max Kirchner , Kevin Pfeiffer , Sebastian Bodenstedt , Alexander C. Jenke , Julia Barthel , Matthias Carstens , Karolin Dehlke , Sophia Dietz , Sotirios Emmanouilidis , Guido Fitze , Martin Freitag , Fabian Holderried , Thorsten Jacobi , Weam Kanjo , Linda Leitermann , Sören Torge Mees , Steffen Pistorius , Conrad Prudlo , Astrid Seiberth , Jurek Schultz , Karolin Thiel , Daniel Ziehn , Stefanie Speidel , Jürgen Weitz , Jakob Nikolas Kather , Marius Distler , Oliver Lester Saldanha medRxiv 2025.09.05.25335174; doi: https://doi.org/10.1101/2025.09.05.25335174 Share This Article: Copy Citation Tools Appendix300: A multi-institutional laparoscopic appendectomy video dataset for computational modeling tasks Fiona R. Kolbinger , Max Kirchner , Kevin Pfeiffer , Sebastian Bodenstedt , Alexander C. Jenke , Julia Barthel , Matthias Carstens , Karolin Dehlke , Sophia Dietz , Sotirios Emmanouilidis , Guido Fitze , Martin Freitag , Fabian Holderried , Thorsten Jacobi , Weam Kanjo , Linda Leitermann , Sören Torge Mees , Steffen Pistorius , Conrad Prudlo , Astrid Seiberth , Jurek Schultz , Karolin Thiel , Daniel Ziehn , Stefanie Speidel , Jürgen Weitz , Jakob Nikolas Kather , Marius Distler , Oliver Lester Saldanha medRxiv 2025.09.05.25335174; doi: https://doi.org/10.1101/2025.09.05.25335174 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Surgery Subject Areas All Articles Addiction Medicine (567) Allergy and Immunology (863) Anesthesia (297) Cardiovascular Medicine (4411) Dentistry and Oral Medicine (443) Dermatology (380) Emergency Medicine (606) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1505) Epidemiology (15205) Forensic Medicine (30) Gastroenterology (1119) Genetic and Genomic Medicine (6574) Geriatric Medicine (666) Health Economics (994) Health Informatics (4511) Health Policy (1365) Health Systems and Quality Improvement (1608) Hematology (537) HIV/AIDS (1263) Infectious Diseases (except HIV/AIDS) (15903) Intensive Care and Critical Care Medicine (1103) Medical Education (620) Medical Ethics (144) Nephrology (665) Neurology (6573) Nursing (345) Nutrition (998) Obstetrics and Gynecology (1139) Occupational and Environmental Health (954) Oncology (3319) Ophthalmology (967) Orthopedics (369) Otolaryngology (420) Pain Medicine (435) Palliative Medicine (129) Pathology (662) Pediatrics (1689) Pharmacology and Therapeutics (691) Primary Care Research (710) Psychiatry and Clinical Psychology (5421) Public and Global Health (9205) Radiology and Imaging (2191) Rehabilitation Medicine and Physical Therapy (1367) Respiratory Medicine (1191) Rheumatology (593) Sexual and Reproductive Health (709) Sports Medicine (529) Surgery (709) Toxicology (99) Transplantation (288) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'9fe8f05e2e58c13d',t:'MTc3OTI1NDkxNg=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.