Full text
67,156 characters
· extracted from
preprint-html
· click to expand
Pan genome clustering identifies a novel mosaic prophage specific to Salmonella Enteritidis lineage associated with the invasive disease in India | medRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-P4HH5NV'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search Pan genome clustering identifies a novel mosaic prophage specific to Salmonella Enteritidis lineage associated with the invasive disease in India Jobin John Jacob , Aravind Velmurugan , Dhanalakshmi Solaimalai , Ramya Iyadurai , Karthik Gunasekaran , Jansi Rani Malaiyappan , M Yesudoss , M Vasuki , Binesh Lal , Jacob John , Kamini Walia , View ORCID Profile Balaji Veeraraghavan doi: https://doi.org/10.1101/2025.05.08.25327125 Jobin John Jacob 1 Department of Clinical Microbiology, Christian Medical College , Vellore, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Aravind Velmurugan 1 Department of Clinical Microbiology, Christian Medical College , Vellore, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Dhanalakshmi Solaimalai 1 Department of Clinical Microbiology, Christian Medical College , Vellore, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Ramya Iyadurai 2 Department of Medicine Unit V, Christian Medical College , Vellore, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Karthik Gunasekaran 2 Department of Medicine Unit V, Christian Medical College , Vellore, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jansi Rani Malaiyappan 1 Department of Clinical Microbiology, Christian Medical College , Vellore, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site M Yesudoss 1 Department of Clinical Microbiology, Christian Medical College , Vellore, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site M Vasuki 1 Department of Clinical Microbiology, Christian Medical College , Vellore, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Binesh Lal 1 Department of Clinical Microbiology, Christian Medical College , Vellore, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jacob John 3 Department of Community Medicine, Christian Medical College , Vellore, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Kamini Walia 4 Division of Epidemiology and Communicable Diseases, Indian Council of Medical Research , New Delhi, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site Balaji Veeraraghavan 1 Department of Clinical Microbiology, Christian Medical College , Vellore, India Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Balaji Veeraraghavan For correspondence: vbalaji{at}cmcvellore.ac.in Abstract Full Text Info/History Metrics Supplementary material Data/Code Preview PDF Abstract Salmonella enterica serovar Enteritidis is a leading cause of bloodstream infections (BSIs), particularly in sub-Saharan Africa (sSA). While typhoidal salmonellosis is well documented in South Asia, the burden and genomic characteristics of non-typhoidal Salmonella (NTS)-associated BSIs remain understudied. This study investigates the clinical presentation, phylogenetic relationships, invasive potential, and transmission dynamics of S. Enteritidis causing BSIs in India. Clinical data were collected from 101 bloodstream infection cases caused by S . Enteritidis (2012–2022). Representative isolates of S . Enteritidis originating from other clinical samples and livestock samples ( n=17 ) were also included for comparative analysis. Study isolates were subjected to whole genome sequencing (WGS) using the Illumina platform and phylogenetic structure, invasiveness index, prophage profiles, and transmission dynamics were analyzed through comparative genomics. Clinical data indicated that infants and immunosuppressed individuals were at the highest risk of S. Enteritidis BSI. Phylogenetic analysis revealed four major lineages, with most study BSI isolates clustering in the Global Intermediate Clade, a novel lineage defined by our study.. This clade exhibited the second-highest invasiveness index (median: 0.221, SD: 0.013), following the West African Clade (median: 0.253, SD: 0.25). Isolates originated from poultry samples clustered separately and were not associated with human BSI strains. Pan-genome analysis revealed that the Global Intermediate Clade acquired a novel mosaic prophage, incorporating genetic elements from Salmonella and Vibrio phages, suggesting a role in host adaptation and virulence. This study provides contemporary insights into the genomic and clinical dynamics of S. Enteritidis BSIs in India. The distinct phylogenetic placement, high invasiveness index, and unique prophage acquisition of the Global Intermediate Clade indicate its potential for extraintestinal adaptation and human-specific transmission. Further research is required to delineate environmental reservoirs and transmission pathways contributing to the persistence of this emerging lineage. Author Summary In this study, we investigated Salmonella enterica serovar Enteritidis, a major cause of invasive bloodstream infections (BSIs), particularly among infants and immunocompromised individuals in India. While invasive non-typhoidal Salmonella (iNTS) is well-documented in sub-Saharan Africa, its burden in South Asia remains understudied. By analyzing clinical and genomic data from BSI patients over a decade, we identified a distinct genetic lineage associated with BSI infections, which we named the “Global Intermediate Clade.” This lineage harbors a unique mosaic prophage—a viral DNA segment integrated into its genome—that may enhance its ability to cause invasive disease. Our findings show that this clade has a high potential for causing severe infections, similar to strains found in Africa. Notably, S . Enteritidis isolates from poultry in India were genetically distinct from those causing BSI, suggesting limited direct transmission from animals to humans. This highlights the need for enhanced genomic surveillance to track emerging pathogen lineages and understand their evolution. By identifying this previously unrecognized clade, our study provides critical insights that could inform public health strategies for controlling Salmonella infections in high-risk populations. Future research should explore the role of this prophage in virulence and its implications for vaccine and treatment development. Introduction Nontyphoidal Salmonella (NTS) are a significant cause of gastrointestinal infections which are generally self-limiting and resolve without any clinical interventions [ 1 , 2 ]. However, over the past few decades, some serovars of NTS have emerged as a leading cause of BSI particularly in sub-Saharan African (sSA) countries [ 3 , 4 ]. As of 2017, sub-Saharan Africa accounted for 79% of the 535,000 global cases of invasive NTS (iNTS) disease and 85% of the 77,500 associated deaths [ 5 ]. iNTS infections are strongly associated with immunocompromised individuals, including those with HIV, malaria, malnutrition, and hematologic malignancies [ 6 , 7 ]. Clinical presentation often includes non-specific febrile illness, closely resembling typhoid fever or malaria, making diagnosis particularly challenging in resource-limited settings [ 8 ]. Although a wide range of Salmonella serovars have been reported to cause iNTS diseases, the majority of infections in sub-Saharan Africa are caused by two dominant serovars: Salmonella enterica serovar Typhimurium (ST313) and Salmonella enterica serovar Enteritidis (ST11) [ 9 , 10 ]. These endemic African lineages have been identified as the primary drivers of iNTS infections in the region [ 11 ]. Phylogenetic analysis based on single nucleotide polymorphisms (SNPs) has identified three distinct lineages (L1, L2, and L3) of S . Typhimurium ST313, which have evolved over time to exhibit increased human adaptation and invasiveness [ 12 ]. Similarly, the African clade of ST11 S . Enteritidis has been predicted to be more invasive than the global epidemic clone and global outlier cluster isolates [ 13 ]. While iNTS disease in sub-Saharan Africa has been studied extensively, isolates from other low-income settings have received less attention. In South Asian countries, the prevalence of iNTS has been largely underestimated due to limited surveillance data and underreporting [ 14 , 15 ]. Furthermore, the transmission dynamics of NTS serovars between humans, animals, and the environment in a One Health context remain poorly characterized [ 16 ]. Previously, a retrospective analysis of blood cultures collected at our tertiary care hospital in southern India region between 2000 and 2020 revealed that S . Typhimurium (49%) and S . Enteritidis (29%) were the most prevalent serovars causing iNTS infections [ 17 ]. Of these two, S . Typhimurium has been relatively well characterized, largely due to its use as an experimental model for human typhoid fever. However, the clinical presentation, antimicrobial resistance patterns, and genomic features of S . Enteritidis infections in our setting remain poorly documented. In this study, we conducted a retrospective analysis of S . Enteritidis isolates obtained from BSI at a tertiary-care hospital in Vellore, India. Clinical characteristics and disease outcomes of these infections were also assessed. Additionally, S . Enteritidis isolates from livestock sources were included to investigate potential zoonotic transmission dynamics between humans and animals. Whole-genome sequencing (WGS) and comparative genomic analysis were performed to determine the phylogenetic relationships, genetic diversity, and invasive potential of these isolates within a global isolate collection. Furthermore, pan-genome analysis was performed to shed to understand evolutionary trajectory, host adaptation mechanisms, and pathogenicity determinants of S . Enteritidis, in order to shed light on its potential for human infection and dissemination. Methods Study design and data collection This retrospective study was conducted between January 2012 and December 2022 at the Christian Medical College (CMC), Vellore, India. CMC Vellore is a 2,234-bed, multispecialty, tertiary-care teaching hospital that serves as a referral center for various medical disciplines. Data were retrieved from the hospital’s electronic medical records system (Clinical Workstation). Clinical information was collected for patients admitted with Salmonella Enteritidis bloodstream infections (BSI), including sociodemographic details, presenting clinical features, co-infections, antibiotic use, and patient outcomes. Additionally, underlying conditions such as HIV status, autoimmune disorders, chronic diseases, malignancies, and the use of steroids, cytotoxic drugs, and other relevant comorbidities were documented. Patient outcomes including length of hospital stay, discharge status, and mortality rates were also assessed. All the patient identifying variables in the data were removed before the analysis. This study received ethical approval from the Institutional Research Board and Ethics Committee of CMC Vellore (IRB Min. No. 11878 dated 27 th February, 2019). As the required data had been collected as part of the standard of care for diagnosis, informed consent waiver was granted by the IRB committee CMC, Vellore. Bacterial isolates, identification and antimicrobial susceptibility testing (AST) Archived S . Enteritidis bloodstream infection (BSI) isolates (n = 101), collected between 2012 and 2022, were revived by culturing. Eight representative isolates from other clinical specimens (Feaces, Pus etc) were included in the study for the purpose of comparison. Isolates originating from poultry specimen was included to investigate potential zoonotic transmission. From poultry samples (rectal swabs and droppings), Salmonella sp. was selectively enriched by culturing in buffered peptone water and individual colonies were isolated using MSRV (Modified semi-solid Rappaport-Vassiliadis) media [ 18 ]. The isolates were further confirmed as S . Enteritidis by standard biochemical and sero-agglutination tests based on the Kauffmann-White scheme [ 19 ]. The isolates were further confirmed as Salmonella Enteritidis through seven-gene multilocus sequence typing (MLST) and comparison with the EnteroBase database ( https://enterobase.warwick.ac.uk ) [ 20 ]. AST (disk diffusion) was performed against ampicillin (10 μg), chloramphenicol (30 μg), co-trimoxazole (1.25/23.75 μg), ciprofloxacin (5 μg), and ceftriaxone (30 μg). Clinical breakpoints followed Clinical and Laboratory Standards Institute (CLSI) guidelines, 2022 [ 21 ]. Escherichia coli ATCC 25922 served as the quality control strain. DNA extraction and whole genome sequencing A total of 48 clinical S . Enteritidis isolates were selected for WGS based on temporal distribution and phenotypic antimicrobial susceptibility profiles, while the remaining clinical isolates were excluded. Additionally, 17 poultry-derived isolates were included, resulting in a final set of 65 isolates for WGS. Genomic DNA was extracted using a Wizard DNA purification kit (Promega, Madison, USA) as per the manufacturer’s instructions. Paired-end fragment libraries were prepared using a Nextera XT DNA sample preparation kit following the manufacturer’s instructions (Illumina, Inc., San Diego, USA). The pooled libraries were diluted at a final concentration of 1.8 pM and sequenced on an Illumina Nextseq 500 platform with 150-cycle paired-end chemistry. Genome Assembly, Annotation and genotyping Sequencing reads were evaluated with FastQC v0.12.0 ( https://www.bioinformatics.babraham.ac.uk/projects/fastqc/ ) and reads with low sequencing quality were trimmed and removed using. Trimmomatic v0.39 ( https://github.com/usadellab/Trimmomatic ) was used to trim adapters and the internally corrected high-quality reads were subjected to genome assembly using SKESA v.2.4.0 ( https://github.com/ncbi/SKESA ). The assemblies were analysed for contamination using Kraken v2.1.3 ( https://github.com/DerrickWood/kraken2 ) and quality was assessed via QUAST v5.2.0 ( https://github.com/ablab/quast ). Draft genome assemblies were examined using Seqsero v2.0 ( https://github.com/denglab/SeqSero2 ) to confirm the antigenic profile of the serotype [ 22 ]. Sequence types were assigned in silico for all the isolates using the Multilocus sequence typing (MLST) pipeline available in the Center for Genomic Epidemiology (CGE) ( https://cge.food.dtu.dk/services/MLST/ ). Antimicrobial resistance genes were screened using NCBI AMRFinderPlus v3.11.20 ( https://github.com/ncbi/amr ). Plasmids were identified from the genome data by searching against the PlasmidFinder database ( https://cge.food.dtu.dk/services/PlasmidFinder/ ). The presence of pSEN-like plasmids and their associated genes was identified by performing BLAST comparisons against reference plasmids pSEN (HG970000) and pSENV (JN885080). Genome annotations were performed using Prokka v1.14.5 ( https://github.com/tseemann/prokka ) based on a custom genus database ( https://github.com/tseemann/prokka?tab=readme-ov-file#crazy-person ). Pangenome derived phylogeny Annotated genomes (GFF3 files) generated by Prokka comprising study isolates ( n=65 ) and a global representation of S . Enteritidis ( n=420 ) were used as input to evaluate pan-genome diversity using Panaroo v1.3.4 ( https://github.com/gtonkinhill/panaroo ) [ 23 ]. Panaroo was run with standard parameters with ‘remove invalid genes’ enabled. Subsequently, single nucleotide polymorphisms (SNPs) were extracted from the core gene alignment generated by Panaroo using SNP-sites ( http://sanger-pathogens.github.io/snp-sites/ ). A Maximum likelihood tree was constructed using IQTree2 (TVM+F+ASC+R2; bootstrap replicates = 100) [ 24 ] and visualized with iTOL ( https://itol.embl.de/ ). Subsequently, distantly related outgroup isolates belonging to diverse sequence types were removed and a phylogenetic tree was reconstructed ( n=475 ) to improve the cladistic structure. Phylogenetic clusters were assigned using rhierBAPS ( https://github.com/gtonkinhill/rhierbaps ) in its default mode (two cluster levels with 30 initial clusters). Minimum spanning trees (MSTs) were created and visualized using GrapeTree ( https://achtman-lab.github.io/GrapeTree/MSTree_holder.html ) from the core genome phylogeny [ 25 ]. Tree nodes were positioned through dynamic rendering and node style was adjusted by fine-tuning the node size and kurtosis. Nodes were coloured by the source of the isolates and node sizes were drawn proportionally to the number of isolates. Pangenome clustering The gene presence or absence matrix created by Panaroo was clustered according to the four major phylogroups using the twilight analysis package ( https://github.com/ghoresh11/twilight ) using the default thresholds [ 26 ]. The pan genome reference FASTA file (pan_genome_reference.fa) generated by Panaroo, which encompasses all the genes within the dataset, was clustered using CD-HIT-EST. [ 27 ] with a 90% identity and 90% sequence length coverage. Finally, clustered phage-associated genes were predicted using PHASTEST database using default settings [ 28 ]. The prophage regions were further characterized through comparative analysis by aligning against reference sequences from the prophageDB database [ 29 ]. The predicted prophage regions were then manually curated to determine their gene composition and structural organization. Interactive visualization of the phylogenetic tree and PHASTER summary data was carried out in Phandango v1.3.0 [ 30 ]. Lineage wise mutation profiling Mutations were identified using in-silico analysis of single nucleotide polymorphisms (SNPs) using Snippy v4.6.0 mapping and variant calling pipeline ( https://github.com/tseemann/snippy ). To obtain the SNPs, we mapped the draft genomes ( n=475 ) against the annotated features of the reference genome P125109 (NC_011294.1). We utilized custom-written bash scripts to extract the pattern of mutation accumulation with respect to the phylogenetic lineages. Genes that contained either frameshift mutation or a premature stop codon were manually curated and classified as hypothetically disrupted coding sequences (HDCS) or pseudogenes. Invasiveness index calculation The potential of S . Enteritidis to cause invasive disease was calculated based on a machine learning pre trained invasive index predictive model ( https://github.com/Gardner-BinfLab/invasive_salmonella ) [ 31 ]. This approach classifies the genomes of invasive and gastrointestinal Salmonella by scoring deleterious mutations in 196 top predictor genes. The distribution of invasiveness index values for four major phylogroups was compared using the Kruskal-Wallis H Test. Statistical analysis Statistical analysis was performed to investigate the potential association between severe immunosuppression and the clinical characteristics of S . Enteritidis infection. Data analysis was performed using GraphPad Prism 5.0 for Windows (GraphPad Software Inc). Continuous variables were represented as median ± interquartile range (IQR). Categorical variables were presented as either numbers or percentages. To compare these categorical variables, we employed either Fisher’s exact test or the Chi-squared test, as appropriate for the specific analysis. We calculated the odds ratio (OR) along with its corresponding 95% confidence intervals (CI). Statistical significance was determined by a P-value < 0.05 (two-tailed). Results Infants and immunosuppressed are more susceptible to S . Enteritidis BSI The patient records indicated a total of 506 patients diagnosed with blood culture-positive iNTS disease between January 2012 and December 2022. Of these, 131 cases were confirmed to be caused by S . Enteritidis by conventional microbiological methods. After excluding 30 cases due to the absence of relevant clinical data and duplicate isolates (repeated samples from the same patient within 14 days), hospital records for 101 S . Enteritidis bacteraemia cases were analysed. The median age of affected patients was 34.5 years (IQR: 9–54.5 years) (Table 1). Notably, pediatric patients (<16 years) accounted for 27.72% (28/101) of cases, with infants (<12 months) comprising 13.86% (14/101), highlighting increased susceptibility in younger age groups. The most common presenting symptoms on admission included fever (75.25%), anemia/unhealthy appearance (59.41%), diarrhea (35.64%), and cough (30.69). Among 86 inpatients, the median fever duration was 6 days (IQR: 3–10 days). Male patients accounted for 65.34% (66/101) of cases. We examined the impact of immunosuppressive conditions on S . Enteritidis bacteremia by comparing patients with these conditions to those without them. Among the 101 patients with S . Enteritidis bacteremia, 57.42% (58/101) had immunosuppressive conditions, including cancer/malignancy (24.75%), autoimmune disorders (21.78%), HIV infection (8.91%), and chronic steroid or chemotherapy use (39.6%) (Table 2). Among non-immunosuppressed patients (n=43), the pediatric population was disproportionately affected (44.18%), further emphasizing the vulnerability of children. Septic shock was significantly more frequent in immunosuppressed patients (27.59% vs. 9.3%; p = 0.025; OR = 3.71, 95% CI: 0.2 ± 0.078), indicating a higher risk of severe disease outcomes. To evaluate treatment strategies and patient outcomes, we analyzed antibiotic therapy and recovery rates among affected individuals. A total of 65.34% (66/101) of patients received more than one antibiotic, primarily consisting of β-lactams (carbapenems, third-generation cephalosporins, β-lactam/β-lactamase inhibitors) and azithromycin. Clinical outcomes showed an overall recovery rate of 83.17% (84/101), while 10.89% (11/101) of patients died. Although mortality was higher in immunosuppressed patients (13.79%) compared to non-immunosuppressed patients (6.98%), this difference was not statistically significant (p = 0.345; OR = 2.13, 95% CI: 0.11 ± 0.0605). Phenotypic characterization S . Enteritidis ( n=101 ) strains were revived from the archived collections at the Department of Clinical Microbiology, CMC Vellore. Study isolates that were confirmed to be S . Enteritidis by biochemical testing and serotyping were subjected to AST. The results demonstrated that all isolates were susceptible to first-line antibiotics, (ampicillin, chloramphenicol, trimethoprim/sulfamethoxazole), and ceftriaxone. However, there was a decrease in susceptibility to fluoroquinolones, with 26.7% (27/101) of the isolates exhibiting non-susceptibility to ciprofloxacin. Population structure of S . Enteritidis consists of four major phylogenetic clades The phylogenetic tree of 486 genomes was established by sequencing 65 isolates of S . Enteritidis (both clinical and poultry) and 421 publicly available genome sequences ( Fig. S1 ). The metadata of isolates selected were described in Table S1 . To improve branch length resolution, outgroup genomes belonging to diverse sequence types (ST180, ST1975, ST3304) were excluded, resulting in an abbreviated ML tree of 475 genomes. This dataset included 59 study isolates 42 from clinical sources and 17 from poultry along with genomes retrieved from public databases, allowing for a detailed assessment of the population structure of S . Enteritidis. Phylogenetic analysis based on 13,876 core gene SNPs revealed that S . Enteritidis genomes clustered into four major phylogeneticclades ( Figure 1 ). Clustering using RhierBAPS (Level 1) identified six BAPS clusters, four of which corresponded to the major phylogroups. In addition to previously defined groups namely the African lineage (BAPS Cluster 3), the global outlier/Atlantic lineage (Cluster 4), and the global epidemic clade (Cluster 1)—we identified a distinct phylogroup (BAPS Cluster 2), separated by 163 unique SNPs ( Table S2 ). This novel cluster, which displays a geographically widespread global distribution, is hereafter referred to as the ‘Global Intermediate Clade’. Phylogenetically, this clade emerges as a paraphyletic group derived from the global outlier lineage, mirroring the evolutionary trajectory of the global epidemic clade. The study isolates were distributed between the Global Intermediate Clade (44.07%; 26/59), Global epidemic clade (28.8%; 17/59) and Global outlier clade (27.12%; 16/59). Notably, the majority of isolates were assigned to Sequence Type (ST)11, irrespective of their phylogenetic classification. Additionally, single-locus variants (SLVs) of ST11, including ST745, ST1479, and ST1974, were identified across the four primary clades. Download figure Open in new tab Figure 1: Maximum likelihood phylogenetic tree of Salmonella Enteritidis was constructed using 13,876 SNPs from 3,661 core genes (>95% presence) identified through pan-genome analysis with Panaroo ( https://github.com/gtonkinhill/panaroo ). The midpoint-rooted phylogeny was inferred using IQ-TREE2 ( http://www.iqtree.org/ ), with bootstrap support values calculated from 100 replicates. The analysis included 475 S . Enteritidis genomes, of which 59 were isolates from this study. The phylogenetic tree reveals the distribution of S . Enteritidis within four main clusters, corresponding to distinct phylogroups. Study isolates are highlighted with red branch symbols. Metadata annotations are displayed as color strips: (1) BAPS clusters, (2) source of isolates, and (3) geographic location. Resistance profiles and key virulence genes are represented as heatmaps, while the invasiveness index for each genome is plotted as an external bar plot. The scale bar indicates substitutions per site. The tree was visualized and annotated using iTOL ( https://itol.embl.de/ ). The geographic distribution of S . Enteritidis phylogroups revealed distinct regional patterns. While some lineages exhibit global distribution, others appear geographically restricted. For instance, the African lineage includes West African and East African sub-lineages, both associated with iNTS disease. In contrast, the Global Outlier and Epidemic clusters contain isolates from diverse sources and geographic regions, spanning collections from 1925 to 2024 ( Table S3 ). Notably, the Global Intermediate Clade appears to have originated in North America, with its earliest known isolate dating back to 1950 (SRR5819753). Ancestral strains of this lineage have been traced to the early 2000s, suggesting a subsequent expansion into Europe and Asia, reflecting its potential role in global S . Enteritidis dissemination. S . Enteritidis isolates from poultry were genetically distinct from those causing BSI Comparative genome analysis was performed to investigate the genetic relationship between human and livestock isolates of S . Enteritidis and to assess potential zoonotic transmission pathways. Phylogenetic analysis revealed that 82.35% (14/17) of poultry isolates were assigned to the global outlier cluster while the remaining were grouped with the quinolone non-susceptible subcluster within global epidemic clade ( Figure S2) . Among the poultry isolates clustered in the global outlier cluster, 13 formed a distinct subcluster that showed no direct genetic association with clinical isolates, suggesting limited direct transmission between poultry and human cases in this study. Notably, none of the poultry isolates of S. Enteritidis from the study area were found to be associated with the Global Intermediate clade ( Figure 1 ). Limited antimicrobial resistance and plasmids among S . Enteritidis Among the S . Enteritidis study isolates, we identified only a few genetic determinants of acquired antibiotic resistance. With the exception of one isolate, none of the study isolates contained detectable AMR genes, indicating a low prevalence of acquired resistance within this dataset. To provide a broader context, phylogroup-wise AMR screening was conducted on a global collection of isolates. Multidrug resistance (MDR) markers, including bla TEM , cat , sul , and dfrA , which confer resistance to first-line antibiotics, were primarily associated with East and West African clades. In contrast, AMR determinants showed variable prevalence across other phylogroups, regardless of their geographic origin. While the Global Epidemic Lineage occasionally carried genetic markers conferring resistance to ampicillin and co-trimoxazole, AMR genes were otherwise infrequent in non-African phylogroups. Unlike other NTS serovars, the majority of S . Enteritidis isolates remained susceptible to fluoroquinolones. However, quinolone resistance-conferring mutations in gyrA (S83Y or D87G) were identified in 25.42% (15/59) of study isolates, all of which belonged to the Global Epidemic Clade, suggesting the emergence of fluoroquinolone resistance within this lineage. The pSEN-like virulence plasmid was commonly detected among global S . Enteritidis isolates. As expected, the pSENV plasmid and its associated replicon were identified in all isolates within the East African sub-clade. In contrast, a few of isolates from other phylogenetic clusters lacked the pSEN-like plasmid, though this absence appeared to be sporadic and not linked to phylogenetic lineage ( Figure S3 ). Further analysis revealed the widespread presence of plasmid-encoded virulence factors (VFs) commonly associated with S . Enteritidis, including fimbrial adhesion genes ( pef ABCD), type III secretion system (T3SS)-secreted effector genes, ( spv BCD) encoded within Salmonella pathogenicity island 2 (SPI-2), and additional virulence genes ( mig-5 and rck ) ( Figure 1 ). Notably, the newly defined Global Intermediate Clade exhibited a high prevalence of these plasmid-associated virulence determinants, with 93.5% (58/62) of isolates carrying all eight genes, underscoring the potential role of this lineage in plasmid-mediated pathogenicity. African and Intermediate clade contained high levels of genome degradation Frameshift mutations and premature stop codons leading to highly degraded coding sequences hypothetically disrupted coding sequences (HDCS) were analyzed across major phylogenetic clusters in the dataset ( Table S4 ). Genomes within the African cluster, including both West African and East African sub-lineages, exhibited the highest number of HDCS (n=9) compared to isolates from the Global Epidemic and Global Outlier clusters (n=2). Additionally, representative genomes from the East African cluster contained an extra 16 HDCS, although none were associated with virulence genes. Isolates belonging to the Global intermediate clade were distinguished by eight lineage-defining HDCS ( Table S4 ). Global intermediate clade has the second-highest invasiveness index, following the west African cluster The invasiveness of S. Enteritidis phylogroups was evaluated using machine-learning based Invasive index calculator. This pipeline utilizes a random forest classifier model to produce predictive scores, denoted as delta bitscores (DBS). It accomplishes this by examining mutations within a previously defined set of 196 genes, as explained earlier. The potential of different phylogroups to cause extra-intestinal infection was compared using Wilcoxon– Mann–Whitney test. The results indicate that all examined S. Enteritidis phylogroups remain to be gastrointestinal (DBS <0.5). Nonetheless, the invasiveness index varies among these phylogroups ( Figure 2 ). We observed a high invasiveness index (median = 0.253, SD = 0.25) for isolates belonging to West African clade while the global epidemic clade had the lowest (median = 0.188, SD = 0.01). The global intermediate clade also exhibited a relatively high invasiveness index (median 0.221, SD= 0.013) compared to East African and outlier clusters. Download figure Open in new tab Figure 2: The lineage wise invasiveness index for all Salmonella Enteritidis genomes analyzed in this study was determined using the approach described by Wheeler et al. The median and standard deviation (SD) values for each lineage are as follows: East African (median = 0.217, SD = 0.010), West African (median = 0.253, SD = 0.026), Global Outlier (median = 0.208, SD = 0.011), Global Intermediate (median = 0.221, SD = 0.013), and Global Epidemic (median = 0.1883, SD = 0.010). Mann-Whitney U-test was used to compare differences between groups. In the boxplot, boxes represent the interquartile range (IQR), whiskers extend to 1.5× IQR, and outliers are shown as points. The Kruskal-Wallis test revealed significant differences across lineages (p < 0.0001, H = 257.92). Pan-genome clustering suggests the evolution of S . Enteritidis is largely driven by the acquisition of prophage genes Pan-genome analysis of Salmonella Enteritidis, excluding highly divergent phylogroups (e.g., ST1975), identified 8,098 gene families. The core genome, comprising genes present in >99% of analyzed genomes, consisted of 3,672 genes, representing 73.8% of the total 5,344 genes. Analysis of the accessory genome revealed distinct gene family distribution patterns among established phylogroups ( Figure S4 ). Lineage-specific gene gain and loss events were particularly pronounced. The Global intermediate clade uniquely harbors a 56.9 kbp novel prophage ( Figure 3 ), a mosaic structure exhibiting homology with Salmonella phage Sal3 (NC_031940) and Vibrio phage X29 (NC_024369). This prophage contains 62 coding sequences (CDS), including the virulence-associated msgE gene, suggesting a potential role in pathogenic adaptation. As reported previously, the African lineage has similarly acquired prophage, closely related to Enterobacter phage P88, in addition to the well-characterized Gifsy-1 prophage. In contrast, the emergence of the Global Epidemic Clade is associated with the acquisition of prophage ΦSE20, reinforcing the role of phage-mediated genetic changes in the evolution of epidemic S . Enteritidis strains. Download figure Open in new tab Figure 3: Prophage Map of Major Salmonella Enteritidis Lineages. The position of prophage regions identified in representative S . Enteritidis ST11 strains from each major lineage using PHASTER ( https://phaster.ca/ ). The panel illustrates the genetic organization of a mosaic prophage identified in the global intermediate clade. Comparative genomic analysis of this mosaic prophage was performed using Proksee ( https://proksee.ca/ ), showing its similarity to closest prophage homologs Salmonella phage Sal3 (NC_031940) and Vibrio phage X29 (NC_024369). Discussion The increasing global incidence of iNTS infections, particularly BSI caused by S . Enteritidis, has been extensively documented in sSA [ 3 , 6 , 32 , 33 ], However, its epidemiology in South Asia, including India, remains poorly characterized. In India, S . Enteritidis is the second most common iNTS serovar causing BSI, with prior studies also linking it to severe foodborne outbreaks (17, 34, 35]. This study presents the first comprehensive genomic and clinical analysis of S . Enteritidis isolates associated with BSIs in India, offering critical insights into their clinical features, phylogenetic relationships, and evolutionary mechanisms. Many studies have identified immunosuppressive conditions such as HIV, malnutrition, and chronic illnesses as major risk factors for iNTS infections [ 14 , 36 , 37 ]. However, most of this evidence derives from African populations [ 6 , 38 ]. Our study expands this understanding to the Indian context, demonstrating that infants and immunocompromised individuals (e.g., those with malignancies, autoimmune disorders, or undergoing invasive procedures) are at high risk of S . Enteritidis associated BSIs. Unlike in sub-Saharan Africa, where HIV coinfection drives iNTS [ 6 ], our cohort showed non-HIV-related immunosuppression as the dominant risk factor (Table 2). Pediatric cases comprised 27.7% of infections, with infants (<12 months) accounting for nearly half. Additionally, the high mortality rate (10.9%) and frequent empiric treatment with typhoid regimens (ceftriaxone-azithromycin) underscore the need for improved diagnostics and tailored management strategies for immunosuppressed and pediatric patients in India. Recent genomic advancements have significantly improved our understanding of S. Enteritidis, elucidating its phylogenetic diversity, transmission dynamics, and mechanisms of virulence and antimicrobial resistance [ 13 , 39 – 41 ]. Globally, sequence type (ST) 11 dominates, representing 90–94% of publicly available S . Enteritidis genomes [ 40 ], a trend reflected in our study, where the majority of isolates were assigned to ST11 ( Table S1 ). Given the limited resolution of traditional 7-gene MLST classification, higher-resolution approaches such as core gene SNP based phylogenetics or core genome MLST (cgMLST) have enabled fine-scale differentiation of ST11 into distinct phylogenetic subclusters [ 13 , 40 ]. Our phylogenetic analysis corroborates the presence of previously established global clades, including the regionally adapted East African and West African Clades (BAPS Cluster 5), the globally disseminated Outlier/Atlantic Clade (Cluster 2), and the Epidemic Clade (Cluster 4) ( Figure 1 ) [ 13 , 40 , 42 ]. Interestingly, a substantial proportion of isolates from this study clustered within a previously undefined lineage (Cluster 1), which appears to have evolved from closely related progenitors within global lineages. EnteroBase metadata analysis (n=293) suggests that this lineage is widely distributed, with a significant proportion of isolates originating from Europe (n=109/293) and North America (n=80/293) ( Table S3 ). Based on its unique phylogenetic placement and broad geographic distribution, we designate this lineage as the “Global Intermediate” Clade, with its earliest known isolate dating back to 1950s (SRR5819753). Among the established S . Enteritidis clades the Central/East African and West African subclades exhibit distinct evolutionary trajectories, shaped by prophage acquisition, AMR determinants, and lineage-specific genomic degradation, all contributing to enhanced human host adaptation [ 13 , 43 ]. For instance, the Central/East African Clade harbors 77 unique genes, including 33 plasmid-encoded (pSENV) virulence factors and 40 genes within a Fels-2-like prophage, while the West African clade contains 15 distinct genes, with 11 associated with a virulence plasmid. Notably, both African clades carry a ∼90 Kb virulence plasmid, nearly twice the size of the 58 Kb plasmid found in the Global Epidemic Clade, and encoding multiple AMR genes [ 44 ]. Similarly, the Global Epidemic Clade is distinguished by the presence of prophage φSE20, which is hypothesized to facilitate colonization in chickens, thereby enhancing transmission to humans and increasing disease potential [ 45 ]. These differences in prophage composition serve as key markers for distinguishing between major S . Enteritidis lineages [ 43 , 46 ]. In contrast, the Global Intermediate Clade shares ROD21 and φSE12 prophages with the two other global lineages but also harbors a distinctive mosaic prophage ( Figure 3 ). Genomic analysis of this novel prophage suggests that it may have diversified through horizontal gene transfer, acquiring genetic material from Salmon 118970 Sal3, Vibrio X29 and other prophages, while also maintaining unique genetic arrangement with no known similarity in current prophage databases. Given that this mosaic prophage is a defining feature of the Global Intermediate Clade, its emergence and diversification may have been driven majorly by phage-associated gene flux [ 47 ]. The genetic basis of invasive Salmonella lineages remains incompletely understood; however functional diversification through genome degradation and acquisition of virulence factors appears to be key drivers of host adaptation [ 48 ]. In our study, the Global intermediate clade displayed an elevated invasiveness index (DBS), closer to the two African Clades ( Figure 2 ) , suggesting that these lineages may have undergone adaptive genomic changes favoring extraintestinal survival and infection. Since loss-of-function mutations and the accumulation of HDCS are hallmarks of host-adapted Salmonella lineages [ 49 ] the increased invasive index divergence in the intermediate clade, coupled with evidence of genomic degradation, supports its potential adaptation to infect humans. These findings, alongside epidemiological landscape of ST313 S . Typhimurium, strongly suggest that the S. Enteritidis Global intermediate clade has diversified from global epidemic clade for enhanced human infectivity [ 12 ]. The global spread of S . Enteritidis is closely linked to contaminated poultry products, which played a key role in its introduction and worldwide dissemination (42, 46]. Genome-based source tracking suggests a centralized origin, likely emerging during the early industrialization of poultry production [ 16 , 50 ]. Comparative genomic analysis of S . Enteritidis isolates from clinical and poultry sources in India reveals that poultry-derived isolates cluster within the Outlier/Atlantic and Global Epidemic Clades, aligning with previous reports linking these lineages to poultry-driven transmission [ 42 ]. Notably, no contemporary poultry isolates are associated with the Global Intermediate Clade, which predominantly comprises Indian bloodstream infection (BSI) isolates. This pattern mirrors the African epidemic lineages, where invasive human-adapted strains evolved independently of poultry-associated strains. Thus, the Global Intermediate Clade appears to be primarily linked to human infections, while poultry isolates cluster within region-specific subclades of the Outlier and Global Epidemic lineages. Our study has several limitations. First, clinical data originate from a single Indian hospital, limiting generalizability to the national disease burden. Second, most clinical variables lacked statistical association with infection outcomes. Third, phylogenetic analysis included 65 of 101 isolates from the study period, with underrepresentation of poultry-derived isolates restricting epidemiological inferences. Finally, functional characterization of the identified prophages, though beyond this study’s scope, is needed to confirm their evolutionary significance. Despite these limitations, our data provide a robust evaluation of global phylogenomics for this understudied pathogen. Conclusion Our findings align with current knowledge regarding the clinical presentation, evolutionary processes, and transmission patterns of S . Enteritidis. Severely immunosuppressed individuals are at higher risk of BSI caused by NTS serovars, reinforcing the opportunistic nature of these infections. Our phylogenomic analyses reveal that Indian invasive S . Enteritidis isolates mostly belong to an emerging lineage, which we designate as the Global Intermediate Clade. This clade exhibited high invasiveness, second only to the West African Clade, and was characterized by a distinct prophage repertoire and extensive genomic degradation. Given its genetic divergence from poultry-associated strains, these findings suggest that this lineage may have undergone adaptation to cause bloodstream infections in humans. Further research is needed to better understand the environmental reservoirs and transmission pathways of the Global Intermediate Clade. Data Availability Raw read data were deposited in the European Nucleotide Archive (ENA) under project accession number: PRJEB87860. The individual sample accession numbers are listed in Table S1 https://www.ncbi.nlm.nih.gov/bioproject/PRJEB87860/ Ethical Clearance Institutional Review Board (IRB) of Christian Medical College (CMC), Vellore, India gave ethical approval for this work vide IRB Min no. 12626 dated 26.02.2020. As the required data had been collected as part of the standard of care for diagnosis, informed consent waiver was granted by the IRB committee CMC, Vellore. Contributors Conceptualization: JJJ, AV, BV and KW Methodology and Investigation: JJJ, AV, DS, RI, KG, JRM, YM, VM and BLY Data analysis: JJJ and AV Visualization: JJJ and AV Funding acquisition: BV and KW Project administration: JJJ, DS, YM, FA, MPT, SK Supervision: DS, BV and KW Original draft: JJJ, AV Review & editing: JJ, BV and KW Funding The study has been funded by the Indian Council of Medical Research, New Delhi, India (Ref. No: AMR/Adoc/186/2019-ECD-II dated 26/08/2019). Disclaimer The funders had no role in the design and conduct of the study; collection, management, analysis, and interpretation of the data; preparation, review, or approval of the manuscript; and decision to submit the manuscript for publication. Competing interests The authors have declared that no competing interests exist. Patient consent for publication Not required. Figure S1: Pan-genome based core genome phylogenetic tree of 486 S . Enteritidis showing the comparative phylogenetic clustering by MLST. Study isolates are highlighted with red branch symbols. MLST are displayed as color strips. The tree was visualized and labeled using iTOL ( https://itol.embl.de/ ). Figure S2: Minimum spanning tree (MST) of S . Enteritidis isolates ( n=475 ) constructed and visualized using GrapeTree ( https://achtman-lab.github.io/GrapeTree/MSTree_holder.html ). Each node represents a unique ST or Clonal group, and node size is proportional to the number of isolates with that ST. Node color indicates the source from which the isolate was obtained. Tree nodes were positioned through dynamic rendering and node style was adjusted by fine-tuning the node size and kurtosis. Figure S3: Phandango heatmap illustration (Hadfield et al. 2018) focusing on the presence of AMR genes, virulence genes and pSEN-like plasmid associated genes across phylogenetic lineages. The orange indicates the presence of a gene and purple indicates its absence. Figure S4: Pangenome analysis of 475 S . Enteritidis isolates indicates the diversity in accessory genomes among the different phylogenetic lineages. Phandango heatmap illustration (Hadfield et al. 2018) of gene presence and absence matrix (right side) against Maximum likelihood phylogenetic tree (Left side) with clades correlate with the observation derived from phylogenetic analysis. The orange indicates the presence of a gene and purple indicates its absence. A highlighted region (white dashed rectangle) indicates a cluster of lineage-specific genes. Acknowledgements We express our heartfelt gratitude to the Department of Clinical Microbiology, Christian Medical College, Vellore, for providing the essential facilities and support that made this study possible. We extend our sincere appreciation to the clinicians, Dr. Jithin Joy and Dr. Suriya Chandran, for their efforts in contributing to the clinical data collection. We are also grateful to Ms. Baby Abirami Shankar and Mr. Ayyanraj N. for their valuable assistance with phenotypic testing, stock culture maintenance, and sequencing. Special thanks go to Ms. Agila K. Pragasam for her expert guidance and support in the genomic analysis. Reference 1. ↵ Acheson D , Hohmann EL . Nontyphoidal salmonellosis . Clin Infect Dis . 2001 Jan 15 ; 32 ( 2 ): 263 – 9 . OpenUrl CrossRef PubMed Web of Science 2. ↵ Uche IV , MacLennan CA , Saul A . A systematic review of the incidence, risk factors and case fatality rates of invasive nontyphoidal Salmonella (iNTS) disease in Africa (1966 to 2014) . PLoS Negl Trop Dis . 2017 Jan 5 ; 11 ( 1 ): e0005118 . OpenUrl CrossRef PubMed 3. ↵ Kariuki S , Gordon MA , Feasey N , Parry CM . Antimicrobial resistance and management of invasive Salmonella disease . Vaccine . 2015 Jun 19 ; 33 Suppl 3 : C21 – 9 . OpenUrl CrossRef PubMed 4. ↵ Mahon BE , Fields PI . Invasive infections with nontyphoidal Salmonella in sub-Saharan Africa . Microbiol Spectr . 2016 Jun ; 4 ( 3 ): 341 – 57 . OpenUrl 5. ↵ Stanaway JD , Parisi A , Sarkar K , Blacker BF , Reiner RC , Hay SI , et al. The global burden of non-typhoidal Salmonella invasive disease: a systematic analysis for the Global Burden of Disease Study 2017 . Lancet Infect Dis . 2019 Dec ; 19 ( 12 ): 1312 – 24 . OpenUrl CrossRef PubMed 6. ↵ Feasey NA , Dougan G , Kingsley RA , Heyderman RS , Gordon MA . Invasive non-typhoidal Salmonella disease: an emerging and neglected tropical disease in Africa . Lancet . 2012 Jun 30 ; 379 (9835): 2489 -99. OpenUrl CrossRef PubMed Web of Science 7. ↵ Biggs HM , Lester R , Nadjm B , Mtove G , Todd JE , Kinabo GD , et al. Invasive Salmonella infections in areas of high and low malaria transmission intensity in Tanzania . Clin Infect Dis . 2014 Mar ; 58 ( 5 ): 638 – 47 . OpenUrl CrossRef PubMed 8. ↵ Marchello CS , Fiorino F , Pettini E , Crump JA , Martin LB , Breghi G , et al. Incidence of non-typhoidal Salmonella invasive disease: a systematic review and meta-analysis . J Infect . 2021 Nov ; 83 ( 5 ): 523 – 32 . OpenUrl CrossRef PubMed 9. ↵ Kingsley RA , Msefula CL , Thomson NR , Kariuki S , Holt KE , Gordon MA , et al. Epidemic multiple drug resistant Salmonella Typhimurium causing invasive disease in sub-Saharan Africa have a distinct genotype . Genome Res . 2009 Dec ; 19 ( 12 ): 2279 – 87 . OpenUrl Abstract / FREE Full Text 10. ↵ Park SE , Pham DT , Pak GD , Panzner U , Espinoza LM , von Kalckreuth V , et al. The genomic epidemiology of multi-drug resistant invasive non-typhoidal Salmonella in selected sub-Saharan African countries . BMJ Glob Health . 2021 Aug ; 6 ( 8 ): e005659 . OpenUrl Abstract / FREE Full Text 11. ↵ Kariuki S , Owusu-Dabo E . Research on invasive nontyphoidal Salmonella disease and developments towards better understanding of epidemiology, management, and control strategies . Clin Infect Dis . 2020 Jul 29 ; 71 ( Suppl 2 ): S127 – 9 . OpenUrl PubMed 12. ↵ Pulford CV , Perez-Sepulveda BM , Canals R , Bevington JA , Bengtsson RJ , Wenner N , et al. Stepwise evolution of Salmonella Typhimurium ST313 causing bloodstream infection in Africa . Nat Microbiol . 2021 Mar ; 6 ( 3 ): 327 – 38 . OpenUrl PubMed 13. ↵ Feasey NA , Hadfield J , Keddy KH , Dallman TJ , Jacobs J , Deng X , et al. Distinct Salmonella Enteritidis lineages associated with enterocolitis in high-income settings and invasive disease in low-income settings . Nat Genet . 2016 Oct ; 48 ( 10 ): 1211 – 7 . OpenUrl CrossRef PubMed 14. ↵ Phu Huong Lan , Le Thi Phuong T , Nguyen Huu H , Thuy L , Mather AE , Park SE , et al. Invasive non-typhoidal Salmonella infections in Asia: clinical observations, disease outcome and dominant serovars from an infectious disease hospital in Vietnam . PLoS Negl Trop Dis . 2016 Aug 11 ; 10 ( 8 ): e0004857 . OpenUrl CrossRef PubMed 15. ↵ Jacob JJ , Solaimalai D , Muthuirulandi Sethuvel DP , Rachel T , Jeslin P , Anandan S , et al. A nineteen-year report of serotype and antimicrobial susceptibility of enteric non-typhoidal Salmonella from humans in Southern India: changing facades of taxonomy and resistance trend . Gut Pathog . 2020 Dec ; 12 : 1 – 9 . OpenUrl CrossRef PubMed 16. ↵ Liu B , Zhang X , Ding X , Bin P , Zhu G . The vertical transmission of Salmonella Enteritidis in a One-Health context . One Health . 2022 Dec 5 ; 15 : 100469 . 17. ↵ Jacob JJ , Solaimalai D , Rachel T , Pragasam AK , Sugumar S , Jeslin P , et al. A secular trend in invasive non-typhoidal Salmonella in South India, 2000–2020: identification challenges and antibiogram . Indian J Med Microbiol. 2022 Oct-Dec ; 40 ( 4 ): 536 – 40 . OpenUrl PubMed 18. ↵ De Smedt JM , Bolderdijk RF , Rappold H , Lautenschlaeger D . Rapid Salmonella detection in foods by motility enrichment on a modified semi-solid Rappaport-Vassiliadis medium . J Food Prot . 1986 Jul ; 49 ( 7 ): 510 – 4 . OpenUrl PubMed 19. ↵ Popoff MY , Bockemühl J , Gheesling LL . Supplement 2002 (no. 46) to the Kauffmann-White scheme . Res Microbiol . 2004 Sep ; 155 ( 7 ): 568 - 70 . OpenUrl CrossRef PubMed Web of Science 20. ↵ Achtman M , Wain J , Weill FX , Nair S , Zhou Z , Sangal V , et al. Multilocus sequence typing as a replacement for serotyping in Salmonella enterica . PLoS Pathog . 2012 Jun ; 8 ( 6 ): e1002776 . OpenUrl CrossRef PubMed 21. ↵ Clinical and Laboratory Standards Institute . Performance standards for antimicrobial susceptibility testing, M100. 32nd ed . Wayne, PA : CLSI ; 2022 . 22. ↵ Zhang S , den Bakker HC , Li S , Chen J , Dinsmore BA , Lane C , et al. SeqSero2: rapid and improved Salmonella serotype determination using whole-genome sequencing data . Appl Environ Microbiol . 2019 Dec 1 ; 85 ( 23 ): e01746 – 19 . OpenUrl CrossRef PubMed 23. ↵ Tonkin-Hill G , MacAlasdair N , Ruis C , Weimann A , Horesh G , Lees JA , et al. Producing polished prokaryotic pangenomes with the Panaroo pipeline . Genome Biol . 2020 Dec ; 21 ( 1 ): 180 . OpenUrl CrossRef PubMed 24. ↵ Minh BQ , Schmidt HA , Chernomor O , Schrempf D , Woodhams MD , von Haeseler A , et al. IQ-TREE 2: new models and efficient methods for phylogenetic inference in the genomic era . Mol Biol Evol . 2020 May 1 ; 37 ( 5 ): 1530 – 4 . OpenUrl CrossRef PubMed 25. ↵ Zhou Z , Alikhan NF , Sergeant MJ , Luhmann N , Vaz C , Francisco AP , et al. GrapeTree: visualization of core genomic relationships among 100,000 bacterial pathogens . Genome Res . 2018 Sep ; 28 ( 9 ): 1395 – 404 . OpenUrl Abstract / FREE Full Text 26. ↵ Horesh G , Taylor-Brown A , McGimpsey S , Lassalle F , Corander J , Heinz E , et al. Different evolutionary trends form the twilight zone of the bacterial pan-genome . Microb Genom . 2021 Sep ; 7 ( 9 ): 000670 . OpenUrl PubMed 27. ↵ Huang Y , Niu B , Gao Y , Fu L , Li W . CD-HIT Suite: a web server for clustering and comparing biological sequences . Bioinformatics . 2010 Mar 1 ; 26 ( 5 ): 680 – 2 . OpenUrl CrossRef PubMed Web of Science 28. ↵ Wishart DS , Han S , Saha S , Oler E , Peters H , Grant JR , et al. PHASTEST: faster than PHASTER, better than PHAST . Nucleic Acids Res . 2023 Jul 5 ; 51 ( W1 ): W443 – 50 . OpenUrl CrossRef PubMed 29. ↵ Dieppa-Colón E , Martin C , Kosmopoulos JC , Anantharaman K . Prophage-DB: a comprehensive database to explore diversity, distribution, and ecology of prophages . Environ Microbiome . 2025 Jan 13 ; 20 ( 1 ): 5 . OpenUrl CrossRef PubMed 30. ↵ Hadfield J , Croucher NJ , Goater RJ , Abudahab K , Aanensen DM , Harris SR . Phandango: an interactive viewer for bacterial population genomics . Bioinformatics . 2018 Jan 15 ; 34 ( 2 ): 292 – 3 . OpenUrl CrossRef PubMed 31. ↵ Wheeler NE , Gardner PP , Barquist L . Machine learning identifies signatures of host adaptation in the bacterial pathogen Salmonella enterica . PLoS Genet . 2018 May ; 14 ( 5 ): e1007333 . OpenUrl CrossRef PubMed 32. ↵ Ao TT , Feasey NA , Gordon MA , Keddy KH , Angulo FJ , Crump JA . Global burden of invasive nontyphoidal Salmonella disease, 2010 . Emerg Infect Dis. 2015 Jun ; 21 ( 6 ): 941 - 9 . OpenUrl CrossRef PubMed 33. ↵ Balasubramanian R , Im J , Lee JS , Jeon HJ , Mogeni OD , Kim JH , et al. The global burden and epidemiology of invasive non-typhoidal Salmonella infections . Hum Vaccin Immunother . 2019 ; 15 ( 6 ): 1421 – 6 . OpenUrl CrossRef PubMed 34. Oommen S , Nair S , Nair K , Pillai S . Epidemiology of non-typhoidal Salmonella among patients attending a tertiary care centre in central Kerala . J Acad Clin Microbiol . 2015 Jan ; 17 ( 1 ): 12 – 5 . OpenUrl 35. Deepanjali S , Jharna M , Chanaveerappa B , Sarumathi D , Gopichand P , Anupriya K . An outbreak of Salmonella Enteritidis food poisoning following consumption of chicken shawarma: a brief epidemiological investigation . F1000Res . 2021 ; 10 : 664 . OpenUrl 36. ↵ Dhanoa A , Fatt QK . Non-typhoidal Salmonella bacteraemia: epidemiology, clinical characteristics and its association with severe immunosuppression . Ann Clin Microbiol Antimicrob . 2009 Dec ; 8 : 15 . 37. ↵ Marchello CS , Birkhold M , Crump JA , Martin LB , Ansah MO , Breghi G , et al. Complications and mortality of non-typhoidal Salmonella invasive disease: a global systematic review and meta-analysis . Lancet Infect Dis . 2022 May ; 22 ( 5 ): 1457 – 70 . OpenUrl 38. ↵ Piccini G , Montomoli E . Pathogenic signature of invasive non-typhoidal Salmonella in Africa: implications for vaccine development . Hum Vaccin Immunother . 2020 Sep 1 ; 16 ( 9 ): 2056 – 71 . OpenUrl PubMed 39. ↵ Graham RM , Hiley L , Rathnayake IU , Jennison AV . Comparative genomics identifies distinct lineages of S . Enteritidis from Queensland, Australia . PLoS One . 2018 Jan 16 ; 13 ( 1 ): e0191042 . OpenUrl PubMed 40. ↵ Cao G , Zhao S , Kuang D , Hsu CH , Yin L , Luo Y , et al. Geography shapes the genomics and antimicrobial resistance of Salmonella enterica serovar Enteritidis isolated from humans . Sci Rep . 2023 Jan 24 ; 13 ( 1 ): 1331 . OpenUrl CrossRef PubMed 41. ↵ Aldrich C , Hartman H , Feasey N , Chattaway MA , Dekker D , Al-Emran HM , et al. Emergence of phylogenetically diverse and fluoroquinolone resistant Salmonella Enteritidis as a cause of invasive nontyphoidal Salmonella disease in Ghana . PLoS Negl Trop Dis . 2019 Jun 20 ; 13 ( 6 ): e0007485 . OpenUrl PubMed 42. ↵ Li S , He Y , Mann DA , Deng X . Global spread of Salmonella Enteritidis via centralized sourcing and international trade of poultry breeding stocks . Nat Commun . 2021 Aug 25 ; 12 ( 1 ): 5109 . OpenUrl PubMed 43. ↵ Gallichan S , Perez-Sepulveda BM , Feasey NA , Hinton JC , Thomas J , Smith AM . Multiplex PCR assay for clade typing of Salmonella enterica serovar Enteritidis . Microbiol Spectr . 2022 Dec 21 ; 10 ( 6 ): e03182 – 22 . OpenUrl PubMed 44. ↵ Worley MJ . Salmonella bloodstream infections . Trop Med Infect Dis . 2023 Oct 27 ; 8 ( 11 ): 487 . OpenUrl PubMed 45. ↵ Campioni F , Cao G , Kastanis G , Janies DA , Bergamini AM , Rodrigues DD , et al. Changing of the genomic pattern of Salmonella Enteritidis strains isolated in Brazil over a 48-year period revealed by whole genome SNP analyses . Sci Rep . 2018 Jul 11 ; 8 ( 1 ): 10478 . OpenUrl CrossRef PubMed 46. ↵ Mascitti AK , Kipper D , Dos Reis RO , da Silva JS , Fonseca AS , Ikuta N , et al. Retrospective whole-genome comparison of Salmonella enterica serovar Enteritidis from foodborne outbreaks in Southern Brazil . Braz J Microbiol . 2021 Sep ; 52 ( 3 ): 1523 – 33 . OpenUrl PubMed 47. ↵ Yates CR , Nguyen A , Liao J , Cheng RA . What’s on a prophage: analysis of Salmonella spp. prophages identifies a diverse range of cargo with multiple virulence-and metabolism-associated functions . mSphere . 2024 Jun 25 ; 9 ( 6 ): e00031 – 24 . OpenUrl PubMed 48. ↵ Spencer CC , Tyerman J , Bertrand M , Doebeli M . Adaptation increases the likelihood of diversification in an experimental bacterial lineage . Proc Natl Acad Sci U S A . 2008 Feb 5 ; 105 ( 5 ): 1585 – 9 . OpenUrl Abstract / FREE Full Text 49. ↵ Tanner JR , Kingsley RA . Evolution of Salmonella within hosts . Trends Microbiol . 2018 Dec ; 26 ( 12 ): 986 – 98 . OpenUrl CrossRef PubMed 50. ↵ Yang Y , Ricke SC , Tellez G , Kwon YM . Quantitative tracking of Salmonella Enteritidis transmission routes using barcode-tagged isogenic strains in chickens: proof-of-concept study . Front Vet Sci . 2017 Feb 14 ; 4 : 15 . View the discussion thread. Back to top Previous Next Posted May 09, 2025. Download PDF Supplementary Material Data/Code Email Thank you for your interest in spreading the word about medRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Pan genome clustering identifies a novel mosaic prophage specific to Salmonella Enteritidis lineage associated with the invasive disease in India Message Subject (Your Name) has forwarded a page to you from medRxiv Message Body (Your Name) thought you would like to see this page from the medRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Pan genome clustering identifies a novel mosaic prophage specific to Salmonella Enteritidis lineage associated with the invasive disease in India Jobin John Jacob , Aravind Velmurugan , Dhanalakshmi Solaimalai , Ramya Iyadurai , Karthik Gunasekaran , Jansi Rani Malaiyappan , M Yesudoss , M Vasuki , Binesh Lal , Jacob John , Kamini Walia , Balaji Veeraraghavan medRxiv 2025.05.08.25327125; doi: https://doi.org/10.1101/2025.05.08.25327125 Share This Article: Copy Citation Tools Pan genome clustering identifies a novel mosaic prophage specific to Salmonella Enteritidis lineage associated with the invasive disease in India Jobin John Jacob , Aravind Velmurugan , Dhanalakshmi Solaimalai , Ramya Iyadurai , Karthik Gunasekaran , Jansi Rani Malaiyappan , M Yesudoss , M Vasuki , Binesh Lal , Jacob John , Kamini Walia , Balaji Veeraraghavan medRxiv 2025.05.08.25327125; doi: https://doi.org/10.1101/2025.05.08.25327125 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Infectious Diseases (except HIV/AIDS) Subject Areas All Articles Addiction Medicine (570) Allergy and Immunology (863) Anesthesia (301) Cardiovascular Medicine (4442) Dentistry and Oral Medicine (444) Dermatology (383) Emergency Medicine (609) Endocrinology (including Diabetes Mellitus and Metabolic Disease) (1511) Epidemiology (15231) Forensic Medicine (30) Gastroenterology (1126) Genetic and Genomic Medicine (6610) Geriatric Medicine (668) Health Economics (998) Health Informatics (4542) Health Policy (1370) Health Systems and Quality Improvement (1613) Hematology (543) HIV/AIDS (1266) Infectious Diseases (except HIV/AIDS) (15924) Intensive Care and Critical Care Medicine (1103) Medical Education (623) Medical Ethics (147) Nephrology (668) Neurology (6608) Nursing (346) Nutrition (999) Obstetrics and Gynecology (1146) Occupational and Environmental Health (957) Oncology (3338) Ophthalmology (974) Orthopedics (369) Otolaryngology (420) Pain Medicine (436) Palliative Medicine (130) Pathology (665) Pediatrics (1693) Pharmacology and Therapeutics (692) Primary Care Research (712) Psychiatry and Clinical Psychology (5449) Public and Global Health (9240) Radiology and Imaging (2203) Rehabilitation Medicine and Physical Therapy (1370) Respiratory Medicine (1196) Rheumatology (596) Sexual and Reproductive Health (714) Sports Medicine (530) Surgery (712) Toxicology (99) Transplantation (289) Urology (265) (function(){function c(){var b=a.contentDocument||a.contentWindow.document;if(b){var d=b.createElement('script');d.innerHTML="window.__CF$cv$params={r:'a02061ea8b48ad07',t:'MTc3OTgzNjI4NA=='};var a=document.createElement('script');a.src='/cdn-cgi/challenge-platform/scripts/jsd/main.js';document.getElementsByTagName('head')[0].appendChild(a);";b.getElementsByTagName('head')[0].appendChild(d)}}if(document.body){var a=document.createElement('iframe');a.height=1;a.width=1;a.style.position='absolute';a.style.top=0;a.style.left=0;a.style.border='none';a.style.visibility='hidden';document.body.appendChild(a);if('loading'!==document.readyState)c();else if(window.addEventListener)document.addEventListener('DOMContentLoaded',c);else{var e=document.onreadystatechange||function(){};document.onreadystatechange=function(b){e(b);'loading'!==document.readyState&&(document.onreadystatechange=e,c())}}}})();
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.