PhageAI: a new approach to predicting the lifestyle of bacteriophages using proteinBERT and convolutional neural networks

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 25,436 characters · extracted from preprint-html · click to expand
PhageAI: a new approach to predicting the lifestyle of bacteriophages using proteinBERT and convolutional neural networks | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results PhageAI: a new approach to predicting the lifestyle of bacteriophages using proteinBERT and convolutional neural networks View ORCID Profile Maria Urbanowicz , View ORCID Profile Arkadiusz Guziński , View ORCID Profile Żaneta Szulc doi: https://doi.org/10.1101/2025.09.02.673651 Maria Urbanowicz 1 PhageAI SA , 93-134 Lodz, Poland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Maria Urbanowicz For correspondence: maria.dorota.urbanowicz{at}gmail.com Arkadiusz Guziński 1 PhageAI SA , 93-134 Lodz, Poland 2 Proteon Pharmaceuticals SA , 93-134 Lodz, Poland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Arkadiusz Guziński Żaneta Szulc 1 PhageAI SA , 93-134 Lodz, Poland Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Żaneta Szulc Abstract Full Text Info/History Metrics Supplementary material Preview PDF Abstract Bacteriophages are viruses that infect bacteria, including temperate, virulent and chronic phages. In the current times of increasing resistance to antibiotics (AMR), it is necessary to quickly find phages and determine their lifecycle, therefore computational methods in the first phase of composing phage preparations are necessary to find such sequences. The challenge in building such tools is the lack of good quality and correctly labeled data from multiple reference databases, which are necessary to select sequences to create cocktails that should contain complete and replication-capable phages. Current published models also do not support chronic phages, which constitute a small but significant group of phages. Another problem is explainability, current models are black-box models where we cannot observe what actually influences the model’s predictions, this may result in the model overlooking features that are truly associated with the phage life cycle. In the presented tool, however, these issues have been explicitly addressed. The presented tool was also compared to other lifecycle prediction models: Phatyp, PhagePred, Bacphlip and Phacts. Introduction Phages are organisms that infect bacteria. Bacteriophages exhibit three main types of lifecycles. One of them is the temperate lifecycle, in which phages infect bacterial cells and integrate into their genome, remaining in a dormant state with the potential to enter the lytic cycle under favorable conditions ( Mirzaei et al., 2017 ). In contrast, virulent phages exclusively follow the lytic cycle, rapidly lysing the host cell upon infection and releasing progeny virions ( Shkoporov et al., 2018 ), while chronic phages are bacteriophage that replicates within the host cell without causing its lysis. New virions are released gradually leading to a persistent infection of the bacterium ( Hobbs et al., 2016 ). Apart from the classical virulent, chronic and temperate phages, bacteriophages may also undergo pseudolysogeny, in which the phage genome remains in the cell in the carrier state, representing a stable coexistence of the virus with a bacterial population. Knowledge about bacteriophages lifecycles is continuously evolving (Chevallereau & Westra, 2021). Bacteriophages are increasingly being considered a last-resort therapeutic option for individuals with antibiotic-resistant bacterial infections ( Zalewska-Piątek, 2023 ). They are also applied in targeted therapies as vectors for genetic material ( Hosseinidoust, 2017 ) and as modifiers of the intestinal microbiota ( Mirzaei et al., 2022 ). In addition, their use in animal husbandry has been explored as an alternative or adjunct to antibiotics ( Kahn et al., 2019 ). High costs of their isolation, cultivation and observation, while the costs of Next Generation Sequencing (NGS) are decreasing, especially in the case of phages from metagenomic samples, means that a rapid method of verifying their life cycle is needed to be able to quickly haracterize them and determine potential practical application (Knezevic et al., 2021). Currently, many attempts have been made to obtain a quick method of classification of bacteriophages. Among the available methods, we can mention PHACTS ( McNair et al., 2012 ), a classifier that uses a random forest algorithm based on proteomic data, Bacphlip ( Hockenberry et al., 2021 ), which also uses a random forest algorithm but is based on proteins described in the literature as being associated with the temperate cycle. Other classifiers are PhagePred ( Song, 2020 ), which works based on Euclidean distance, using a Markov model based on k- mer frequency. There is also PhaTYP, which uses BERT as an algorithm that detects the patterns associated with a given phage life cycle based on the presence of phage protein clusters in sequences ( Shang et al., 2023 ). In this paper we present a novel, machine learning approach to classify bacteriophages into three groups: chronic, virulent and temperate on the basis of their proteomes. The novelty of the tool stems from its ability to incorporate the chronic cycle, explainability in the temperate virulent classification and usage of large protein embedding models to improve protein representation as described in detail in the Methods section. Our tool is available online at https://app.phage.ai/ . Methods Dataset For the training and testing sets, we used a dataset of 1,851 phages. To ensure representation of all possible genera, we selected representatives from 1,652 genera included in the Virus Metadata Resource (VMR) file (August 2022) from International Committee on Taxonomy of Viruses (ICTV), and we also included representatives for chronic phages. The chronic bacteriophages dataset also includes sequences derived from pig fecal samples ( Billaud et al., 2021 ). Subsequently, observations similar more than 70 % were removed from the collection using the VIRIDIC program ( Moraru et al., 2020 ) to ensure diversity and representativeness for each genus. Threshold 70% was established based on separation criteria of taxonomic groups for tailed phages ( Turner et al., 2021 ). Preprocessing The pre-filtered sequences were structurally annotated using the Glimmer program (Hyatt et al., 2017). The lifecycle labels for chronic phages were determined in case of morphogenesis protein (pI) or VP3 protein presence. Lifecycle labels for temperate and virulent phages were determined in the presence or absence of proteins associated with lysogenic lifecycle including integrase protein. All observations with labels are available in Supplementary Data (Table S3). The protein detection was performed using diamond ( Buchfink et al., 2021 ), hmmscan ( Eddy, 2011 ) and interproscan ( Blum et al., 2021 ) using default parameters. Model preparation For building model proteins sequences were used. Embedding was performed using the ProteinBertT5 model ( Nadav et al., 2022 ), which was used as the first layer of the neural network model as embedding layer in the convolutional neural network (CNN) model. Each protein was first represented as an embedding vector. For each phage, a sequence was then constructed in which every protein corresponds to a ‘word’ represented by its ProtBertT5 embedding. These sequences were subsequently used as inputs for the model. The procedure diagram is available below ( Fig. 1 ). Phage classification in our solution is based on two independent models. The first step is to classify bacteriophages into chronic and non-chronic phages, and the next step is to classify them into virulent and temperate phages ( Fig. 2 ). For training both models, training and test sets were prepared independently. In each model, a random split of 80:20 was considered, taking into account the proportions of both classes for training models. Download figure Open in new tab Figure 1. The technical model pipeline: genes were first detected using Glimmer, after which embeddings were generated for all bacteriophage proteins. A feature matrix was then constructed for classification, and model explainability was applied to distinguish virulent from temperate phages. Download figure Open in new tab Figure 2. The PhageAI pipeline: the proposed methodology for bacteriophage life cycle recognition involves an initial classification of chronic versus non-chronic phages, followed by a subsequent classification into virulent or temperate classes. Explainability analysis The integrated gradient (IG) method ( Sundararajan et al., 2017 ) was used for explainability analyses, then the results from the IG analysis were combined using annotation from the diamond ( Buchfink et al., 2021 ), hmmscan ( Eddy, 2011 ) and interproscan ( Blum et al., 2021 ) using default parameters programs to obtain a label for selected key proteins in the analysis. The annotation process was identical to the description of life cycle sets. Results The results of the model were evaluated on the basis of an independent test set, for this purpose the following statistics were used: Precision (TP/TP+FP), Recall (TP/TP+FN)and F1-score (2 × (Precision × Recall) / (Precision + Recall)) and ROC-AUC curve. The original results were obtained on the test set of the classifier by comparing it with the available tools: Bacphlip, PhagePred, PhaTYP, Phacts. The ROC curve analysis indicated that the best overall results were achieved using Bacphlip and PhageAI model. The results are also confirmed by precision, recall and F1-score statistics. Results for this comparison are available in Supplementary Data (Table S1). The added value of the publication is the result of explainability analyses for temperate and virulent bacteriophages, where proteins annotated as the integrases stand for 90% of the observations as the most important feature supporting predictions of temperate lifecycle, other proteins that were important for explainability analysis are listed in Supplementary Data (Table S2) for every bacteriophage from test set. Additionally, the table and figure contain results for chronic class, where evaluation on the test set demonstrates that the model attains highly satisfactory results across all performance metrics. ( Fig. 3 ). Download figure Open in new tab Figure 3. The ROC curve comparison on the test set. The value shown in the legend is AUCROC score. PhageAI and Bacphlip has the best performance (A). Proportion of the most important features for classification of temperate bacteriophages (B). The ROC curve for chronic-non chronic classificatory (C). View this table: View inline View popup Download powerpoint Table 1. The performance comparison on the test set. Discussion In an era of increased access to sequencing technology and a noticeable increase in the number of phage sequences published in databases ( Fig. 4 ), the use of predictive models to answer one of the key questions: “What life cycle does a bacteriophage lead?” is beginning to gain importance. Download figure Open in new tab Figure 4. The number of phage sequences published in GenBank between 2014 and 2024. The figure shows an increase in the number of sequences since 2019, when the number exceeded 2,000 per year and has remained above that level since then. Through our work, we wanted to address the opportunities offered by introducing AI/ML to phage science and the benefits it can bring. Working with models requires a large, well-characterized dataset. For this reason, we created the PhageAI service and adapted our bioinformatics pipelines to create the first datasets that could be used to create predictive models. We have achieved high levels of confidence and model explainability, something that is new for AI-based solutions and phage science. Our models utilized validated data and complete bacteriophages, focusing on nearly all currently described genera, ensuring the greatest possible diversity. This also allowed us to determine phage life cycles in taxonomic groups that were previously poorly described. When comparing our model to existing approaches used in benchmarking, the model most closely aligned with our results is Bacphlip. This similarity is likely due to Bacphlip’s utilization of protein-level information and accurate annotation, which facilitates a better understanding of the factors influencing predictions. Properly annotated training data ensures that the assigned labels are accurate, improving model performance. A limitation of Bacphlip, however, is its inability to support chronic phages. Interestingly, comparison with Phatyp yielded suboptimal results on our dataset. This may be attributed to its training on publicly available databases without prior validation, potentially leading to lower predictive accuracy on curated data. PhagePred and Phacts, being older models, likely show reduced performance due to reliance on outdated datasets and limited knowledge regarding bacteriophage lifecycle annotation at the time of their development. Notably, none of the published models support chronic phages, despite the availability of current datasets that allow for the construction of representative training sets. Another challenge is the lack of model explainability, which prevents us from understanding the underlying basis of predictions. This limitation, especially when training and testing datasets are highly similar, can lead to potential bias or overestimation of model performance. One of the limitations we see in presented model is the need to switch to amino acid sequences and the need to use additional programs for sequence annotation, which in itself may introduce errors in the form of predicting on incorrectly annotated proteins. On the other hand, by training the model on proteins, we managed to introduce methods of explaining the model’s indications that are understandable to humans. As our analyses show, the main determinant is the presence of integrase on the bacteriophage genome for most bacteriophages and those are results which met our expectations. Our next step will be to configure an input data pipeline, which will allow us to ensure early on that the model is making predictions based on clean, complete phage sequences. Currently, the model will attempt to process a sequence regardless of whether it comes from a phage, bacteria, or other organism, which can lead to misunderstandings of results. We anticipate that our work will facilitate research by accelerating bioinformatics analyses and making these approaches more accessible to researchers without extensive expertise in bioinformatics. Declarations Ethics approval and consent to participate Not applicable. Consent for publication Not applicable. Competing interests The authors are employees of PhageAI S.A., which developed the tool described in this article. Funding This work was supported by PhageAI S.A. Data availability The dataset information can be found in Supplementary Data.xlsx Funder Information Declared PhageAI S.A. References 1. ↵ Blum , M. , Chang , H. Y. , Chuguransky , S. , Grego , T. , Kandasaamy , S. , Mitchell , A. , … & Finn , R. D. ( 2021 ). The InterPro protein families and domains database: 20 years on . Nucleic acids research , 49 ( D1 ), D344 – D354 . OpenUrl CrossRef PubMed 2. ↵ Buchfink , B. , Reuter , K. , & Drost , H. G. ( 2021 ). Sensitive protein alignments at tree-of-life scale using DIAMOND . Nature methods , 18 ( 4 ), 366 – 368 . OpenUrl PubMed 3. ↵ Eddy , S. R. ( 2011 ). Accelerated profile HMM searches . PLoS computational biology , 7 ( 10 ), e1002195 . OpenUrl 4. ↵ Hobbs , Z. , & Abedon , S. T. ( 2016 ). Diversity of phage infection types and associated terminology: the problem with ‘Lytic or lysogenic’ . FEMS microbiology letters , 363 ( 7 ), fnw047 . OpenUrl CrossRef PubMed 5. ↵ Hockenberry , A. J. , & Wilke , C. O. ( 2021 ). BACPHLIP: predicting bacteriophage lifestyle from conserved protein domains . PeerJ , 9 , e11396 . OpenUrl CrossRef PubMed 6. ↵ Hosseinidoust , Z. ( 2017 ). Phage-mediated gene therapy . Current Gene Therapy , 17 ( 2 ), 120 – 126 . OpenUrl PubMed 7. Hyatt , D. , Chen , G. L. , LoCascio , P. F. , Land , M. L. , Larimer , F. W. , & Hauser , L. J. ( 2010 ). Prodigal: prokaryotic gene recognition and translation initiation site identification . BMC bioinformatics , 11 , 1 – 11 . OpenUrl CrossRef PubMed 8. ↵ Kahn , L. H. , Bergeron , G. , Bourassa , M. W. , De Vegt , B. , Gill , J. , Gomes , F. , … & Topp , E. ( 2019 ). From farm management to bacteriophage therapy: strategies to reduce antibiotic use in animal agriculture . Annals of the New York Academy of Sciences , 1441 ( 1 ), 31 – 39 . OpenUrl CrossRef PubMed 9. Knežević , P. , Hoyle , N. S. , Matsuzaki , S. , & Gorski , A. ( 2021 ). Advances in phage therapy: present challenges and future perspectives . Frontiers in microbiology , 12 , 701898 . OpenUrl PubMed 10. Mäntynen , S. , Laanto , E. , Oksanen , H. M. , Poranen , M. M. , & Díaz-Muñoz , S. L. ( 2021 ). Black box of phage–bacterium interactions: exploring alternative phage infection strategies . Open biology , 11 ( 9 ), 210188 . OpenUrl CrossRef PubMed 11. ↵ McNair , K. , Bailey , B. A. , & Edwards , R. A. ( 2012 ). PHACTS, a computational approach to classifying the lifestyle of phages . Bioinformatics , 28 ( 5 ), 614 – 618 . OpenUrl CrossRef PubMed Web of Science 12. ↵ Mirzaei , M. K. , & Deng , L. ( 2022 ). New technologies for developing phage-based tools to manipulate the human microbiome . Trends in microbiology , 30 ( 2 ), 131 – 142 . OpenUrl CrossRef PubMed 13. ↵ Mirzaei , M. K. , & Maurice , C. F. ( 2017 ). Ménage à trois in the human gut: interactions between host, bacteria and phages . Nature Reviews Microbiology , 15 ( 7 ), 397 – 408 . OpenUrl CrossRef PubMed 14. ↵ Moraru , C. , Varsani , A. , & Kropinski , A. M. ( 2020 ). VIRIDIC—A novel tool to calculate the intergenomic similarities of prokaryote-infecting viruses . Viruses , 12 ( 11 ), 1268 . OpenUrl CrossRef PubMed 15. ↵ Nadav Brandes , Dan Ofer , Yam Peleg , Nadav Rappoport , Michal Linial , ProteinBERT: a universal deep-learning model of protein sequence and function , Bioinformatics , Volume 38 , Issue 8 , March 2022 , Pages 2102 – 2110 , doi: 10.1093/bioinformatics/btac020 OpenUrl CrossRef PubMed 16. ↵ Shang , J. , Tang , X. , & Sun , Y. ( 2023 ). PhaTYP: predicting the lifestyle for bacteriophages using BERT . Briefings in Bioinformatics , 24 ( 1 ), bbac487 . OpenUrl CrossRef PubMed 17. ↵ Shkoporov , A. N. , Khokhlova , E. V. , Fitzgerald , C. B. , Stockdale , S. R. , Draper , L. A. , Ross , R. P. , & Hill , C. ( 2018 ). ΦCrAss001 represents the most abundant bacteriophage family in the human gut and infects Bacteroides intestinalis . Nature communications , 9 ( 1 ), 4781 . OpenUrl PubMed 18. ↵ Song , K. ( 2020 ). Classifying the lifestyle of metagenomically-derived phages sequences using alignment-free methods . Frontiers in microbiology , 11 , 567769 . OpenUrl PubMed 19. ↵ Sundararajan , M. , Taly , A. , & Yan , Q. ( 2017 , July ). Axiomatic attribution for deep networks . In International conference on machine learning (pp. 3319 – 3328 ). PMLR . 20. ↵ Turner , D. , Kropinski , A. M. , & Adriaenssens , E. M. ( 2021 ). A roadmap for genome-based phage taxonomy . Viruses , 13 ( 3 ), 506 . OpenUrl CrossRef PubMed 21. ↵ Zalewska-Piątek , B. ( 2023 ). Phage therapy—challenges, opportunities, and future prospects . Pharmaceuticals , 16 ( 12 ), 1638 . OpenUrl PubMed 22. ↵ Billaud , M. , Lamy-Besnier , Q. , Lossouarn , J. , Moncaut , E. , Dion , M. B. , Moineau , S. , … & Petit , M. A. ( 2021 ). Analysis of viromes and microbiomes from pig fecal samples reveals that phages and prophages rarely carry antibiotic resistance genes . ISME communications , 1 ( 1 ), 55 . OpenUrl PubMed View the discussion thread. Back to top Previous Next Posted September 06, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following PhageAI: a new approach to predicting the lifestyle of bacteriophages using proteinBERT and convolutional neural networks Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share PhageAI: a new approach to predicting the lifestyle of bacteriophages using proteinBERT and convolutional neural networks Maria Urbanowicz , Arkadiusz Guziński , Żaneta Szulc bioRxiv 2025.09.02.673651; doi: https://doi.org/10.1101/2025.09.02.673651 Share This Article: Copy Citation Tools PhageAI: a new approach to predicting the lifestyle of bacteriophages using proteinBERT and convolutional neural networks Maria Urbanowicz , Arkadiusz Guziński , Żaneta Szulc bioRxiv 2025.09.02.673651; doi: https://doi.org/10.1101/2025.09.02.673651 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Bioinformatics Subject Areas All Articles Animal Behavior and Cognition (7643) Biochemistry (17717) Bioengineering (13910) Bioinformatics (42017) Biophysics (21480) Cancer Biology (18628) Cell Biology (25537) Clinical Trials (138) Developmental Biology (13392) Ecology (19935) Epidemiology (2067) Evolutionary Biology (24356) Genetics (15617) Genomics (22530) Immunology (17755) Microbiology (40438) Molecular Biology (17200) Neuroscience (88705) Paleontology (667) Pathology (2840) Pharmacology and Toxicology (4832) Physiology (7657) Plant Biology (15171) Scientific Communication and Education (2046) Synthetic Biology (4304) Systems Biology (9828) Zoology (2272)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00