Full text
21,722 characters
· extracted from
preprint-html
· click to expand
Towards Modeling in Large-Scale Genetic and Metabolic Networks | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Towards Modeling in Large-Scale Genetic and Metabolic Networks View ORCID Profile Marco Polo Castillo-Villalba doi: https://doi.org/10.1101/2025.11.11.687908 Marco Polo Castillo-Villalba 1 Department of Molecular Biology and Biotechnology, Institute of Biomedical Research UNAM , Circuito Universitario 04510 CDMX, Mexico Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Marco Polo Castillo-Villalba For correspondence: mpolocv{at}gmail.com Abstract Full Text Info/History Metrics Supplementary material Preview PDF A bstract Mathematical modeling of large-scale genetic and metabolic networks remains an open area of research with profound implications for understanding biochemical signaling systems in both prokaryotic and eukaryotic organisms. In this work, we extend the biochemical modeling framework based on the Power Law formalism , originally developed by M.A. Savageau to elucidate design principles in small bacterial networks. This formalism captures gene regulation and metabolic fluxes through two fundamental sets of parameters: kinetic parameters and kinetic orders . The kinetic parameters determine the magnitudes of fluxes, while the kinetic orders appearing as exponents in the power-law representation encode the regulatory structure of the system. We propose a mathematical technique to characterize the entire family of systems associated with the space of kinetic orders. We show that this exponent space possesses a well-defined structure in toric geometry and can therefore be modeled using algebraic varieties . To represent large-scale networks, we associate a toric variety with each polynomial equation of the system and then use geometric techniques to coherently combine these varieties into a global structure, or fan . This construction enables a modular and geometrically consistent representation of complex biochemical networks. 1. Introduction 2. Theoretical Background: Biochemical Networks as Toric S-systems One of the main ideas behind the analysis of biochemical systems is the conservation of mass in reactions. In addition, the Michaelis–Menten rate law is one of the fundamental concepts in biochemical systems. However, in recent decades, this law has been refined to provide more detailed biochemical information about the biomolecules participating in the network. For example, it is now possible to consider reactions with arbitrary orders, such as the number of binding sites in gene operator regions or activation parameters from Hill functions. This is the basis of the Power Law formalism [ 11 ], which, through parametric extensions, allows for the simultaneous modeling of both metabolism and gene regulation. The formal expression of this model is given below: Here, the kinetic parameters α ik and β ik capture the rate constants for production and degradation, respectively, of each species or biomolecule in the network. The kinetic orders g ijk and h ijk represent genotypic information, such as binding sites and the kinetic orders of catalyzed reactions or multimeric regulation sub units in protein structures. Therefore, Equation (2.1) captures all the information required to analyze genetic–metabolic networks. Definition 2.1. (S-systems). We define the number of combinations of dominant terms in Equation (2.1) as: which partitions the space of concentrations ( X 1 , …, X n ). Each partition corresponds to a dominant term, or S-system , as defined in [ 13 ], [ 11 ], [ 7 ], [ 8 ], [ 9 ]. This is expressed as follows: In the context of this formalism, an S-system defines a quantitative phenotype and corresponds to a biological reality in molecular biology. These systems are not merely mathematical artifacts; they represent rates of change in molecular concentrations derived from this formal gradient. 2.1. Toric S-systems In this section, we highlight the importance of studying the exponents and in an S-system. We assert that the monomial map represents a Genotype–Phenotype relationship with properties of great interest for further study. This central idea forms the foundation of our research. Below, we briefly summarize the definitions introduced in well-known works such as [ 7 ], [ 13 ], [ 11 ], and [ 7 ]. Definition 2.2. (Exponent Space or Support) For an S-system defined by , we define the exponent space of , also formally known as the support of a polynomial, as: Using the support of any S-system supp , we can construct all linear combinations from the two vectors in the support, and . The set of all such vector combinations defines the cone associated with , as described in [ 4 ]. Definition 2.3. (Cone) Let be an S-system as defined above. We define the cone associated with it as: This cone represents the linear space generated by all combinations of the vectors in the support space, including addition, subtraction, and scalar multiplication. If the vectors consist only of integer entries, the cone is called a lattice cone [ 4 ]. Definition 2.4. (Dual Cone) Let σ ⊆ℤ n be a lattice cone. The dual cone σ ∨ is defined as: as described in [ 4 ]. Definition 2.5. (Monoid) By intersecting the dual cone with the n -dimensional integer lattice, we obtain: which we call a monoid . This monoid, denoted by M , has rank n and is isomorphic to ℤ n [ 4 ]. Lemma (Gordan’s Lemma and the Hilbert Basis) Given a cone σ , the intersection of its dual with the n -dimensional integer space, forms a monoid that has a finite set of generators. This generating set is called the Hilbert basis [ 17 ], [ 4 ]. Definition 2.6. (Fan or topological environment) Given a collection of dual cones we define the fan as the union of all these cones. We denote this fan by Σ ⊆ ℤ n [ 4 ]. Finally, we construct a coordinate polynomial ring for S-systems. Let be an S-system defined for any i -th species in a metabolic network. Given the support of this polynomial supp( f ) and its associated cone σ , we define the polynomial ring: In other words, the exponents of an S-system (i.e., the kinetic orders) are embedded in a geometric space. We will explore new topological properties that arise from this geometric object in the following sections. Definition 2.7. (Toric Ideal). A toric ideal is the set of prime binomials defined by I = , where H is the Hilbert basis of the polynomials generated from I , [ 17 ], [ 3 ]. Definition 2.8. (Toric Variety). We define a toric variety associated with a polynomial f as follows: Here, the notation Spec ( R σ ) denotes the set of all prime polynomials (i.e., non-divisible polynomials) { f 1 , …, f k } in the ring R σ for some integer k , see [ 4 ]. Definition 2.9. (Environment Cone). Let f be an S-system representing the rate law for the change in concentration of any species in a gene–metabolic network. We compute the support of f and the cone associated with it, σ ⊆ℤ n . Since supp( f ) ⊆ σ , we define the environment cone associated with f as the dual cone σ ∨ of σ . Thus, we have the inclusion relation: Relevance in Enzyme Kinetics Up to this point, we have equipped the set of vectors associated with the kinetic orders of an S-system with new geometric properties. We have defined cones, polynomial rings, and toric varieties. The most important result arises from Gordan’s Lemma [ 4 ], which guaranties the existence of a generator basis (the Hilbert basis ) for the entire kinetic order space defined for any species in the network. Next, we will explore how to exploit the properties induced by this Hilbert basis. Toric S-systems and Dominant Fluxes Given the Hilbert basis H = { h 1 , …, h k }, we represent it in matrix form considering each h i as a row vector: We can use this matrix to represent the variables X i in a new coordinate system using the following monomial transformation: as discussed in [ 4 ], [ 17 ], and [ 3 ]. This transformation reveals dynamical properties encoded within the S-systems through the Hilbert basis [ 17 ], [ 5 ]. This matrix representation allows embedding all S-system equations into a new system of monomial coordinates. Hence, we extend the analysis of molecular networks toward large-scale genetic and metabolic systems. Theorem 2.10. (Toric S-system). If we substitute the above change of coordinates into Equation (2.2), the original S-system equations, we obtain the following expression, valid for all i = 1, …, n: Proof . Given an S-system representation of molecular networks as in Equation (2.2), and applying Hironaka’s theorem together with the algorithmic construction of the Hilbert basis (a finite number of times) to the S-system equations [ 1 ], [ 6 ], [ 5 ], we find that every S-system is toric and can be described by: Or, more compactl: We thus define a Toric S-system according to the expression above, where h j is an element of the Hilbert basis for some j. We assert that the binomials constructed from the Hilbert basis H , with and , are toric binomials. q.e.d . The monomial transformation, represents, in this geometric framework, the Genotype–Phenotype relationship . These are the coordinate transformations of the geometric basis corresponding to the kinetic orders such as the number of binding sites in regulatory genomic sequences, the order of biochemical reactions in metabolism, or the degree of multimeric regulation in proteins. The monomials represent the chemical concentrations of the species or biomolecules described by the S-system X i . The coordinates u ij encode information derived from the genome sequence, which is then expressed through the phenotypic gradient: Thus, the mapping of dynamical behavior occurs through this gradient, linking genotypic parameters to phenotypic observables. 3. Discussion We have presented new topological properties of biochemical networks by exploiting the structural features of the Power Law and S-system modeling frameworks. In particular, we emphasize the significance of the monomial map: , which provides a bridge between biochemical kinetics and algebraic geometry. By focusing our analysis on the exponent space of S-systems, we study the kinetic orders using computational algebraic geometry techniques. This allows us to identify geometric bases that constrain and characterize the possible values of these parameters, thereby facilitating the solution of large systems of differential equations. The central open questions that can be addressed with this approach are as follows: Under what conditions are these geometrical regions valid for assigning values to the kinetic orders? Which of these regions represent true biological information and which are merely mathematical artifacts? Another advantage of the proposed methodology is its potential to model the dynamics of large-scale metabolic and gene-regulatory networks. The monomial map has a formal justification through the mathematical concept of a toric variety . Although toric varieties are abstract algebraic objects, they serve as powerful tools for modular analysis: each variety corresponds to a submodule of the biochemical network, and the full network can be reconstructed by gluing together these varieties using geometric techniques. While a single toric variety may provide limited insight into the overall biochemical system, the ensemble of all varieties properly joined captures the global dynamics of large-scale genetic and metabolic networks. This modular, geometrically grounded framework thus offers a new perspective for understanding and simulating the complex interplay between genotype and phenotype. Finally, we have included in the Supplementary Information the complete set of equations used for the toric analysis of a gene–metabolic network in the allosteric system of the tetrameric protein TrpR (tryptophan repressor) in E. coli K-12. In a future work, we will solve the complete dynamics using toric varieties such as biochemical modules. Declaration of Interest Statement The author declares that he has no personal, financial, professional, or academic conflicts of interest. Support information Download figure Open in new tab Figure 1. Tryptophan genetic and metabolic network Download figure Open in new tab Figure 2. Toric S-system equations for tetrameric tryptophan protein. 4. Acknowledgment Marco Polo Castillo Villalba is a doctoral student from the Programa de Doctorado en Ciencias Biomédicas, Universidad Nacional Autónoma de México (UNAM) and has received the CONAHCYT fellowship 754050. We acknowledge funding from UNAM and from the National Institutes of Health (grant number 5R01GM110597-03). I give a special thanks to Michael A. Savageau for all technical comments during my scholar stay with him, Pedro Miramontes Vidal and Julio Collado-Vides and technical contribution by Laura Gómez Romero. Funder Information Declared CONAHCYT , 754050 National Institutes of Health, US. , 5R01GM110597- 03 Footnotes Email address: mpolocv{at}gmail.com Only it was included support information files, to clarify the applications to molecular networks within of this new framework. References [1]. ↵ M.F. Atiyah . Resolution of Singularities and Division of Distributions, Communications On Pure and Applied Mathematics , vol. XXIII , 145 – 150 ( 1970 ). OpenUrl [2]. D. Cox , J. Little and D. O’Shea . Using Algebraic Geometry . Springer , 2nd . Edition, August , 2004 . [3]. ↵ D. Cox , J. Little and H. Schenck . Toric Varieties Department Of Mathematics, Amherst College, Amherst MA 01002 , 2010 . [4]. ↵ G. Ewald . Combinatorial Convexity and Algebraic Geometry ., Springer-Verlag , New York, Inc ., 1996 . [5]. ↵ Henk M , Weismantel R. On Hilbert bases of polyhedral cones . Konrad-Zuse-Zentrum für Informationstechnik ; 2010 . [6]. ↵ T. Fukui . Introduction to Toric Modifications With an Application to Real Singularities . Department Of Mathematics, Faculty Of Science, Saitama University. 255 Shimo-Okubo, Urawa 338-8570 , Japan , pag. 96 – 114 , 2000 . [7]. ↵ J. G. Lomnitz , M. A. Savageau . Phenotypic deconstruction of gene circuitry Chaos . Vol. 23 , Issue 2 , May 21, 2013 . [8]. ↵ J. G. Lomnitz , M. A. Savageau . Strategy Revealing Phenotypic Differences among Synthetic Oscillator Designs . ACS Synth. Biol . Volume 3 , 686701 , July 14, 2014 . OpenUrl [9]. ↵ J. G. Lomnitz , M. A. Savageau . Elucidating the genotype-phenotype map by automatic enumeration and analysis of the phenotypic repertoire . npj Systems Biology and Applications . Vol 1 , 15003 ; doi: 10.1038/npjsba.2015.3 ; published online 28 September 2015 . OpenUrl CrossRef PubMed [10]. J. G. Lomnitz , M. A. Savageau . Design Space Toolbox V2: Automated Software Enabling a Novel Phenotype-Centric Modeling Strategy for Natural and Synthetic Biological Systems . Frontiers in Genetics . Vol 27 , article 117, 12 July , 2015 . [11]. ↵ Biochemical Systems Analysis : “ A Study of Function and Design in Molecular Biology ”. Biochemical Systems Analysis ., volume 1 . Addison-Wesley Inc, Reading, Mass , USA , 1976 . [12]. Savageau MA . Optimal design of feedback control by inhibition. Dynamic considerations . J Mol Evol . 1975 ; 5 : 199 – 222 . OpenUrl CrossRef PubMed Web of Science [13]. ↵ M. A. Savageau and E. O. Voit . Recasting Nonlinear Differential Equations as S-Systems: A Canonical Nonlinear Form . Mathematical Biosciences ., Volume 87 , Issue 1 , pages 83 – 115 , November 1987 . OpenUrl CrossRef Web of Science [14]. M. A. Savageau , H. O. Voit and D. H. Irvine . Biochemical Systems Theory and Metabolic Control Theory: 1. Fundamental Similarities and Differences . Mathematical Biosciences ., Volume 86 , Issue( 2 ), pages 127 – 145 , October 1987 . OpenUrl CrossRef [15]. M. A. Savageau . Design principles for elementary gene circuits: Elements, methods, and examples . Chaos ., Volume 11 , Issue 1 , December ( 2001 ). [16]. M. A. Savageau , P. M. B. M. Coelho , R. A. Fasani and A. Salvador . Phenotypes and tolerances in the design space of biochemical systems . PNAS . Vol. 106 , no. 16 , 6435 – 6440 , April 21, 2009 . OpenUrl Abstract / FREE Full Text [17]. ↵ B. Sturmfels . Grobner Bases and Convex Polytopes . American Mathematical Society. Providence, RI , 1996 . [18]. Voit , E. O. Non Linear Canonical Modeling . S-system Approach To Understanding Complexity . New York . New Nonstrand Reinold , ( 1991 ). View the discussion thread. Back to top Previous Next Posted November 14, 2025. Download PDF Supplementary Material Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Towards Modeling in Large-Scale Genetic and Metabolic Networks Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Towards Modeling in Large-Scale Genetic and Metabolic Networks Marco Polo Castillo-Villalba bioRxiv 2025.11.11.687908; doi: https://doi.org/10.1101/2025.11.11.687908 Share This Article: Copy Citation Tools Towards Modeling in Large-Scale Genetic and Metabolic Networks Marco Polo Castillo-Villalba bioRxiv 2025.11.11.687908; doi: https://doi.org/10.1101/2025.11.11.687908 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Systems Biology Synthetic Biology Subject Areas All Articles Animal Behavior and Cognition (7629) Biochemistry (17660) Bioengineering (13881) Bioinformatics (41910) Biophysics (21436) Cancer Biology (18576) Cell Biology (25480) Clinical Trials (138) Developmental Biology (13368) Ecology (19887) Epidemiology (2067) Evolutionary Biology (24302) Genetics (15598) Genomics (22482) Immunology (17726) Microbiology (40360) Molecular Biology (17163) Neuroscience (88534) Paleontology (666) Pathology (2830) Pharmacology and Toxicology (4821) Physiology (7637) Plant Biology (15129) Scientific Communication and Education (2045) Synthetic Biology (4290) Systems Biology (9817) Zoology (2269)
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.