One model to rule them all: unification of voltage-gated potassium channel models via deep non-linear mixed effects modelling

doi:10.1101/2025.04.24.650426

One model to rule them all: unification of voltage-gated potassium channel models via deep non-linear mixed effects modelling

2025 · doi:10.1101/2025.04.24.650426

preprint OA: closed

📄 Open PDF Full text JSON View at publisher

Full text 92,476 characters · extracted from preprint-html · click to expand

One model to rule them all: unification of voltage-gated potassium channel models via deep non-linear mixed effects modelling | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results One model to rule them all: unification of voltage-gated potassium channel models via deep non-linear mixed effects modelling View ORCID Profile Domas Linkevicius , Angus Chadwick , Melanie I. Stefan , View ORCID Profile David C. Sterratt doi: https://doi.org/10.1101/2025.04.24.650426 Domas Linkevicius 1 Institute for Adaptive and Neural Computation, School of Informatics, University of Edinburgh , Edinburgh, United Kingdom Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Domas Linkevicius For correspondence: domas.l{at}proton.me Angus Chadwick 1 Institute for Adaptive and Neural Computation, School of Informatics, University of Edinburgh , Edinburgh, United Kingdom Find this author on Google Scholar Find this author on PubMed Search for this author on this site Melanie I. Stefan 2 Faculty of Medicine, Medical School Berlin , Berlin, Germany Find this author on Google Scholar Find this author on PubMed Search for this author on this site David C. Sterratt 1 Institute for Adaptive and Neural Computation, School of Informatics, University of Edinburgh , Edinburgh, United Kingdom Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for David C. Sterratt Abstract Full Text Info/History Metrics Preview PDF Abstract Ion channels are essential for signal processing and propagation in neural cells. Voltage-gated ion channels permeable to potassium (K v ) form one of the most prominent channel families. Techniques used to model the voltage-dependent gating of K v channels date back to Hodgkin and Huxley (1952). Different K v types can display radically different kinetic properties, requiring different mathematical models. However, the construction of Hodgkin-Huxley-like (HH-like) models is generally complex and time consuming due to the number of parameters, their tuning and having to choose functional forms to model gating. In addition to the between-K v type heterogeneity, there can be significant within-K v type kinetic heterogeneity between different cells with genetically identical channels. Since HH-like models do not account for such variability, extensions to it are necessary. We use scientific machine learning (SciML), the integration of machine learning methodologies with existing scientific models, and non-linear mixed effects (NLME) modelling to bypass the limitations of HH-like modelling. NLME is a modelling methodology that takes into account both within- and between-subject variability. These tools allowed us to complement the HH-like modelling and construct a unified SciML HH-like model that fits the recordings from 20 different K v types. The unified SciML HH-like model produced closer fits to the data compared to a set of seven previous HH-like models and was able to represent the highly heterogeneous data from different cells. Our model may be the first step in producing a SciML foundation model for ion channels that would be capable of modelling the gating kinetics of any ion channel type. Author summary Ion channels are complex molecules embedded in the membranes of neurons – the cells responsible for signal propagation and processing in the brain. Ion channels can open and close in response to various types of stimuli, in particular the voltage difference across the cell membrane. Computational modelling, usage of mathematical techniques to represent a system and algorithmically solve for its dynamics, has been previously used to understand the dynamics of voltage-gated ion channels. However, computational modelling of voltage-gated ion channels requires costly and complex optimization routines to optimize their structure and parameters. We utilize two tools new to the modelling of voltage-gated ion channels – scientific machine learning and non-linear mixed effects modelling – to bypass some limitations associated with the existing methods. By using scientific machine learning and non-linear mixed effects modelling we were able to create a unified model capable of modelling the gating dynamics of 20 different ion channels. This is in stark contrast to the existing modelling approaches, where each channel requires its own model. Moreover, our unified model performed better than seven existing ion channel gating models. Therefore, the tools we used and the model we created is a significant step forward in facilitating the modelling of ion channel gating. Future work could include even more ion channels types within the scope of our unified model. Introduction Ion channels are ubiquitous in cellular membranes and essential for various forms of signal transduction. There are multiple different mechanisms by which ion channels can be activated, such as different ligands, mechanical stimulation, and voltage, whereas some channels are passively open [ 1 ]. Voltage-gated ion channels are important because they are one of the main means of signal conduction in the nervous system and neural cells [ 2 , 3 ]. An important feature of voltage-gated ion channels is their permeability to one dominant ion type, with sodium, potassium and calcium being the most prominent [ 1 ]. Moreover, even among voltage-gated channels that are permeable to the same ion, there is significant functional and structural heterogeneity [ 4 ]. For example, there are 40 different voltage-gated potassium channels expressed in the mammalian brain, divided into 12 subfamilies called K v 1-12 [ 5 ]. Different voltage-gated ion channel types show different voltage dependencies, making their role in electrical signalling functionally distinct, yet overlapping [ 6 ]. One way to understand the functional complexity resulting from the abundance of different voltage-gated ion channel types is computational modelling. Mathematical models of ion channels found in the central nervous system can be used in compartmental models of neurons to elucidate the importance and interactions between various channel types, as well as the interaction between electrical and biochemical signalling [ 7 , 8 ]. One of the most prominent and widespread paradigms of voltage-gated ion channel modelling was first published in the pioneering work of Hodgkin and Huxley [ 2 ]. Hodgkin and Huxley used various experimental manipulations to characterize the voltage dependencies of the sodium and potassium channel gating in the squid giant axon. The essence of their method is computational modelling of hypothesised gating variables via differential equations. Following the notation in [ 9 ], two voltage-dependent functions describe the dynamics of the i th gating variable m i : the steady-state probability of the gate being open m i ,∞ ( V ) and the time-constant of the kinetics τ i ( V ), where V is the membrane potential. These functions are used in an ordinary differential equation system which can be solved numerically to obtain the dynamics of the gating variables over time m i ( t ). The gating dynamics can then be used to obtain the current conducted over time I ( t ). There are many possible functional forms used for m i ,∞ ( V ) and τ i ( V ) (see various models in https://modeldb.science/ [ 7 ] for examples). Even though the HH modelling paradigm was a breakthrough, its application can be complex: 1) finding and tuning the parameters of the often numerically unstable functional forms of m i ,∞ ( V ) and τ i ( V ) that can easily exhibit extreme behaviours; 2) setting up an appropriate m i structure often requiring either expensive discrete optimization routines or manual hand-tuning; 3) assumption of independence between the gating variables that may make it difficult to fit the data. The first two difficulties are not unique to the HH paradigm, they also apply if Markov models, which are a generalization of the kinetic schemes used by Hodgking and Huxley [ 2 ], are used. Markov models offers more flexibility, but can often result in parameter and kinetic scheme structure unidentifiablity [ 10 ]. The difficulties of the Hodgkin-Huxley model were highlighted with the publication of a data set described in Ranjan et al. [ 4 ]. The data recorded by Ranjan et al. [ 4 ] (see https://channelpedia.epfl.ch/expdata ) contains automated voltage-clamp recordings of 40 different K v channels, one at a time expressed in CHO cells. They used a set of voltage-clamping protocols to probe the activation, inactivation, deactivation and recovery of K v channels, as well as their response to ramp and action potential-like stimuli. One of the key insights from the Ranjan et al. [ 4 ] data is the inherent kinetic heterogeneity of some K v subtypes: even though the K v channels expressed in the cells were genetically the same, the recordings showed significant variability for some channel types, e.g. for K v 1.3 or K v 3.4. The data showed variability in what using the HH paradigm would be modelled as m i ,∞ , as well as τ i . The challenge posed by the data in Ranjan et al. [ 4 ] to the HH and Markov paradigms is that the basic models have one set of parameters and are not built for handling heterogeneity, i.e., different functional forms for m i ,∞ ( V ) and τ i ( V ) and number of gates m i with different functions may be required for different cells. Fitting a model to a single current recording is a challenging task; fitting many such models via the classical HH paradigm may be prohibitively expensive. Although there are purpose-built approaches to identifying the Markov gating structure of a given current recording [ 11 ], to the best of our knowledge, no approach currently used in computational neuroscience can efficiently handle the challenge of data heterogeneity. To address the challenge of heterogeneous channel behaviour, we apply modelling tools used in pharmacokinetics and pharmacodynamics (PK/PD), where heterogeneous populations of patients and complex dynamics are commonplace. The nonlinear mixed effects (NLME) modelling [ 12 ] framework is common in PK/PD literature and is well-suited to model complex dynamics in heterogeneous populations. NLME is a hierarchical framework with the population level parameters (fixed effects) at the highest level and individualized parameters (random effects) at the lowest level (see Figure 2 ). This structure allows to both individualize predictions in the presence of significant individual differences (for example, people in clinical trials), as well as extract average, population level models useful for future predictions. Moreover, the NLME approach allows for arbitrary nonlinear functions to be used, so long as the gradient vectors with respect to both fixed and random effects can be calculated. NLME modelling has been applied widely in PK/PD (e.g. see [ 13 ]), and infectious disease modelling [ 14 ], but it is also gaining popularity in other domains, for example, individualized predictions of mood [ 15 ], repeated measurements of individualized gaze estimation [ 16 ] and many other applications where the hierarchical structure is more faithful to reality than a single level structure. Download figure Open in new tab Fig 1. Visual representation of data processing pipeline. Each row represents the processing undertaken by some sample sweeps for each protocol: top row – activation, second row – deactivation, third row – inactivation, fourth row – recovery. The legends for each row are given in the last column. The plot for MAPE exclusion for the activation protocol is not shown because this step is not applied to the activation protocol. The down-sampling was not applied to the deactivation protocol because MAPE > 0.05. The normalization and rescaling column contains the relevant activation trace to which the other protocols were rescaled to. Download figure Open in new tab Fig 2. Visual representation of an NLME model, rectangle nodes in the top box denote parameters (fixed effects), circles denote random quantities which are either latent (unfilled) or observed (filled), diamonds are deterministic given the inputs, and nodes without a border are constant. Given nonlinear functions powerful enough to model any m i ,∞ ( V ) and τ i ( V ) present in the data and enough gates m i , the NLME approach would serve as a suitable tool to handle the heterogeneity observed in the Ranjan et al. [ 4 ] data. We use NLME and neural networks, which are universal function approximators [ 17 ], to represent m i ,∞ ( V ) and τ i ( V ) and fit a single HH-like model for all K v channels for which Ranjan et al. [ 4 ] provide data. We first fit a unified K v channel model by pooling data from different channel types into a single data set, relying on the power of neural networks to provide functional flexibility and the random effects to capture the heterogeneity present in the data. We then utilize the channel type and recording temperature information of individual recordings to predict a portion of variability inherent to the channel type and temperature that was initially captured by the random effects. This step also allows the derivation of average models for different K v types. We then compare our unified model performance against multiple existing single channel model baselines. We show that the predictions of our unified model result in lower RMSE values than ones from models used in existing publications, even if random effects are added to their parameters. This comparison proves that our unified model that uses neural networks to represent m i ,∞ ( V ) and τ i ( V ) learns representations that can model the K v dynamics in response to protocols presented in the data more accurately than the bespoke models. Moreover, the benefits of having a unified model are shown via the superior performance of the unified model against multiple separate models using the same neural network-based approach. We hypothesize that the unified approach outperforms the multiple single channel modelling approach due to the sharing of information and between similar K v types, especially when data is more limited, and finding more universal m i ,∞ ( V ) and τ i ( V ) forms. Finally, we analyse the m i ,∞ ( V ) and τ i ( V ) functions, and the temperature dependence of different K v types. Our results are practically useful in many ways, for example, by providing a significantly simpler and more efficient way to represent different K v models, by providing a workflow of voltage-gated ion channel model development that is significantly faster and more powerful than the previously used methods and a set of heterogeneous K v channel fits that are usable in traditional computational neuroscience simulators, such as NEURON [ 18 ]. Finally, our results point to a set of new higher level possibilities, such as a unified channel model representing both potassium and sodium channels, as well as being able to more easily integrate information of how different cellular factors affect channel dynamics. Methods Raw data We downloaded the data for all cells that were classified as active by Ranjan et al. [ 4 ] for further processing locally. For a full description of the data and the recording conditions see the original publication. The raw current recording data used in this study has been downloaded in the neurodata without borders ( .nwb ) format from https://channelpedia.epfl.ch/expdata for the following 20 channel types: K v 1.1, K v 1.2, K v 1.3, K v 1.4, K v 1.5, K v 1.6, K v 1.8, K v 2.1, K v 2.2, K v 3.1, K v 3.1, K v 3.3, K v 3.4, K v 4.1, K v 4.2, K v 4.3, K v 10.1, K v 10.2, K v 12.1, and K v 12.3. These channel types were chosen based on a preliminary inspection of the number of cell recordings that showed a good signal to noise ratio in a sufficient number of recordings over different temperatures (15°C, 25°C and 35°C). Voltage-clamp protocols used in Ranjan et al The current recordings in Ranjan et al. [ 4 ] were obtained by applying (often multiple times) six voltage-clamp protocols. Each protocol began with a 100ms baseline period, where in the first 40ms each cell was held at − 80mV, then the holding voltage was set to − 90mV for 10ms and from 50ms to 100ms the voltage was set back to −80mV. After this initial baseline period, each cell was exposed to one of six voltage clamp protocols – activation, deactivation, inactivation, recovery, ramp and action potential-like stimulation – meant to probe different K v channel properties. Each protocol consisted of a specific number of sweeps where a single feature of the protocol was varied. After each sweep, the cell was held at −80mV for the final 100ms. Generally, after the initial activation protocol, the protocols in Ranjan et al. [ 4 ] were applied in a consistent order (potentially multiple times): activation, ramp, deactivation, AP, inactivation. After the repetition of these five protocols, the recovery protocol was applied, potentially multiple times. Due to the limitations of Pumas.jl (its usage is described below), which disallows continuously applied time-varying negative stimuli, we only used the first four protocols – activation, deactivation, inactivation and recovery, described briefly below; for full description, see Ranjan et al. [ 4 ]. Activation The activation protocol consists of 18 sweeps at different holding voltages meant to measure the steady state activation levels of K v channels. Specifically, after the baseline period, cells were held between −90mV and +80mV (10mV increments) for 500ms. Deactivation The deactivation protocol consists of 12 sweeps meant to probe the deactivation kinetics of K v channels. Each sweep includes two different voltage levels: during the first 300ms the cells were clamped at +70mV, whereas for the subsequent 200ms the cells were held at voltages between −80mV to +30mV (10mV increments). Inactivation The inactivation protocol consists of 12 sweeps meant to probe the inactivation kinetics of K v channels. Each sweep includes two different voltage levels. During the first 1500ms the cells were held at voltages between − 40mV to +70mV (10mV increments). Afterwards, the holding voltage is switched to +30mV for 100ms. Recovery The recovery protocol consists of 16 sweeps intended to investigate the kinetics of K v recovery after activation. For the first 1500ms the cells were held at +50mV to induce channel activation and, potentially, inactivation. Then, each cell was held at − 80mV for a time period ranging between 50ms to 2300ms (150ms increments) during which the channels recovered. Finally, the cells were held at +50mV for 200ms to measure the levels of channel recovery after the recovery period. Data processing In order to make the data in Ranjan et al. [ 4 ] suitable for model training we undertook a series of data processing steps ( Figure 1 ). First, we filtered out inconsistent data. We then applied a time series smoothing algorithm to reduce the noise levels, followed by setting the current baseline to 0, normalization of the current, rescaling, exclusion of systematic data artifacts and downsampling. All data processing, modelling and analyses in this paper were performed using the Julia v1.10.4 programming language [ 19 ]. Filtering out inconsistent data We included only the second repetition of the activation protocol and the first repetition of each other protocol for further processing instead of averaging the different repetitions. We chose this approach due to frequent inconsistencies of current amplitudes or time constants between subsequent repetitions. We assumed that the earlier repetitions are of higher quality due to suffering from rundown less. First, we visually inspected the second repetition of the activation protocol for all of the cells and if any systematic irregularities were detected, we manually excluded the cells from further usage. This left a total of 2969 cells for further processing. For a more detailed summary of the number of sweeps left after the data processing see Table 1 . View this table: View inline View popup Download powerpoint Table 1. Number of sweeps of the data remaining after filtering of inconsistent data and irregularities. Since the activation sweeps were recorded first, we treated them as the standard reference point against which subsequent data is to be compared and scaled to. We compared the sweeps from other protocols to the relevant parts of the activation protocol using the mean absolute percentage error (MAPE), where m is the length of the time series being compared, x is the reference time series and y is the time series being evaluated: Using cell and sweep-specific references we then excluded any subsequent sweeps that were not consistent with the relevant activation sweep according to the following criteria: Deactivation – after the initial baseline period of 100ms, for the next 300ms in all sweeps in the deactivation protocol the cells are held at +70mV. If after setting the baseline to 0 (by subtracting the mean of the current during the first 40ms of the baseline period), and scaling of the peak current to match the activation protocol peak at +70mV, MAPE > 0.05, the sweep is not used. Inactivation – after the initial baseline period of 100ms, cells are held at voltages ranging from − 40mV to +70mV, which is a subset of the voltages used in the activation sweeps. Therefore, we took the first 500ms post-baseline from the inactivation sweeps and the activation sweeps held at the same voltage. We then set both of their baselines to 0 (by subtracting the mean of the current during the first 40ms of the baseline period) and scaled both inactivation and activation sweeps by the ratio of the activation peak at +80mV divided by the peak of the respective sweep (inactivation or activation). If MAPE > 0.05 for the inactivation protocol compared against the matching activation protocol, the inactivation sweep was not used. We chose to scale both sweeps to the activation peak at +80mV, which introduces a systematic bias, instead of the peak at the matching activation voltage to avoid introducing additional noise which often resulted in inconsistencies in inactivation peaks, where clamping to lower voltages resulting in higher current peaks compared to higher voltages. Recovery – after the initial baseline period of 100ms, cells are held at +50mV for the first 1500ms. Therefore, we took the first 500ms of that 1500ms and compared against the 500ms of activation protocol at +50mV. We set the baseline of both sweeps to 0, scaled both sweeps by the ratio of activation peak at +80mV divided by the peak of the given sweep and calculated the MAPE values. Moreover, there were multiple cases where the recovery sweeps were internally inconsistent; some traces showed significantly different current values at the end the 1500ms. Therefore, we calculated the median current value at 1500ms post-baseline over all the sweeps of a given cell and we used recovery sweep only if MAPE < 0.05 and the current value at 1500ms post-baseline was within one standard deviation of the median. These consistency checks were necessary to ensure that we kept only the sweeps that were internally consistent with the activation sweeps, for example there were no significant differences in time constants or large recording artifacts, etc. Usage of inconsistent data would have significantly hampered model training by requiring additional model mechanisms capable of accounting for the inconsistencies. Smoothing After the filtering of the sweeps inconsistent with the second repetition of the activation protocol, we smoothed the data using the Julia KissSmoothing.jl v1.0.8 package (see https://github.com/francescoalemanno/KissSmoothing.jl ). It implements a smoothing function called denoise which transforms the signal using the discrete cosine transform and convolves it with an Gaussian function (similar to the method outlined in [ 20 ]). We use denoise with default parameters, except for setting the smoothing intensity to factor=1.0 . Setting the baseline Since the raw current recordings were often offset from 0 at 80mV, when there should be no significant potassium current (due to the voltage being close to the reversal potential and channels generally being closed), we calculated the mean of the first 40ms of each sweep and subtracted it from the full sweep to set the mean during the baseline period to 0. Normalization Since we were only interested in the channel gating dynamics, we normalized each sweep by the current peak I max of activation sweep when the cell was held at +80mV. This allows us to model only the gating dynamics, reducing the number of parameters that need to be fit. Rescaling For each sweep of each protocol other than activation, it was rescaled by ratio of the matching activation sweep peak current divided by the given sweep peak current before normalization by I max . Concretely, each sweep of the deactivation protocol was rescaled by the activation sweep peak when the cell is held at +70mV. Each trace of the inactivation protocol was rescaled by the matching activation sweep. Finally, each sweep of the recovery protocol was rescaled by the activation sweep peak when the cell is held at +50mV. Excluding systematic recording artifacts A significant number of sweeps showed fast negative deflection artifacts whenever voltage-clamping level was changed. This behavior does not arise from channel gating dynamics, therefore, after taking the previously described data processing steps, we excluded any points that are more negative than − 0.01. This is to avoid the model being penalized for not fitting the data it by construction can not reproduce. Down-sampling of sweeps In order to speed up model training we down-sampled all the sweeps by using the M4 down-sampler. The M4 down-sampler was chosen because of its simplicity, efficiency and preservation of extrema [ 21 ]. More specifically, for a given time-series x and number of bins b , the M4 down-sampling algorithm starts by dividing x into b non-overlapping bins and then takes the first and the last values in that bin, as well as the maximal and the minimal remaining values. Therefore, the M4 down-sampler reduces the length of a time-series from the initial length k to 4 b . Each initial 100ms baseline recording was reduced from 1000 to 9 points: 3 points from the first 40ms, 3 points from 40ms to 50ms and 3 points from 50ms to 98ms, all spaced equidistantly within each of these periods. The final 100ms was also down-sampled to 3 equidistant points. For the activation protocol, the 4000 points starting from 100ms to 600ms were down-sampled to 120 points. For the deactivation protocol, the 3000 points between 100ms to 400ms were down-sampled to 72 points, while the points between 400ms to 600ms were down-sampled to 48 points. For the inactivation protocol the 15000 points between 100ms and 1500ms were down-sampled to 360 points, whereas the 1000 points between 1600ms to 1700ms were down-sampled to 24 points. Finally, for the recovery protocol, the 15000 points between 100ms and 1600ms were down-sampled to 360 points, the period between the initial +50mV and the test +50mV that was of variable length was down-sampled to 3 points spaced equidistantly, and the second +50mV period of 150ms was down-sampled to 48 points. Down-sampling was the final step of our data processing pipeline. The data remaining at this point was split into training, validation and test data sets (described below). The full raw and the processed data are available to be downloaded at [ 22 ]. Next we move on to describe the general nonlinear mixed effects modelling approach. Nonlinear mixed effects (NMLE) modelling We adapt the definitions of NLME provided in [ 23 , 24 ]. The NLME modelling framework comprises a two level hierarchical structure ( Fig 2 ) with fixed effects Θ at the upper level which do not vary between recorded entities. Fixed effects can be broadly grouped into model parameters θ random effect prior distribution parameters Ω observation model noise parameters σ The lower level consists of random effects η n which account for the inter-individual variability of the observations by individualizing the model parameters θ for the n th individual. In this study the inter-individual variability is between the recorded currents y n for the n th cell. Furthermore, a set of covariates Z n (which are known at the outset) are associated with the n th cell, namely, the temperature of the recording (but see below), as well as the channel type. These three sets of values (Θ, η n and Z n ) are collated via the parameter model g (note the similar but distinct notation for the maximal channel conductance) into the dynamical parameter vector p n of the n th cell The dynamical parameters p n are then fed into the structural model (e.g. an ordinary differential equation (ODE) system) where u n are the dynamical variables being solved for, e.g. the gating variables in the Hodgkin-Huxley formalism. The final step is to link the numerical solution of the ODE system to the experimentally observed quantities y nj , where j denotes the number of different observed quantities for the n th individual. In this study the only observable quantity is the recorded normalized current defined in Equation 10 . After numerically solving Equation 3 , the appropriate variables are derived and passed through a Gaussian observational model to account for observational noise, giving y nj (in this study there is only one observed quantity, therefore j is omitted) where is defined in Equation 10 . In all following equations the dependence of y n on time will be omitted to reduce visual clutter. There are many ways to fit NLME models, both frequentist and Bayesian [ 25 ]. In this study we used both the maximum a posteriori (MAP) conditional log-likelihood objective which can be stated as as well as the maximum a posteriori (MAP) first order conditional estimate (FOCE) of the marginal likelihood [ 9 ] with the random effects for individual cells set to their empirical Bayes estimate (EBE n values defined as In both definitions Θ * is the mode of the fixed effects and p (Θ) is the fixed effect prior distribution. We specify how we used both of these objectives below. K v channel models In this study we use four types of models which we evaluate and fit to the Ranjan et al. [ 4 ] data, all of which follow the general HH equations for the gating variables m i which form the function f in Equation 3 : These equations can be solved numerically to obtain the current I ( t ) conducted by the channels over time. I ( t ) is the product of the gating variables m i ( t ), the maximum channel conductance , the ionic reversal potential E and the gating variable power n i Since we are only interested in the channel gating dynamics captured by m i , instead we derive the normalized current where and by definition. We next describe the four types of HH models that we used, which differ in their scope, the functional forms used for m i ,∞ ( V ) and τ i ( V ), the inclusion of the gating power n i and the inclusion of random effects. The first model type, which we call the classical HH models, is a set of K v models from https://modeldb.science/ . Since a systematic evaluation of existing K v channel models is outside the scope of this work, we selected a number of models based on preliminary tests of their quality of fitting the Ranjan et al. [ 4 ] data for the K v channel being modelled. The K v channels for which we found reasonably good baseline models are K v 1.1 [ 4 ], K v 1.2 [ 26 ], K v 1.5 [ 27 ], K v 3.1 [ 28 ], K v 3.3, K v 3.4 and K v 4.3 which are all from [ 29 ] (see respective publications for specific model structure). The classical HH models serve as the exemplars of the class of models that are currently among the most prominent in computational neuroscience. Since none of the classical HH models included random effects, in addition to the original models, we also analysed the same models with random effects added on their parameters. We used a standard multivariate Gaussian random effect prior and only fitted the EBE n for these models using the FOCE objective (see Eq. 6 ). Addition of random effects allowed for a fairer comparison with the next two types of models and the baseline models, helping to isolate the impact of using alternative functional forms for m i ,∞ ( V ) and τ i ( V ). We call this group of models the classical HH models with random effects. Our third model type is the individual SciML HH models. For this model type, we use neural network-based m i ,∞ ( V ) and τ i ( V ) functions. The models follow the classical HH formalism from Equation 8 , but in this case and where V is voltage, η i,f are the random effects for the appropriate function f, θ i ,∞ and θ i,τ are neural network weights and biases of the i th respective neural network, and are specific types of neural network architecture and T n is the normalized temperature for the n th cell. Specifically, is capped off with a sigmoid nonlinearity and outputs in the range of (0, 1), whereas is capped off with a softplus nonlinearity and outputs in the range of (0, ∞). For all models we used i = 2 gates, therefore there were four vectors of neural network weights per model for a K v type, where each neural network had two hidden layers of 5 units each with L1 regularization of the weights with λ = 10 −4 . Moreover, we used 8 random effects, two for each function. The fourth type of model we use is the unified SciML HH model. This model type is used to model all of the K v types via the same set of fixed effects Θ, largely following the neural network-based and functions used in the individual SciML HH models (including the same hyper-parameters). However, in this case the random effects η i,f contain two components, the truly random effects η * and the augmentation random effects η † which are added element-wise, i.e. .The augmentation random effects for the n th cell are based on the channel type c n (encoded as a 19 dimensional one-hot vector), as well as the normalized temperature ,assuming that the temperature is a noisy estimate of the true temperature by adding a random effect η temp ∼ 𝒩 (0, 1). The observation that the temperature is a noisy estimate is based on the recordings of the electrode tip temperature available in the original data set. We then pass the channel type vector and the normalized temperature to an augmentation neural network where θ aug is the set of neural network weights. This model structure allows the inherent heterogeneity present in the data to be accounted for, while capturing the portion of its variance attributable to different K v types and temperatures via NN aug . Data splitting into training, validation and test data sets For the individual SciML HH model training we split the processed data using a 60% / 20% / 20% fraction for training, validation and test. We took the appropriate fractions from each temperature for each channel type, rather than pooling the temperatures together. The validation and test data derived in this fashion were used for the validation and testing of all model types. However, the training data set for the unified SciML HH model, due to its size, required a different approach. For the unified SciML HH model, we took seven cells for each of the three measured temperatures for each channel type, except for K v 1.8, K v 4.2, K v 12.3. We took seven cells because that was the maximal number of cells that we could take for each channel type such that the resulting data set would be balanced for each temperature and each channel type. This resulted in 357 cells in the training data. We left K v 1.8, K v 4.2, K v 12.3 out of the training data in order to establish whether the unified SciML model could generalize to channel types which were not in the training data set. Model fitting We use the Pumas.jl [ 23 ] and DeepPumas.jl [ 30 ] Julia packages to solve Equations 5 and 6 . Pumas.jl contains efficient and powerful algorithms for NLME modelling, whereas DeepPumas.jl contains the code infrastructure necessary to incorporate neural networks into the NLME modelling. More specifically, it implements algorithms to solve equations 6 , 5 and 7 and uses forward-model automatic differentiation to allow gradient-based optimization techniques. We used the BFGS optimization algorithm from Optim.jl with the gradient calculations handled by Pumas.jl and DeepPumas.jl . Both the classical HH models with random effects and the individual SciML HH type models were fit to the individual K v channel type data, whereas the unified SciML HH model was fit to a unified data set described earlier. For the classical HH models with random effects, we fixed the θ and the Ω values and only fit the σ and the η n values to data. All fitting was done on the JuliaHub ( https://juliahub.com/ ) cloud computing platform using nodes with 8 vCPUs and 64GB of memory. Fits took between three and twenty-four hours, depending on the K v type and the amount of data which was used. All the code that was used to define the models, run the simulations and perform the analysis is accessible at https://github.com/dom-linkevicius/SciMLHHModels.jl.git . The first stage of fitting was shared between the individual and the unified SciML HH models. In the first step of the fitting we used the conditional likelihood objective ( Eq. 5 ) to produce an initial fit of all of the fixed effects, except for the parameters of the random effect prior Ω which was initialized to be standard normal and was held constant throughout this step of the optimization. We ran the optimization for 300 epochs, saving the results every 15 epochs, evaluating the model performance on the validation data and selecting the set of parameters that had the best performance on the validation data. Conditional likelihood is much more numerically efficient due to Θ and η n being optimized jointly whereas, for example, marginal likelihood generally requires a two level optimization scheme. However, conditional likelihood requires appropriate handling of Ω to avoid overly broad random effect distributions which barely penalize extreme η n values and effectively result in different individual models due to the learning being offloaded mostly to the random effects. In the second stage, which was only applied to the unified SciML HH model, we held all of the fixed effect values constant, except for the random effect prior parameters Ω. Then we used the FOCE objective ( Equation 6 ) to fit the Ω. We ran the optimization for 10 iterations. The objective changed very minimally during the 10 iterations (so the quality of the data fit did not change), but the values in Ω were adjusted appropriately. Since the data fitting quality does not change in this step, we opted to omit the individual SciML HH models from this step because our main focus is on the unified SciML HH model (see Results and Discussion). This two stage optimization procedure utilizes the numerical efficiency of the conditional likelihood by first finding the neural network weights capable of representing the functions necessary to model the current conducted via the K v channels. It also safeguards against the over-fitting of the random effects by not allowing the penalty coming from the random effect prior to become negligible via Ω assuming arbitrarily large values. The second step in the optimization pipeline only optimizes Ω using an approximation to the marginal likelihood. This step is meant to calibrate the spread of the random effects in order to properly account for the inherent heterogeneity present in the data that is not due to the differences in temperature or channel types. Under ideal circumstances of large enough compute capabilities, joint fitting of all the fixed effects using only marginal likelihood would be preferable, but was not feasible in the present study. Results As described in detail in the Methods, we fitted two novel types of HH models to voltage clamp data from 20 K v channels collected by Ranjan et al. [ 4 ] and compared them against a set of classical HH models with and without random effects. The first set of seven classical HH models for different K v types was taken from the literature (see Methods). The second set of models was produced by taking the models from the first set and adding random effects on their parameters. The third set of 20 models was produced by using neural networks to represent the voltage-dependent gating functions m i ,∞ ( V ) and τ i ( V ) and we call it the individual SciML HH models. The final model again used neural networks to represent m i ,∞ ( V ) and τ i ( V ), but it was fitted to a joint data set of different K v channels, we call this model the unified SciML HH model. We present the results of both the individual and the unified SciML HH models that we fit, along with the performance of the classical HH models and the classical HH models with random effects. We only show the results of the best performing models found during the optimization. For more detailed results of model selection see S1 Appendix. Fig 3 shows the comparison of the different types of HH models for one example channel, K v 1.1, chosen because Ranjan et al. [ 4 ] compare a model for this channel to their data. The four leftmost plots in Fig 3 show the normalised voltage clamp currents (see Methods) for 10 sweeps of the activation protocol at +80mV (black lines) along with the respective model predictions (blue – unified SciML HH, yellow – individual SciML HH, green – classical HH without random effects, pink – classical HH with random effects. Visually, there is a clear difference between the fits for the SciML HH models and the HH models, with the classical HH models performing poorly, the SciML HH models fitting the data reasonably well. The box plots (rightmost plot in Fig 3 ) of the root mean square error (RMSE) show that the SciML HH models significantly outperform the classical HH models with or without random effects (for statistical test results see Table 2 ). The individual SciML HH model significantly outperforms the unified SciML HH model, but the size of the difference is small ( Table 2 ). View this table: View inline View popup Download powerpoint Table 2. Comparison of performance between different models on the test data set. Download figure Open in new tab Fig 3. Comparison of the four different HH model types for the K v 1.1 channel. Left-most panel shows box plots of the test data RMSE values (at the sweep level, e.g. activation at +80mV). The next four plots show 10 activation sweeps at +80mV (from different cells) from the test data set (black) and the matching model predictions (coloured lines), providing a visual link between the RMSE values in the box plot and traces. The classical HH model without random effects (green line) displays variance because even though the model parameters do not have random effects on them, the temperature used in it does. Fig 4 shows the (RMSE) box plots for different model predictions compared to normalised voltage clamp current at the protocol sweep level for individual channel types. The four types of models – unified SciML HH (blue), individual SciML HH (yellow), classical HH without random effects (green) and classical HH with random effects (pink) display a consistent pattern of performance across different K v channel types. Download figure Open in new tab Fig 4. RMSE box plots obtained by comparing the data against model predictions at the sweep level, e.g. Activation protocol at − 10mV. Different colours represent different HH model types: blue – unified SciML HH model, yellow – individual SciML HH models, green – classical HH models re-implemented from existing publications without random effects, pink – classical HH models re-implemented from existing publications but with random effects on their parameters. The number of different cells in the test data set is denoted by n and shown above each subplot. The channel types (K v 1.8, K v 4.2 and K v 12.3) not used in the training of the unified SciML HH model have a light red background to distinguish them from the rest. Note that outliers are not shown and the y axes are not identical between different subplots to enhance legibility. Firstly, the comparisons between the classical HH models with and without random effects confirms the utility of the NLME approach in modelling the K v channel data of Ranjan et al. [ 4 ]. In all seven cases (K v 1.1, K v 1.2, K v 1.5, K v 3.1, K v 3.3, K v 3.4 and K v 4.3) of the implemented classical HH models, the version of the model with random effects significantly outperformed the version without the random effect (see Table 2 for more details). Secondly, comparing the individual SciML models against the classical HH models with random effects allows us to determine which model contains more appropriate functional forms for modelling the K v currents. The functions used to model the gating variables in the classical HH models are constructed by hand and in some cases with biophysical support. We hypothesised that neural networks offer a more flexible and more powerful approach to constructing gating variable functions than the classical approach. As shown in Fig 4 and in Table 2 , the individual SciML HH models fit the data significantly better than the classical HH models with random effects in all seven cases. This comparison indicates that the flexibility in the voltage-dependent gating functions of individual SciML HH models supported better fits to the Ranjan et al. data than the classical HH models. Finally, we compare the unified SciML HH model and the individual SciML HH models. Under ideal circumstances, an individualised channel model would always outperform a more unified model due to its ability to specialize on a particular K v type. However, given that the data is limited and there are similarities between the different K v channel dynamics, a unified model may offer comparable or better performance along with the possibility of generalizing to channel types on which it was not trained. As shown in Fig 4 and in Table 2 , the unified SciMLHH model outperformed the individual SciML HH models in five out of 20 cases, gets outperformed in 11 out of 20 cases and in four out of 20 cases there is no significant difference. Therefore, the individual SciML HH models outperform the unified SciML HH model on the majority of K v channel types. However, looking at the effect sizes of the differences ( Table 2 ), the differences are generally small (Cohen’s d > 0.2), except for K v 10.1 where the difference is medium (Cohen’s d > 0.5). Importantly, the unified SciML HH model performs similarly well to the individual SciML HH models on data from channel types which were not in the training data (K v 1.8, K v 4.2, K v 12.3, see Fig 4 subplots with light red background). Therefore, despite the statistically significant better performance of the individual SciML HH models in a higher proportion of cases, since the effect sizes are generally small and the unified SciML HH model offers a much more parsimonious representation of the data with the ability to generalize to K v channels on which it was not trained, we conclude that the unified SciML HH model is practically preferable to the individual SciML HH models. Therefore, we will restrict further analyses to the unified SciML HH model. We show some example unified SciML HH model predictions on the test data for channel types which were in the training data ( Fig 5 ) and channel types which were not ( Fig 6 ) to illustrate the model’s ability to generalize well. Download figure Open in new tab Fig 5. Samples of the unified SciML HH model predictions for test data for the activation protocol for a subset of channel types used in training: K v 1.1, K v 2.2, K v 3.1, K v 4.1, K v 10.1 and K v 12.1. The model predictions are plotted as black lines, whereas the empirical data is colour coded by the temperature at which it was recorded – blue for 15°C, yellow for 15°C and green for 35°C. Each subplot represents measurements from a different cell. Download figure Open in new tab Fig 6. Samples of the unified SciML HH model predictions for the activation protocol of the test data for a subset of channel types not used in training (K v 1.8, K v 4.2, K v 12.3) and therefore represent the model’s ability to generalize. The model predictions are plotted as black lines, whereas the empirical data is colour coded by the temperature at which it was recorded – blue for 15°C, yellow for 25°C and green for 35°C. Each subplot represents measurements from a different cell. Unified SciML Hodgkin-Huxley model diagnostics To evaluate the model performance in an absolute sense, rather than relative to other types of models we examine a number of diagnostics. The first set of diagnostic plots investigates the distributions of pairs of Empirical Bayes Estimates of random effects (EBEs, defined in Equation 7 ) obtained by fitting them to the test data. As shown in the pair plots in Fig 7 (subplots below the diagonal), the EBEs have a varying range of values, e.g. η 5 or η 8 are relatively more concentrated than η 1 or η 2 . However, visually there seem to be relatively few, if any, correlations between the different η s. The subplots above the diagonal show the RMSE values associated with the pairs of EBEs, and could highlight regions of EBEs which would systematically have higher errors, but no such patterns emerged. We conclude that there is no significant mismatch between the random effect prior and the posterior. Download figure Open in new tab Fig 7. Pair plots of the Empirical Bayes estimates (EBEs) of random effects obtained on the cells in the test data set. The diagonal shows the histogram and a kernel density fit to the EBE distributions. Sub-diagonal subplots show the contour plots of the distribution of pairs of EBEs. Super-diagonal subplots show the scatter plot of the pairs of EBEs with points coloured by the RMSE at the sweep level to check if certain regions of the distributions contain high RMSE points. The second set of diagnostic plots ( Fig 8 ) are classical NLME residuals diagnostics. Fig 8A shows the relationship between the model population level predictions (i.e. not for a particular cell, but for a channel type) and all the observations for that channel type. An ideal model would have a Gaussian error around the yellow y = x line, which denotes a perfect relationship between the observed values and the values predicted by the model. The unified SciML HH model shows approximately this behaviour as both the local linear fits to the contour lines (LOESS, red line) and the global linear fit (OLS, green line) are very close to the ideal line of y = x (yellow line). The error distribution exhibits some heteroscedasticity – the width of the error distribution decreases with increasing x values. However, overall, given that the heteroscedasticity is mild, we conclude that the model fits the data reasonably well at the population level. Download figure Open in new tab Fig 8. Goodness of fit visualizations for the unified SciML HH model on the test data set. Panels contain: A – observations plotted against population predictions, B – observations plotted against individual predictions, C – weighted population residuals plotted against time, D – weighted individual residuals plotted against individual predictions. Each subplot contains either two or three lines: the yellow y = x line (where x is the prediction and y are the observed values), in the top two plots shows an ideal scenario, the green line represents a global ordinary least squares (OLS) fit and the red line represents the locally estimated scatter plot smoothing (LOESS) fit to the data shown in each subplot. The contour line levels represent the log 10 (# of points + 1) (differentiated by the intensity of the contour and shown in the colour bar on the right) and are based on approximately 3 million observed data points present in the test data set. Visually, the individual predictions ( Fig 8B ) are significantly more accurate than the population level predictions ( Fig 8A ). For the individual predictions, the global and local linear fits nearly coincide with the y = x line and there is a high concentration of contour lines around the y = x line with a relatively small standard deviation. Therefore, we conclude that the individual fits obtained via the unified SciML HH model are better than the population fits. Fig 8C analyses the population level residuals weighted by the inverse standard deviation of the observation model and their dependence on time. Therefore, in this plot the residuals can be larger than 1 if a model has a small σ value in the observational model. A well-performing model would show no dependence of the residuals on time, which is nearly true of the unified SciML HH model – the local and the global linear fits (red and green lines) are virtually overlapping and are on the y = 0 line. The wider distribution of the contour plot of the residuals at earlier times might indicate that there is a higher spread of the residuals during those times. However, the length of the recording from a cell was proportional to the number of stimulation protocols and sweeps which were of high enough quality. Therefore, since a significant amount of data was filtered out, there are more shorter recordings than longer ones, and the more numerous shorter recordings will tend display larger variability than the fewer long ones. Therefore, the higher spread of the contour lines at earlier times is most likely a feature of the data used, rather than biased model performance. Finally, Fig 8D plots individual predictions against weighted residuals of individual predictions. Under ideal circumstances the plot would show a 𝒩 (0, 1) distribution around the y = 0 line. The model results show the correct mean behaviour both locally and globally (red and green lines basically overlapping), but not ideal spread that is skewed towards the negative values with a standard deviation larger than one (similar skewness can also be noted in the bottom left plot). This skewness is most likely due to the model structure and normalization of the data. The model cannot produce negative normalized currents, whereas, due to the noise inherent in the data, current values can be negative and they get up-weighted by a small σ in the observational model. Therefore, these diagnostics support the conclusion that the unified SciML model predictions are generally unbiased, both at the population and the individual cell levels. The final set of diagnostics are the visual predictive checks (VPCs) shown in Fig 9 . The VPCs are given for each sweep of each protocol to provide a more granular diagnostic of the model’s performance. For a given model VPCs a produced by sampling k random effects which produces n populations. For each population of k samples we calculate the 95% confidence intervals for the 10%, 50% and 90% quantiles of the data (shaded areas) and then plot the actual observed quantiles. If the observed quantiles fall into the simulated 95% CI of the quantiles, the model is representative of the data to which it was fit. Download figure Open in new tab Fig 9. Visual predictive checks (VPCs) for the unified SciML HH model with one subplot for each sweep of each protocol. Each subplot contains three black lines representing the 10%, 50%, 90% quantiles of the data, as well as three light blue shaded areas for the simulated 95% confidence intervals for the 10%, 50%, 90% quantiles. The red shaded areas show where the observed quantile lines are outside the simulated quantiles. Overall, the VPCs support the conclusion that the unified SciML HH model fits the population level data reasonably well. However, most likely due to the differing amounts of data available for each protocol, there are some differences between the protocols. More specifically, the activation and deactivation protocols show mostly good VPCs, whereas the inactivation and the recovery protocols show still mostly good, but somewhat worse VPCs. Specifically, for the inactivation protocol the model consistently under-predicts the 10% quantile relative to the data. Similarly for the recovery protocol, the model systematically under-predicts the 10% quantile. Therefore, the VPCs indicate that some caution is warranted when the unified SciML HH model is used to simulate channel dynamics involving inactivation or recovery, but otherwise provides general support to the quality of the population predictions of the model. We have provided three model diagnostic plots for the unified SciML HH model, investigating different, if overlapping, aspects of its performance: whether the EBEs are correlated, the residuals and the VPCs. The diagnostics lend significant support to the conclusion that the model predictions for individual cells are highly accurate and the population level predictions are reasonably accurate. Unified SciML Hodgkin-Huxley model gating function behaviour Having established the quality of the unified SciML HH model, we now investigate its properties, starting by showing the fitted m i ,∞ ( V ) and τ i ( V ) functions. We plot the fitted functions for the individual cells for the test data set in Fig 10 and the population predictions in Fig 11 . We provide both plots to illustrate the variability of the gating functions in the test data, and to show the population level predictions made for temperatures not included in the training data. Download figure Open in new tab Fig 10. Individual predictions of the m i ,∞ ( V ) and τ i ( V ) functions with the EBEs for the cells in the test data. Each column represents one plots one function and its dependence on voltage and the plot is split into two groups, the left batch of K v channels and the right batch of K v channels, indicated by the names after the fourth and the eighth columns with the number of cells n in the test data for that channel type. Most cells had data in all three temperatures – 15°C (blue), 25°C (yellow) and 35°C (green). The solid lines represent the median and the shaded area is the 95% confidence interval. Download figure Open in new tab Fig 11. Population predictions of the m i ,∞ ( V ) and τ i ( V ) functions with the η = 0. Each column represents plots for one function and its dependence on voltage and the plot is split into two groups, the left batch of K v channels and the right batch of K v channels, indicated by the names after the fourth and the eighth columns. The colour bar on the right indicates the temperature at which the functions are evaluated. The individual fitted functions ( Fig 10 ) exhibits several patterns. Firstly, m 2,∞ ( V ) approximately follows the classical sigmoidal behaviour of an activation gate, increasing in value as the voltage increases, reaching the maximal value of 1 at different voltages for different K v types. It is notable that m 2,∞ ( V ) shows a small amount of temperature dependence. The steady state behaviour of the first gating particle, m 1,∞ ( V ), however, varies between cells, displaying three clusters of behaviours. Firstly, for some channel types (K v 10.1, K v 10.2, K v 12.1 and K v 12.3) m 1,∞ ( V ) does not show significant dynamics, implying that for those channel types a single gating variable would have been sufficient. Next, a few channel types display a classical inactivating behaviour that may reach close to full (K v 1.3 and K v 3.4) or partial inactivation (K v 1.5, K v 3.1 andK v 4.3). For all remaining channels, m 1,∞ ( V ) shows a mix of inactivating behaviour at low voltages and activating behaviour at high voltages (e.g. see K v 1.8 or K v 4.2, especially at 15°C). This behaviour illustrates the flexibility of the SciML approach. This behaviour may also indicate that adding a third gating variable may provide small improvements for the channel types showing this behaviour in m 1,∞ ( V ). Contrasting τ 1 ( V ), the time constant associated with m 1,∞ ( V ), and τ 2 ( V ), the time constant associated with m 2,∞ ( V ), it is clear that τ 1 ( V ) is generally either only as fast or significantly slower than τ 2 ( V ). Therefore, the main activation represented by m 2,∞ ( V ) is fast, and the gating dynamics modelled via m 1,∞ ( V ) are slow. Generally the τ i ( V ) behave as expected when temperature is increased, in they get smaller (i.e. the equilibration is faster). Recall that if the temperature is increased, reaction rates α i ( V ) and β i ( V ) tend to increase, decreasing the time constant τ i ( V ). Contrary to the results shown in Fig 10 which are based on actual fits using η obtained from individual cells in the test data set, the plots in Fig 11 are obtained by setting η = 0 and setting temperature T ∈ [ 15 , 20 , 25 , 30 , 35 ]. Therefore, Fig 11 provides predictions in cases where no data is available, specifically at temperatures other than 15°C, 25°C and 15°C. For both m 1,∞ ( V ) and m 2,∞ ( V ) their dynamics across temperatures are monotonic, suggesting that the model may generalize reasonably to other temperatures. It is notable that τ 1 ( V ) can take various different functional forms (e.g. see K v 1.8 or K v 3.4) across temperatures. Finally, τ 2 ( V ) shows a fairly consistent functional shape with the largest differences between channel types at higher temperatures. Finally, Fig 12 shows the Q 10 ( V ) values for ratios of the gating time constant functions evaluated at 15°C and 25°C (blue lines), and the ratios of functions evaluated at 25°C and 35°C (orange lines). The most striking feature of these plots is the Q 10 ( V ) values taken for the activation time constant τ 2 ( V ), e.g. 100 at +80mV for K v 3.3 and smaller (but still large) for other channel types. These Q 10 ( V ) values significantly exceed any previously used Q 10 values (e.g. 2-4, see [ 1 ]) used in models of ion channels, as well as empirical estimates provided in [ 4 ]. The Q 10 ( V ) values for τ 1 ( V ) are better aligned with the literature. Importantly, most channel types show significant voltage dependencies for Q 10 ( V ) that can be qualitatively different between the two calculated ratios. Data measured at a set of intermediate temperatures between 15°C and 35°C may be necessary to better constrain the Q 10 ( V ) values of the unified SciML HH model. Download figure Open in new tab Fig 12. Q 10 ( V ) values obtained by evaluating the unified SciML HH model with η = 0 and calculating the ratios of the gating time constant functions τ 1 ( V ), τ 2 ( V ) values evaluated at 15°C and 25°C (blue line) as well as 25°C and 35°C (orange lines). The plot is split into two blocks (two columns each) and each row within a block is for an individual K v channel type. Discussion In this study, we employed scientific machine learning (SciML) and non-linear mixed effects modelling (NLME) to address the challenge of modelling the gating kinetics of a diverse set of voltage-gated potassium ion (K v ) channels, using data from Ranjan et al. [ 4 ]. To our knowledge, no previous work has fully modelled this dataset. Traditional Hodgkin-Huxley-like (HH) approaches to modelling ion channel gating require assumptions (or costly optimization techniques) to determine the appropriate number of gating particles, the functional forms and parameters describing the voltage dependencies of these particles, and the exponents applied to the gating particles. In contrast, we utilized the SciML framework, replacing the traditional functional forms of m i ,∞ ( V ) and τ i ( V ) with neural networks that were appropriately constrained. This allowed us to preserve the general HH framework while only assuming the number of gating particles. All other parameters were then fitted using efficient, gradient-based optimization techniques [ 23 ]. The data we fit the models to showed significant heterogeneity [ 4 ]. In addition to the expected differences in gating kinetics between distinct K v channel types, variability was also observed within cells expressing the same K v type. This within-type variability is challenging to capture with conventional methods for modelling voltage-gated ion channels. However, the NLME approach is specifically designed to account for both between-type and within-type variability by modelling the latter as random effects. We explored two distinct SciML HH modelling approaches: (i) constructing individual SciML HH models for each K v type, and (ii) developing a unified SciML HH model that accommodates all K v types for which there was data, with channel type mapped onto the random effects through an additional neural network NN aug . To assess the relative performance of the SciML HH K v models, we compared them to a set of seven previously published HH models. Since the existing HH models do not account for within-K v -type variability, we incorporated random effects into the parameters of the seven published K v channels. This enabled us to isolate the contributions of the SciML approach – i.e. the data-driven learning of voltage-dependent functions – and evaluate the impact of incorporating random effects in fitting the Ranjan et al. [ 4 ] dataset. Our comparisons demonstrated that both the addition of random effects and the use of the SciML approach independently improved the fit of the K v models to the data (see Fig 4 ). The seven existing HH models fit significantly better when random effects were added. Furthermore, the HH models with random effects were significantly outperformed by the two SciML HH models, in which neural networks represented m i ,∞ ( V ) and τ i ( V ). The next question was whether the individual or unified SciML HH approach performed better. Comparing the two approaches revealed that the individual SciML HH models generally outperformed the unified model. This result is expected, as the neural network architectures used in both approaches were identical. The individual models could specialize more effectively to the specific gating dynamics of each K v type, whereas the unified model had to account for all types. However, while the differences between the individual and unified models were statistically significant, they were generally small. Notably, the unified SciML HH model was able to generalize to three additional K v types that it was not trained on. Given the small performance differences and the advantage of parsimony, we concluded that the unified SciML HH model is preferable. It is also highly extensible to many more voltage-gated channel types. Therefore, our primary contribution is the development, validation, and analysis of the unified SciML HH model, capable of modelling the gating dynamics of at least 20 different K v channel types. There are multiple ways to fit HH models to current recordings and it is worth comparing the software used in this study ( Pumas.jl and DeepPumas.jl ) to other available software packages. For example, Data2Dynamics ( https://github.com/Data2Dynamics/d2d ) is a MATLAB-based software package capable of optimizing the reaction rates of chemical reaction networks in an efficient manner [ 32 ]. This software suite was used in an attempt ( https://github.com/njohner/Kv-kinetic-models ) to model the K v data from Ranjan et al [ 23 ]. Even though Data2Dynamics offers powerful capabilities in optimizing the reaction rates of chemical reaction networks, it does not include algorithms for the optimization of the structure of the networks. Therefore, while powerful in certain use cases, the problem tackled in this study requires a richer set of functionalities, notably usage of neural networks. Another option that is more specialized to computational neuroscience is the Python-based BluePyOpt package [ 33 ]. It has been used in studies to optimize the conductances of ion channels along the dendritic tree of a compartmental neuron model [ 34 , 35 ]. It uses a set of evolutionary algorithms to fit various parameters, such as the maximal channel conductance, distribution of conductances along a dendrite, but it can also be used to optimize the parameters that determine the kinetic properties of individual channel types. However, BluePyOpt does not directly optimize the structure of the functions used for channel gating and therefore does not offer all the functionality necessary to tackle the current challenge. Without going into an extended review of the available tools for fitting chemical reaction networks to data, based on the two aforementioned examples, we conclude that Pumas.jl and DeepPumas.jl offer some of the currently most powerful and feature complete tools and were essential in modelling the different types of K v channels. Therefore, our second contribution is the application of a novel set of approaches, SciML and NLME, to a challenge in computational neuroscience. These tools can be applied to other challenges where significant variance between observed entities is present, for example, modelling of synaptic signalling stemming from highly variable proteomic structures [ 36 ]. The creation of a unified model for 20 different K v channels represents an important first step, but there are many potential directions for future development. The most immediate and promising future direction is extending the current unified model to include recently published data [ 4 ] on other major voltage-gated ion channels (K 2P , K ir , K Ca , Na v , Ca v , and HCN). While some families of voltage-gated channels, such as Kir and Nav, should integrate smoothly into the current unified model – potentially even falling within its existing predictive range – other families with more complex gating mechanisms (e.g. K Ca and Ca v ) will require more sophisticated adaptations. For these, additional components, such as calcium dynamics, may need to be incorporated into the model. Moreover, there is no theoretical limit to the number of temporally varying signals (such as neuromodulators, drugs, etc.) that could be fed as inputs to the neural networks representing the gating functions, depending on the available data. However, practical challenges arise when adding more dimensions or inputs to the neural networks, and alternative approaches would need to be explored to assess their feasibility. One of the potential challenges for the unified SciML HH model lies in its use of one-hot encoding to represent different channel types. If this encoding is naively extended by increasing its dimension, it may lead to an augmentation neural network NN aug with too many parameters, making the model prohibitively expensive to fit. A more practical long-term solution could involve a dimensionality reduction approach, perhaps based on factors like the 3D structure of the channel or its amino acid sequence. The latent representations derived from such an encoding could then be combined with the random effects or used to replace the current one-hot vector altogether. This approach could enable the model to predict the impact of point mutations or other modifications on channel kinetics. Furthermore, encoding the 3D structure or amino acid sequence would facilitate the creation of species-agnostic ion channel models, allowing for the integration of data from different species. A similar dimensionality reduction approach could be applied to external factors affecting channel kinetics, such as neuromodulators or drugs, before passing these latent representations into the neural networks that model the kinetics. In essence, the use of a foundation model – currently popular in deep learning – could be highly beneficial for modelling ion channel gating [ 37 ]. It remains to be seen what predictive and explanatory power such a model could offer. The HH approach to modelling ion channels – where channels are represented by a number of independent gating particles – is just one of several modelling paradigms. In fact, it is a subclass of the broader Markov models, where the gating particles may not be independent. For additional modelling approaches, see [ 38 ]. Recent studies have used single-channel patch-clamp recordings combined with deep learning to infer the most likely Markov schemes underlying the recorded data [ 11 , 39 ]. Although their approaches may initially appear similar to ours, there are several key differences. Firstly, the studies by [ 11 , 39 ] rely on single-channel patch-clamp recordings, which are more challenging to obtain compared to the whole-cell patch-clamp data used in Ranjan et al. [ 4 ]. Consequently, these approaches are suited to different types of questions. For instance, if the focus is on understanding the impact of phosphorylation on the gating of individual channels, the approach taken in [ 11 , 39 ] would likely be more appropriate. However, if the goal is to model the aggregate dynamics of many channels within a large patch of membrane, our approach is likely to provide more accurate predictions. Moreover, our approach is better equipped to handle variability from different sources, such as differences in gating kinetics between cells expressing the same K v type or across different K v types. Additionally, extending the gating mechanisms to include Ca 2+ or other ligands, in addition to voltage, may present more challenges for the Markov scheme approach due to the exponential growth in the number of states. Theoretically we could take different Markov schemes and represent the voltage-dependent gating functions as neural networks, but such an approach would require significant efforts to find an appropriate Markov scheme. Therefore, the approaches in [ 11 , 39 ] and ours may be complementary. If the HH formalism proves insufficiently expressive for modelling a broader range of ion channel types, the approach of [ 11 , 39 ] could provide a more universally appropriate Markov scheme. Our approach could then be applied to model the transition rates within it. In addition to its explanatory and predictive benefits, a foundational approach to modelling ion channel gating could offer practical advantages for modellers. Current detailed compartmental models of neurons (written in e.g. NEURON ) typically require multiple files, each representing a single type of ion channel. There is an abundance of such files in various repositories and databases (notably https://modeldb.science/ [ 7 ]), but these files often differ in their underlying models, even for the same ion channel type. Determining which model is most appropriate and provides the best fit to the data can be difficult and time-consuming. However, if a well-validated foundational model were available, this problem would be significantly alleviated. The burden of creating and maintaining a large number of files for each ion channel would be greatly reduced. Our unified SciML HH model could currently be used in a NEURON .MOD file by incorporating a pre-constructed lookup table for different K v types. However, a significant challenge arises from the inability to use multiple lookup tables within the same .MOD file. Other data formats, such as NeuroML [ 40 ], may present their own challenges when attempting to port our unified SciML HH model to them. If foundation channel gating models are developed in the future, it would be important to collaborate with software developers of compartmental neural modelling simulators. In conclusion, we successfully addressed a major challenge in neuroscience: the efficient and accurate modelling of voltage-gated potassium channel gating. By combining two novel approaches in computational neuroscience – scientific machine learning and non-linear mixed effects modelling – we developed a unified model capable of fitting the gating dynamics of 20 different K v types. Our work demonstrates how these approaches can be seamlessly integrated into existing computational neuroscience approaches. Moreover, the produced unified K v channel gating model may serve as the first step in creating a next generation foundation model that would be able to model all known voltage-gated channel families. The resulting gains in predictive and explanatory power, as well as computational efficiency could help to tackle complex challenges, such as investigating diseases related to ion channels [ 41 ]. Supporting information S1 Appendix. Hyper-parameter optimization . Footnotes ↵ * David.C.Sterratt{at}ed.ac.uk References 1. ↵ Hille B. Ionic Channels of Excitable Membranes . Sinauer ; 2001 . Available from: https://books.google.co.uk/books?id=8Vk-QwAACAAJ . 2. ↵ Hodgkin AL , Huxley AF . A quantitative description of membrane current and its application to conduction and excitation in nerve . The Journal of Physiology . 1952 ; 117 ( 4 ): 500 – 544 . doi: 10.1113/jphysiol.1952.sp004764 . OpenUrl CrossRef PubMed Web of Science 3. ↵ Thorpe SJ . Spike arrival times: A highly efficient coding scheme for neural networks ; 1990 .Available from: https://api.semanticscholar.org/CorpusID:59901370 . 4. ↵ Ranjan R , Logette E , Marani M , Herzog M , Tâche V , Scantamburlo E , et al. A Kinetic Map of the Homomeric Voltage-Gated Potassium Channel (Kv) Family . Frontiers in Cellular Neuroscience . 2019 ; 13 . doi: 10.3389/fncel.2019.00358 . OpenUrl CrossRef PubMed 5. ↵ Alexander SPH , Mathie AA , Peters JA , Veale EL , Striessnig J , Kelly E , et al. British Journal of Pharmacology . 2023 ; 180 ( S2 ): S145 – S222 . doi: 10.1111/bph.16178 . OpenUrl CrossRef PubMed 6. ↵ Johnston J , Forsythe ID , Kopp-Scheinpflug C. SYMPOSIUM REVIEW: Going native: voltage-gated potassium channels controlling neuronal excitability . The Journal of Physiology . 2010 ; 588 ( 17 ): 3187 – 3200 . doi: 10.1113/jphysiol.2010.191973 . OpenUrl CrossRef PubMed 7. ↵ McDougal RA , Morse TM , Carnevale T , Marenco L , Wang R , Migliore M , et al. Twenty years of ModelDB and beyond: building essential modeling tools for the future of neuroscience ; 2017 . 8. ↵ Maler O , Halász Á , Dang T , Piazza C Sterratt DC , Sorokina O , Armstrong JD . Integration of Rule-Based Models and Compartmental Models of Neurons . In: Maler O , Halász Á , Dang T , Piazza C , editors. Hybrid Systems Biology . Cham : Springer International Publishing ; 2015 . p. 143 – 158 . 9. ↵ Walch OJ , Eisenberg MC . Parameter identifiability and identifiable combinations in generalized Hodgkin–Huxley models . Neurocomputing . 2016 ; 199 : 137 – 143 . doi: 10.1016/j.neucom.2016.03.027 . OpenUrl CrossRef 10. ↵ Fink M , Noble D. Markov models for ion channels: Versatility versus identifiability and speed . Philosophical Transactions of the Royal Society A: Mathematical, Physical and Engineering Sciences . 2009 ; 367 : 2161 – 2179 . doi: 10.1098/rsta.2008.0301 . OpenUrl CrossRef PubMed 11. ↵ Oikonomou E , Kolan R , Kern L , Gruber T , Alzheimer C , Krauss P , et al. A deep-learning approach to quasi-instantaneous Markov-modeling of ion channel gating ; 2024 . Presented as poster in FENS2024 conference . Available from: https://fens2024.abstractserver.com/program/#/details/presentations/1099 . 12. ↵ Lindstrom MJ , Bates DM . Nonlinear Mixed Effects Models for Repeated Measures Data ; 1990 . Available from: https://www.jstor.org/stable/2532087?seq=1&cid=pdf- . 13. ↵ Lee JL , Mohamed Shah N , Makmor-Bakry M , Islahudin F , Alias H , Mohd Saffian S. A systematic review of population pharmacokinetic analyses of polyclonal immunoglobulin G therapy . International Immunopharmacology . 2021 ; 97 : 107721 . doi: 10.1016/j.intimp.2021.107721 . OpenUrl CrossRef PubMed 14. ↵ Adéoti OM , Agbla S , Diop A , Glèlè Kakaï R. Nonlinear mixed models and related approaches in infectious disease modeling: A systematic and critical review . Infectious Disease Modelling . 2025 ; 10 ( 1 ): 110 – 128 . doi: 10.1016/j.idm.2024.09.001 . OpenUrl CrossRef PubMed 15. ↵ Wörtwein T , Allen NB , Sheeber LB , Auerbach RP , Cohn JF , Morency LP . Neural Mixed Effects for Nonlinear Personalized Predictions . In: Proceedings of the 25th International Conference on Multimodal Interaction. ICMI ‘23 . New York, NY, USA : Association for Computing Machinery ; 2023 . p. 445 – 454 . Available from: https://doi.org/10.1145/3577190.3614115. 16. ↵ Xiong Y , Kim HJ , Singh V. Mixed Effects Neural Networks (MeNets) With Applications to Gaze Estimation . In: 2019 IEEE/CVF Conference on Computer Vision and Pattern Recognition (CVPR) ; 2019 . p. 7735 – 7744 . 17. ↵ Hornik K , Stinchcombe M , White H. Multilayer feedforward networks are universal approximators . Neural Networks . 1989 ; 2 ( 5 ): 359 – 366 . doi: 10.1016/0893-6080(89)90020-8 . OpenUrl CrossRef Web of Science 18. ↵ Awile O , Kumbhar P , Cornu N , Dura-Bernal S , King JG , Lupton O , et al. Modernizing the NEURON Simulator for Sustainability, Portability, and Performance . Frontiers in Neuroinformatics . 2022 ; 16 . doi: 10.3389/fninf.2022.884046 . OpenUrl CrossRef 19. ↵ Bezanson J , Edelman A , Karpinski S , Shah VB . Julia: A fresh approach to numerical computing . SIAM Review . 2017 ; 59 ( 1 ): 65 – 98 . doi: 10.1137/141000671 . OpenUrl CrossRef PubMed 20. ↵ Savitzky A , Golay MJE . Smoothing and Differentiation of Data by Simplified Least Squares Procedures . Analytical Chemistry . 1964 ; 36 ( 8 ): 1627 – 1639 . doi: 10.1021/ac60214a047 . OpenUrl CrossRef 21. ↵ Jugel U , Jerzak Z , Hackenbroich G , Markl V. M4: a visualization-oriented time series data aggregation . Proc VLDB Endow . 2014 ; 7 ( 10 ): 797 – 808 . doi: 10.14778/2732951.2732953 . OpenUrl CrossRef 22. ↵ Linkevicius D , Chadwick A , Stefan MI , C Sterratt D. Raw and processed data used in the publication “One model to rule them all: unification of voltage-gated potassium channel models via deep non-linear mixed effects modelling” ; 2025 . Available from: addurl. 23. ↵ Rackauckas C , Ma Y , Noack A , Dixit V , Mogensen PK , Elrod C , et al. Accelerated Predictive Healthcare Analytics with Pumas, A High Performance Pharmaceutical Modeling and Simulation Platform . bioRxiv . 2022 ; doi: 10.1101/2020.11.28.402297 . OpenUrl Abstract / FREE Full Text 24. ↵ Duchesne R , Guillemin A , Gandrillon O , Crauste F. Practical identifiability in the frame of nonlinear mixed effects models: the example of the in vitro erythropoiesis . BMC Bioinformatics . 2021 ; p. 1 – 21 . doi: 10.1186/s12859-021-04373-4 . OpenUrl CrossRef 25. ↵ Lee SY . Bayesian Nonlinear Models for Repeated Measurement Data: An Overview, Implementation, and Applications . Mathematics . 2022 ; 10 ( 6 ). doi: 10.3390/math10060898 . OpenUrl CrossRef 26. ↵ Shen W , Hernandez-Lopez S , Tkatch T , Held JE , Surmeier DJ . Kv1.2-Containing K+ Channels Regulate Subthreshold Excitability of Striatal Medium Spiny Neurons . Journal of Neurophysiology . 2004 ; 91 ( 3 ): 1337 – 1349 . doi: 10.1152/jn.00414.2003 . OpenUrl CrossRef PubMed Web of Science 27. ↵ Masoli S , Solinas S , D’Angelo E. Action potential processing in a detailed Purkinje cell model reveals a critical role for axonal compartmentalization . Frontiers in Cellular Neuroscience . 2015 ; 9 . doi: 10.3389/fncel.2015.00047 . OpenUrl CrossRef PubMed 28. ↵ Wang LY , Gan L , Forsythe ID , Kaczmarek LK . Contribution of the Kv3.1 potassium channel to high-frequency firing in mouse auditory neurones . The Journal of Physiology . 1998 ; 509 ( 1 ): 183 – 194 . doi: 10.1111/j.1469-7793.1998.183bo.x . OpenUrl CrossRef PubMed Web of Science 29. ↵ Beining M , Mongiat LA , Schwarzacher SW , Cuntz H , Jedlicka P. T2N as a new tool for robust electrophysiological modeling demonstrated for mature and adult-born dentate granule cells . eLife . 2017 ; 6 : e26517 . doi: 10.7554/eLife.26517 . OpenUrl CrossRef PubMed 30. ↵ Rackauskas Christopher IV . Neural-Embedded Nonlinear Mixed Effects Models (NENLME) in Pumas.jl . In: American Conference on Pharmacometrics ; 2019 . 31. Sawilowsky SS . Very large and huge effect sizes . Journal of Modern Applied Statistical Methods . 2009 ; 8 : 597 – 599 . doi: 10.22237/jmasm/1257035100 . OpenUrl CrossRef 32. ↵ Raue A , Steiert B , Schelker M , Kreutz C , Maiwald T , Hass H , et al. Data2Dynamics: A modeling environment tailored to parameter estimation in dynamical systems . Bioinformatics . 2015 ; 31 : 3558 – 3560 . doi: 10.1093/bioinformatics/btv405 . OpenUrl CrossRef PubMed 33. ↵ Geit WV , Gevaert M , Chindemi G , Rössert C , Courcol JD , Muller EB , et al. BluePyOpt: Leveraging open source software and cloud infrastructure to optimise model parameters in neuroscience . Frontiers in Neuroinformatics . 2016 ; 10 . doi: 10.3389/fninf.2016.00017 . OpenUrl CrossRef PubMed 34. ↵ Masoli S , Rizza MF , Sgritta M , Geit WV , Schürmann F , D’Angelo E. Single neuron optimization as a basis for accurate biophysical modeling: The case of cerebellar granule cells . Frontiers in Cellular Neuroscience . 2017 ; 11 . doi: 10.3389/fncel.2017.00071 . OpenUrl CrossRef PubMed 35. ↵ Migliore R , Lupascu CA , Bologna LL , Romani A , Courcol JD , Antonel S , et al. The physiological variability of channel density in hippocampal CA1 pyramidal cells and interneurons explored using a unified data-driven modeling workflow . PLoS Computational Biology . 2018 ; 14 . doi: 10.1371/journal.pcbi.1006423 . OpenUrl CrossRef 36. ↵ Roy M , Sorokina O , McLean C , Tapia-González S , DeFelipe J , Armstrong JD , et al. Regional diversity in the postsynaptic proteome of the mouse brain . Proteomes . 2018 ; 6 : 1 – 18 . doi: 10.3390/proteomes6030031 . OpenUrl CrossRef 37. ↵ Bommasani R , Hudson DA , Adeli E , Altman RB , Arora S , von Arx S , et al. On the Opportunities and Risks of Foundation Models . CoRR . 2021 ;abs/2108.07258. 38. ↵ Sansom MS , Ball FG , Kerry CJ , McGee R , Ramsey RL , Usherwood PN . Markov, fractal, diffusion, and related models of ion channel gating . A comparison with experimental data from two ion channels. Biophysical Journal . 1989 ; 56 ( 6 ): 1229 – 1243 . doi: 10.1016/S0006-3495(89)82770-5 . OpenUrl CrossRef PubMed Web of Science 39. ↵ Oikonomou E , Gruber T , Chandra AR , Höller S , Alzheimer C , Wellein G , et al. 2D-dwell-time analysis with simulations of ion-channel gating using high-performance computing . Biophysical Journal . 2023 ; 122 ( 7 ): 1287 – 1300 . doi: 10.1016/j.bpj.2023.02.023 . OpenUrl CrossRef PubMed 40. ↵ Goddard NH , Hucka M , Howell F , Cornelis H , Shankar K , Beeman D. Towards NeuroML: Model Description Methods for Collaborative Modelling in Neuroscience . Philosophical Transactions: Biological Sciences . 2001 ; 356 ( 1412 ): 1209 – 1228 . OpenUrl CrossRef PubMed 41. ↵ Musio C. Ion Channels and Neurological Disease . Life . 2024 ; 14 ( 6 ). doi: 10.3390/life14060758 . OpenUrl CrossRef View the discussion thread. Back to top Previous Next Posted April 26, 2025. Download PDF Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following One model to rule them all: unification of voltage-gated potassium channel models via deep non-linear mixed effects modelling Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share One model to rule them all: unification of voltage-gated potassium channel models via deep non-linear mixed effects modelling Domas Linkevicius , Angus Chadwick , Melanie I. Stefan , David C. Sterratt bioRxiv 2025.04.24.650426; doi: https://doi.org/10.1101/2025.04.24.650426 Share This Article: Copy Citation Tools One model to rule them all: unification of voltage-gated potassium channel models via deep non-linear mixed effects modelling Domas Linkevicius , Angus Chadwick , Melanie I. Stefan , David C. Sterratt bioRxiv 2025.04.24.650426; doi: https://doi.org/10.1101/2025.04.24.650426 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Neuroscience Subject Areas All Articles Animal Behavior and Cognition (7640) Biochemistry (17706) Bioengineering (13902) Bioinformatics (41978) Biophysics (21465) Cancer Biology (18611) Cell Biology (25528) Clinical Trials (138) Developmental Biology (13387) Ecology (19920) Epidemiology (2067) Evolutionary Biology (24332) Genetics (15615) Genomics (22519) Immunology (17747) Microbiology (40424) Molecular Biology (17194) Neuroscience (88662) Paleontology (667) Pathology (2838) Pharmacology and Toxicology (4827) Physiology (7650) Plant Biology (15160) Scientific Communication and Education (2046) Synthetic Biology (4302) Systems Biology (9826) Zoology (2271)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00