Full text
92,595 characters
· extracted from
preprint-html
· click to expand
Atlas of the Bacterial Serine-Threonine Kinases expands the functional diversity of the kinome | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results Atlas of the Bacterial Serine-Threonine Kinases expands the functional diversity of the kinome View ORCID Profile Brady O’Boyle , Wayland Yeung , Jason D. Lu , Samiksha Katiyar , Tomer M. Yaron-Barir , View ORCID Profile Jared L. Johnson , Lewis C. Cantley , Natarajan Kannan doi: https://doi.org/10.1101/2025.01.12.632604 Brady O’Boyle 1 Department of Biochemistry & Molecular Biology, University of Georgia , Athens, GA 30602, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Brady O’Boyle Wayland Yeung 7 Institute of Bioinformatics, University of Georgia , Athens, GA 30602, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jason D. Lu 1 Department of Biochemistry & Molecular Biology, University of Georgia , Athens, GA 30602, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Samiksha Katiyar 7 Institute of Bioinformatics, University of Georgia , Athens, GA 30602, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Tomer M. Yaron-Barir 2 Meyer Cancer Center, Weill Cornell Medicine , New York, NY 10021, USA 5 Englander Institute for Precision Medicine, Institute for Computational Biomedicine , Weill Cornell Medicine, New York, NY 10021, USA 6 Columbia University Vagelos College of Physicians and Surgeons , New York, NY 10032, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Jared L. Johnson 2 Meyer Cancer Center, Weill Cornell Medicine , New York, NY 10021, USA 3 Department of Cell Biology, Harvard Medical School , Boston, MA 02115, USA 4 Dana-Farber Cancer Institute, Harvard Medical School , Boston, MA 02215, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Jared L. Johnson Lewis C. Cantley 2 Meyer Cancer Center, Weill Cornell Medicine , New York, NY 10021, USA 3 Department of Cell Biology, Harvard Medical School , Boston, MA 02115, USA 4 Dana-Farber Cancer Institute, Harvard Medical School , Boston, MA 02215, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site Natarajan Kannan 1 Department of Biochemistry & Molecular Biology, University of Georgia , Athens, GA 30602, USA 7 Institute of Bioinformatics, University of Georgia , Athens, GA 30602, USA Find this author on Google Scholar Find this author on PubMed Search for this author on this site For correspondence: nkannan{at}uga.edu Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Bacterial serine-threonine protein kinases (STKs) regulate diverse cellular processes associated with cell growth, virulence, and pathogenicity. They are evolutionarily related to the druggable eukaryotic STKs. However, an incomplete knowledge of how bacterial STKs differ from their eukaryotic counterparts and how they have diverged to regulate diverse bacterial signaling functions presents a bottleneck in targeting them for drug discovery efforts. Here, we classified over 300,000 bacterial STK sequences from the NCBI RefSeq non-redundant and UniProt protein databases into 35 canonical and seven non-canonical (pseudokinase) families based on the patterns of evolutionary constraints in the conserved catalytic domain and flanking regulatory domains. Through statistical comparisons, we identified distinguishing features of bacterial STKs, including a distinctive arginine residue in a regulatory helix (C-Helix) that dynamically couples ATP and substrate binding lobes of the kinase domain. Biochemical and peptide-library screens demonstrated that constrained residues contribute to substrate specificity and kinase activation in the Mycobacterium tuberculosis kinase PknB. Collectively, these findings open new avenues for investigating bacterial STK functions in cellular signaling and for the development of selective bacterial STK inhibitors. Introduction Hanks-type serine-threonine protein kinases, often referred to simply as STKs or protein kinases, are a large family of enzymes that play crucial roles in metabolism, cell signaling, protein regulation, cellular transport, secretory processes, and other cellular pathways ( 1 – 3 ). They accomplish this by catalyzing the transfer of a phosphate group - usually from ATP - to a serine or threonine residue in a target protein substrate, thereby regulating protein functions post translationally. Phosphorylation by serine-threonine protein kinases is a prevalent form of regulation found across all domains of life ( 4 – 8 ). The human genome encodes ∼450 STKs ( 1 ), and orthologs of these proteins have been mapped across diverse eukaryotic species ( 2 , 9 ). Further evolutionary classification of these sequences based on the patterns of conservation and variation in the commonly conserved catalytic domain has identified sequence and structural features contributing to the functional specialization of STK families ( 10 – 18 ) as well as in the development of selective STK inhibitors ( 19 – 23 ). Despite substantial progress in the evolutionary and functional characterization of eukaryotic serine-threonine protein Kinases (eSTKs), the STK complement of microbial genomes remains relatively understudied. One group of understudied Hanks-type protein kinases is the bacterial serine-threonine protein Kinase (bSTK) class, sometimes collectively referred to as PknB ( 24 , 25 ). bSTKs are unrelated to bacterial tyrosine kinases or histidine kinases ( 26 , 27 ), but share a high degree of sequence and structural similarity to eSTKs ( 28 ). Initially discovered in Myxococcus xanthus in 1991 ( 29 ), the number of STKs within bacterial genomes ranges from 1 in Escherichia coli to over 60 in some species of Actinobacteria ( 25 ). bSTKs are of particular interest because of their role in virulence ( 30 – 40 ), bacterial cellular development ( 30 – 32 , 35 , 41 – 50 ), and antibiotic resistance ( 30 , 51 – 56 ). A greater understanding of bSTKs and their integral role in bacterial cellular processes can shed light on their potential use as targets for antibacterial drugs ( 57 – 61 ), further evidenced in a study where a bSTK was targeted to successfully inhibit the growth of methicillin-resistant Staphylococcus aureus (MRSA), a bacterial strain that is resistant to many commonly used antibiotics ( 56 ). In particular, the extensive library of small molecule inhibitors developed for eSTKs can potentially be repurposed for targeting bSTKs involved in bacterial virulence and antibiotic resistance. However, an incomplete knowledge of the evolutionary divergence of bSTKs and eSTKs, and the lack of an evolutionary framework relating diverse bSTK families, has hindered drug discovery efforts and structural understanding of bSTK functional specialization. Previous efforts to identify and classify bSTK sequences have primarily focused on a subset of prokaryotic phyla ( 25 , 62 , 63 ). Although these studies have illuminated pieces of the diversity and evolution of bSTKs, there has yet to be any unified, systematic classification or evolutionary analysis of bSTKs to the degree seen with human protein kinases. Here, we classified nearly 300,000 bSTK protein sequences spanning nearly 26,000 strains into 42 distinct families comprising canonical kinase and noncanonical pseudokinase families, homologous to Pfam pkinase family (PF00069) ( 64 ). Furthermore, using a Bayesian statistical approach successfully employed in the functional classification of eSTKs ( 11 , 16 – 18 , 65 – 71 ), we delineated sequence constraints characteristic of various bSTK families. We analyzed them using available crystal structures and AlphaFold models. In addition to unique domain combinations and sequence indels, we identified co-conserved sequence patterns characteristic of various bSTK families. Biochemical and peptide-library-based characterization of a bSTK conserved RF motif in the C-Helix of the Mycobacterium tuberculosis kinase PknB revealed new insights into substrate recognition and allosteric control of catalytic activity. By revealing shared and unique regulatory mechanisms for bSTKs, our studies open new avenues for repurposing eSTK drugs for bacterial infections. Results 42 bSTK families identified through constraint-based clustering We identified bSTK families using constraint-based sequence clustering of aligned protein sequences from the UniProt ( https://www.uniprot.org ) and NCBI RefSeq non-redundant ( https://www.ncbi.nlm.nih.gov/refseq/about/nonredundantproteins/ ) protein sequence databases. To ensure an accurate sequence alignment of bSTK catalytic domains, we began by generating an alignment profile using 43 experimentally validated bSTKs (data file S1). We then utilized multiply-aligned profiles for global alignment of protein sequences (MAPGAPS) ( 72 ), a profile-based alignment tool, to identify, align and annotate bSTKs from the wealth of publicly available sequence data in the RefSeq Non-Redundant protein sequence database (NR) ( 73 ) and UniProtKB + UniRef protein sequence database ( 74 ). We then grouped aligned kinase domain sequences into hierarchical clusters based on the patterns of functionally conserved residues using the optimal multiple-category Bayesian Partitioning with Pattern Selection (omcBPPS) sampling algorithm ( 75 ) (see methods for details). In brief, omcBPPS samples the space of sequence partitions and associated sequence patterns to classify aligned protein sequences into multiple hierarchical categories. Sequences that share common co-conserved patterns, also referred to as constraints, are grouped into specific categories or families. The families identified using omcBPPS were then used to build family-specific alignment profiles to refine the classification of bSTK families further. We grouped bSTK sequences that did not fall into any identified families into the "Bac_Unique" category. We aligned approximately 300,000 bSTK sequences and classified ∼200,000 sequences into 42 newly defined bSTK families ( Fig. 1 , table S1, data file S2). Taxonomic analysis revealed that many STK families are specific to only one bacterial phylum. Actinobacteria exhibited the most diverse repertoire of STKs, encompassing 13 families and over 100,000 sequences unique to Actinobacterial species. Following this, Proteobacteria comprised 9 families with over 19,000 sequences. Firmicutes included 4 families with 7,000 sequences, Cyanobacteria had three families with 27,000 total sequences, and Myxococcota contained two families with 12,000 sequences. The most prominent bSTK family was KAPD, a gram-positive–specific family that consisted of over 55,000 unique sequences from mainly Actinobacteria and Firmicutes phyla, including one of the most well-studied bSTK proteins, M. tuberculosis PknB. Download figure Open in new tab Fig. 1. bSTK families identified through constraint-based sequence clustering analysis. Euler diagram of the 42 bSTK families identified using omcBPPS. Families are positioned along the x-axis based on the average Hanks-Type constraint score of the sequences within the family, with 0 representing sequences with no Hanks-Type constraints and 1 representing sequences with all Hanks-Type constraints. The sizes of the families are based on the number of sequences filtered at 98% sequence identity. Acronyms and abbreviations designating the families are defined in the Supplementary Materials (table S2). Evolutionarily conserved bacterial pseudokinase families The Hanks-type kinases are defined by key hallmark function motifs that include the catalytic HRD motif, metal-binding DFG motif, and the salt bridge (K 30 -E 49 , based on the bSTK alignment) connecting the β3 strand and αC-Helix ( 4 ). Many of the bSTK families scored very highly for the Hanks-type kinase constraints (fig. S1), suggesting that they retain many functionally important Hanks-type kinase motifs and residues. Some bSTK families, however, scored as low as 30% for Hanks-type kinase constraints. The substitution or absence of these constrained residues suggests divergent catalytic or regulatory mechanisms in these families. Visualization of the sequence patterns (using sequence logos) in these divergent families revealed that seven of the 42 bSTK families displayed variations in one or more catalytic triad residues essential for phosphotransferase activity ( Fig. 2A ), namely the ATP-binding VAIK-Lys, the catalytic HRD-Asp, and the metal-binding DFG-Asp, and therefore are annotated as pseudokinases ( 1 ). Substitution of the VAIK-Lys occurs in all seven of the pseudokinase families. 34% of CP1 members, 60% of DYD and all ActPs1, ActPs2, ActPs3, DLHK, and GLW family sequences lack the VAIK-Lys. Substitution of the HRD-Asp occurs in six of the pseudokinase families. 37% of CP1 family members, 97% of the ActPs3, and 99-100% of the ActPs1, ActPs2, DLHK, and GLW family members lack the HRD-Asp. Likewise, multiple bSTK families diverge in the DFG-Asp position. 17% of CP1 family members, 98% of ActPs3, and 100% of ActPs1, ActPs2, and GLW family members lack the DFG-Asp. AlphaFold3 models ( 76 ) further support the divergence of these families in the active site ( Fig. 2B ) In addition to the active site, we identified family-specific indels (insertions and deletions) in several pseudokinase families (fig. S2). About 60% of sequences belonging to the ActPs1 family had a deletion of about 20 residues between the F- and H-helices, resulting in the deletion of the G-helix. Similarly, at least 50% of sequences in the ActPs3 family had a 40-residue deletion of the activation loop. The crystal structure of the kinase domain of the MviN protein in M. tuberculosis , which falls into the ActPs3 family, further supports this finding by revealing an attenuated activation loop ( 77 ). ActPs2 sequences, on the other hand, display multiple insertions. The most notable insertions are a small insertion between the end of the activation loop and the F-helix, an insertion of about 30 residues between the β3-strand and the C-Helix, and a ∼200 residue insertion in the activation loop (fig. S2). CP1, DYD, DLHK, or GLW displayed no family-specific insertions. Download figure Open in new tab Fig. 2. Conserved bacterial pseudokinase families. ( A ) Sequence logos of the catalytic triad motifs in canonical STKs and in each of the bacterial pseudokinase families. ( B ) Comparison between the active site of canonical STKs and the active site of a representative from each bacterial pseudokinase family. The crystal structure of M. tuberculosis PknB (PDB: 1MRU) is used as the reference canonical STK. AlphaFold3 models ( 76 ) were generated for the kinase domain from a representative sequence of each pseudokinase families (NCBI accession numbers: DLHK WP_188258456.1; ActPs1 WP_093894422.1; GLW MBH9021688.1; ActPs2 WP_032763871.1; DYD WP_039364684.1; ActPs3 WP_046703973.1; CP1 WP_248060551.1). The VAIK motif is colored pink, the catalytic loop is colored green, and the DFG-motif is colored blue. Phylogenetic reconstruction of bSTK families After classifying bSTKs into families using constraint-based clustering, we wanted to validate these families and determine evolutionary relationships between them. To accomplish this, we performed maximum-likelihood phylogenetic reconstruction. Following a purge at 100% sequence identity, ∼200,000 protein sequences of bSTKs belonging to the 42 identified families were used in the analysis (data set S2). We found that the phylogenetic analysis corroborated our constraint-based clustering results, with bSTK sequences from the same family clustering together ( Fig. 3 , data files S3 to 5). Download figure Open in new tab Fig. 3. Representation of a maximum-likelihood phylogenetic analysis. The color of internal nodes denotes the branch support of major clades. Lineages belonging to each of the 4 major clades are distinguished by the color of the branches, with Clade 1, 2, 3, and 4 being colored light orange, green, blue, and pink, respectively. Leaf nodes have a pie chart representing the percentage of the canonical kinase (orange) and pseudokinase (purple). Our phylogenetic analysis reveals that 35 of the 42 bSTK families fall into four major clades Fig. 3 , data files S3 to 5): Clade 1, Clade 2, Clade 3, and Clade 4. We found that three of the four clades are taxonomic-specific. 5 families from a diverse array of bacterial phyla make up Clade 1. Clade 2 consists of almost entirely Actinobacteria-specific families, whereas Clade 3 is predominantly Cyanobacteria-specific and includes families from other lineages. Clade 4 is the largest of the four clades and is composed almost entirely of Proteobacteria and Firmicutes-specific families. 7 bSTK families did not fall into any of these four major clades. Of the 42 families, our phylogenetic analysis revealed that 35 families form monophyletic clades. 6 of the bSTK families are paraphyletic, including Act1, Act2, CCM1, FP1, Cyan1, and PTCK, whereas KAPD is polyphyletic. Act1, Act2, FP1, Cyan1, and PTCK are ancestral to a single other monophyletic STK family (Act1:ActPs1, Act2:ActPs2, FP1:Cyan2, Cyan1:YMGK, and PTCK:GLW). As for CCM1, the family is paraphyletic and split into two groups: ( 1 ) Chloroflexota and ( 2 ) Cyanobacteria and other phyla. This split is observed across multiple runs regardless of the sequences used, with bootstrap values above 75%. Domain and transmembrane analysis reveal family-specific features We performed domain and transmembrane analysis to obtain functional insights into bSTK families. The most common domain architecture among the bSTK families consisted of a kinase domain with a C-terminal transmembrane helix. We observe this domain organization in 25 bSTK families ( Fig. 4 ). KAPD, GN-NS1, and PTCK families are associated with a second protein domain, in addition to the single STK domain and the C-terminal transmembrane region. These data are consistent with previous domain analyses of bSTK-containing protein sequences that reported bSTKs are linked C-terminally to a transmembrane region ( 25 ). This contrasts with membrane-associated eukaryotic kinases, which typically have the transmembrane positioned N-terminal to the kinase domain—a domain organization found in only one of the 42 bSTK families, CCM1. Download figure Open in new tab Fig. 4. Conserved domain architecture for each of the bSTK families. Canonical STK domains are shown as purple blocks, and transmembrane regions are shown as orange circles. Pseudokinase domains are shown as gray blocks and conserved, non-STK domains are shown as white blocks. Domain architecture is shown for domains present in more than 20% of sequences in the bSTK family. For families containing members with variable domain structures, the different domain organizations are shown. Protein domain acronyms are defined in the Supplementary Materials (table S3). 6 of the bSTK families, CCM1, CP, PknK, Cyan2, Cyan3, Myxo1, Myxo2, Proteo1, and DLHK, are associated with more than one conserved domain architecture. CCM1 family members contain a transmembrane region or an FHA domain N-terminus of the kinase domain. A PQQ DH domain C-terminal of the kinase domain also characterizes a distinct CCM1 subfamily. Likewise, PknK and CP1 family members have multiple functional domains linked to the kinase domain. Cyan2, Myxo1, and Myxo2 families are similar in that they have two possible domain architectures: ones consisting of just a C-terminal transmembrane region and others such as Cyan2, Myxo1, and Myxo2 containing a C-terminal GUN4, TPR, and Peptidase_M14NE-CP-C, respectively. Proteo1 families are associated with three domain organizations: a C-terminal transmembrane region, an FGE-sulfatase, and a DUF4384 domain. DLHK family members generally have four other domains on the same polypeptide chain, all C-terminal to the kinase domain. 5 STK families, Strep1, PknG, Strep2, GN-NS1, and Myxo1, contain conserved TPR C-terminal to the kinase domain. Among all 42 bSTK families, this is the only protein domain that appears alongside multiple families. Structural features distinguishing bSTKs from eSTKs We generated sequence logos from profile-based sequence alignments to investigate the sequence and structural basis for bSTK functional divergence. bSTKs contain multiple unique insertions within the kinase domain, including a 4-residue insertion between the β3-strand and the αC-Helix, a 2-residue insertion in the activation loop, and an insertion of varying length within the F-G-H helical bundle (fig. S3). Overall, bSTK catalytic domain lengths are ∼10 amino acid residues longer than their eSTK counterparts. We also identified multiple conserved bSTK-specific motifs. These features are highlighted in the M. tuberculosis PknB crystal structure (PDB: 612P, Fig. 5A ). They include a distinctive methionine in the gatekeeper position ( Fig. 5B , fig. S3), a highly conserved methionine in the G-loop ( Fig. 5C , fig. S3), a conserved arginine and phenylalanine (RF) motif in the αC-Helix ( Fig. 5D , fig. S3), and a poly-proline motif in the loop between the G-helix and the H-helix ( Fig. 5E , fig. S3). Download figure Open in new tab Fig. 5. Conserved structural features unique to bSTKs. ( A ) A crystal structure of M. tuberculosis PknB bound to ATP and magnesium serves as the reference structure (PDB: 6I2P). ( B ) The gatekeeper-Met is shown in magenta in the reference structure. ( C ) The G-loop-Met is shown in pink in the reference structure, forming a hydrophobic interface with the αC-Helix. ( D ) The RF motif located within the αC-Helix is colored green. ( E ) The prolines of the poly-proline motif of the GH-loop are shown in cyan. One of the most distinguishing bSTK features is an RF motif in the αC-Helix ( Fig. 5D ). The RF-Phe mediates hydrophobic packing interactions with residues in the N-lobe, particularly a Met in the G-loop. The arginine (Arg 45 based on the bSTK alignment) is present in ∼50% of bSTKs ( Fig. 6A ) and highly conserved in 22 bSTK families (fig. S4). In contrast to the RF-Phe, the RF-Arg is quite dynamic and adopts multiple distinct conformations in available crystal structures and AlphaFold3 models ( Fig. 6B ). We group these conformations into five distinct states. In State 1, the C-Helix-Arg interacts with the phosphate groups of phosphorylated threonines in the activation loop ( Fig. 6C ), whereas in State 2 it forms a cation-pi interaction with a phenylalanine of the C-Helix ( Fig. 6D ). In State 3, the C-Helix-Arg forms a salt bridge with the highly conserved C-Helix-Glu ( Fig. 6E ), whereas in State 4 it hydrogen bonds to the backbone carbonyl of the DFG-Gly in the activation loop ( Fig. 6F ). In the substrate-bound structure of PknB, the C-Helix-Arg forms a salt bridge with a glutamate in the Glycogen accumulation regulator A (GarA) substrate ( Fig. 6G ). Download figure Open in new tab Fig. 6. Conservation and dynamic nature of the C-Helix-Arg in bSTKs ( A ) Sequence probability logo of the canonical bSTK and eSTK C-helices. The conserved, bacterial-specific C-Helix-Arg is annotated with a dotted red box. ( B ) AlphaFold3 model of the C-Helix-Arg, shown in light brown, without interactions. ( C ) AlphaFold3 model of C-Helix-Arg interaction with phosphorylated threonine residues in the activation loop. ( D ) Crystal structure (PDB: 3F69 Chain B) of the C-Helix-Arg forming a cation-pi interaction with a phenylalanine within the C-Helix. ( E ) Crystal structure (PDB: 3ORT) of the C-Helix-Arg forming a salt-bridge with the C-Helix-Glu. ( F ) Crystal structure (PDB: 6B2P) of the C-Helix-Arg forming a hydrogen bond with the backbone of a residue within the activation loop. ( G ) Crystal structure (PDB: 6I2P) of the C-Helix-Arg (Chain B) forming a salt-bridge with a co-crystalized substrate, GarA, shown in dark green. ( H ) Rate of in vitro autophosphorylation of His-tagged WT and R45M PknB at different time points (0, 10, 30, 120 minutes). The percent phosphorylation at each time point was determined based on the phosphorylated and unphosphorylated protein band densities quantified using a LICOR Odyssey M imager (fig. S5). Autophosphorylation assays were performed in triplicate and significance was calculated using an unpaired t-test for each time point (*, P <0.05). To evaluate if the C-Helix-Arg plays a role in modulating kinase activity, we mutated the M. tuberculosis PknB C-Helix-Arg 55 (referred to as Arg 45 for consistency) to a methionine (R45M), a variant observed on other bSTKs (fig. S4) and measured the impact of R45M mutation on kinase autophosphorylation activity. Autophosphorylation activity is seen almost immediately in both PknB variants following the addition of Mg-ATP ( Fig. 6H and fig. S5). However, after 10 minutes the R45M autophosphorylation rate was significantly faster than WT, with almost double the percent phosphorylation. The R45M autophosphorylation rate remained faster than WT for the first 30 minutes of the assay and only after 60 minutes did both the WT and R45M variants display comparable amounts of autophosphorylation. These results suggest a role for R45 in kinase regulation. Effects of constraint mutations on PknB substrate specificity motif To demonstrate that the bSTK constraints have biological relevance in addition to being hallmark features of their respective families, we mutated the M. tuberculosis PknB C-Helix-Arg 45 and a KAPD-specific constraint within the D-helix, Arg 101 (referred to as Arg 87 for consistency), to a methionine (R45M) and alanine (R87A), respectively. These amino acid variants are found in other bSTKs and were selected to preserve the activity and stability of the kinase. We then used a Positional Scanning Peptide Array (PSPA) analysis to generate a substrate specificity consensus motif for the Wild-Type PknB and the two mutants (data files S6 to S8). The wild-type (WT) PknB strongly prefers negatively charged residues and has a low tolerance for hydrophobic residues N-terminus of the phosphoacceptor site ( Fig. 7A , fig. S6). On the C-terminus of the phosphoacceptor site, the WT PknB generally prefers charged or polar residues, particularly at the +1 position, where the most highly preferred residue is glutamine. In contrast, the R45M mutation substantially altered peptide substrate preference. Although amino-acid preferences N-terminus of the phosphoaccetor site are comparable to WT ( Fig. 7B , fig. S7), consensus motifs in the C-terminus are substantially different, with preference for hydrophobic residues at the +2, +3 and +4 positions and some preference for a polar or charged amino acid at the +1 position. In the case of the R87A mutant, the substrate specificity consensus motif is drastically different from WT on both termini of the phosphoacceptor ( Fig. 7C , fig. S8). On the N-terminal side of the phosphorylation site, the amino-acid preference changes from acidic to basic or polar amino acids and demonstrates an increased tolerance for hydrophobic residues. Overall preference for specific residues N-terminus of the phosphorylation site is lower than WT. On the C-terminus of the phosphorylation site, however, R87A shows a strong preference for hydrophobic residues, particularly at the +2 and +3 positions, and a negative selection for acidic/charged residues and prolines. Download figure Open in new tab Fig. 7. Substrate specificity consensus motif of M. tuberculosis PknB mutants and their modifications to surface electrostatics. ( A ) PknB WT substrate specificity consensus motif and heatmap. The effect that an amino acid at a given position within the peptide has on substrate phosphorylation relative to other amino acids at the same position is noted with larger characters in the sequence logo indicating a more substantial effect on phosphorylation. Amino acids above the x-axis indicate a positive effect on the favorability of substrate phosphorylation relative to other amino acids, and amino acids below the x-axis indicate a negative effect on favorability. The heatmap provides the log-scale favorability values for each amino acid at each position within the peptide, with indicating positive favorability values and blue indicating negative favorability values. ( B and C ) substrate specificity consensus motifs and heatmaps for PknB R45M (B) and PknB R87A (C). ( D ) Surface electrostatic visualization of PknB WT bound to a modeled peptide (shown in cyan). N- and C-termini of the peptide are indicated with N and C, respectively. Red indicates a negative charge, blue indicates a positive charge, and gray indicates a neutral charge. ( E and F ) Comparison of the PknB WT surface electrostatics with those of PknB R45M (E) and PknB R87A (F). The dashed circles indicate the arginine side chain in the WT protein and its absence in the mutant proteins to highlight its effect on the local surface electrostatics. To obtain structural insights into the altered substrate specificity of the R45M and R87A mutants, we modeled a peptide into the substrate binding region of PknB and visualized the surface electrostatics ( Fig. 7D ). The R87A mutation creates a negatively charged surface patch surrounding the D-helix relative to WT PknB and a deeper groove for accommodating residues in the N-terminal region of the substrate peptide ( Fig. 7E ). In contrast, the R45M mutant creates a more neutral charge in a large pocket near the junction of the C-Helix and the activation loop, near where the C-terminus of the peptide binds ( Fig. 7F ). Together these structural changes provide a plausible explanation for the observed differences in the peptide substrate specificity profiles displayed by mutant and WT PknB. Discussion In this study, we report a comprehensive classification of bSTKs into 42 distinct families based on a comprehensive informatics analysis of over 300,000 bacterial kinase sequences. We demonstrate that bSTKs are a diverse class of enzymes with substantial variations in both primary sequence and 3D structures. The constraint patterns represent the defining residues for each bSTK family and serve as a quantitative metric for annotating sequences into one of the families. These constraints can be utilized to characterize family-specific regulatory and mechanistic traits at the molecular level. We demonstrated this in PknB, in which the mutation of KAPD-specific arginine (R 87 in reference to the bSTK alignment) in the D-helix results in a considerably different substrate specificity consensus motif compared to the WT PknB. Actinobacteria have the most diverse array of bSTK families. This phylum is one of the largest, most common, and most diverse bacterial phyla, with members of this taxonomic group represented in terrestrial and aquatic ecosystems ( 78 ). Previous studies have reported that in Actinobacteria, protein kinases are the predominant type of membrane-associated signaling component ( 79 ). The diversity of Actinobacterial STKs identified in our study further supports their proposed roles in diverse bacterial functions ( 78 , 80 ). Although the functions of most bSTKs are yet to be determined, our analysis of their domain architectures suggest important functional roles. For example, the KAPD family of STKs carry a conserved penicillin-binding and serine-threonine kinase–associated (PASTA) domain, C-terminal to the kinase domain and a transmembrane region. This architecture is well-documented in bSTK, with multiple PASTA domains in the same polypeptide chain ( 81 ). In Streptococcus pneumoniae and M. tuberculosis, the PASTA domains serve as extracellular sensors by binding peptidoglycans and subsequently activating their associated STK, which phosphorylates its substrate and begins a signaling cascade to regulate cell division or peptidoglycan synthesis ( 30 , 82 – 84 ). Given the widespread presence of membrane-associated bSTK families (28 of 42 bSTK families), many of the STK families may be involved in communicating extracellular signals to intracellular response in a manner analogous to receptor tyrosine kinases. Another domain of note is the TPR domain, which is present in multiple divergent bSTK families mapping to different clades in the phylogenetic tree. TPR domains function as protein scaffolding or interaction modules in many biological functions, including protein import, gene regulation, and mitosis ( 85 ). TPRs are also implicated in host cell adhesion, virulence factor transportation, and the survival of pathogenic organisms within a host ( 86 – 89 ). The crystal structure of PknG, a secreted STK from M. tuberculosis , suggests a role for TPR domain in protein dimerization ( 90 ). We predict that the TPR domain performs an analogous protein interaction role in the GN-NS1, Myxo1, Strep1 and Strep2 families identified in our study. Our study also maps and extends the pseudokinase complement of bSTKs. Conserved eukaryotic pseudokinase families perform important noncatalytic functions such as protein scaffolding, competitive inhibitors, molecular switches, and allosteric activators ( 25 , 91 , 92 ). And although their presence in bacteria is not as ubiquitous, the presence of pseudokinase STK families within bacteria and their unique constraint patterns not seen in eukaryotic kinases hint towards conserved, non-catalytic activity of these families, potentially performing bacterial-specific roles. In eukaryotes, some pseudokinase families also retain the ability to bind ATP or non-canonical small molecules ( 93 ) despite lacking the VAIK-Lys, such as the WNK family ( 94 ), ULK4 ( 18 ), or KSR1 ( 95 , 96 ). Given the conserved substitution of the VAIK-Lys to an arginine, ActPs2 sequences may have evolved non-canonical ligand binding mechanisms ( Fig. 2 ). In DLHK family members, the presence of the HRD-Asp, which is required for ATP hydrolysis, suggests that members of this family may retain the ability to hydrolyze ATP; however, the substitution of both the metal-binding DFG-Asp and HRDxxxxN-Asn would also suggest non-canonical nucleotide binding bSTKs display unique sequence and structural variations in the catalytic domain that provide clues for functional inference and drug development efforts. One of the most distinctive features distinguishing bSTKs from eSTKs is the RF motif in the regulatory C-Helix. The RF motif is rarely observed in eSTKs with the exception of some apicomplexan STKs, which conserve an arginine structurally analogous to the RF-Arg in bSTKs ( 97 ). In the apicomplexan kinase CpCDPK2 ( Cryptosporidium parvum Calcium Dependent Protein Kinase 2), the C-Helix-Arg coordinates with the phosphorylated residue in the activation loop similar to the phosphorylated PknB model proposed in our study ( Fig. 6C ). Furthermore, the multiple conformational states adopted by the RF-motif arginine in different crystal structures of PknB suggests an auto-regulatory role for this motif in bSTKs. Indeed, mutation of the RF-Arg to a methionine alters the rate of autophosphorylation, presumably by relieving the autoinhibitory interactions between the RF-Arg and the C-Helix-Glu that prevents the kinase from adopting an active conformation ( Fig. 6E ). In this regard, the bSTK-specific insert between the β3 strand and the C-Helix (fig. S3) may be relevant because this region is also known to modulate C-Helix movement in PknB and in eSTKs ( 98 ). Another striking feature of bSTKs is the divergence in the ATP binding gatekeeper residues and substrate binding GHI sub-domain. Most eSTKs have a hydrophobic residue or a threonine at the gatekeeper position (PKA Met 121 ), though it varies based on the family. Across bSTKs, however, there is a substantially lower amount of diversity at the gatekeeper position, with methionine being the predominant residues at the gatekeeper in bSTKs. This information can be leveraged to inform drug repurposing efforts aimed at regulating bSTK activity, as the properties of the gatekeeper residue dictate nucleotide binding and Type-1 kinase inhibitor selectivity ( 99 ). A methionine-selective Type-1 kinase inhibitor would serve as a conceptual starting point for bSTK-specific inhibitor design. Likewise, we identified a left-handed poly-proline type II (PPII) helix motif within the GHI-subdomain of some bSTKs, a feature that is not seen in eSTKs. PPI helices have been shown to serve as protein docking sites ( 100 ) and the GHI domain is known to play a role in protein-protein interactions and substrate binding for both bSTKs and eSTKs ( 98 , 101 ). With this information, one can identify potential bSTK substrates and binding partners, further characterizing the functions of bSTKs in cellular signaling pathogenicity and informing the development of bSTK targeting drugs. A structure of PknB cocrystalized with a substrate, GarA, also reveals the C-Helix-Arg plays a role in substrate specificity, which is further corroborated by our Positional Scanning Peptide Array analysis. An arginine to methionine mutation results in PknB preferring a substrate with hydrophobic residues C-terminal to the phosphorylation site. Our analysis also revealed that bSTKs bind peptide substrates in a canonical orientation and that the KAPD-specific constraint, Arg 87 , plays a role in substrate specificity, as previously suggested ( 102 ). Arg 87 , found within the D-Helix, may only require a single acidic residue N-terminal of the phosphorylation site, with the arginine side chain’s flexibility enabling it to interact with any residue at the five N-terminal positions. This would explain why there is such high tolerance for non-acidic residues at those positions within the peptide, and why a single substitution resulted in the loss of specificity towards acidic residues at all five N-terminal positions. Unlike the R45M mutation, however, the R87A not only affects local specificity on the N-terminal side of the phosphoacceptor site, but also the specificity of more distal residues C-terminus to the phosphoacceptor site. This degree of change in the substrate specificity consensus motif is substantial, especially for a single amino acid substitution. This includes an increase in the favorability for methionine at the +1 position over glutamine, which previously was suggested as a crucial residue for PknB substrate phosphorylation ( 49 ). The exact mechanism for how Arg 87 affects the specificity for distant residues of the peptide remains unclear, however, it further emphasizes the importance of these bSTK family constraints in the structure-function and specificity of bSTKs. bSTKs have been shown to play important regulatory roles in bacterial pathogens, making them attractive targets for anti-microbial therapeutics ( 30 , 57 , 103 , 104 ). Several studies have explored this avenue in an effort to combat antimicrobial drug resistance ( 105 – 109 ), however, there are currently no bSTK inhibitors approved for antimicrobial use ( 110 ) due to issues such as toxicity. Many pipelines and assays are already in place to develop therapeutics that target human STKs ( 111 – 114 ). Tailoring these to bSTKs would provide a robust framework for drug development using existing resources, and the constraints that define each of the bSTK families would provide clues for repurposing existing inhibitors to target bSTKs with a greater degree of specificity. The structure and regulatory features we have presented in this paper that are shared among bSTKs, such as bSTK-specific divergence in the gatekeep residues and ATP binding P-loop, could also be used to inform the development of broad spectrum bSTK targeting antimicrobial drugs. Materials and Methods Detection of bSTK sequences In order to align and annotate bSTK sequences from protein databases, 43 experimentally validated bSTK sequences (data file S1) were gathered and aligned using MAFFT v7.453 to create a Multiply-Aligned Profiles for Global Alignment of Protein Sequences (MAPGAPS) profile. Sequences from closely related kinase families identified in Kannan, 2007 ( 24 ) were also aligned and included in the MAPGAPS profile to prevent the misannotation of non-protein kinases as bSTKs. MAPGAPS version 2.1 was then used to annotate bSTKs by aligning protein sequences from the UniRef protein sequence database (obtained February 6, 2020) to the bSTK MAPGAPS profile, from which 45,359 bSTK sequences were annotated. Following an initial run of omcBPPS, protein sequences that fell into STK families identified through omcBPPS were used to build a hierarchical MAPGAPs profile in an effort to further refine protein sequence alignment and STK identification. The NCBI Non-Redundant protein sequence database (obtained June 14, 2022) was also aligned to later versions of the bSTK profile with a total of 500,935 bSTK sequences identified, 294,534 of which were annotated into one of the 42 bSTK families we identified. Bayesian statistical analyses and pattern-based classification of bSTK sequences Constraint-based sequence clustering was performed with the Optimal Multi-Category Bayesian Partitioning with Pattern Selection (omcBPPS) scheme and used to group STKs together into families of evolutionarily related proteins. All omcBPPS runs were run in triplicate. For the initial run, 45,359 bSTK sequences that were initially identified using the MAPGAPS algorithm were used as the input for omcBPPS. Sequences that contained constraint patterns identified from the omcBPPS run were used to build a MAPGAPS profile for their corresponding family. We aligned sequences from the aforementioned protein sequence databases using the MAPGAPS algorithm. The sequences that were annotated by MAPGAPS to belong to each bSTK constraint-cluster (family) were then purged at 95% sequence identity (42,543 sequences) and used as input for omcBPPS to further breakdown each constraint-cluster into unique families or subfamilies. bSTK sequences that did not belong to any of the constraint clusters were also purged at 95% sequence identity and used as an input for omcBPPS to sort them into newly classified bSTK families. This process was repeated multiple times, using HelperBunny to identify whether a constraint pattern matched a previously identified pattern or represented a previously undescribed pattern. We used a quantitative means of evaluating how well any given sequence fit into each of the clusters defined by our model, as previously performed in Yeung et al, 2021 ( 65 ). Each bSTK cluster was associated with a list of constraints that dictated which amino acid(s) were likely to be found at a given alignment position. Furthermore, each constraint was associated with a log-likelihood score which described how specific a constraint was to its respective cluster. To score a sequence against a cluster, we added the log-likelihoods of all the constraints which were true for the query sequence. In order to make this score comparable across clusters, we divided this number by the total log-likelihood of all the cluster’s constraints. This resulted in a range from 0 to 1. For example, a sequence which followed all of a given cluster’s constraints would have received a maximum score of 1 for that cluster, whereas a sequence which did not satisfy any of a given cluster’s constraints would have received a minimum score of 0 for that cluster. For the purposes of discrete classification, we defined a cut-off score for classifying a sequence into a cluster. Based on the distribution of scores from all possible sequence-cluster pairs across multiple test data sets, we defined the optimal cut-off at the global minimum of 0.7 (fig. S9). Comparative Sequence Analysis Comparative sequence analyses between bSTK families and EPKs were performed in Python3 using custom scripts (provided in our computational notebooks). Weblogos were generated using WebLogo 3.7.12, with the colors of the amino acids corresponding to their biochemical properties. Modeling protein structures Protein models for STKs that did not have protein structures available in the Protein Data Bank were predicted using AlphaFold version 3 ( 76 ). Structures were visualized in PyMOL version 2.3.0 ( 115 ). Constraints associated with the bSTK families were mapped to AlphaFold models or crystal structures using a custom Python3 script (provided in our computational notebooks). Substrate bound M. tuberculosis PknB structure was generated through homology modeling using SWISS-MODEL ( 116 ). PkA bound to PKI was used as the homology model template (PDB: 2GFC) and the canonical M. tuberculosis PknB kinase domain (UniProt: P9WI81 residues 11-273) was used as the query sequence. Phylogenetic reconstruction Phylogenetic reconstruction of aligned bSTK domains was performed to model STK evolution in bacteria. The phylogenies of larger datasets were inferred through maximum-likelihood using FastTree2.1 ( 117 ). All bSTK sequences from the NCBI sequence database belonging to the 42 identified families were first purged at 100% sequence identity using CD-HIT ( 118 ) and outlier sequences were removed (201,421 sequences total). FastTree2 was run using the LG model and Gamma20 likelihood was optimized following CAT (categories) approximation. Local support values were calculated using the Shimodaira-Hasegawa test ( 117 ). Phylogenetic analyses were performed on smaller datasets to validate the FastTree results. Phylogenies of datasets containing representatives from each of the bSTK families were inferred using IQ-TREE version 1.6.12 ( 119 ) with ModelFinder ( 120 ). bSTK families were first purged at 90% sequence identity and 15 representative sequences were randomly selected from each family. 5 EPK sequences were also included in the dataset to serve as an outgroup. The substitution model LG ( 121 ) was used with empirical amino acid frequencies and a FreeRate model with 10 categories ( 122 , 123 ). Branch support values were generated using ultrafast bootstrap with 1000 resamples ( 124 , 125 ). Results indicated that sequences from the same clusters consistently formed paraphyletic groups or monophyletic clades with high bootstrap support. Domain and transmembrane analysis Transmembrane regions were predicted by running full length protein sequences through TMHMM-2.0 ( 126 ). Additional domains for each bacterial protein sequence were identified using the bwrpsb api on NCBI with superfamily hits only against the CDD database ( 127 ) with an e-value threshold of 0.01 and with a maximum number of 500 hits. Kinase domains were annotated with our manually curated protein kinase profiles and any domains overlapping the kinase domain were removed. Protein expression and purification The PknB construct (11-288aa) was codon optimized for expression in Escherichia coli using the GeneSmart prediction software (Genscript). DNA sequence was cloned into a pET-28a(+) expression vector at cloning sites EcoRI/NotI. The plasmid containing N-terminal His-tagged PknB was expressed in E. coli BL21 (DE3) cells. Bacteria were cultured in LB media supplemented with 60 µg/mL kanamycin at 37°C. Upon reaching an optical density (OD) of 0.6, E. coli was induced with 1 mM IPTG (Isopropyl β-D-1-thiogalactopyranoside) for 16 hours at 15°C. Subsequently, the bacterial culture was centrifuged at 5000 rpm at 4°C for 15 minutes. The resulting bacterial pellet was then resuspended in a buffer consisting of 50 mM HEPES, 200 mM NaCl, 10% glycerol, and 1 mM PMSF (phenylmethylsulfonyl fluoride) at pH 7. The lysate was clarified through centrifugation at 15,000 rpm at 4°C for 1 hour. The resulting supernatant, containing solubilized PknB, was collected and vacuum filtered through a 0.45 µm filter unit (Fisher Scientific). The bacterial lysate was loaded onto a Cytiva HiTrap TALON crude 1 mL column and eluted across a 0-500 mM imidazole gradient in 1 mL fractions. Protein purity was assessed using SDS-PAGE with Coomassie stain. Fractions were collected and dialyzed against a buffer consisting of 50 mM HEPES, 200 mM NaCl, and 10% glycerol at pH 7 four times over 20 hours. Quantification of PknB was performed using the Bradford Assay (Bio-Rad), revealing a concentration of 0.85 mg/mL. Protein stability was assessed through Differential Scanning Fluorimetry (Applied Biosystems StepOnePlus Real-Time PCR System) for 2 hours with a step increase from 25°C to 95°C. Protein function was assessed using an autophosphorylation assay. The protein was then aliquoted, snap-frozen, and stored at −80°C. R81M (equivalent to R45M within the bSTK alignment and R55M within the M. tuberculosis PknB P9WI81 UniProt sequence entry) and R127A (equivalent to R87A within the bSTK alignment and R101A within the M. tuberculosis PknB P9WI81 UniProt sequence entry) mutations in the PknB kinase domain were introduced using the New England Biolabs Q5 site-directed mutagenesis kit following the manufacturer’s recommendations. Primers were designed using the online NEBaseChanger tool and were generated by Eurofins. Autophosphorylation Assay WT PknB and R45M PknB (both 0.8 mg/mL) were dephosphorylated by incubating with New England Biolabs Lambda Phosphatase, 10mM MnCl 2 , and 10x NEB buffer at room temperature for one hour. To separate the His-tagged kinase from the untagged phosphatase, Co-NTA agarose beads were added to the reaction tube and incubated at 4°C for 1 hour. The beads were washed three times with buffer (50mM HEPES, 200mM NaCl, and 10%, pH 7) and the bound proteins were eluted in wash buffer containing 300mM imidazole. Eluted protein was dialyzed in wash buffer to remove imidazole. Quantification of WT PknB and R45M PknB was performed using the Bradford Assay (Bio-Rad) and the final concentration for both variants was 0.5 mg/mL. For the autophosphorylation assay, 2x kinase buffer (50mM HEPES, 200mM NaCl, 10% glycerol buffer, 20mM MgCl 2 , pH 7) and 5mM ATP were added to a microcentrifuge tube containing either PknB WT or PknB R4M. Tubes were put in a 30°C water bath and samples were taken from the reaction tube at 0, 5, 10, 30, 60 and 120 minutes and the reaction was immediately quenched with 4x SDS reducing sample buffer and 5 minutes on a 95°C heat block. Samples were loaded on a 10% SDS-PAGE, run at 151V for 1 hour and stained with Coomassie blue. The density of the bands of phosphorylated and dephosphorylated protein were quantified using a LICOR Odyssey M instrument. Profiling kinase substrate specificity Recombinant M. tuberculosis PknB preferred substrate was identified using a Positional Scanning Peptide Array analysis, performed as outlined in Johnson et al., 2023 ( 14 ). PknB was added to a 384-well plate that contained a 50uM solution of peptide substrate library mixtures (Anaspec, AS-62017-1 and AS-62335). Assay conditions were as follows: 50 mM HEPES, 200 mM NaCl, and 10% glycerol at pH 7.3. The reaction was initiated with 100 uM of ATP (50 μCi ml−1 γ-32P-ATP, Perkin-Elmer), followed by a 90-minute incubation. After the reaction, solutions were spotted onto streptavidin-conjugated membranes (Promega, V2861), where the biotinylated C-terminal ends of the peptides were tightly associated. The membranes were rinsed, and peptide phosphorylation amounts were imaged using a Typhoon FLA 7000 phosphorimager (GE). Densitometry matrices were generated by quantifying the raw data (GEL file) using ImageQuant (GE). Supplementary Materials Figs. S1–S9. Tables S1–S3. Data files S1–S8. Funding National Institute of Health grant R35 GM139656. Author contributions Conceptualization: BMO, NK Data curation: BMO, WY Formal analysis: BMO, WY, JLJ, TMY Funding acquisition: NK Investigation: BMO, JDL, SK, JLJ Methodology: BMO, WY, JDL, SK, NK Project administration: NK Resources: NK LCC Supervision: NK, SK Validation: BMO, JDL, JLJ Visualization: BMO, TMY Writing – original draft: BMO, JDL, NK Writing – review & editing: BMO WY, JDL, JLJ, NK Competing interests L.C.C. is a founder and member of the board of directors of Agios Pharmaceuticals and is a founder and receives research support from Petra Pharmaceuticals; is listed as an inventor on a patent (WO2019232403A1, Weill Cornell Medicine) for combination therapy for PI3K-associated disease or disorder, and the identification of therapeutic interventions to improve response to PI3K inhibitors for cancer treatment; is a co-founder and shareholder in Faeth Therapeutics; has equity in and consults for Cell Signaling Technologies, Volastra, Larkspur and 1 Base Pharmaceuticals; and consults for Loxo-Lilly. T.M.Y. is a co-founder of DeStroke. J.L.J has received consulting fees from Scorpion Therapeutics and Volastra Therapeutics. W.Y. is currently employed by Tessera Therapeutics. The other authors declare that they have no competing interests. Data and materials availability Jupyter notebooks and full protein sequence datasets are available at the following github repository: https://github.com/boboyle/Atlas-of-Bacterial-Serine-Threonine-Kinome.git . All other data required to evaluate the conclusions in the paper are present in the paper or the Supplementary Materials. Acknowledgements Thank you to members of Dr. Natarajan Kannan’s laboratory, Dr. Patrick Eyers, Dr. Dominic Byrne, and Dr. Benjamin Turk for helpful discussions and valuable feedback. References and Notes 1. ↵ G. Manning , D. B. Whyte , R. Martinez , T. Hunter , S. Sudarsanam , The Protein Kinase Complement of the Human Genome . Science 298 , 1912 – 1934 ( 2002 ). OpenUrl Abstract / FREE Full Text 2. ↵ G. Manning , G. D. Plowman , T. Hunter , S. Sudarsanam , Evolution of protein kinase signaling from yeast to man . Trends Biochem Sci 27 , 514 – 520 ( 2002 ). OpenUrl CrossRef PubMed Web of Science 3. ↵ P. Cohen , Protein kinases--the major drug targets of the twenty-first century? Nat Rev Drug Discov 1 , 309 – 315 ( 2002 ). OpenUrl CrossRef PubMed Web of Science 4. ↵ S. K. Hanks , A. M. Quinn , T. Hunter , The protein kinase family: conserved features and deduced phylogeny of the catalytic domains . Science 241 , 42 – 52 ( 1988 ). OpenUrl Abstract / FREE Full Text 5. P. J. Kennelly , Protein kinases and protein phosphatases in prokaryotes: a genomic perspective . FEMS Microbiol Lett 206 , 1 – 8 ( 2002 ). OpenUrl CrossRef PubMed Web of Science 6. P. J. Kennelly , Archaeal protein kinases and protein phosphatases: insights from genomics and biochemistry . Biochem J 370 , 373 – 389 ( 2003 ). OpenUrl Abstract / FREE Full Text 7. G. A. Khoury , R. C. Baliban , C. A. Floudas , Proteome-wide post-translational modification statistics: frequency analysis and curation of the swiss-prot database . Sci Rep 1 , 90 , srep00090 ( 2011 ). OpenUrl CrossRef PubMed 8. ↵ S. Ramazi , J. Zahiri , Posttranslational modifications in proteins: resources, tools and prediction methods . Database (Oxford) 2021 , baab012 ( 2021 ). OpenUrl CrossRef PubMed 9. ↵ L.-C. Huang , R. Taujale , N. Gravel , A. Venkat , W. Yeung , D. P. Byrne , P. A. Eyers , N. Kannan , KinOrtho: a method for mapping human kinase orthologs across the tree of life and illuminating understudied kinases . BMC Bioinformatics 22 , 446 ( 2021 ). OpenUrl CrossRef PubMed 10. ↵ M. Varjosalo , S. Keskitalo , A. Van Drogen , H. Nurkkala , A. Vichalkovski , R. Aebersold , M. Gstaiger , The protein interaction landscape of the human CMGC kinase group . Cell Rep 3 , 1306 – 1320 ( 2013 ). OpenUrl CrossRef PubMed Web of Science 11. ↵ N. Kannan , A. F. Neuwald , Evolutionary constraints associated with functional specificity of the CMGC protein kinases MAPK, CDK, GSK, SRPK, DYRK, and CK2alpha . Protein Sci 13 , 2059 – 2077 ( 2004 ). OpenUrl CrossRef PubMed Web of Science 12. L. R. Pearce , D. Komander , D. R. Alessi , The nuts and bolts of AGC protein kinases . Nat Rev Mol Cell Biol 11 , 9 – 22 ( 2010 ). OpenUrl CrossRef PubMed Web of Science 13. J. M. Arencibia , D. Pastor-Flores , A. F. Bauer , J. O. Schulze , R. M. Biondi , AGC protein kinases: from structural mechanism of regulation to allosteric drug development for the treatment of human diseases . Biochim Biophys Acta 1834 , 1302 – 1321 ( 2013 ). OpenUrl CrossRef PubMed 14. ↵ J. L. Johnson , T. M. Yaron , E. M. Huntsman , A. Kerelsky , J. Song , A. Regev , T.-Y. Lin , K. Liberatore , D. M. Cizin , B. M. Cohen , N. Vasan , Y. Ma , K. Krismer , J. T. Robles , B. van de Kooij , A. E. van Vlimmeren , N. Andrée-Busch , N. F. Käufer , M. V. Dorovkov , A. G. Ryazanov , Y. Takagi , E. R. Kastenhuber , M. D. Goncalves , B. D. Hopkins , O. Elemento , D. J. Taatjes , A. Maucuer , A. Yamashita , A. Degterev , M. Uduman , J. Lu , S. D. Landry , B. Zhang , I. Cossentino , R. Linding , J. Blenis , P. V. Hornbeck , B. E. Turk , M. B. Yaffe , L. C. Cantley , An atlas of substrate specificities for the human serine/threonine kinome . Nature 613 , 759 – 766 ( 2023 ). OpenUrl CrossRef PubMed 15. R. Roskoski , ERK1/2 MAP kinases: structure, function, and regulation . Pharmacol Res 66 , 105 – 143 ( 2012 ). OpenUrl CrossRef PubMed 16. ↵ N. Kannan , N. Haste , S. S. Taylor , A. F. Neuwald , The hallmark of AGC kinase functional divergence is its C-terminal tail, a cis-acting regulatory module . Proc Natl Acad Sci U S A 104 , 1272 – 1277 ( 2007 ). OpenUrl Abstract / FREE Full Text 17. A. Venkat , G. Watterson , D. P. Byrne , B. O’Boyle , S. Shrestha , N. Gravel , E. E. Fairweather , L. A. Daly , C. Bunn , W. Yeung , I. Aggarwal , S. Katiyar , C. E. Eyers , P. A. Eyers , N. Kannan , Mechanistic and evolutionary insights into isoform-specific “supercharging” in DCLK family kinases . Elife 12 , RP87958 ( 2023 ). OpenUrl CrossRef PubMed 18. ↵ F. Preuss , D. Chatterjee , S. Mathea , S. Shrestha , J. St-Germain , M. Saha , N. Kannan , B. Raught , R. Rottapel , S. Knapp , Nucleotide Binding, Evolutionary Insights, and Interaction Partners of the Pseudokinase Unc-51-like Kinase 4 . Structure 28 , 1184 – 1196 .e6 ( 2020 ). OpenUrl CrossRef 19. ↵ M. W. Karaman , S. Herrgard , D. K. Treiber , P. Gallant , C. E. Atteridge , B. T. Campbell , K. W. Chan , P. Ciceri , M. I. Davis , P. T. Edeen , R. Faraoni , M. Floyd , J. P. Hunt , D. J. Lockhart , Z. V. Milanov , M. J. Morrison , G. Pallares , H. K. Patel , S. Pritchard , L. M. Wodicka , P. P. Zarrinkar , A quantitative analysis of kinase inhibitor selectivity . Nat Biotechnol 26 , 127 – 132 ( 2008 ). OpenUrl CrossRef PubMed Web of Science 20. M. I. Davis , J. P. Hunt , S. Herrgard , P. Ciceri , L. M. Wodicka , G. Pallares , M. Hocker , D. K. Treiber , P. P. Zarrinkar , Comprehensive analysis of kinase inhibitor selectivity . Nat Biotechnol 29 , 1046 – 1051 ( 2011 ). OpenUrl CrossRef PubMed 21. K. S. Bhullar , N. O. Lagarón , E. M. McGowan , I. Parmar , A. Jha , B. P. Hubbard , H. P. V. Rupasinghe , Kinase-targeted cancer therapies: progress, challenges and future directions . Mol Cancer 17 , 48 ( 2018 ). OpenUrl CrossRef PubMed 22. P. Cohen , D. Cross , P. A. Jänne , Kinase drug discovery 20 years after imatinib: progress and future directions . Nat Rev Drug Discov 20 , 551 – 569 ( 2021 ). OpenUrl CrossRef PubMed 23. ↵ F. M. Ferguson , N. S. Gray , Kinase inhibitors: the road ahead . Nat Rev Drug Discov 17 , 353 – 377 ( 2018 ). OpenUrl CrossRef PubMed 24. ↵ N. Kannan , S. S. Taylor , Y. Zhai , J. C. Venter , G. Manning , Structural and functional diversity of the microbial kinome . PLoS Biol 5 , e17 ( 2007 ). OpenUrl CrossRef PubMed 25. ↵ A. Kwon , S. Scott , R. Taujale , W. Yeung , K. J. Kochut , P. A. Eyers , N. Kannan , Tracing the origin and evolution of pseudokinases across the tree of life . Sci Signal 12 , eaav3810 ( 2019 ). OpenUrl Abstract / FREE Full Text 26. ↵ C. Grangeasse , S. Nessler , I. Mijakovic , Bacterial tyrosine kinases: evolution, biological function and structural insights . Phil. Trans. R. Soc. B 367 , 2640 – 2655 ( 2012 ). OpenUrl CrossRef PubMed 27. ↵ M. Foussard , S. Cabantous , J.-D. Pédelacq , V. Guillet , S. Tranier , L. Mourey , C. Birck , J.-P. Samama , The molecular puzzle of two-component signaling cascades . Microbes and Infection 3 , 417 – 424 ( 2001 ). OpenUrl CrossRef PubMed Web of Science 28. ↵ I. A. Stancik , M. S. Šestak , B. Ji , M. Axelson-Fisk , D. Franjevic , C. Jers , T. Domazet-Lošo , I. Mijakovic , Serine/Threonine Protein Kinases from Bacteria, Archaea and Eukarya Share a Common Evolutionary Origin Deeply Rooted in the Tree of Life . J Mol Biol 430 , 27 – 32 ( 2018 ). OpenUrl CrossRef PubMed 29. ↵ W. Zhang , J. Munoz-Dorado , M. Inouye , S. Inouye , Identification of a putative eukaryotic-like protein kinase family in the developmental bacterium Myxococcus xanthus . J Bacteriol 174 , 5450 – 5453 ( 1992 ). OpenUrl Abstract / FREE Full Text 30. ↵ S. N. Nagarajan , C. Lenoir , C. Grangeasse , Recent advances in bacterial signaling by serine/threonine protein kinases . Trends Microbiol 30 , 553 – 566 ( 2022 ). OpenUrl CrossRef PubMed 31. S. N. Nagarajan , S. Upadhyay , Y. Chawla , S. Khan , S. Naz , J. Subramanian , S. Gandotra , V. K. Nandicoori , Protein kinase A (PknA) of Mycobacterium tuberculosis is independently activated and is critical for growth in vitro and survival of the pathogen in the host . J Biol Chem 290 , 9626 – 9645 ( 2015 ). OpenUrl Abstract / FREE Full Text 32. ↵ Y. Chawla , S. Upadhyay , S. Khan , S. N. Nagarajan , F. Forti , V. K. Nandicoori , Protein kinase B (PknB) of Mycobacterium tuberculosis is essential for growth of the pathogen in vitro as well as for survival within the host . J Biol Chem 289 , 13858 – 13875 ( 2014 ). OpenUrl Abstract / FREE Full Text 33. D. A. Pensinger , A. J. Schaenzer , J.-D. Sauer , Do Shoot the Messenger: PASTA Kinases as Virulence Determinants and Antibiotic Targets . Trends Microbiol 26 , 56 – 69 ( 2018 ). OpenUrl CrossRef PubMed 34. N. Dhasmana , N. Kumar , A. Gangwal , C. C. Keshavam , L. K. Singh , N. Sangwan , P. Nashier , S. Biswas , A. P. Pomerantsev , S. H. Leppla , Y. Singh , M. Gupta , Bacillus anthracis chain length, a virulence determinant, is regulated by membrane localized serine/threonine protein kinase PrkC . J Bacteriol 203 , e00582 – 20 , JB.00582–20 ( 2021 ). OpenUrl PubMed 35. ↵ D. A. Pensinger , K. M. Boldon , G. Y. Chen , W. J. B. Vincent , K. Sherman , M. Xiong , A. J. Schaenzer , E. R. Forster , J. Coers , R. Striker , J.-D. Sauer , The Listeria monocytogenes PASTA Kinase PrkA and Its Substrate YvcK Are Required for Cell Wall Homeostasis, Metabolism, and Virulence . PLoS Pathog 12 , e1006001 ( 2016 ). OpenUrl CrossRef PubMed 36. B. Rieck , G. Degiacomi , M. Zimmermann , A. Cascioferro , F. Boldrin , N. R. Lazar-Adler , A. R. Bottrill , F. le Chevalier , W. Frigui , M. Bellinzoni , M.-N. Lisa , P. M. Alzari , L. Nguyen , R. Brosch , U. Sauer , R. Manganelli , H. M. O’Hare , PknG senses amino acid availability to control metabolism and virulence of Mycobacterium tuberculosis . PLoS Pathog 13 , e1006399 ( 2017 ). OpenUrl CrossRef PubMed 37. J. Ge , H. Xu , T. Li , Y. Zhou , Z. Zhang , S. Li , L. Liu , F. Shao , A Legionella type IV effector activates the NF-kappaB pathway by phosphorylating the IkappaB family of inhibitors . Proc Natl Acad Sci U S A 106 , 13725 – 13730 ( 2009 ). OpenUrl Abstract / FREE Full Text 38. C. Michard , D. Sperandio , N. Baïlo , J. Pizarro-Cerdá , L. LeClaire , E. Chadeau-Argaud , I. Pombo-Grégoire , E. Hervet , A. Vianney , C. Gilbert , M. Faure , P. Cossart , P. Doublet , The Legionella Kinase LegK2 Targets the ARP2/3 Complex To Inhibit Actin Nucleation on Phagosomes and Allow Bacterial Evasion of the Late Endocytic Pathway . mBio 6 , e00354 – 00315 ( 2015 ). OpenUrl CrossRef PubMed 39. P.-C. Lee , M. P. Machner , The Legionella Effector Kinase LegK7 Hijacks the Host Hippo Pathway to Promote Infection . Cell Host Microbe 24 , 429 – 438 .e6 ( 2018 ). OpenUrl CrossRef PubMed 40. ↵ S. M. Moss , I. R. Taylor , D. Ruggero , J. E. Gestwicki , K. M. Shokat , S. Mukherjee , A Legionella pneumophila Kinase Phosphorylates the Hsp70 Chaperone Family to Inhibit Eukaryotic Protein Synthesis . Cell Host Microbe 25 , 454 – 462 .e6 ( 2019 ). OpenUrl CrossRef PubMed 41. ↵ A. Fleurie , S. Manuse , C. Zhao , N. Campo , C. Cluzel , J.-P. Lavergne , C. Freton , C. Combet , S. Guiral , B. Soufi , B. Macek , E. Kuru , M. S. VanNieuwenhze , Y. V. Brun , A.-M. Di Guilmi , J.-P. Claverys , A. Galinier , C. Grangeasse , Interplay of the serine/threonine-kinase StkP and the paralogs DivIVA and GpsB in pneumococcal cell elongation and division . PLoS Genet 10 , e1004275 ( 2014 ). OpenUrl CrossRef PubMed 42. P. Kaur , M. Rausch , B. Malakar , U. Watson , N. P. Damle , Y. Chawla , S. Srinivasan , K. Sharma , T. Schneider , G. D. Jhingan , D. Saini , D. Mohanty , F. Grein , V. K. Nandicoori , LipidII interaction with specific residues of Mycobacterium tuberculosis PknB extracytoplasmic domain governs its optimal activation . Nat Commun 10 , 1231 ( 2019 ). OpenUrl CrossRef PubMed 43. L. Zucchini , C. Mercy , P. S. Garcia , C. Cluzel , V. Gueguen-Chaignon , F. Galisson , C. Freton , S. Guiral , C. Brochier-Armanet , P. Gouet , C. Grangeasse , PASTA repeats of the protein kinase StkP interconnect cell constriction and separation of Streptococcus pneumoniae . Nat Microbiol 3 , 197 – 209 ( 2018 ). OpenUrl PubMed 44. A. Fleurie , C. Lesterlin , S. Manuse , C. Zhao , C. Cluzel , J.-P. Lavergne , M. Franz-Wachtel , B. Macek , C. Combet , E. Kuru , M. S. VanNieuwenhze , Y. V. Brun , D. Sherratt , C. Grangeasse , MapZ marks the division sites and positions FtsZ rings in Streptococcus pneumoniae . Nature 516 , 259 – 262 ( 2014 ). OpenUrl CrossRef PubMed 45. N. Holečková , L. Doubravová , O. Massidda , V. Molle , K. Buriánková , O. Benada , O. Kofroňová , A. Ulrych , P. Branny , LocZ is a new cell division protein involved in proper septum placement in Streptococcus pneumoniae . mBio 6 , e01700 – 01714 ( 2014 ). OpenUrl CrossRef PubMed 46. A. Ulrych , N. Holečková , J. Goldová , L. Doubravová , O. Benada , O. Kofroňová , P. Halada , P. Branny , Characterization of pneumococcal Ser/Thr protein phosphatase phpP mutant and identification of a novel PhpP substrate, putative RNA binding protein Jag . BMC Microbiol 16 , 247 ( 2016 ). 47. J. J. Zheng , A. J. Perez , H.-C. T. Tsui , O. Massidda , M. E. Winkler , Absence of the KhpA and KhpB (JAG/EloR) RNA-binding proteins suppresses the requirement for PBP2b by overproduction of FtsA in Streptococcus pneumoniae D39 . Mol Microbiol 106 , 793 – 814 ( 2017 ). OpenUrl CrossRef PubMed 48. M. J. Bergé , C. Mercy , I. Mortier-Barrière , M. S. VanNieuwenhze , Y. V. Brun , C. Grangeasse , P. Polard , N. Campo , A programmed cell division delay preserves genome integrity during natural genetic transformation in Streptococcus pneumoniae . Nat Commun 8 , 1621 ( 2017 ). OpenUrl CrossRef PubMed 49. ↵ C.-M. Kang , D. W. Abbott , S. T. Park , C. C. Dascher , L. C. Cantley , R. N. Husson , The Mycobacterium tuberculosis serine/threonine kinases PknA and PknB: substrate identification and regulation of cell shape . Genes Dev 19 , 1692 – 1704 ( 2005 ). OpenUrl Abstract / FREE Full Text 50. ↵ M. Rausch , J. P. Deisinger , H. Ulm , A. Müller , W. Li , P. Hardt , X. Wang , X. Li , M. Sylvester , M. Engeser , W. Vollmer , C. E. Müller , H. G. Sahl , J. C. Lee , T. Schneider , Coordination of capsule assembly and cell wall biosynthesis in Staphylococcus aureus . Nat Commun 10 , 1404 ( 2019 ). OpenUrl CrossRef PubMed 51. ↵ C. J. Kristich , J. L. Little , C. L. Hall , J. S. Hoff , Reciprocal regulation of cephalosporin resistance in Enterococcus faecalis . mBio 2 , e00199 – 00111 ( 2011 ). OpenUrl CrossRef PubMed 52. E. Cuenot , T. Garcia-Garcia , T. Douche , O. Gorgette , P. Courtin , S. Denis-Quanquin , S. Hoys , Y. D. N. Tremblay , M. Matondo , M.-P. Chapot-Chartier , C. Janoir , B. Dupuy , T. Candela , I. Martin-Verstraete , The Ser/Thr Kinase PrkC Participates in Cell Wall Homeostasis and Antimicrobial Resistance in Clostridium difficile . Infect Immun 87 , e00005 – 19 ( 2019 ). OpenUrl PubMed 53. E. A. Libby , S. Reuveni , J. Dworkin , Multisite phosphorylation drives phenotypic variation in (p)ppGpp synthetase-dependent antibiotic tolerance . Nat Commun 10 , 5133 ( 2019 ). OpenUrl CrossRef PubMed 54. S. L. Kellogg , C. J. Kristich , Convergence of PASTA Kinase and Two-Component Signaling in Response to Cell Wall Stress in Enterococcus faecalis . J Bacteriol 200 , e00086 – 18 ( 2018 ). OpenUrl PubMed 55. A. Chatterjee , R. Poon , S. S. Chatterjee , Stp1 Loss of Function Promotes β-Lactam Resistance in Staphylococcus aureus That Is Independent of Classical Genes . Antimicrob Agents Chemother 64 , e02222 – 19 ( 2020 ). OpenUrl PubMed 56. ↵ S. Kant , S. Asthana , D. Missiakas , V. Pancholi , A novel STK1-targeted small-molecule as an “antibiotic resistance breaker” against multidrug-resistant Staphylococcus aureus . Sci Rep 7 , 5067 ( 2017 ). OpenUrl CrossRef PubMed 57. ↵ M. Z. Khan , P. Kaur , V. K. Nandicoori , Targeting the messengers: Serine/threonine protein kinases as potential targets for antimycobacterial drug development . IUBMB Life 70 , 889 – 904 ( 2018 ). OpenUrl CrossRef PubMed 58. J. V. V. B. Borba , A. C. Silva , M. N. N. Lima , S. S. Mendonca , N. Furnham , F. T. M. Costa , C. H. Andrade , Chemogenomics and bioinformatics approaches for prioritizing kinases as drug targets for neglected tropical diseases . Adv Protein Chem Struct Biol 124 , 187 – 223 ( 2021 ). OpenUrl CrossRef PubMed 59. A. King , M. S. Blackledge , Evaluation of small molecule kinase inhibitors as novel antimicrobial and antibiofilm agents . Chem Biol Drug Des 98 , 1038 – 1064 ( 2021 ). OpenUrl CrossRef PubMed 60. The next giant step for microbes . Nat Biotechnol 41 , 1 ( 2023 ). OpenUrl CrossRef PubMed 61. ↵ V. N. Danilenko , D. I. Osolodkin , S. A. Lakatosh , M. N. Preobrazhenskaya , A. A. Shtil , Bacterial eukaryotic type serine-threonine protein kinases: from structural biology to targeted anti-infective drug design . Curr Top Med Chem 11 , 1352 – 1369 ( 2011 ). OpenUrl CrossRef PubMed 62. ↵ N. Tyagi , K. Anamika , N. Srinivasan , A framework for classification of prokaryotic protein kinases . PLoS One 5 , e10608 ( 2010 ). OpenUrl CrossRef PubMed 63. ↵ A. Odelgard , E. Hägglund , L. Guy , S. G. E. Andersson , Phylogeny and Expansion of Serine/Threonine Kinases in Phagocytotic Bacteria in the Phylum Planctomycetota . Genome Biol Evol 16 , evae068 ( 2024 ). OpenUrl CrossRef PubMed 64. ↵ T. Paysan-Lafosse , A. Andreeva , M. Blum , S. R. Chuguransky , T. Grego , B. L. Pinto , G. A. Salazar , M. L. Bileschi , F. Llinares-López , L. Meng-Papaxanthos , L. J. Colwell , N. V. Grishin , R. D. Schaeffer , D. Clementel , S. C. E. Tosatto , E. Sonnhammer , V. Wood , A. Bateman , The Pfam protein families database: embracing AI/ML . Nucleic Acids Research 53 , D523 – D534 ( 2025 ). OpenUrl CrossRef PubMed 65. ↵ W. Yeung , A. Kwon , R. Taujale , C. Bunn , A. Venkat , N. Kannan , Evolution of Functional Diversity in the Holozoan Tyrosine Kinome . Mol Biol Evol 38 , 5625 – 5639 ( 2021 ). OpenUrl CrossRef PubMed 66. E. Talevich , N. Kannan , Structural and evolutionary adaptation of rhoptry kinases and pseudokinases, a family of coccidian virulence factors . BMC Evol Biol 13 , 117 ( 2013 ). OpenUrl CrossRef PubMed 67. P. A. Eyers , K. Keeshan , N. Kannan , Tribbles in the 21st Century: The Evolving Roles of Tribbles Pseudokinases in Biology and Disease . Trends Cell Biol 27 , 284 – 298 ( 2017 ). OpenUrl CrossRef PubMed 68. S. Shrestha , D. P. Byrne , J. A. Harris , N. Kannan , P. A. Eyers , Cataloguing the dead: breathing new life into pseudokinase research . FEBS J 287 , 4150 – 4169 ( 2020 ). OpenUrl CrossRef PubMed 69. C. Agnew , L. Liu , S. Liu , W. Xu , L. You , W. Yeung , N. Kannan , D. Jablons , N. Jura , The crystal structure of the protein kinase HIPK2 reveals a unique architecture of its CMGC-insert region . J Biol Chem 294 , 13545 – 13559 ( 2019 ). OpenUrl Abstract / FREE Full Text 70. N. Kannan , A. F. Neuwald , S. S. Taylor , Analogous regulatory sites within the alphaC-beta4 loop regions of ZAP-70 tyrosine kinase and AGC kinases . Biochim Biophys Acta 1784 , 27 – 32 ( 2008 ). OpenUrl CrossRef PubMed Web of Science 71. ↵ B. O’Boyle , S. Shrestha , K. Kochut , P. A. Eyers , N. Kannan , Computational tools and resources for pseudokinase research . Methods Enzymol 667 , 403 – 426 ( 2022 ). OpenUrl CrossRef PubMed 72. ↵ A. F. Neuwald , Rapid detection, classification and accurate alignment of up to a million or more related protein sequences . Bioinformatics 25 , 1869 – 1875 ( 2009 ). OpenUrl CrossRef PubMed Web of Science 73. ↵ N. A. O’Leary , M. W. Wright , J. R. Brister , S. Ciufo , D. Haddad , R. McVeigh , B. Rajput , B. Robbertse , B. Smith-White , D. Ako-Adjei , A. Astashyn , A. Badretdin , Y. Bao , O. Blinkova , V. Brover , V. Chetvernin , J. Choi , E. Cox , O. Ermolaeva , C. M. Farrell , T. Goldfarb , T. Gupta , D. Haft , E. Hatcher , W. Hlavina , V. S. Joardar , V. K. Kodali , W. Li , D. Maglott , P. Masterson , K. M. McGarvey , M. R. Murphy , K. O’Neill , S. Pujar , S. H. Rangwala , D. Rausch , L. D. Riddick , C. Schoch , A. Shkeda , S. S. Storz , H. Sun , F. Thibaud-Nissen , I. Tolstoy , R. E. Tully , A. R. Vatsan , C. Wallin , D. Webb , W. Wu , M. J. Landrum , A. Kimchi , T. Tatusova , M. DiCuccio , P. Kitts , T. D. Murphy , K. D. Pruitt , Reference sequence (RefSeq) database at NCBI: current status, taxonomic expansion, and functional annotation . Nucleic Acids Res 44 , D733 – 745 ( 2016 ). OpenUrl CrossRef PubMed 74. ↵ UniProt Consortium , UniProt: the Universal Protein Knowledgebase in 2023 . Nucleic Acids Res 51 , D523 – D531 ( 2023 ). OpenUrl CrossRef PubMed 75. ↵ A. F. Neuwald , A Bayesian Sampler for Optimization of Protein Domain Hierarchies . Journal of Computational Biology 21 , 269 – 286 ( 2014 ). OpenUrl CrossRef PubMed 76. ↵ J. Abramson , J. Adler , J. Dunger , R. Evans , T. Green , A. Pritzel , O. Ronneberger , L. Willmore , A. J. Ballard , J. Bambrick , S. W. Bodenstein , D. A. Evans , C.-C. Hung , M. O’Neill , D. Reiman , K. Tunyasuvunakool , Z. Wu , A. Žemgulytė , E. Arvaniti , C. Beattie , O. Bertolli , A. Bridgland , A. Cherepanov , M. Congreve , A. I. Cowen-Rivers , A. Cowie , M. Figurnov , F. B. Fuchs , H. Gladman , R. Jain , Y. A. Khan , C. M. R. Low , K. Perlin , A. Potapenko , P. Savy , S. Singh , A. Stecula , A. Thillaisundaram , C. Tong , S. Yakneen , E. D. Zhong , M. Zielinski , A. Žídek , V. Bapst , P. Kohli , M. Jaderberg , D. Hassabis , J. M. Jumper , Accurate structure prediction of biomolecular interactions with AlphaFold 3 . Nature 630 , 493 – 500 ( 2024 ). OpenUrl CrossRef PubMed 77. ↵ C. L. Gee , K. G. Papavinasasundaram , S. R. Blair , C. E. Baer , A. M. Falick , D. S. King , J. E. Griffin , H. Venghatakrishnan , A. Zukauskas , J.-R. Wei , R. K. Dhiman , D. C. Crick , E. J. Rubin , C. M. Sassetti , T. Alber , A phosphorylated pseudokinase complex controls cell wall synthesis in mycobacteria . Sci Signal 5 , ra7 ( 2012 ). OpenUrl Abstract / FREE Full Text 78. ↵ E. A. Barka , P. Vatsa , L. Sanchez , N. Gaveau-Vaillant , C. Jacquard , J. P. Meier-Kolthoff , H.-P. Klenk , C. Clément , Y. Ouhdouch , G. P. van Wezel , Taxonomy , Physiology , and Natural Products of Actinobacteria . Microbiol Mol Biol Rev 80 , 1 – 43 ( 2016 ). OpenUrl CrossRef PubMed 79. ↵ X. Huang , D. Pinto , G. Fritz , T. Mascher , Environmental Sensing in Actinobacteria: a Comprehensive Survey on the Signaling Capacity of This Phylum . J Bacteriol 197 , 2517 – 2535 ( 2015 ). OpenUrl Abstract / FREE Full Text 80. ↵ K. Flärdh , M. J. Buttner , Streptomyces morphogenetics: dissecting differentiation in a filamentous bacterium . Nat Rev Microbiol 7 , 36 – 49 ( 2009 ). OpenUrl CrossRef PubMed Web of Science 81. ↵ H. Ogawara , Distribution of PASTA domains in penicillin-binding proteins and serine/threonine kinases of Actinobacteria . J Antibiot (Tokyo ) 69 , 660 – 685 ( 2016 ). OpenUrl CrossRef PubMed 82. ↵ A. Ruggiero , P. De Simone , G. Smaldone , F. Squeglia , R. Berisio , Bacterial cell division regulation by Ser/Thr kinases: a structural perspective . Curr Protein Pept Sci 13 , 756 – 766 ( 2012 ). OpenUrl CrossRef PubMed 83. L. Nováková , S. Bezousková , P. Pompach , P. Spidlová , L. Sasková , J. Weiser , P. Branny , Identification of multiple substrates of the StkP Ser/Thr protein kinase in Streptococcus pneumoniae . J Bacteriol 192 , 3629 – 3638 ( 2010 ). OpenUrl Abstract / FREE Full Text 84. ↵ P. Barthe , G. V. Mukamolova , C. Roumestand , M. Cohen-Gonsaud , The structure of PknB extracellular PASTA domain from mycobacterium tuberculosis suggests a ligand-dependent kinase activation . Structure 18 , 606 – 615 ( 2010 ). OpenUrl CrossRef PubMed 85. ↵ L. D. D’Andrea , L. Regan , TPR proteins: the versatile helix . Trends Biochem Sci 28 , 655 – 662 ( 2003 ). OpenUrl CrossRef PubMed Web of Science 86. ↵ J. E. Bröms , P. J. Edqvist , A. Forsberg , M. S. Francis , Tetratricopeptide repeats are essential for PcrH chaperone function in Pseudomonas aeruginosa type III secretion . FEMS Microbiol Lett 256 , 57 – 66 ( 2006 ). OpenUrl CrossRef PubMed Web of Science 87. P. J. Edqvist , J. E. Bröms , H. J. Betts , A. Forsberg , M. J. Pallen , M. S. Francis , Tetratricopeptide repeats in the type III secretion chaperone, LcrH: their role in substrate binding and secretion . Mol Microbiol 59 , 31 – 44 ( 2006 ). OpenUrl CrossRef PubMed Web of Science 88. S. Chakraborty , M. Monfett , T. M. Maier , J. L. Benach , D. W. Frank , D. G. Thanassi , Type IV pili in Francisella tularensis: roles of pilF and pilT in fiber assembly, host cell adherence, and virulence . Infect Immun 76 , 2852 – 2861 ( 2008 ). OpenUrl Abstract / FREE Full Text 89. ↵ J. Chao , D. Wong , X. Zheng , V. Poirier , H. Bach , Z. Hmama , Y. Av-Gay , Protein kinase and phosphatase signaling in Mycobacterium tuberculosis physiology and pathogenesis . Biochim Biophys Acta 1804 , 620 – 627 ( 2010 ). OpenUrl CrossRef PubMed Web of Science 90. ↵ N. Scherr , S. Honnappa , G. Kunz , P. Mueller , R. Jayachandran , F. Winkler , J. Pieters , M. O. Steinmetz , Structural basis for the specific inhibition of protein kinase G, a virulence factor of Mycobacterium tuberculosis . Proc Natl Acad Sci U S A 104 , 12151 – 12156 ( 2007 ). OpenUrl Abstract / FREE Full Text 91. ↵ P. D. Mace , J. M. Murphy , There’s more to death than life: Noncatalytic functions in kinase and pseudokinase signaling . J Biol Chem 296 , 100705 ( 2021 ). OpenUrl CrossRef PubMed 92. ↵ J. B. Sheetz , M. A. Lemmon , Looking lively: emerging principles of pseudokinase signaling . Trends Biochem Sci 47 , 875 – 891 ( 2022 ). OpenUrl CrossRef PubMed 93. ↵ J. M. Murphy , Q. Zhang , S. N. Young , M. L. Reese , F. P. Bailey , P. A. Eyers , D. Ungureanu , H. Hammaren , O. Silvennoinen , L. N. Varghese , K. Chen , A. Tripaydonis , N. Jura , K. Fukuda , J. Qin , Z. Nimchuk , M. B. Mudgett , S. Elowe , C. L. Gee , L. Liu , R. J. Daly , G. Manning , J. J. Babon , I. S. Lucet , A robust methodology to subclassify pseudokinases based on their nucleotide-binding properties . Biochem J 457 , 323 – 334 ( 2014 ). OpenUrl Abstract / FREE Full Text 94. ↵ B. Xu , J. M. English , J. L. Wilsbacher , S. Stippec , E. J. Goldsmith , M. H. Cobb , WNK1, a novel mammalian serine/threonine protein kinase lacking the catalytic lysine in subdomain II . J Biol Chem 275 , 16795 – 16801 ( 2000 ). OpenUrl Abstract / FREE Full Text 95. ↵ D. F. Brennan , A. C. Dar , N. T. Hertz , W. C. H. Chao , A. L. Burlingame , K. M. Shokat , D. Barford , A Raf-induced allosteric transition of KSR stimulates phosphorylation of MEK . Nature 472 , 366 – 369 ( 2011 ). OpenUrl CrossRef PubMed Web of Science 96. ↵ J. Hu , H. Yu , A. P. Kornev , J. Zhao , E. L. Filbert , S. S. Taylor , A. S. Shaw , Mutation that blocks ATP binding creates a pseudokinase stabilizing the scaffolding function of kinase suppressor of Ras, CRAF and BRAF . Proc Natl Acad Sci U S A 108 , 6067 – 6072 ( 2011 ). OpenUrl Abstract / FREE Full Text 97. ↵ E. Talevich , A. Mirza , N. Kannan , Structural and evolutionary divergence of eukaryotic protein kinases in Apicomplexa . BMC Evol Biol 11 , 321 ( 2011 ). 98. ↵ S. S. Taylor , A. P. Kornev , Protein kinases: evolution of dynamic regulatory proteins . Trends Biochem Sci 36 , 65 – 77 ( 2011 ). OpenUrl CrossRef PubMed Web of Science 99. ↵ D. Fabbro , S. W. Cowan-Jacob , H. Moebitz , Ten things you should know about protein kinases: IUPHAR Review 14 . Br J Pharmacol 172 , 2675 – 2700 ( 2015 ). OpenUrl CrossRef PubMed 100. ↵ A. A. Adzhubei , M. J. E. Sternberg , A. A. Makarov , Polyproline-II helix in proteins: structure and function . J Mol Biol 425 , 2100 – 2132 ( 2013 ). OpenUrl CrossRef PubMed 101. ↵ S. F. F. Pereira , L. Goss , J. Dworkin , Eukaryote-like serine/threonine kinases and phosphatases in bacteria . Microbiol Mol Biol Rev 75 , 192 – 212 ( 2011 ). OpenUrl Abstract / FREE Full Text 102. ↵ S. Prisic , S. Dankwa , D. Schwartz , M. F. Chou , J. W. Locasale , C.-M. Kang , G. Bemis , G. M. Church , H. Steen , R. N. Husson , Extensive phosphorylation with overlapping specificity by Mycobacterium tuberculosis serine/threonine protein kinases . Proc Natl Acad Sci U S A 107 , 7521 – 7526 ( 2010 ). OpenUrl Abstract / FREE Full Text 103. ↵ S. Manuse , A. Fleurie , L. Zucchini , C. Lesterlin , C. Grangeasse , Role of eukaryotic-like serine/threonine kinases in bacterial cell division and morphogenesis . FEMS Microbiol Rev 40 , 41 – 56 ( 2016 ). OpenUrl CrossRef PubMed 104. ↵ D. Djorić , N. E. Minton , C. J. Kristich , The enterococcal PASTA kinase: A sentinel for cell envelope stress . Mol Oral Microbiol 36 , 132 – 144 ( 2021 ). OpenUrl CrossRef PubMed 105. ↵ P. Fernandez , B. Saint-Joanis , N. Barilone , M. Jackson , B. Gicquel , S. T. Cole , P. M. Alzari , The Ser/Thr protein kinase PknB is essential for sustaining mycobacterial growth . J Bacteriol 188 , 7778 – 7784 ( 2006 ). OpenUrl Abstract / FREE Full Text 106. A. Wehenkel , P. Fernandez , M. Bellinzoni , V. Catherinot , N. Barilone , G. Labesse , M. Jackson , P. M. Alzari , The structure of PknB in complex with mitoxantrone, an ATP-competitive inhibitor, suggests a mode of protein kinase regulation in mycobacteria . FEBS Lett 580 , 3018 – 3022 ( 2006 ). OpenUrl CrossRef PubMed 107. D. A. Maslov , A. V. Korotina , K. V. Shur , A. A. Vatlin , O. B. Bekker , S. G. Tolshchina , R. I. Ishmetova , N. K. Ignatenko , G. L. Rusinov , V. N. Charushin , V. N. Danilenko , Synthesis and antimycobacterial activity of imidazo[1,2-b][1,2,4,5]tetrazines . Eur J Med Chem 178 , 39 – 47 ( 2019 ). OpenUrl CrossRef PubMed 108. A. J. Schaenzer , N. Wlodarchak , D. H. Drewry , W. J. Zuercher , W. E. Rose , R. Striker , J.-D. Sauer , A screen for kinase inhibitors identifies antimicrobial imidazopyridine aminofurazans as specific inhibitors of the Listeria monocytogenes PASTA kinase PrkA . J Biol Chem 292 , 17037 – 17045 ( 2017 ). OpenUrl Abstract / FREE Full Text 109. ↵ H. Li , T. Li , Q. Hu , Z. Yao , L. Li , Q. Huang , R. Zhou , Inhibitors targeting the autophosphorylation of serine/threonine kinase of Streptococcus suis show potent antimicrobial activity . Front Microbiol 13 , 990091 ( 2022 ). OpenUrl CrossRef PubMed 110. ↵ R. Roskoski , Properties of FDA-approved small molecule protein kinase inhibitors: A 2021 update . Pharmacol Res 165 , 105463 ( 2021 ). 111. ↵ M. Zhang , Y. Liu , H. Jang , R. Nussinov , Strategy toward Kinase-Selective Drug Discovery . J Chem Theory Comput 19 , 1615 – 1628 ( 2023 ). OpenUrl CrossRef PubMed 112. Z. Gagic , D. Ruzic , N. Djokovic , T. Djikic , K. Nikolic , In silico Methods for Design of Kinase Inhibitors as Anticancer Drugs . Front Chem 7 , 873 ( 2019 ). OpenUrl PubMed 113. B. A. Haubrich , D. C. Swinney , Enzyme Activity Assays for Protein Kinases: Strategies to Identify Active Substrates . Curr Drug Discov Technol 13 , 2 – 15 ( 2016 ). OpenUrl CrossRef PubMed 114. ↵ F. Ferrè , A. Palmeri , M. Helmer-Citterich , Computational methods for analysis and inference of kinase/inhibitor relationships . Front Genet 5 , 196 ( 2014 ). OpenUrl PubMed 115. ↵ The PyMOL Molecular Graphics System, version 2.3.0, Schrödinger, LLC . 116. ↵ A. Waterhouse , M. Bertoni , S. Bienert , G. Studer , G. Tauriello , R. Gumienny , F. T. Heer , T. A. P. de Beer , C. Rempfer , L. Bordoli , R. Lepore , T. Schwede , SWISS-MODEL: homology modelling of protein structures and complexes . Nucleic Acids Res 46 , W296 – W303 ( 2018 ). OpenUrl CrossRef PubMed 117. ↵ M. N. Price , P. S. Dehal , A. P. Arkin , FastTree 2--approximately maximum-likelihood trees for large alignments . PLoS One 5 , e9490 ( 2010 ). OpenUrl CrossRef PubMed 118. ↵ W. Li , A. Godzik , Cd-hit: a fast program for clustering and comparing large sets of protein or nucleotide sequences . Bioinformatics 22 , 1658 – 1659 ( 2006 ). OpenUrl CrossRef PubMed Web of Science 119. ↵ L.-T. Nguyen , H. A. Schmidt , A. von Haeseler , B. Q. Minh , IQ-TREE: a fast and effective stochastic algorithm for estimating maximum-likelihood phylogenies . Mol Biol Evol 32 , 268 – 274 ( 2015 ). OpenUrl CrossRef PubMed 120. ↵ S. Kalyaanamoorthy , B. Q. Minh , T. K. F. Wong , A. von Haeseler , L. S. Jermiin , ModelFinder: fast model selection for accurate phylogenetic estimates . Nat Methods 14 , 587 – 589 ( 2017 ). OpenUrl CrossRef PubMed 121. ↵ S. Q. Le , O. Gascuel , An improved general amino acid replacement matrix . Mol Biol Evol 25 , 1307 – 1320 ( 2008 ). OpenUrl CrossRef PubMed Web of Science 122. ↵ Z. Yang , A space-time process model for the evolution of DNA sequences . Genetics 139 , 993 – 1005 ( 1995 ). OpenUrl Abstract / FREE Full Text 123. ↵ J. Soubrier , M. Steel , M. S. Y. Lee , C. Der Sarkissian , S. Guindon , S. Y. W. Ho , A. Cooper , The influence of rate heterogeneity among sites on the time dependence of molecular rates . Mol Biol Evol 29 , 3345 – 3358 ( 2012 ). OpenUrl CrossRef PubMed 124. ↵ B. Q. Minh , M. A. T. Nguyen , A. von Haeseler , Ultrafast approximation for phylogenetic bootstrap . Mol Biol Evol 30 , 1188 – 1195 ( 2013 ). OpenUrl CrossRef PubMed Web of Science 125. ↵ D. T. Hoang , O. Chernomor , A. von Haeseler , B. Q. Minh , L. S. Vinh , UFBoot2: Improving the Ultrafast Bootstrap Approximation . Mol Biol Evol 35 , 518 – 522 ( 2018 ). OpenUrl CrossRef PubMed 126. ↵ E. L. Sonnhammer , G. von Heijne , A. Krogh , A hidden Markov model for predicting transmembrane helices in protein sequences . Proc Int Conf Intell Syst Mol Biol 6 , 175 – 182 ( 1998 ). OpenUrl CrossRef PubMed 127. ↵ J. Wang , F. Chitsaz , M. K. Derbyshire , N. R. Gonzales , M. Gwadz , S. Lu , G. H. Marchler , J. S. Song , N. Thanki , R. A. Yamashita , M. Yang , D. Zhang , C. Zheng , C. J. Lanczycki , A. Marchler-Bauer , The conserved domain database in 2023 . Nucleic Acids Res 51 , D384 – D388 ( 2023 ). OpenUrl CrossRef PubMed View the discussion thread. Back to top Previous Next Posted January 15, 2025. Download PDF Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following Atlas of the Bacterial Serine-Threonine Kinases expands the functional diversity of the kinome Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share Atlas of the Bacterial Serine-Threonine Kinases expands the functional diversity of the kinome Brady O’Boyle , Wayland Yeung , Jason D. Lu , Samiksha Katiyar , Tomer M. Yaron-Barir , Jared L. Johnson , Lewis C. Cantley , Natarajan Kannan bioRxiv 2025.01.12.632604; doi: https://doi.org/10.1101/2025.01.12.632604 Share This Article: Copy Citation Tools Atlas of the Bacterial Serine-Threonine Kinases expands the functional diversity of the kinome Brady O’Boyle , Wayland Yeung , Jason D. Lu , Samiksha Katiyar , Tomer M. Yaron-Barir , Jared L. Johnson , Lewis C. Cantley , Natarajan Kannan bioRxiv 2025.01.12.632604; doi: https://doi.org/10.1101/2025.01.12.632604 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Bioinformatics Subject Areas All Articles Animal Behavior and Cognition (7635) Biochemistry (17691) Bioengineering (13892) Bioinformatics (41937) Biophysics (21452) Cancer Biology (18589) Cell Biology (25504) Clinical Trials (138) Developmental Biology (13378) Ecology (19899) Epidemiology (2067) Evolutionary Biology (24320) Genetics (15609) Genomics (22506) Immunology (17736) Microbiology (40394) Molecular Biology (17181) Neuroscience (88605) Paleontology (666) Pathology (2832) Pharmacology and Toxicology (4824) Physiology (7641) Plant Biology (15156) Scientific Communication and Education (2045) Synthetic Biology (4294) Systems Biology (9825) Zoology (2271)
Text is read by the "Ask this paper" AI Q&A widget below.
Extraction quality varies by source — PMC NXML preserves structure
cleanly, OA-HTML may include some navigation residue, and OA-PDF can
have broken hyphenation. The publisher copy
(via DOI)
is the canonical version.