QuartPlotR: A quarternary phase diagram tool

preprint OA: closed
📄 Open PDF Full text JSON View at publisher
Full text 14,006 characters · extracted from preprint-html · click to expand
QuartPlotR: A quarternary phase diagram tool | bioRxiv /* */ /* */ <!-- <!-- /*! * yepnope1.5.4 * (c) WTFPL, GPLv2 */ (function(a,b,c){function d(a){return"[object Function]"==o.call(a)}function e(a){return"string"==typeof a}function f(){}function g(a){return!a||"loaded"==a||"complete"==a||"uninitialized"==a}function h(){var a=p.shift();q=1,a?a.t?m(function(){("c"==a.t?B.injectCss:B.injectJs)(a.s,0,a.a,a.x,a.e,1)},0):(a(),h()):q=0}function i(a,c,d,e,f,i,j){function k(b){if(!o&&g(l.readyState)&&(u.r=o=1,!q&&h(),l.onload=l.onreadystatechange=null,b)){"img"!=a&&m(function(){t.removeChild(l)},50);for(var d in y[c])y[c].hasOwnProperty(d)&&y[c][d].onload()}}var j=j||B.errorTimeout,l=b.createElement(a),o=0,r=0,u={t:d,s:c,e:f,a:i,x:j};1===y[c]&&(r=1,y[c]=[]),"object"==a?l.data=c:(l.src=c,l.type=a),l.width=l.height="0",l.onerror=l.onload=l.onreadystatechange=function(){k.call(this,r)},p.splice(e,0,u),"img"!=a&&(r||2===y[c]?(t.insertBefore(l,s?null:n),m(k,j)):y[c].push(l))}function j(a,b,c,d,f){return q=0,b=b||"j",e(a)?i("c"==b?v:u,a,b,this.i++,c,d,f):(p.splice(this.i++,0,a),1==p.length&&h()),this}function k(){var a=B;return a.loader={load:j,i:0},a}var l=b.documentElement,m=a.setTimeout,n=b.getElementsByTagName("script")[0],o={}.toString,p=[],q=0,r="MozAppearance"in l.style,s=r&&!!b.createRange().compareNode,t=s?l:n.parentNode,l=a.opera&&"[object Opera]"==o.call(a.opera),l=!!b.attachEvent&&!l,u=r?"object":l?"script":"img",v=l?"script":u,w=Array.isArray||function(a){return"[object Array]"==o.call(a)},x=[],y={},z={timeout:function(a,b){return b.length&&(a.timeout=b[0]),a}},A,B;B=function(a){function b(a){var a=a.split("!"),b=x.length,c=a.pop(),d=a.length,c={url:c,origUrl:c,prefixes:a},e,f,g;for(f=0;f<d;f++)g=a[f].split("="),(e=z[g.shift()])&&(c=e(c,g));for(f=0;f<b;f++)c=x[f](c);return c}function g(a,e,f,g,h){var i=b(a),j=i.autoCallback;i.url.split(".").pop().split("?").shift(),i.bypass||(e&&(e=d(e)?e:e[a]||e[g]||e[a.split("/").pop().split("?")[0]]),i.instead?i.instead(a,e,f,g,h):(y[i.url]?i.noexec=!0:y[i.url]=1,f.load(i.url,i.forceCSS||!i.forceJS&&"css"==i.url.split(".").pop().split("?").shift()?"c":c,i.noexec,i.attrs,i.timeout),(d(e)||d(j))&&f.load(function(){k(),e&&e(i.origUrl,h,g),j&&j(i.origUrl,h,g),y[i.url]=2})))}function h(a,b){function c(a,c){if(a){if(e(a))c||(j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}),g(a,j,b,0,h);else if(Object(a)===a)for(n in m=function(){var b=0,c;for(c in a)a.hasOwnProperty(c)&&b++;return b}(),a)a.hasOwnProperty(n)&&(!c&&!--m&&(d(j)?j=function(){var a=[].slice.call(arguments);k.apply(this,a),l()}:j[n]=function(a){return function(){var b=[].slice.call(arguments);a&&a.apply(this,b),l()}}(k[n])),g(a[n],j,b,n,h))}else!c&&l()}var h=!!a.test,i=a.load||a.both,j=a.callback||f,k=j,l=a.complete||f,m,n;c(h?a.yep:a.nope,!!i),i&&c(i)}var i,j,l=this.yepnope.loader;if(e(a))g(a,0,l,0);else if(w(a))for(i=0;i (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start':new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0];var j=d.createElement(s);var dl=l!='dataLayer'?'&l='+l:'';j.src='//www.googletagmanager.com/gtm.js?id='+i+dl;j.type='text/javascript';j.async=true;f.parentNode.insertBefore(j,f);})(window,document,'script','dataLayer','GTM-M677548'); Skip to main content Home About Submit ALERTS / RSS Search for this keyword Advanced Search New Results QuartPlotR: A quarternary phase diagram tool View ORCID Profile Alaguraj Veluchamy , Chris Bowler doi: https://doi.org/10.1101/2024.03.22.586216 Alaguraj Veluchamy 1 St. Jude Children’s Research Hospital, Department of Computational Biology , Memphis, TN USA 2 Institut de biologie de l’Ecole normale supérieure (IBENS), Ecole normale supérieure, CNRS, INSERM , PSL Université, 75005, Paris, France Find this author on Google Scholar Find this author on PubMed Search for this author on this site ORCID record for Alaguraj Veluchamy For correspondence: alaguraj.v{at}gmail.com Chris Bowler 2 Institut de biologie de l’Ecole normale supérieure (IBENS), Ecole normale supérieure, CNRS, INSERM , PSL Université, 75005, Paris, France Find this author on Google Scholar Find this author on PubMed Search for this author on this site Abstract Full Text Info/History Metrics Data/Code Preview PDF Abstract Motivation Large scale studies involving exploratory data analysis and important key discoveries require platform that provides comprehensive visualization. Density distribution analysis across multiple datasets is intuitive and summarization, visualization could reveal several biological information. Integration and visualization of sequence and annotation features in the context of composition of genomic mutation, microbiota, population are significantly challenging. Results We propose a simple, novel strategy of visualization of multidimensional datasets involving multiple layers of data distribution which are interconnected. Also, we have implemented this phase diagram in an easy-to-use tool QuartPlotR, a resource for plotting charts from different genomic datasets. A generic data access and plotting framework has been designed and this is implemented as an R package. Availability https://github.com/AlagurajVeluchamy/QuartPlotR . Contact alaguraj.veluchamy{at}stjude.org Supplementary information Supplementary data are available at Bioinformatics online. 1 Introduction About complexity of data: Increasing number of Big Data, data types and their complexity challenges computational biologists to create novel methods of both analysis and visualization. Data complexity is intrinsic to biological systems with multiple layers of interconnected data. For example, comparison of multiple quantitative data involves visualization by displaying relative abundance using bar charts or area plots or pie-charts. Visualization problem: Understanding of these multiple datasets from multiple different samples require both global and in-depth view. Insights-driven data visualization simplifies decision making for biologists by increasing degrees of abstraction and reducing the complexity parameter. Sample data visualization: DataVis (data visualization) is a subdiscipline of bioinformatics and provide scientific communities with plethora of choices of tools for dissemination of science visually ( O’Donoghue, 2021 ). Additionally, Big Data such as metagenomics data encompass attributes which are both quantitative and categorical in nature. Tools such as Krona provide charts which provides interactive visualization of multiple locations ( Ondov et al ., 2011 ). Genetic data visualization tools for health and diseases usually are landscape based on a particular region ( Jia et al ., 2020 ). Shortcomings from Linear layout in displaying large volume of genomic data were mitigated in CIRCOS in the form of circular layout ( Krzywinski et al ., 2009 ). Spatial visualization of scRNA data such as t-SNE from multiple cancer types involves classification and comparison of commonalities and differences of individual cells in a two-dimensional map ( Li et al ., 2017 ). What is lacking: However, these tools lack the features for displaying secondary variables that include comparing relationships between taxonomic and functional variation of multiple samples such as location of samples in metagenomic data, mutations in population with stroke or cancer. About Quarternary plot: Here, we present a novel method of visualization data which are of comparative level of complexity. We demonstrated the usability of this tool using both metagenome and mutation data. Our method, Quarternary plot is a graphical representation that provides comparative visualization of both taxonomic and functional hierarchies. This plotting system is coordinate based and presented in a spatial layout as opposed to the linear and circular layouts discussed earlier. Edges of the quadrilateral is the sample. This plotter is easy to use on multiple platforms. 2 Methods Phase diagram: Data points are represented as a spatial diagram in a polygon (quadrilateral). Four samples are defined as vertex of this quadrilateral. Initially, the quadrilateral is split into four triangles. For each data point, the data is represented as a centroid point, calculated from three sides of a triangle. where G(x1,y1) is the centroid of the triangle. P1, P2, P3 are values of individual samples. x1, y1 are co-ordinates for each triangle. Similarly, x2, y2, x3, y3, x4, y4 are calculated for four triangles (upper, lower, left and right triangles) in a quadrilateral. Hierarchical data abstraction: Four layers of abstraction can be visualized: Data points are distributed based on the above barometric calculation. Data points could be displayed as points or differential circles. Size of the circle is based on the quantitation. Pie chart for numerical proportion of data. Implementation in R: Lines connecting vertex of the polygon is drawn. A grid is drawn followed by labeling of the pie-chart is done. Data sources: Metagenome and mutation data: Metagenome data from four locations were taken and the data for tag assignment (MetaG) and metatranscriptome (MetaT) are used to plot ( de Vargas et al ., 2015 ). 3 Results QuartPlotR accurately describes a four-sided dataset. This tool enables scientists to have an intuitive pattern from large list of genes. Visualization properties such as data points could be either dot or pie-charts. The image attributes include: Four corners are represented as a vertex in the diamond shaped quadrilateral. Data points can be displayed either as Pie chart or dot plot. Size of pie represents one quantitative selection. Data points which are located towards the corner are barometric in nature. When all four parts are equally shared, the points are in the middle. The points will be on the line, if data points shared among two only vertex only. 3.1 Data Structure QuartPlotR requires a minimum of four column (tab delimited) text file (TXT). Data structure should be hierarchically defined. Each column could be either category or numerical. Minimum numerical value should be presented in all samples. 3.2 Illustration using metagenomics and mutation data Metagenomics data collected from ( de Vargas et al ., 2015 ). As described in ocean plankton distribution, the station22, has a very high proportion of plankton which is in the range of 20-80 micron ( Fig.1 ). Download figure Open in new tab Fig. 1. Quarternary diagram for a metatranscriptome. Using QuartPlotR to compare four metatranscriptomes tag assignment. The scale in the four quadrant refers to different station of sampling. ST122, ST123, ST124, ST125 refers to four different sampling locations. 3.3 Advantages and limitations Most combination of categorical andquantitative data can be optimally visualized. Limitations include Comparative visualization is limited to 4 sides only. Large number of overlapping data points could clutter pie charts, user need to adapt dot plot in that case. Atleast data from two sides should be shared, otherwise datafondsThe Funding This work has been supported by the CNRS. Conflict of Interest none declared. Footnotes https://github.com/AlagurajVeluchamy/QuartPlotR References ↵ Jia , W. et al. ( 2020 ) Oviz-Bio: a web-based platform for interactive cancer genomics data visualization . Nucleic Acids Res ., 48 , W415 – W426 . OpenUrl ↵ Krzywinski , M. et al. ( 2009 ) Circos: An information aesthetic for comparative genomics . Genome Res ., 19 , 1639 – 1645 . OpenUrl Abstract / FREE Full Text ↵ Li , W. et al. ( 2017 ) Application of t-SNE to human genetic data . J. Bioinform. Comput. Biol ., 15 , 1750017 . OpenUrl CrossRef PubMed ↵ O’Donoghue , S.I. ( 2021 ) Grand Challenges in Bioinformatics Data Visualization . Front. Bioinforma ., 1 , 13 . OpenUrl ↵ Ondov , B.D. et al. ( 2011 ) Interactive metagenomic visualization in a Web browser . BMC Bioinformatics , 12 , 385 . OpenUrl CrossRef PubMed ↵ de Vargas , C. et al. ( 2015 ) Ocean plankton . Eukaryotic plankton diversity in the sunlit ocean. Science , 348 , 1261605 . OpenUrl View the discussion thread. Back to top Previous Next Posted March 27, 2024. Download PDF Data/Code Email Thank you for your interest in spreading the word about bioRxiv. NOTE: Your email address is requested solely to identify you as the sender of this article. Your Email * Your Name * Send To * Enter multiple addresses on separate lines or separate them with commas. You are going to email the following QuartPlotR: A quarternary phase diagram tool Message Subject (Your Name) has forwarded a page to you from bioRxiv Message Body (Your Name) thought you would like to see this page from the bioRxiv website. Your Personal Message CAPTCHA This question is for testing whether or not you are a human visitor and to prevent automated spam submissions. Share QuartPlotR: A quarternary phase diagram tool Alaguraj Veluchamy , Chris Bowler bioRxiv 2024.03.22.586216; doi: https://doi.org/10.1101/2024.03.22.586216 Share This Article: Copy Citation Tools QuartPlotR: A quarternary phase diagram tool Alaguraj Veluchamy , Chris Bowler bioRxiv 2024.03.22.586216; doi: https://doi.org/10.1101/2024.03.22.586216 Citation Manager Formats BibTeX Bookends EasyBib EndNote (tagged) EndNote 8 (xml) Medlars Mendeley Papers RefWorks Tagged Ref Manager RIS Zotero Tweet Widget Facebook Like Google Plus One Subject Area Bioinformatics Subject Areas All Articles Animal Behavior and Cognition (7644) Biochemistry (17728) Bioengineering (13916) Bioinformatics (42037) Biophysics (21488) Cancer Biology (18636) Cell Biology (25552) Clinical Trials (138) Developmental Biology (13401) Ecology (19940) Epidemiology (2067) Evolutionary Biology (24367) Genetics (15621) Genomics (22545) Immunology (17764) Microbiology (40475) Molecular Biology (17208) Neuroscience (88744) Paleontology (667) Pathology (2842) Pharmacology and Toxicology (4834) Physiology (7659) Plant Biology (15175) Scientific Communication and Education (2047) Synthetic Biology (4304) Systems Biology (9834) Zoology (2272)

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

Ask this paper AI returns verbatim quotes from the full text · source: preprint-html

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2024) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc
last seen: 2026-05-20T01:45:00.602351+00:00