White paper: standards for handling and analyzing plant pan-genomes

doi:10.12688/f1000research.166538.2

White paper: standards for handling and analyzing plant pan-genomes

2025 · doi:10.12688/f1000research.166538.2

preprint OA: closed CC-BY-4.0

🔓 Open OA copy Full text JSON View at publisher

Full text 237,502 characters · extracted from preprint-html · click to expand

White paper: standards for handling and analyzing... | F1000Research "use strict";function _typeof(t){return(_typeof="function"==typeof Symbol&&"symbol"==typeof Symbol.iterator?function(t){return typeof t}:function(t){return t&&"function"==typeof Symbol&&t.constructor===Symbol&&t!==Symbol.prototype?"symbol":typeof t})(t)}!function(){var t=function(){var t,e,o=[],n=window,r=n;for(;r;){try{if(r.frames.__tcfapiLocator){t=r;break}}catch(t){}if(r===n.top)break;r=r.parent}t||(!function t(){var e=n.document,o=!!n.frames.__tcfapiLocator;if(!o)if(e.body){var r=e.createElement("iframe");r.style.cssText="display:none",r.name="__tcfapiLocator",e.body.appendChild(r)}else setTimeout(t,5);return!o}(),n.__tcfapi=function(){for(var t=arguments.length,n=new Array(t),r=0;r 3&&2===parseInt(n[1],10)&&"boolean"==typeof n[3]&&(e=n[3],"function"==typeof n[2]&&n[2]("set",!0)):"ping"===n[0]?"function"==typeof n[2]&&n[2]({gdprApplies:e,cmpLoaded:!1,cmpStatus:"stub"}):o.push(n)},n.addEventListener("message",(function(t){var e="string"==typeof t.data,o={};if(e)try{o=JSON.parse(t.data)}catch(t){}else o=t.data;var n="object"===_typeof(o)&&null!==o?o.__tcfapiCall:null;n&&window.__tcfapi(n.command,n.version,(function(o,r){var a={__tcfapiReturn:{returnValue:o,success:r,callId:n.callId}};t&&t.source&&t.source.postMessage&&t.source.postMessage(e?JSON.stringify(a):a,"*")}),n.parameter)}),!1))};"undefined"!=typeof module?module.exports=t:t()}(); dataLayer = dataLayer || []; // Standard GTM initialization - Google Consent Mode handles consent automatically (function(w,d,s,l,i){w[l]=w[l]||[];w[l].push({'gtm.start': new Date().getTime(),event:'gtm.js'});var f=d.getElementsByTagName(s)[0], j=d.createElement(s),dl=l!='dataLayer'?'&l='+l:'';j.async=true;j.src= 'https://www.googletagmanager.com/gtm.js?id='+i+dl+ '>m_auth=hzk0Vc3qFsQYhCrIoHz68A>m_preview=env-1>m_cookies_win=x';f.parentNode.insertBefore(j,f); })(window,document,'script','dataLayer','GTM-MWFK8L5J'); ;window.NREUM||(NREUM={});NREUM.init={distributed_tracing:{enabled:true},privacy:{cookies_enabled:true},ajax:{deny_list:["bam.nr-data.net"]}}; ;NREUM.loader_config={accountID:"438030",trustKey:"438030",agentID:"772317073",licenseKey:"97f8f67f26",applicationID:"772317073"} ;NREUM.info={beacon:"bam.nr-data.net",errorBeacon:"bam.nr-data.net",licenseKey:"97f8f67f26",applicationID:"772317073",sa:1} ;/*! For license information please see nr-loader-spa-1.236.0.min.js.LICENSE.txt */ (()=>{"use strict";var e,t,r={5763:(e,t,r)=>{r.d(t,{P_:()=>l,Mt:()=>g,C5:()=>s,DL:()=>v,OP:()=>T,lF:()=>D,Yu:()=>y,Dg:()=>h,CX:()=>c,GE:()=>b,sU:()=>_});var n=r(8632),i=r(9567);const o={beacon:n.ce.beacon,errorBeacon:n.ce.errorBeacon,licenseKey:void 0,applicationID:void 0,sa:void 0,queueTime:void 0,applicationTime:void 0,ttGuid:void 0,user:void 0,account:void 0,product:void 0,extra:void 0,jsAttributes:{},userAttributes:void 0,atts:void 0,transactionName:void 0,tNamePlain:void 0},a={};function s(e){if(!e)throw new Error("All info objects require an agent identifier!");if(!a[e])throw new Error("Info for ".concat(e," was never set"));return a[e]}function c(e,t){if(!e)throw new Error("All info objects require an agent identifier!");a[e]=(0,i.D)(t,o),(0,n.Qy)(e,a[e],"info")}var u=r(7056);const d=()=>{const e={blockSelector:"[data-nr-block]",maskInputOptions:{password:!0}};return{allow_bfcache:!0,privacy:{cookies_enabled:!0},ajax:{deny_list:void 0,enabled:!0,harvestTimeSeconds:10},distributed_tracing:{enabled:void 0,exclude_newrelic_header:void 0,cors_use_newrelic_header:void 0,cors_use_tracecontext_headers:void 0,allowed_origins:void 0},session:{domain:void 0,expiresMs:u.oD,inactiveMs:u.Hb},ssl:void 0,obfuscate:void 0,jserrors:{enabled:!0,harvestTimeSeconds:10},metrics:{enabled:!0},page_action:{enabled:!0,harvestTimeSeconds:30},page_view_event:{enabled:!0},page_view_timing:{enabled:!0,harvestTimeSeconds:30,long_task:!1},session_trace:{enabled:!0,harvestTimeSeconds:10},harvest:{tooManyRequestsDelay:60},session_replay:{enabled:!1,harvestTimeSeconds:60,sampleRate:.1,errorSampleRate:.1,maskTextSelector:"*",maskAllInputs:!0,get blockClass(){return"nr-block"},get ignoreClass(){return"nr-ignore"},get maskTextClass(){return"nr-mask"},get blockSelector(){return e.blockSelector},set blockSelector(t){e.blockSelector+=",".concat(t)},get maskInputOptions(){return e.maskInputOptions},set maskInputOptions(t){e.maskInputOptions={...t,password:!0}}},spa:{enabled:!0,harvestTimeSeconds:10}}},f={};function l(e){if(!e)throw new Error("All configuration objects require an agent identifier!");if(!f[e])throw new Error("Configuration for ".concat(e," was never set"));return f[e]}function h(e,t){if(!e)throw new Error("All configuration objects require an agent identifier!");f[e]=(0,i.D)(t,d()),(0,n.Qy)(e,f[e],"config")}function g(e,t){if(!e)throw new Error("All configuration objects require an agent identifier!");var r=l(e);if(r){for(var n=t.split("."),i=0;i {r.d(t,{D:()=>i});var n=r(50);function i(e,t){try{if(!e||"object"!=typeof e)return(0,n.Z)("Setting a Configurable requires an object as input");if(!t||"object"!=typeof t)return(0,n.Z)("Setting a Configurable requires a model to set its initial properties");const r=Object.create(Object.getPrototypeOf(t),Object.getOwnPropertyDescriptors(t)),o=0===Object.keys(r).length?e:r;for(let a in o)if(void 0!==e[a])try{"object"==typeof e[a]&&"object"==typeof t[a]?r[a]=i(e[a],t[a]):r[a]=e[a]}catch(e){(0,n.Z)("An error occurred while setting a property of a Configurable",e)}return r}catch(e){(0,n.Z)("An error occured while setting a Configurable",e)}}},6818:(e,t,r)=>{r.d(t,{Re:()=>i,gF:()=>o,q4:()=>n});const n="1.236.0",i="PROD",o="CDN"},385:(e,t,r)=>{r.d(t,{FN:()=>a,IF:()=>u,Nk:()=>f,Tt:()=>s,_A:()=>o,il:()=>n,pL:()=>c,v6:()=>i,w1:()=>d});const n="undefined"!=typeof window&&!!window.document,i="undefined"!=typeof WorkerGlobalScope&&("undefined"!=typeof self&&self instanceof WorkerGlobalScope&&self.navigator instanceof WorkerNavigator||"undefined"!=typeof globalThis&&globalThis instanceof WorkerGlobalScope&&globalThis.navigator instanceof WorkerNavigator),o=n?window:"undefined"!=typeof WorkerGlobalScope&&("undefined"!=typeof self&&self instanceof WorkerGlobalScope&&self||"undefined"!=typeof globalThis&&globalThis instanceof WorkerGlobalScope&&globalThis),a=""+o?.location,s=/iPad|iPhone|iPod/.test(navigator.userAgent),c=s&&"undefined"==typeof SharedWorker,u=(()=>{const e=navigator.userAgent.match(/Firefox[/\s](\d+\.\d+)/);return Array.isArray(e)&&e.length>=2?+e[1]:0})(),d=Boolean(n&&window.document.documentMode),f=!!navigator.sendBeacon},1117:(e,t,r)=>{r.d(t,{w:()=>o});var n=r(50);const i={agentIdentifier:"",ee:void 0};class o{constructor(e){try{if("object"!=typeof e)return(0,n.Z)("shared context requires an object as input");this.sharedContext={},Object.assign(this.sharedContext,i),Object.entries(e).forEach((e=>{let[t,r]=e;Object.keys(i).includes(t)&&(this.sharedContext[t]=r)}))}catch(e){(0,n.Z)("An error occured while setting SharedContext",e)}}}},8e3:(e,t,r)=>{r.d(t,{L:()=>d,R:()=>c});var n=r(2177),i=r(1284),o=r(4322),a=r(3325);const s={};function c(e,t){const r={staged:!1,priority:a.p[t]||0};u(e),s[e].get(t)||s[e].set(t,r)}function u(e){e&&(s[e]||(s[e]=new Map))}function d(){let e=arguments.length>0&&void 0!==arguments[0]?arguments[0]:"",t=arguments.length>1&&void 0!==arguments[1]?arguments[1]:"feature";if(u(e),!e||!s[e].get(t))return a(t);s[e].get(t).staged=!0;const r=[...s[e]];function a(t){const r=e?n.ee.get(e):n.ee,a=o.X.handlers;if(r.backlog&&a){var s=r.backlog[t],c=a[t];if(c){for(var u=0;s&&u {let[t,r]=e;return r.staged}))&&(r.sort(((e,t)=>e[1].priority-t[1].priority)),r.forEach((e=>{let[t]=e;a(t)})))}function f(e,t){var r=e[1];(0,i.D)(t[r],(function(t,r){var n=e[0];if(r[0]===n){var i=r[1],o=e[3],a=e[2];i.apply(o,a)}}))}},2177:(e,t,r)=>{r.d(t,{c:()=>f,ee:()=>u});var n=r(8632),i=r(2210),o=r(1284),a=r(5763),s="nr@context";let c=(0,n.fP)();var u;function d(){}function f(e){return(0,i.X)(e,s,l)}function l(){return new d}function h(){u.aborted=!0,u.backlog={}}c.ee?u=c.ee:(u=function e(t,r){var n={},c={},f={},g=!1;try{g=16===r.length&&(0,a.OP)(r).isolatedBacklog}catch(e){}var p={on:b,addEventListener:b,removeEventListener:y,emit:v,get:x,listeners:w,context:m,buffer:A,abort:h,aborted:!1,isBuffering:E,debugId:r,backlog:g?{}:t&&"object"==typeof t.backlog?t.backlog:{}};return p;function m(e){return e&&e instanceof d?e:e?(0,i.X)(e,s,l):l()}function v(e,r,n,i,o){if(!1!==o&&(o=!0),!u.aborted||i){t&&o&&t.emit(e,r,n);for(var a=m(n),s=w(e),d=s.length,f=0;fn,p:()=>i});var n=r(2177).ee.get("handle");function i(e,t,r,i,o){o?(o.buffer([e],i),o.emit(e,t,r)):(n.buffer([e],i),n.emit(e,t,r))}},4322:(e,t,r)=>{r.d(t,{X:()=>o});var n=r(5546);o.on=a;var i=o.handlers={};function o(e,t,r,o){a(o||n.E,i,e,t,r)}function a(e,t,r,i,o){o||(o="feature"),e||(e=n.E);var a=t[o]=t[o]||{};(a[r]=a[r]||[]).push([e,i])}},3239:(e,t,r)=>{r.d(t,{bP:()=>s,iz:()=>c,m$:()=>a});var n=r(385);let i=!1,o=!1;try{const e={get passive(){return i=!0,!1},get signal(){return o=!0,!1}};n._A.addEventListener("test",null,e),n._A.removeEventListener("test",null,e)}catch(e){}function a(e,t){return i||o?{capture:!!e,passive:i,signal:t}:!!e}function s(e,t){let r=arguments.length>2&&void 0!==arguments[2]&&arguments[2],n=arguments.length>3?arguments[3]:void 0;window.addEventListener(e,t,a(r,n))}function c(e,t){let r=arguments.length>2&&void 0!==arguments[2]&&arguments[2],n=arguments.length>3?arguments[3]:void 0;document.addEventListener(e,t,a(r,n))}},4402:(e,t,r)=>{r.d(t,{Ht:()=>u,M:()=>c,Rl:()=>a,ky:()=>s});var n=r(385);const i="xxxxxxxx-xxxx-4xxx-yxxx-xxxxxxxxxxxx";function o(e,t){return e?15&e[t]:16*Math.random()|0}function a(){const e=n._A?.crypto||n._A?.msCrypto;let t,r=0;return e&&e.getRandomValues&&(t=e.getRandomValues(new Uint8Array(31))),i.split("").map((e=>"x"===e?o(t,++r).toString(16):"y"===e?(3&o()|8).toString(16):e)).join("")}function s(e){const t=n._A?.crypto||n._A?.msCrypto;let r,i=0;t&&t.getRandomValues&&(r=t.getRandomValues(new Uint8Array(31)));const a=[];for(var s=0;s {r.d(t,{Bq:()=>n,Hb:()=>o,oD:()=>i});const n="NRBA",i=144e5,o=18e5},7894:(e,t,r)=>{function n(){return Math.round(performance.now())}r.d(t,{z:()=>n})},7243:(e,t,r)=>{r.d(t,{e:()=>o});var n=r(385),i={};function o(e){if(e in i)return i[e];if(0===(e||"").indexOf("data:"))return{protocol:"data"};let t;var r=n._A?.location,o={};if(n.il)t=document.createElement("a"),t.href=e;else try{t=new URL(e,r.href)}catch(e){return o}o.port=t.port;var a=t.href.split("://");!o.port&&a[1]&&(o.port=a[1].split("/")[0].split("@").pop().split(":")[1]),o.port&&"0"!==o.port||(o.port="https"===a[0]?"443":"80"),o.hostname=t.hostname||r.hostname,o.pathname=t.pathname,o.protocol=a[0],"/"!==o.pathname.charAt(0)&&(o.pathname="/"+o.pathname);var s=!t.protocol||":"===t.protocol||t.protocol===r.protocol,c=t.hostname===r.hostname&&t.port===r.port;return o.sameOrigin=s&&(!t.hostname||c),"/"===o.pathname&&(i[e]=o),o}},50:(e,t,r)=>{function n(e,t){"function"==typeof console.warn&&(console.warn("New Relic: ".concat(e)),t&&console.warn(t))}r.d(t,{Z:()=>n})},2587:(e,t,r)=>{r.d(t,{N:()=>c,T:()=>u});var n=r(2177),i=r(5546),o=r(8e3),a=r(3325);const s={stn:[a.D.sessionTrace],err:[a.D.jserrors,a.D.metrics],ins:[a.D.pageAction],spa:[a.D.spa],sr:[a.D.sessionReplay,a.D.sessionTrace]};function c(e,t){const r=n.ee.get(t);e&&"object"==typeof e&&(Object.entries(e).forEach((e=>{let[t,n]=e;void 0===u[t]&&(s[t]?s[t].forEach((e=>{n?(0,i.p)("feat-"+t,[],void 0,e,r):(0,i.p)("block-"+t,[],void 0,e,r),(0,i.p)("rumresp-"+t,[Boolean(n)],void 0,e,r)})):n&&(0,i.p)("feat-"+t,[],void 0,void 0,r),u[t]=Boolean(n))})),Object.keys(s).forEach((e=>{void 0===u[e]&&(s[e]?.forEach((t=>(0,i.p)("rumresp-"+e,[!1],void 0,t,r))),u[e]=!1)})),(0,o.L)(t,a.D.pageViewEvent))}const u={}},2210:(e,t,r)=>{r.d(t,{X:()=>i});var n=Object.prototype.hasOwnProperty;function i(e,t,r){if(n.call(e,t))return e[t];var i=r();if(Object.defineProperty&&Object.keys)try{return Object.defineProperty(e,t,{value:i,writable:!0,enumerable:!1}),i}catch(e){}return e[t]=i,i}},1284:(e,t,r)=>{r.d(t,{D:()=>n});const n=(e,t)=>Object.entries(e||{}).map((e=>{let[r,n]=e;return t(r,n)}))},4351:(e,t,r)=>{r.d(t,{P:()=>o});var n=r(2177);const i=()=>{const e=new WeakSet;return(t,r)=>{if("object"==typeof r&&null!==r){if(e.has(r))return;e.add(r)}return r}};function o(e){try{return JSON.stringify(e,i())}catch(e){try{n.ee.emit("internal-error",[e])}catch(e){}}}},3960:(e,t,r)=>{r.d(t,{K:()=>a,b:()=>o});var n=r(3239);function i(){return"undefined"==typeof document||"complete"===document.readyState}function o(e,t){if(i())return e();(0,n.bP)("load",e,t)}function a(e){if(i())return e();(0,n.iz)("DOMContentLoaded",e)}},8632:(e,t,r)=>{r.d(t,{EZ:()=>u,Qy:()=>c,ce:()=>o,fP:()=>a,gG:()=>d,mF:()=>s});var n=r(7894),i=r(385);const o={beacon:"bam.nr-data.net",errorBeacon:"bam.nr-data.net"};function a(){return i._A.NREUM||(i._A.NREUM={}),void 0===i._A.newrelic&&(i._A.newrelic=i._A.NREUM),i._A.NREUM}function s(){let e=a();return e.o||(e.o={ST:i._A.setTimeout,SI:i._A.setImmediate,CT:i._A.clearTimeout,XHR:i._A.XMLHttpRequest,REQ:i._A.Request,EV:i._A.Event,PR:i._A.Promise,MO:i._A.MutationObserver,FETCH:i._A.fetch}),e}function c(e,t,r){let i=a();const o=i.initializedAgents||{},s=o[e]||{};return Object.keys(s).length||(s.initializedAt={ms:(0,n.z)(),date:new Date}),i.initializedAgents={...o,[e]:{...s,[r]:t}},i}function u(e,t){a()[e]=t}function d(){return function(){let e=a();const t=e.info||{};e.info={beacon:o.beacon,errorBeacon:o.errorBeacon,...t}}(),function(){let e=a();const t=e.init||{};e.init={...t}}(),s(),function(){let e=a();const t=e.loader_config||{};e.loader_config={...t}}(),a()}},7956:(e,t,r)=>{r.d(t,{N:()=>i});var n=r(3239);function i(e){let t=arguments.length>1&&void 0!==arguments[1]&&arguments[1],r=arguments.length>2?arguments[2]:void 0,i=arguments.length>3?arguments[3]:void 0;return void(0,n.iz)("visibilitychange",(function(){if(t)return void("hidden"==document.visibilityState&&e());e(document.visibilityState)}),r,i)}},1214:(e,t,r)=>{r.d(t,{em:()=>v,u5:()=>N,QU:()=>S,_L:()=>I,Gm:()=>L,Lg:()=>M,gy:()=>U,BV:()=>Q,Kf:()=>ee});var n=r(2177);const i="nr@original";var o=Object.prototype.hasOwnProperty,a=!1;function s(e,t){return e||(e=n.ee),r.inPlace=function(e,t,n,i,o){n||(n="");var a,s,c,u="-"===n.charAt(0);for(c=0;c 2?n-2:0),o=2;o {r(A[T],e,w),r(E[T],e,w)})),r(l._A,"fetch",y),t.on(y+"end",(function(e,r){var n=this;if(r){var i=r.headers.get("content-length");null!==i&&(n.rxSize=i),t.emit(y+"done",[null,r],n)}else t.emit(y+"done",[e],n)})),t}const O={},j=["pushState","replaceState"];function S(e){const t=function(e){return(e||n.ee).get("history")}(e);return!l.il||O[t.debugId]++||(O[t.debugId]=1,s(t).inPlace(window.history,j,"-")),t}var P=r(3239);const C={},R=["appendChild","insertBefore","replaceChild"];function I(e){const t=function(e){return(e||n.ee).get("jsonp")}(e);if(!l.il||C[t.debugId])return t;C[t.debugId]=!0;var r=s(t),i=/[?&](?:callback|cb)=([^&#]+)/,o=/(.*)\.([^.]+)/,a=/^(\w+)(\.|$)(.*)$/;function c(e,t){var r=e.match(a),n=r[1],i=r[3];return i?c(i,t[n]):t[n]}return r.inPlace(Node.prototype,R,"dom-"),t.on("dom-start",(function(e){!function(e){if(!e||"string"!=typeof e.nodeName||"script"!==e.nodeName.toLowerCase())return;if("function"!=typeof e.addEventListener)return;var n=(a=e.src,s=a.match(i),s?s[1]:null);var a,s;if(!n)return;var u=function(e){var t=e.match(o);if(t&&t.length>=3)return{key:t[2],parent:c(t[1],window)};return{key:e,parent:window}}(n);if("function"!=typeof u.parent[u.key])return;var d={};function f(){t.emit("jsonp-end",[],d),e.removeEventListener("load",f,(0,P.m$)(!1)),e.removeEventListener("error",l,(0,P.m$)(!1))}function l(){t.emit("jsonp-error",[],d),t.emit("jsonp-end",[],d),e.removeEventListener("load",f,(0,P.m$)(!1)),e.removeEventListener("error",l,(0,P.m$)(!1))}r.inPlace(u.parent,[u.key],"cb-",d),e.addEventListener("load",f,(0,P.m$)(!1)),e.addEventListener("error",l,(0,P.m$)(!1)),t.emit("new-jsonp",[e.src],d)}(e[0])})),t}var k=r(5763);const H={};function L(e){const t=function(e){return(e||n.ee).get("mutation")}(e);if(!l.il||H[t.debugId])return t;H[t.debugId]=!0;var r=s(t),i=k.Yu.MO;return i&&(window.MutationObserver=function(e){return this instanceof i?new i(r(e,"fn-")):i.apply(this,arguments)},MutationObserver.prototype=i.prototype),t}const z={};function M(e){const t=function(e){return(e||n.ee).get("promise")}(e);if(z[t.debugId])return t;z[t.debugId]=!0;var r=n.c,o=s(t),a=k.Yu.PR;return a&&function(){function e(r){var n=t.context(),i=o(r,"executor-",n,null,!1);const s=Reflect.construct(a,[i],e);return t.context(s).getCtx=function(){return n},s}l._A.Promise=e,Object.defineProperty(e,"name",{value:"Promise"}),e.toString=function(){return a.toString()},Object.setPrototypeOf(e,a),["all","race"].forEach((function(r){const n=a[r];e[r]=function(e){let i=!1;[...e||[]].forEach((e=>{this.resolve(e).then(a("all"===r),a(!1))}));const o=n.apply(this,arguments);return o;function a(e){return function(){t.emit("propagate",[null,!i],o,!1,!1),i=i||!e}}}})),["resolve","reject"].forEach((function(r){const n=a[r];e[r]=function(e){const r=n.apply(this,arguments);return e!==r&&t.emit("propagate",[e,!0],r,!1,!1),r}})),e.prototype=a.prototype;const n=a.prototype.then;a.prototype.then=function(){var e=this,i=r(e);i.promise=e;for(var a=arguments.length,s=new Array(a),c=0;c e())),t};function m(e,t){i.inPlace(t,["onreadystatechange"],"fn-",E)}function b(){var e=this,t=r.context(e);e.readyState>3&&!t.resolved&&(t.resolved=!0,r.emit("xhr-resolved",[],e)),i.inPlace(e,f,"fn-",E)}if(function(e,t){for(var r in e)t[r]=e[r]}(o,p),p.prototype=o.prototype,i.inPlace(p.prototype,J,"-xhr-",E),r.on("send-xhr-start",(function(e,t){m(e,t),function(e){h.push(e),a&&(y?y.then(A):u?u(A):(w=-w,x.data=w))}(t)})),r.on("open-xhr-start",m),a){var y=c&&c.resolve();if(!u&&!c){var w=1,x=document.createTextNode(w);new a(A).observe(x,{characterData:!0})}}else t.on("fn-end",(function(e){e[0]&&e[0].type===d||A()}));function A(){for(var e=0;e {r.d(t,{t:()=>n});const n=r(3325).D.ajax},6660:(e,t,r)=>{r.d(t,{A:()=>i,t:()=>n});const n=r(3325).D.jserrors,i="nr@seenError"},3081:(e,t,r)=>{r.d(t,{gF:()=>o,mY:()=>i,t9:()=>n,vz:()=>s,xS:()=>a});const n=r(3325).D.metrics,i="sm",o="cm",a="storeSupportabilityMetrics",s="storeEventMetrics"},4649:(e,t,r)=>{r.d(t,{t:()=>n});const n=r(3325).D.pageAction},7633:(e,t,r)=>{r.d(t,{Dz:()=>i,OJ:()=>a,qw:()=>o,t9:()=>n});const n=r(3325).D.pageViewEvent,i="firstbyte",o="domcontent",a="windowload"},9251:(e,t,r)=>{r.d(t,{t:()=>n});const n=r(3325).D.pageViewTiming},3614:(e,t,r)=>{r.d(t,{BST_RESOURCE:()=>i,END:()=>s,FEATURE_NAME:()=>n,FN_END:()=>u,FN_START:()=>c,PUSH_STATE:()=>d,RESOURCE:()=>o,START:()=>a});const n=r(3325).D.sessionTrace,i="bstResource",o="resource",a="-start",s="-end",c="fn"+a,u="fn"+s,d="pushState"},7836:(e,t,r)=>{r.d(t,{BODY:()=>A,CB_END:()=>E,CB_START:()=>u,END:()=>x,FEATURE_NAME:()=>i,FETCH:()=>_,FETCH_BODY:()=>v,FETCH_DONE:()=>m,FETCH_START:()=>p,FN_END:()=>c,FN_START:()=>s,INTERACTION:()=>l,INTERACTION_API:()=>d,INTERACTION_EVENTS:()=>o,JSONP_END:()=>b,JSONP_NODE:()=>g,JS_TIME:()=>T,MAX_TIMER_BUDGET:()=>a,REMAINING:()=>f,SPA_NODE:()=>h,START:()=>w,originalSetTimeout:()=>y});var n=r(5763);const i=r(3325).D.spa,o=["click","submit","keypress","keydown","keyup","change"],a=999,s="fn-start",c="fn-end",u="cb-start",d="api-ixn-",f="remaining",l="interaction",h="spaNode",g="jsonpNode",p="fetch-start",m="fetch-done",v="fetch-body-",b="jsonp-end",y=n.Yu.ST,w="-start",x="-end",A="-body",E="cb"+x,T="jsTime",_="fetch"},5938:(e,t,r)=>{r.d(t,{W:()=>o});var n=r(5763),i=r(2177);class o{constructor(e,t,r){this.agentIdentifier=e,this.aggregator=t,this.ee=i.ee.get(e,(0,n.OP)(this.agentIdentifier).isolatedBacklog),this.featureName=r,this.blocked=!1}}},9144:(e,t,r)=>{r.d(t,{j:()=>m});var n=r(3325),i=r(5763),o=r(5546),a=r(2177),s=r(7894),c=r(8e3),u=r(3960),d=r(385),f=r(50),l=r(3081),h=r(8632);function g(){const e=(0,h.gG)();["setErrorHandler","finished","addToTrace","inlineHit","addRelease","addPageAction","setCurrentRouteName","setPageViewName","setCustomAttribute","interaction","noticeError","setUserId"].forEach((t=>{e[t]=function(){for(var r=arguments.length,n=new Array(r),i=0;i 1?r-1:0),i=1;i {e.exposed&&e.api[t]&&o.push(e.api[t](...n))})),o.length>1?o:o[0]}(t,...n)}}))}var p=r(2587);function m(e){let t=arguments.length>1&&void 0!==arguments[1]?arguments[1]:{},m=arguments.length>2?arguments[2]:void 0,v=arguments.length>3?arguments[3]:void 0,{init:b,info:y,loader_config:w,runtime:x={loaderType:m},exposed:A=!0}=t;const E=(0,h.gG)();y||(b=E.init,y=E.info,w=E.loader_config),(0,i.Dg)(e,b||{}),(0,i.GE)(e,w||{}),(0,i.sU)(e,x),y.jsAttributes??={},d.v6&&(y.jsAttributes.isWorker=!0),(0,i.CX)(e,y),g();const T=function(e,t){t||(0,c.R)(e,"api");const h={};var g=a.ee.get(e),p=g.get("tracer"),m="api-",v=m+"ixn-";function b(t,r,n,o){const a=(0,i.C5)(e);return null===r?delete a.jsAttributes[t]:(0,i.CX)(e,{...a,jsAttributes:{...a.jsAttributes,[t]:r}}),x(m,n,!0,o||null===r?"session":void 0)(t,r)}function y(){}["setErrorHandler","finished","addToTrace","inlineHit","addRelease"].forEach((e=>h[e]=x(m,e,!0,"api"))),h.addPageAction=x(m,"addPageAction",!0,n.D.pageAction),h.setCurrentRouteName=x(m,"routeName",!0,n.D.spa),h.setPageViewName=function(t,r){if("string"==typeof t)return"/"!==t.charAt(0)&&(t="/"+t),(0,i.OP)(e).customTransaction=(r||"http://custom.transaction")+t,x(m,"setPageViewName",!0)()},h.setCustomAttribute=function(e,t){let r=arguments.length>2&&void 0!==arguments[2]&&arguments[2];if("string"==typeof e){if(["string","number"].includes(typeof t)||null===t)return b(e,t,"setCustomAttribute",r);(0,f.Z)("Failed to execute setCustomAttribute.\nNon-null value must be a string or number type, but a type of was provided."))}else(0,f.Z)("Failed to execute setCustomAttribute.\nName must be a string type, but a type of was provided."))},h.setUserId=function(e){if("string"==typeof e||null===e)return b("enduser.id",e,"setUserId",!0);(0,f.Z)("Failed to execute setUserId.\nNon-null value must be a string type, but a type of was provided."))},h.interaction=function(){return(new y).get()};var w=y.prototype={createTracer:function(e,t){var r={},i=this,a="function"==typeof t;return(0,o.p)(v+"tracer",[(0,s.z)(),e,r],i,n.D.spa,g),function(){if(p.emit((a?"":"no-")+"fn-start",[(0,s.z)(),i,a],r),a)try{return t.apply(this,arguments)}catch(e){throw p.emit("fn-err",[arguments,this,"string"==typeof e?new Error(e):e],r),e}finally{p.emit("fn-end",[(0,s.z)()],r)}}}};function x(e,t,r,i){return function(){return(0,o.p)(l.xS,["API/"+t+"/called"],void 0,n.D.metrics,g),i&&(0,o.p)(e+t,[(0,s.z)(),...arguments],r?null:this,i,g),r?void 0:this}}function A(){r.e(439).then(r.bind(r,7438)).then((t=>{let{setAPI:r}=t;r(e),(0,c.L)(e,"api")})).catch((()=>(0,f.Z)("Downloading runtime APIs failed...")))}return["actionText","setName","setAttribute","save","ignore","onEnd","getContext","end","get"].forEach((e=>{w[e]=x(v,e,void 0,n.D.spa)})),h.noticeError=function(e,t){"string"==typeof e&&(e=new Error(e)),(0,o.p)(l.xS,["API/noticeError/called"],void 0,n.D.metrics,g),(0,o.p)("err",[e,(0,s.z)(),!1,t],void 0,n.D.jserrors,g)},d.il?(0,u.b)((()=>A()),!0):A(),h}(e,v);return(0,h.Qy)(e,T,"api"),(0,h.Qy)(e,A,"exposed"),(0,h.EZ)("activatedFeatures",p.T),T}},3325:(e,t,r)=>{r.d(t,{D:()=>n,p:()=>i});const n={ajax:"ajax",jserrors:"jserrors",metrics:"metrics",pageAction:"page_action",pageViewEvent:"page_view_event",pageViewTiming:"page_view_timing",sessionReplay:"session_replay",sessionTrace:"session_trace",spa:"spa"},i={[n.pageViewEvent]:1,[n.pageViewTiming]:2,[n.metrics]:3,[n.jserrors]:4,[n.ajax]:5,[n.sessionTrace]:6,[n.pageAction]:7,[n.spa]:8,[n.sessionReplay]:9}}},n={};function i(e){var t=n[e];if(void 0!==t)return t.exports;var o=n[e]={exports:{}};return r[e](o,o.exports,i),o.exports}i.m=r,i.d=(e,t)=>{for(var r in t)i.o(t,r)&&!i.o(e,r)&&Object.defineProperty(e,r,{enumerable:!0,get:t[r]})},i.f={},i.e=e=>Promise.all(Object.keys(i.f).reduce(((t,r)=>(i.f[r](e,t),t)),[])),i.u=e=>(({78:"page_action-aggregate",147:"metrics-aggregate",242:"session-manager",317:"jserrors-aggregate",348:"page_view_timing-aggregate",412:"lazy-feature-loader",439:"async-api",538:"recorder",590:"session_replay-aggregate",675:"compressor",733:"session_trace-aggregate",786:"page_view_event-aggregate",873:"spa-aggregate",898:"ajax-aggregate"}[e]||e)+"."+{78:"ac76d497",147:"3dc53903",148:"1a20d5fe",242:"2a64278a",317:"49e41428",348:"bd6de33a",412:"2f55ce66",439:"30bd804e",538:"1b18459f",590:"cf0efb30",675:"ae9f91a8",733:"83105561",786:"06482edd",860:"03a8b7a5",873:"e6b09d52",898:"998ef92b"}[e]+"-1.236.0.min.js"),i.o=(e,t)=>Object.prototype.hasOwnProperty.call(e,t),e={},t="NRBA:",i.l=(r,n,o,a)=>{if(e[r])e[r].push(n);else{var s,c;if(void 0!==o)for(var u=document.getElementsByTagName("script"),d=0;d {s.onerror=s.onload=null,clearTimeout(h);var i=e[r];if(delete e[r],s.parentNode&&s.parentNode.removeChild(s),i&&i.forEach((e=>e(n))),t)return t(n)},h=setTimeout(l.bind(null,void 0,{type:"timeout",target:s}),12e4);s.onerror=l.bind(null,s.onerror),s.onload=l.bind(null,s.onload),c&&document.head.appendChild(s)}},i.r=e=>{"undefined"!=typeof Symbol&&Symbol.toStringTag&&Object.defineProperty(e,Symbol.toStringTag,{value:"Module"}),Object.defineProperty(e,"__esModule",{value:!0})},i.j=364,i.p="https://js-agent.newrelic.com/",(()=>{var e={364:0,953:0};i.f.j=(t,r)=>{var n=i.o(e,t)?e[t]:void 0;if(0!==n)if(n)r.push(n[2]);else{var o=new Promise(((r,i)=>n=e[t]=[r,i]));r.push(n[2]=o);var a=i.p+i.u(t),s=new Error;i.l(a,(r=>{if(i.o(e,t)&&(0!==(n=e[t])&&(e[t]=void 0),n)){var o=r&&("load"===r.type?"missing":r.type),a=r&&r.target&&r.target.src;s.message="Loading chunk "+t+" failed.\n("+o+": "+a+")",s.name="ChunkLoadError",s.type=o,s.request=a,n[1](s)}}),"chunk-"+t,t)}};var t=(t,r)=>{var n,o,[a,s,c]=r,u=0;if(a.some((t=>0!==e[t]))){for(n in s)i.o(s,n)&&(i.m[n]=s[n]);if(c)c(i)}for(t&&t(r);u {i.r(o);var e=i(3325),t=i(5763);const r=Object.values(e.D);function n(e){const n={};return r.forEach((r=>{n[r]=function(e,r){return!1!==(0,t.Mt)(r,"".concat(e,".enabled"))}(r,e)})),n}var a=i(9144);var s=i(5546),c=i(385),u=i(8e3),d=i(5938),f=i(3960),l=i(50);class h extends d.W{constructor(e,t,r){let n=!(arguments.length>3&&void 0!==arguments[3])||arguments[3];super(e,t,r),this.auto=n,this.abortHandler,this.featAggregate,this.onAggregateImported,n&&(0,u.R)(e,r)}importAggregator(){let e=arguments.length>0&&void 0!==arguments[0]?arguments[0]:{};if(this.featAggregate||!this.auto)return;const r=c.il&&!0===(0,t.Mt)(this.agentIdentifier,"privacy.cookies_enabled");let n;this.onAggregateImported=new Promise((e=>{n=e}));const o=async()=>{let t;try{if(r){const{setupAgentSession:e}=await Promise.all([i.e(860),i.e(242)]).then(i.bind(i,3228));t=e(this.agentIdentifier)}}catch(e){(0,l.Z)("A problem occurred when starting up session manager. This page will not start or extend any session.",e)}try{if(!this.shouldImportAgg(this.featureName,t))return void(0,u.L)(this.agentIdentifier,this.featureName);const{lazyFeatureLoader:r}=await i.e(412).then(i.bind(i,8582)),{Aggregate:o}=await r(this.featureName,"aggregate");this.featAggregate=new o(this.agentIdentifier,this.aggregator,e),n(!0)}catch(e){(0,l.Z)("Downloading and initializing ".concat(this.featureName," failed..."),e),this.abortHandler?.(),n(!1)}};c.il?(0,f.b)((()=>o()),!0):o()}shouldImportAgg(r,n){return r!==e.D.sessionReplay||!1!==(0,t.Mt)(this.agentIdentifier,"session_trace.enabled")&&(!!n?.isNew||!!n?.state.sessionReplay)}}var g=i(7633),p=i(7894);class m extends h{static featureName=g.t9;constructor(r,n){let i=!(arguments.length>2&&void 0!==arguments[2])||arguments[2];if(super(r,n,g.t9,i),("undefined"==typeof PerformanceNavigationTiming||c.Tt)&&"undefined"!=typeof PerformanceTiming){const n=(0,t.OP)(r);n[g.Dz]=Math.max(Date.now()-n.offset,0),(0,f.K)((()=>n[g.qw]=Math.max((0,p.z)()-n[g.Dz],0))),(0,f.b)((()=>{const t=(0,p.z)();n[g.OJ]=Math.max(t-n[g.Dz],0),(0,s.p)("timing",["load",t],void 0,e.D.pageViewTiming,this.ee)}))}this.importAggregator()}}var v=i(1117),b=i(1284);class y extends v.w{constructor(e){super(e),this.aggregatedData={}}store(e,t,r,n,i){var o=this.getBucket(e,t,r,i);return o.metrics=function(e,t){t||(t={count:0});return t.count+=1,(0,b.D)(e,(function(e,r){t[e]=w(r,t[e])})),t}(n,o.metrics),o}merge(e,t,r,n,i){var o=this.getBucket(e,t,n,i);if(o.metrics){var a=o.metrics;a.count+=r.count,(0,b.D)(r,(function(e,t){if("count"!==e){var n=a[e],i=r[e];i&&!i.c?a[e]=w(i.t,n):a[e]=function(e,t){if(!t)return e;t.c||(t=x(t.t));return t.min=Math.min(e.min,t.min),t.max=Math.max(e.max,t.max),t.t+=e.t,t.sos+=e.sos,t.c+=e.c,t}(i,a[e])}}))}else o.metrics=r}storeMetric(e,t,r,n){var i=this.getBucket(e,t,r);return i.stats=w(n,i.stats),i}getBucket(e,t,r,n){this.aggregatedData[e]||(this.aggregatedData[e]={});var i=this.aggregatedData[e][t];return i||(i=this.aggregatedData[e][t]={params:r||{}},n&&(i.custom=n)),i}get(e,t){return t?this.aggregatedData[e]&&this.aggregatedData[e][t]:this.aggregatedData[e]}take(e){for(var t={},r="",n=!1,i=0;i t.max&&(t.max=e),e 2&&void 0!==arguments[2])||arguments[2];super(e,r,j.t,n),c.il&&((0,t.OP)(e).initHidden=Boolean("hidden"===document.visibilityState),(0,N.N)((()=>(0,s.p)("docHidden",[(0,p.z)()],void 0,j.t,this.ee)),!0),(0,O.bP)("pagehide",(()=>(0,s.p)("winPagehide",[(0,p.z)()],void 0,j.t,this.ee))),this.importAggregator())}}var P=i(3081);class C extends h{static featureName=P.t9;constructor(e,t){let r=!(arguments.length>2&&void 0!==arguments[2])||arguments[2];super(e,t,P.t9,r),this.importAggregator()}}var R,I=i(2210),k=i(1214),H=i(2177),L={};try{R=localStorage.getItem("__nr_flags").split(","),console&&"function"==typeof console.log&&(L.console=!0,-1!==R.indexOf("dev")&&(L.dev=!0),-1!==R.indexOf("nr_dev")&&(L.nrDev=!0))}catch(e){}function z(e){try{L.console&&z(e)}catch(e){}}L.nrDev&&H.ee.on("internal-error",(function(e){z(e.stack)})),L.dev&&H.ee.on("fn-err",(function(e,t,r){z(r.stack)})),L.dev&&(z("NR AGENT IN DEVELOPMENT MODE"),z("flags: "+(0,b.D)(L,(function(e,t){return e})).join(", ")));var M=i(6660);class B extends h{static featureName=M.t;constructor(r,n){let i=!(arguments.length>2&&void 0!==arguments[2])||arguments[2];super(r,n,M.t,i),this.skipNext=0;try{this.removeOnAbort=new AbortController}catch(e){}const o=this;o.ee.on("fn-start",(function(e,t,r){o.abortHandler&&(o.skipNext+=1)})),o.ee.on("fn-err",(function(t,r,n){o.abortHandler&&!n[M.A]&&((0,I.X)(n,M.A,(function(){return!0})),this.thrown=!0,(0,s.p)("err",[n,(0,p.z)()],void 0,e.D.jserrors,o.ee))})),o.ee.on("fn-end",(function(){o.abortHandler&&!this.thrown&&o.skipNext>0&&(o.skipNext-=1)})),o.ee.on("internal-error",(function(t){(0,s.p)("ierr",[t,(0,p.z)(),!0],void 0,e.D.jserrors,o.ee)})),this.origOnerror=c._A.onerror,c._A.onerror=this.onerrorHandler.bind(this),c._A.addEventListener("unhandledrejection",(t=>{const r=function(e){let t="Unhandled Promise Rejection: ";if(e instanceof Error)try{return e.message=t+e.message,e}catch(t){return e}if(void 0===e)return new Error(t);try{return new Error(t+(0,D.P)(e))}catch(e){return new Error(t)}}(t.reason);(0,s.p)("err",[r,(0,p.z)(),!1,{unhandledPromiseRejection:1}],void 0,e.D.jserrors,this.ee)}),(0,O.m$)(!1,this.removeOnAbort?.signal)),(0,k.gy)(this.ee),(0,k.BV)(this.ee),(0,k.em)(this.ee),(0,t.OP)(r).xhrWrappable&&(0,k.Kf)(this.ee),this.abortHandler=this.#e,this.importAggregator()}#e(){this.removeOnAbort?.abort(),this.abortHandler=void 0}onerrorHandler(t,r,n,i,o){"function"==typeof this.origOnerror&&this.origOnerror(...arguments);try{this.skipNext?this.skipNext-=1:(0,s.p)("err",[o||new F(t,r,n),(0,p.z)()],void 0,e.D.jserrors,this.ee)}catch(t){try{(0,s.p)("ierr",[t,(0,p.z)(),!0],void 0,e.D.jserrors,this.ee)}catch(e){}}return!1}}function F(e,t,r){this.message=e||"Uncaught error with no additional information",this.sourceURL=t,this.line=r}let U=1;const q="nr@id";function G(e){const t=typeof e;return!e||"object"!==t&&"function"!==t?-1:e===c._A?0:(0,I.X)(e,q,(function(){return U++}))}function V(e){if("string"==typeof e&&e.length)return e.length;if("object"==typeof e){if("undefined"!=typeof ArrayBuffer&&e instanceof ArrayBuffer&&e.byteLength)return e.byteLength;if("undefined"!=typeof Blob&&e instanceof Blob&&e.size)return e.size;if(!("undefined"!=typeof FormData&&e instanceof FormData))try{return(0,D.P)(e).length}catch(e){return}}}var X=i(7243);class W{constructor(e){this.agentIdentifier=e,this.generateTracePayload=this.generateTracePayload.bind(this),this.shouldGenerateTrace=this.shouldGenerateTrace.bind(this)}generateTracePayload(e){if(!this.shouldGenerateTrace(e))return null;var r=(0,t.DL)(this.agentIdentifier);if(!r)return null;var n=(r.accountID||"").toString()||null,i=(r.agentID||"").toString()||null,o=(r.trustKey||"").toString()||null;if(!n||!i)return null;var a=(0,_.M)(),s=(0,_.Ht)(),c=Date.now(),u={spanId:a,traceId:s,timestamp:c};return(e.sameOrigin||this.isAllowedOrigin(e)&&this.useTraceContextHeadersForCors())&&(u.traceContextParentHeader=this.generateTraceContextParentHeader(a,s),u.traceContextStateHeader=this.generateTraceContextStateHeader(a,c,n,i,o)),(e.sameOrigin&&!this.excludeNewrelicHeader()||!e.sameOrigin&&this.isAllowedOrigin(e)&&this.useNewrelicHeaderForCors())&&(u.newrelicHeader=this.generateTraceHeader(a,s,c,n,i,o)),u}generateTraceContextParentHeader(e,t){return"00-"+t+"-"+e+"-01"}generateTraceContextStateHeader(e,t,r,n,i){return i+"@nr=0-1-"+r+"-"+n+"-"+e+"----"+t}generateTraceHeader(e,t,r,n,i,o){if(!("function"==typeof c._A?.btoa))return null;var a={v:[0,1],d:{ty:"Browser",ac:n,ap:i,id:e,tr:t,ti:r}};return o&&n!==o&&(a.d.tk=o),btoa((0,D.P)(a))}shouldGenerateTrace(e){return this.isDtEnabled()&&this.isAllowedOrigin(e)}isAllowedOrigin(e){var r=!1,n={};if((0,t.Mt)(this.agentIdentifier,"distributed_tracing")&&(n=(0,t.P_)(this.agentIdentifier).distributed_tracing),e.sameOrigin)r=!0;else if(n.allowed_origins instanceof Array)for(var i=0;i 2&&void 0!==arguments[2])||arguments[2];super(r,n,Z.t,i),(0,t.OP)(r).xhrWrappable&&(this.dt=new W(r),this.handler=(e,t,r,n)=>(0,s.p)(e,t,r,n,this.ee),(0,k.u5)(this.ee),(0,k.Kf)(this.ee),function(r,n,i,o){function a(e){var t=this;t.totalCbs=0,t.called=0,t.cbTime=0,t.end=E,t.ended=!1,t.xhrGuids={},t.lastSize=null,t.loadCaptureCalled=!1,t.params=this.params||{},t.metrics=this.metrics||{},e.addEventListener("load",(function(r){_(t,e)}),(0,O.m$)(!1)),c.IF||e.addEventListener("progress",(function(e){t.lastSize=e.loaded}),(0,O.m$)(!1))}function s(e){this.params={method:e[0]},T(this,e[1]),this.metrics={}}function u(e,n){var i=(0,t.DL)(r);i.xpid&&this.sameOrigin&&n.setRequestHeader("X-NewRelic-ID",i.xpid);var a=o.generateTracePayload(this.parsedOrigin);if(a){var s=!1;a.newrelicHeader&&(n.setRequestHeader("newrelic",a.newrelicHeader),s=!0),a.traceContextParentHeader&&(n.setRequestHeader("traceparent",a.traceContextParentHeader),a.traceContextStateHeader&&n.setRequestHeader("tracestate",a.traceContextStateHeader),s=!0),s&&(this.dt=a)}}function d(e,t){var r=this.metrics,i=e[0],o=this;if(r&&i){var a=V(i);a&&(r.txSize=a)}this.startTime=(0,p.z)(),this.listener=function(e){try{"abort"!==e.type||o.loadCaptureCalled||(o.params.aborted=!0),("load"!==e.type||o.called===o.totalCbs&&(o.onloadCalled||"function"!=typeof t.onload)&&"function"==typeof o.end)&&o.end(t)}catch(e){try{n.emit("internal-error",[e])}catch(e){}}};for(var s=0;s 1?e[1]=i:e.push(i)}else e[0]&&e[0].headers&&s(e[0].headers,n)&&(this.dt=n);function s(e,t){var r=!1;return t.newrelicHeader&&(e.set("newrelic",t.newrelicHeader),r=!0),t.traceContextParentHeader&&(e.set("traceparent",t.traceContextParentHeader),t.traceContextStateHeader&&e.set("tracestate",t.traceContextStateHeader),r=!0),r}}function x(e,t){this.params={},this.metrics={},this.startTime=(0,p.z)(),this.dt=t,e.length>=1&&(this.target=e[0]),e.length>=2&&(this.opts=e[1]);var r,n=this.opts||{},i=this.target;"string"==typeof i?r=i:"object"==typeof i&&i instanceof Y?r=i.url:c._A?.URL&&"object"==typeof i&&i instanceof URL&&(r=i.href),T(this,r);var o=(""+(i&&i instanceof Y&&i.method||n.method||"GET")).toUpperCase();this.params.method=o,this.txSize=V(n.body)||0}function A(t,r){var n;this.endTime=(0,p.z)(),this.params||(this.params={}),this.params.status=r?r.status:0,"string"==typeof this.rxSize&&this.rxSize.length>0&&(n=+this.rxSize);var o={txSize:this.txSize,rxSize:n,duration:(0,p.z)()-this.startTime};i("xhr",[this.params,o,this.startTime,this.endTime,"fetch"],this,e.D.ajax)}function E(t){var r=this.params,n=this.metrics;if(!this.ended){this.ended=!0;for(var o=0;o 2&&void 0!==arguments[2])||arguments[2];super(e,t,we.t,r),this.importAggregator()}}new class{constructor(e){let t=arguments.length>1&&void 0!==arguments[1]?arguments[1]:(0,_.ky)(16);c._A?(this.agentIdentifier=t,this.sharedAggregator=new y({agentIdentifier:this.agentIdentifier}),this.features={},this.desiredFeatures=new Set(e.features||[]),this.desiredFeatures.add(m),Object.assign(this,(0,a.j)(this.agentIdentifier,e,e.loaderType||"agent")),this.start()):(0,l.Z)("Failed to initial the agent. Could not determine the runtime environment.")}get config(){return{info:(0,t.C5)(this.agentIdentifier),init:(0,t.P_)(this.agentIdentifier),loader_config:(0,t.DL)(this.agentIdentifier),runtime:(0,t.OP)(this.agentIdentifier)}}start(){const t="features";try{const r=n(this.agentIdentifier),i=[...this.desiredFeatures];i.sort(((t,r)=>e.p[t.featureName]-e.p[r.featureName])),i.forEach((t=>{if(r[t.featureName]||t.featureName===e.D.pageViewEvent){const n=function(t){switch(t){case e.D.ajax:return[e.D.jserrors];case e.D.sessionTrace:return[e.D.ajax,e.D.pageViewEvent];case e.D.sessionReplay:return[e.D.sessionTrace];case e.D.pageViewTiming:return[e.D.pageViewEvent];default:return[]}}(t.featureName);n.every((e=>r[e]))||(0,l.Z)("".concat(t.featureName," is enabled but one or more dependent features has been disabled (").concat((0,D.P)(n),"). This may cause unintended consequences or missing data...")),this.features[t.featureName]=new t(this.agentIdentifier,this.sharedAggregator)}})),(0,T.Qy)(this.agentIdentifier,this.features,t)}catch(e){(0,l.Z)("Failed to initialize all enabled instrument classes (agent aborted) -",e);for(const e in this.features)this.features[e].abortHandler?.();const r=(0,T.fP)();return delete r.initializedAgents[this.agentIdentifier]?.api,delete r.initializedAgents[this.agentIdentifier]?.[t],delete this.sharedAggregator,r.ee?.abort(),delete r.ee?.get(this.agentIdentifier),!1}}}({features:[J,m,S,class extends h{static featureName=oe;constructor(t,r){if(super(t,r,oe,!(arguments.length>2&&void 0!==arguments[2])||arguments[2]),!c.il)return;const n=this.ee;let i;(0,k.QU)(n),this.eventsEE=(0,k.em)(n),this.eventsEE.on(se,(function(e,t){this.bstStart=(0,p.z)()})),this.eventsEE.on(ae,(function(t,r){(0,s.p)("bst",[t[0],r,this.bstStart,(0,p.z)()],void 0,e.D.sessionTrace,n)})),n.on(ce+ne,(function(e){this.time=(0,p.z)(),this.startPath=location.pathname+location.hash})),n.on(ce+ie,(function(t){(0,s.p)("bstHist",[location.pathname+location.hash,this.startPath,this.time],void 0,e.D.sessionTrace,n)}));try{i=new PerformanceObserver((t=>{const r=t.getEntries();(0,s.p)(te,[r],void 0,e.D.sessionTrace,n)})),i.observe({type:re,buffered:!0})}catch(e){}this.importAggregator({resourceObserver:i})}},C,xe,B,class extends h{static featureName=de;constructor(e,r){if(super(e,r,de,!(arguments.length>2&&void 0!==arguments[2])||arguments[2]),!c.il)return;if(!(0,t.OP)(e).xhrWrappable)return;try{this.removeOnAbort=new AbortController}catch(e){}let n,i=0;const o=this.ee.get("tracer"),a=(0,k._L)(this.ee),s=(0,k.Lg)(this.ee),u=(0,k.BV)(this.ee),d=(0,k.Kf)(this.ee),f=this.ee.get("events"),l=(0,k.u5)(this.ee),h=(0,k.QU)(this.ee),g=(0,k.Gm)(this.ee);function m(e,t){h.emit("newURL",[""+window.location,t])}function v(){i++,n=window.location.hash,this[ve]=(0,p.z)()}function b(){i--,window.location.hash!==n&&m(0,!0);var e=(0,p.z)();this[pe]=~~this[pe]+e-this[ve],this[ye]=e}function y(e,t){e.on(t,(function(){this[t]=(0,p.z)()}))}this.ee.on(ve,v),s.on(be,v),a.on(be,v),this.ee.on(ye,b),s.on(ge,b),a.on(ge,b),this.ee.buffer([ve,ye,"xhr-resolved"],this.featureName),f.buffer([ve],this.featureName),u.buffer(["setTimeout"+le,"clearTimeout"+fe,ve],this.featureName),d.buffer([ve,"new-xhr","send-xhr"+fe],this.featureName),l.buffer([me+fe,me+"-done",me+he+fe,me+he+le],this.featureName),h.buffer(["newURL"],this.featureName),g.buffer([ve],this.featureName),s.buffer(["propagate",be,ge,"executor-err","resolve"+fe],this.featureName),o.buffer([ve,"no-"+ve],this.featureName),a.buffer(["new-jsonp","cb-start","jsonp-error","jsonp-end"],this.featureName),y(l,me+fe),y(l,me+"-done"),y(a,"new-jsonp"),y(a,"jsonp-end"),y(a,"cb-start"),h.on("pushState-end",m),h.on("replaceState-end",m),window.addEventListener("hashchange",m,(0,O.m$)(!0,this.removeOnAbort?.signal)),window.addEventListener("load",m,(0,O.m$)(!0,this.removeOnAbort?.signal)),window.addEventListener("popstate",(function(){m(0,i>1)}),(0,O.m$)(!0,this.removeOnAbort?.signal)),this.abortHandler=this.#e,this.importAggregator()}#e(){this.removeOnAbort?.abort(),this.abortHandler=void 0}}],loaderType:"spa"})})(),window.NRBA=o})(); window.jQuery || document.write(' ') CKEDITOR_BASEPATH='https://f1000research.com/js/vendor/ckeditor/' window.reactTheme = 'research'; window.MathJax = { CommonHTML: { linebreaks: { automatic: true } }, 'HTML-CSS': { linebreaks: { automatic: true } }, SVG: { linebreaks: { automatic: true } }, AuthorInit: function() { MathJax.Hub.Register.MessageHook('End Process', function () { let timeout = false; // holder for timeout id const delay = 250; // delay after event is "complete" to run callback const reflowMath = function() { const dispFormulas = document.querySelectorAll('.disp-formula.panel'); if (!dispFormulas) { return; } for (const dispFormula of dispFormulas) { const child = dispFormula.querySelector('.MathJax_Preview').nextSibling.firstChild; const isMultiline = MathJax.Hub.getAllJax(dispFormula)[0].root.isMultiline; if (dispFormula.offsetWidth < child.offsetWidth || isMultiline) { MathJax.Hub.Queue(['Rerender', MathJax.Hub, dispFormula]); } } }; window.addEventListener('resize', function() { clearTimeout(timeout); // clear the timeout timeout = setTimeout(reflowMath, delay); // start timing for event "completion" }); }); }, }; if (window.location.hash == '#_=_'){ window.location = window.location.href.split('#')[0] } !function(f,b,e,v,n,t,s){if(f.fbq)return;n=f.fbq=function() {n.callMethod? n.callMethod.apply(n,arguments):n.queue.push(arguments)} ;if(!f._fbq)f._fbq=n; n.push=n;n.loaded=!0;n.version='2.0';n.queue=[];t=b.createElement(e);t.async=!0; t.src=v;s=b.getElementsByTagName(e)[0];s.parentNode.insertBefore(t,s)}(window, document,'script','https://connect.facebook.net/en_US/fbevents.js'); fbq('init', '1641728616063202'); fbq('track', "PixelInitialized", {}); (function(h,o,t,j,a,r){ h.hj=h.hj||function(){(h.hj.q=h.hj.q||[]).push(arguments)}; h._hjSettings={hjid:2318163,hjsv:6}; a=o.getElementsByTagName('head')[0]; r=o.createElement('script');r.async=1; r.src=t+h._hjSettings.hjid+j+h._hjSettings.hjsv; a.appendChild(r); })(window,document,'https://static.hotjar.com/c/hotjar-','.js?sv='); search file_upload Submit your research search menu close search Browse Gateways & Collections How to Publish Submit your Research My Submissions Article Guidelines Article Guidelines (New Versions) Open Data, Software and Code Guidelines Open Data and Accessible Source Materials Guidelines (HSS) Open Data, Software and Code Guidelines (PSE) Prepublication Checks Production Process Posters and Slides Guidelines Document Guidelines Article Processing Charges Peer Review Finding Article Reviewers About How it Works For Reviewers Our Advisors Policies Glossary FAQs For Developers Newsroom Contact My Research Submissions Content and Tracking Alerts My Details Sign In file_upload Submit your research { "@context": "https://schema.org", "@type": "ScholarlyArticle", "mainEntityOfPage": { "@type": "WebPage", "@id": "https://f1000research.com/articles/14-739" }, "headline": "White paper: standards for handling and analyzing plant pan-genomes", "datePublished": "2025-07-28T14:43:17", "dateModified": "2026-05-07T07:43:20", "author": [ { "@type": "Person", "name": "Marc C. Heuermann" }, { "@type": "Person", "name": "Pedro Barros" }, { "@type": "Person", "name": "Sebastian Beier" }, { "@type": "Person", "name": "Heidrun Gundlach" }, { "@type": "Person", "name": "Jorge Alvarez-Jarreta" }, { "@type": "Person", "name": "Keywan Hassani-Pak" }, { "@type": "Person", "name": "Patrick König" }, { "@type": "Person", "name": "Anne Fiebig" }, { "@type": "Person", "name": "Tim Godec" }, { "@type": "Person", "name": "Kristina Gruden" }, { "@type": "Person", "name": "Nadja Nolte" }, { "@type": "Person", "name": "Marko Petek" }, { "@type": "Person", "name": "Uwe Scholz" }, { "@type": "Person", "name": "Maja Zagorščak" }, { "@type": "Person", "name": "Klaas Vandepoele" }, { "@type": "Person", "name": "Michiel Van Bel" } ], "publisher": { "@type": "Organization", "name": "F1000Research", "logo": { "@type": "ImageObject", "url": "https://f1000research.com/img/AMP/F1000Research_image.png", "height": 480, "width": 60 } }, "image": { "@type": "ImageObject", "url": "https://f1000research.com/img/AMP/F1000Research_image.png", "height": 1200, "width": 150 }, "description": "Plant pan-genomes, which aggregate genomic sequences and annotations from multiple individuals of a species, have emerged as transformative tools for understanding genetic diversity, adaptation, and evolutionary dynamics. Super-pan-genomes, extending across species boundaries, further enable comparative analyses of clades or genera, bridging breeding applications with evolutionary insights (Shang et al., 2022; Li et al., 2023a). However, the absence of standardized practices for data generation, analysis, and sharing hinders reproducibility and interoperability. This white paper presents a harmonized framework developed by the ELIXIR E-PAN consortium, addressing nomenclature, quality control (QC), data formats, visualization, and community practices. By adopting these guidelines, researchers can enhance FAIR (Findable, Accessible, Interoperable, Reusable) compliance, foster collaboration, and accelerate translational applications in crop improvement and evolutionary biology." } { "@context": "http://schema.org", "@type": "BreadcrumbList", "itemListElement": [ { "@type": "ListItem", "position": "1", "item": { "@id": "https://f1000research.com/", "name": "Home" } }, { "@type": "ListItem", "position": "2", "item": { "@id": "https://f1000research.com/browse/articles", "name": "Browse" } }, { "@type": "ListItem", "position": "3", "item": { "@id": "https://f1000research.com/articles/14-739/v2", "name": "White paper: standards for handling and analyzing plant pan-genomes" } } ] } Home Browse White paper: standards for handling and analyzing plant pan-genomes ALL Metrics - Views Downloads Get PDF Get XML Cite How to cite this article Heuermann MC, Barros P, Beier S et al. White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.12688/f1000research.166538.2 ) NOTE: If applicable, it is important to ensure the information in square brackets after the title is included in all citations of this article. Close Copy Citation Details Export Export Citation Sciwheel EndNote Ref. Manager Bibtex ProCite Sente EXPORT Select a format first Track Share ▬ ✚ Review Revised White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] Marc C. Heuermann 1 , Pedro Barros https://orcid.org/0000-0001-5626-0619 2 , Sebastian Beier https://orcid.org/0000-0002-2177-8781 3 , [...] Heidrun Gundlach https://orcid.org/0000-0002-6757-0943 4 , Jorge Alvarez-Jarreta https://orcid.org/0000-0002-0946-0957 5 , Keywan Hassani-Pak https://orcid.org/0000-0001-9625-0511 6 , Patrick König https://orcid.org/0000-0002-8948-6793 1 , Anne Fiebig https://orcid.org/0000-0003-3159-3593 1 , Tim Godec https://orcid.org/0000-0002-1719-3107 7 , Kristina Gruden 7 , Nadja Nolte 7 , Marko Petek https://orcid.org/0000-0003-3644-7827 7 , Uwe Scholz https://orcid.org/0000-0001-6113-3518 1 , Maja Zagorščak 7 , Klaas Vandepoele 8 , Michiel Van Bel 8 Marc C. Heuermann 1 , Pedro Barros https://orcid.org/0000-0001-5626-0619 2 , [...] Sebastian Beier https://orcid.org/0000-0002-2177-8781 3 , Heidrun Gundlach https://orcid.org/0000-0002-6757-0943 4 , Jorge Alvarez-Jarreta https://orcid.org/0000-0002-0946-0957 5 , Keywan Hassani-Pak https://orcid.org/0000-0001-9625-0511 6 , Patrick König https://orcid.org/0000-0002-8948-6793 1 , Anne Fiebig https://orcid.org/0000-0003-3159-3593 1 , Tim Godec https://orcid.org/0000-0002-1719-3107 7 , Kristina Gruden 7 , Nadja Nolte 7 , Marko Petek https://orcid.org/0000-0003-3644-7827 7 , Uwe Scholz https://orcid.org/0000-0001-6113-3518 1 , Maja Zagorščak 7 , Klaas Vandepoele 8 , Michiel Van Bel 8 PUBLISHED 18 Nov 2025 Author details Author details 1 Leibniz Institute of Plant Genetics and Crop Plant Research (IPK), Seeland, Saxony-Anhalt, 06466, Germany 2 Universidade Nova de Lisboa Instituto de Tecnologia Quimica e Biologica, Oeiras, Lisbon, Portugal 3 Forschungszentrum Jülich GmbH Institute of Bio- and Geosciences, Jülich, North Rhine-Westphalia, 52425, Germany 4 Helmholtz Zentrum München, Neuherberg, 85764, Germany 5 European Molecular Biology Laboratory, European Bioinformatics Institute, Wellcome Genome Campus, Hinxton, Cambridge, CB10 1SD, UK 6 Rothamsted Research, Harpenden, England, AL52JQ, UK 7 National Institute of Biology, Večna pot 111, Ljubljana, 1000, Slovenia 8 Department of Plant Biotechnology and Bioinformatics, Ghent University, Technologiepark 71, Ghent, 9052, Belgium Marc C. Heuermann Roles: Conceptualization, Writing – Original Draft Preparation, Writing – Review & Editing Pedro Barros Roles: Writing – Review & Editing Sebastian Beier Roles: Writing – Review & Editing Heidrun Gundlach Roles: Writing – Review & Editing Jorge Alvarez-Jarreta Roles: Writing – Review & Editing Keywan Hassani-Pak Roles: Writing – Review & Editing Patrick König Roles: Writing – Review & Editing Anne Fiebig Roles: Writing – Review & Editing Tim Godec Roles: Writing – Review & Editing Kristina Gruden Roles: Writing – Review & Editing Nadja Nolte Roles: Writing – Review & Editing Marko Petek Roles: Writing – Review & Editing Uwe Scholz Roles: Writing – Review & Editing Maja Zagorščak Roles: Writing – Review & Editing Klaas Vandepoele Roles: Project Administration, Writing – Review & Editing Michiel Van Bel Roles: Project Administration, Writing – Review & Editing OPEN PEER REVIEW DETAILS REVIEWER STATUS This article is included in the ELIXIR gateway. This article is included in the Plant Science gateway. This article is included in the Genomics and Genetics gateway. Abstract Plant pan-genomes, which aggregate genomic sequences and annotations from multiple individuals of a species, have emerged as transformative tools for understanding genetic diversity, adaptation, and evolutionary dynamics. Super-pan-genomes, extending across species boundaries, further enable comparative analyses of clades or genera, bridging breeding applications with evolutionary insights (Shang et al., 2022; Li et al., 2023a). However, the absence of standardized practices for data generation, analysis, and sharing hinders reproducibility and interoperability. This white paper presents a harmonized framework developed by the ELIXIR E-PAN consortium, addressing nomenclature, quality control (QC), data formats, visualization, and community practices. By adopting these guidelines, researchers can enhance FAIR (Findable, Accessible, Interoperable, Reusable) compliance, foster collaboration, and accelerate translational applications in crop improvement and evolutionary biology. READ ALL READ LESS Keywords plant pan-genome, white paper, standards, quality control Corresponding Author(s) Marc C. Heuermann ( [email protected] ) Close Corresponding author: Marc C. Heuermann Competing interests: No competing interests were disclosed. Grant information: This study has received funding from ELIXIR under the call for proposals on Biodiversity, Food Safety and Pathogens (2024-SCIENCE-BFSP) as part of WP2 E-PAN: Enhancing pan-genome analysis in plants. MCH received funding from ELIXIR-DE, which was supported by the Federal Ministry of Education and Research BMBF within the framework of de.NBI/ELIXIR-DE (W-de.NBI-009). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript. Copyright: © 2025 Heuermann MC et al . This is an open access article distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. How to cite: Heuermann MC, Barros P, Beier S et al. White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.12688/f1000research.166538.2 ) First published: 28 Jul 2025, 14 :739 ( https://doi.org/10.12688/f1000research.166538.1 ) Latest published: 07 May 2026, 14 :739 ( https://doi.org/10.12688/f1000research.166538.3 ) Revised Amendments from Version 1 The reviewers’ comments have helped us significantly refine the white paper. The new figure provides readers with a clear, visualized, and summarized overview of the essential steps required to successfully conduct a pan-genome analysis. These steps encompass quality control, annotation, pan-genome construction and analysis, and visualization throughout a pan-genome project, with exemplary tools highlighted for each stage. Furthermore, we have substantially expanded the scope of the chapters on quality control standards, data formats and sharing, visualization and analysis guidelines, and case studies. The reviewers’ comments have helped us significantly refine the white paper. The new figure provides readers with a clear, visualized, and summarized overview of the essential steps required to successfully conduct a pan-genome analysis. These steps encompass quality control, annotation, pan-genome construction and analysis, and visualization throughout a pan-genome project, with exemplary tools highlighted for each stage. Furthermore, we have substantially expanded the scope of the chapters on quality control standards, data formats and sharing, visualization and analysis guidelines, and case studies. See the authors' detailed response to the review by Jianping Xu See the authors' detailed response to the review by Rutwik Barmukh See the authors' detailed response to the review by Sunil Kumar Sahu See the authors' detailed response to the review by Xiaoming Xie READ REVIEWER RESPONSES  There is a newer version of this article available. Suppress this message for one day. 1. Introduction Pan-genomes capture both core genomic elements (shared across individuals) and accessory components (variable or unique to subsets), offering unprecedented resolution for studying traits such as disease resistance, environmental adaptation, and domestication ( Qin et al., 2021 ; Zhou et al., 2022 ). Super-pan-genomes, which span multiple species, provide evolutionary context for gene family dynamics and speciation events, as demonstrated in clades like Brassicaceae ( Jiao & Schneeberger, 2020 ) and Solanaceae ( Alonge et al., 2022 ). In plant genomics, pan-genomes are vital for understanding genetic diversity, adaptation, and evolutionary dynamics, particularly given the extensive variation observed in plant species ( Schreiber et al., 2024 ). Despite their potential, inconsistencies in data management—such as ad hoc naming conventions, variable QC practices, and fragmented repository use—limit cross-study comparisons and data reuse. The ELIXIR E-PAN consortium synthesizes insights from foundational studies on barley ( Hordeum vulgare ), rice ( Oryza sativa ), tomato ( Solanum lycopersicum ), and Arabidopsis ( Arabidopsis thaliana ) to propose actionable standards. These guidelines aim to unify the plant genomics community, ensuring robust, interoperable resources for breeding and evolutionary research. 2. Naming conventions and ontologies 2.1 Accession and assembly identifiers Accession naming should adhere to MIAPPE (Minimum Information About Plant Phenotyping Experiments) standards. The Biological Material ID should incorporate institutional identifiers, followed by the accession number from germplasm catalogue or common name of the plant source/variety (e.g., IPK-Gatersleben:HOR_13170 for barley accession “Barke”) to ensure traceability (MIAPPE v1.1, Papoutsoglou et al., 2020 ). When complementary data regarding a specific accession is also available at external sources (e.g. Biosamples), a link to a Biological material external ID should be provided in the metadata. Genome assembly identifiers should contain at least 4 fields—species, variety/line, project group, assembly version — separated by period (‘.’), with an optional fifth field for additional information ( Cannon et al., 2025 ). For example, drOrySati.Nipponbare.RicePan.1.0, which refers to the assembly of Oryza sativa , Nipponbare cultivar, RicePan project, version 1.0 (ToLID identifier, https://id.tol.sanger.ac.uk/ , Darwin Tree of Life Consortium, 2023 ). 2.2 Gene identifiers Gene identifiers must balance stability with biological relevance, as outlined by Cannon et al. (2025) , keeping track of the annotation version, chromosome and gene ID. Their framework proposes human- and machine-readable identifiers, including the assembly names (e.g. drOrySati.Nipponbare.RicePan.1.0) with the addition of gene models like drOrySati.Nipponbare.RicePan.1.0.1.01.g000100 (assembly version 1.0, annotation version 1, chromosome 01, gene 100). To enhance this for pan-genomics, the “group” field can denote pan-genome projects (e.g., RicePan), linking multiple assemblies, while optional fields like “Hap1” or metadata tags distinguish haplotypes or accession types (e.g., wild vs. cultivated). Pangenes, representing orthologous gene clusters, can be assigned identifiers like drOrySati.RicePan.pan00001, with metadata linking to specific gene models across assemblies. Cannon et al. (2025) advocate preserving legacy identifiers via cross-references to ensure stability, avoiding disruptive renaming as new accessions are added. 2.3 Metadata and ontologies A core metadata schema is critical for interoperability. Required fields to properly annotate pan-genome studies include species details such as name (TaxonID), pedigree, geographic origin, ploidy and chromosome number, as well as sequencing technology used (e.g. PacBio HiFi, Oxford Nanopore, Hi-C, Illumina), assembly pipelines (e.g., Flye ( Kolmogorov et al., 2020 ), hifiasm ( Cheng et al., 2024 ), Canu ( Koren et al., 2017 ), …), and assembly QC metrics (e.g., BUSCO scores ( Manni et al., 2021 )). Existing ontologies such as the Sequence Ontology (SO) should be extended to include pan-genome-specific terms that describe the layouts and structures of pan-genomes ( Eilbeck et al., 2005 ). These can be categorized as core, shell and cloud genome genes, but these terms may depend on the number of genomes and genotypes selected ( Jayakodi et al., 2024 ). Any downstream comparative analysis requires open and transparent reporting on the thresholds used, so that these must be included in the metadata. Collaboration with the AgBioData Nomenclature Working Group and the Genomics Standards Consortium ( https://www.gensc.org/ ) ensures alignment with broader genomic standards ( Cannon et al., 2025 ). 2.4 Generalized feature identification As pan-genome graphs grow to encompass not just core and variable genes but a full spectrum of genomic elements, we need a unified identification system. Current annotation often focuses on genes, leaving features like transposable elements, SSRs, non-coding RNAs, and regulatory motifs with inconsistent or tool-specific labels. We propose the development of a generalized feature identifier (GFI) . This system would provide a stable, queryable, and standardized format for any annotated feature, independent of its type or the discovery tool used. A GFI would be important for pan-genome-scale association studies and for functionally characterizing the entire “dark matter” of the genome, ensuring that a SNP in a long terminal repeat or a copy number variation in a novel ncRNA can be cataloged and compared with the same rigor as in a protein-coding gene. 3. Quality Control (QC) standards 3.1 Sequencing and assembly QC Quality control in genome assembly workflows begins with sequencing QC, where tools like FASTQC assess raw read integrity, including base quality, GC content, and adapter contamination ( Figure 1A ). K-mer plots, generated via Jellyfish ( Marçais et al., 2011 ) paired with GenomeScope 2 ( Ranallo-Benavidez et al., 2020 ), provide insights into genome complexity, such as ploidy, heterozygosity, and repetitive element profiles ( Figure 1A ). For individual assembly QC, QUAST ( Mikheenko et al., 2023 ) is recommended for evaluating contiguity metrics (e.g., N50, L50) and is particularly effective for comparing multiple assemblies of diploid genomes, while CRAQ ( Li et al., 2023 ) excels in assessing consensus accuracy and structural errors in polyploid genomes due to its sensitivity to haplotype-specific misassemblies ( Figure 1A ). When results from QUAST and CRAQ conflict (e.g., differing contig counts due to haplotype collapsing), users should prioritize CRAQ for polyploid assemblies and cross-validate with raw read alignments (e.g., using Minimap2) to resolve discrepancies. Merqury ( Rhie et al., 2020 ) further validates haplotype resolution in polyploid or heterozygous genomes (e.g., wheat, potato) by comparing k-mer spectra between raw reads and assemblies, offering a robust check for completeness and phasing errors ( Figure 1A ). For repeat quality control, the LTR Assembly Index (LAI; Ou et al., 2018 ) assesses the completeness of long terminal repeat retrotransposons, while tidk ( Brown et al., 2025 ) detects telomeric motifs to evaluate chromosomal end-to-end integrity ( Figure 1A ). When results from these tools conflict, LAI generally provides a more reliable indicator of assembly quality. Even in high-quality plant genomes assembled from long reads, some chromosome ends may still lack detectable telomeric repeats. Figure 1. Overview of quality control, annotation, pan-genome analysis, and visualization steps across a -pan-genome project, with example tools highlighted. A , Sequencing and assembly QC. Raw DNA reads are screened for base quality, adapter contamination, and k-mer composition using FastQC , GenomeScope 2 , and Jellyfish . Individual assemblies are evaluated for contiguity, completeness, and consensus accuracy with QUAST and CRAG ; haplotype resolution in polyploids with Merqury ; repeat content and assembly of long terminal repeat retrotransposons with LTR assembly index ; and telomere identification with tidk . B , Annotation QC. Gene models are generated and refined with BRAKER3 , MAKER2 , Helixer , and PASA , and can be transferred between assemblies using Liftoff. Validation incorporates RNA-seq support and summary metrics including gene set completeness with BUSCO , gene family classification with Mercator4 , structural annotation validation with PSAURON , and contamination detection with OMArk . C , Pan-genome–specific QC and discovery. Across multiple genomes, analyses include gene accumulation and saturation behavior, detection of structural variants with Sniffles2 and SVIM , assessment of presence–absence variation with Panaroo , and tests for gene family expansion or contraction with CAFE5 and OrthoFinder . D , Visualization and comparative analysis. Linear genome browsers support side-by-side inspection of assemblies and annotations ( jBrowse2 , IGV ). Graph-based frameworks represent shared and alternative haplotypes and enable mapping and variant interrogation across many genomes ( VG toolkit , PGGB , PanTools , wfmash ), complemented by network and assembly graph viewers ( cytoscape , bandage ). E , Pre-rendered web portals. Project-specific portals provide searchable tracks and summary plots for community access, exemplified by PanBARLEX , ( https://panbarlex.ipk-gatersleben.de/#seqcluster/BarleyCDS90_02985 ). F , Presence absence variation (PAV) relations shown in knowledge graphs produced by KnetMiner . Dashed boxes delineate workflow stages; icons are schematic. The listed software represents commonly used options and is not exhaustive. Abbreviations: QC, quality control; RNA-seq, RNA sequencing; PAV, presence–absence variation. 3.2 Annotation QC Annotation pipelines must be documented alongside assembly strategies. These may include gene model integration pipelines like MAKER2 ( Holt & Yandell, 2011 ), PASA ( Haas et al., 2003 ) or BRAKER3 ( Gabriel et al., 2024 ), while Helixer ( Stiehler et al., 2020 ) is recommended for ab initio prediction in non-model organisms due to its deep learning-based approach ( Figure 1B ). Liftoff ( Shumate & Salzberg, 2021 ) is ideal for annotation transfer between closely related species and should be part of a standard annotation pipeline ( Figure 1B ). Use versioned workflows (e.g., Snakemake ( Köster & Rahmann, 2012 ), or Nextflow ( Di Tommaso et al., 2017 )) to ensure reproducibility, provenance tracking, and portability. Transcriptomic data (RNA-Seq) from multiple tissues (e.g., roots, shoots) and stress conditions (e.g., drought, disease) with sufficient read coverage validates gene models, especially for accessory genes lacking orthologs ( Qin et al., 2021 ). Long-read RNA sequencing technologies are recommended to recover full-length transcripts and accurately characterize alternative isoforms. For structural annotation QC, BUSCO ( Manni et al., 2021 ) assesses gene space completeness using lineage-specific datasets that can be adjusted for polyploid genomes ( Figure 1B ). Mercator4 ( Bolger et al., 2021 ) assigns functional categories based on the MapMan bin system and is useful for identifying missing functions in a single genome ( Figure 1B ). PSAURON ( Sommer et al., 2025 ) validates structural annotations, and OMArk ( Nevers et al., 2025 ) detects contamination via evolutionary consistency checks ( Figure 1B ). In cases where evaluation tools disagree (e.g., BUSCO reports missing genes but PSAURON suggests completeness), integrating RNA-Seq support and orthology evidence provides a more reliable basis for resolving such discrepancies. 3.3 Pan-genome-specific QC Pan-genome completeness requires saturation analysis, where gene accumulation curves assess whether additional accessions contribute novel genes ( Tettelin et al., 2005 ). For species with varying ploidy levels (e.g., diploid vs. polyploid barley), a minimum of 10–20 accessions is typically required for diploid species to approach saturation, while polyploid species may need 30–50 accessions due to increased gene content complexity ( Jayakodi et al., 2024 ). Users should plot accumulation curves using tools like Panaroo and evaluate saturation by fitting models (e.g., Heap’s Law) to confirm diminishing returns in gene discovery ( Figure 1C ). For species like barley, benchmark datasets of 100+ conserved genes enable orthology tool validation ( Jayakodi et al., 2024 ). OrthoFinder ( Emms & Kelly, 2019 ) and CAFE5 ( Mendes et al., 2020 ) facilitate gene family expansion and contraction analyses, providing insights into evolutionary dynamics ( Figure 1C ). Structural variant detection, using Sniffles2 ( Smolka et al., 2024 ) for long-read data or SVIM ( Heller & Vingron, 2019 ) for short-read data, quantifies indels and inversions ( Qin et al., 2021 ) ( Figure 1C ). When tools like Sniffles2 and SVIM yield conflicting variant calls, users should integrate multi-platform data (e.g., combining long- and short-read alignments) and prioritize calls supported by higher read depth or mapping quality. Presence-absence variation (PAV) detection via Panaroo or PAV-specific pipelines is critical for identifying variable gene content tied to phenotypic diversity ( Tonkin-Hill et al., 2020 ). 4. Data formats and sharing 4.1 File formats • Raw data : Assemblies must be submitted in FASTA format with headers containing unique sequence identifiers (e.g., >chr01, >chr02). Annotations must be provided in GFF3 or GTF format (compliant with Sequence Ontology), with the sequence IDs in the first column exactly matching the sequence identifiers used in the FASTA headers. • Derived data : Structural variants in VCF/BCF, orthogroups in TSV (cluster ID + member gene), and graph-based representations (GFA format) for complex pan-genomes ( Li et al., 2020 ). 4.2 Repositories Centralized repositories would archive versioned datasets (e.g., Barley v2, Rice v1.5) with DOI-based identifiers (DataCite). Public deposition in INSDC (raw reads and assembly, https://www.insdc.org/ ) and Ensembl (annotations, see documentation of Ensembl, 2025, https://beta.ensembl.org/ ) ensures global accessibility (ENA Documentation, 2025). 4.3 Metadata requirements Mandatory metadata fields include sequencing technology and coverage (e.g., PacBio HiFi, Oxford Nanopore), assembly method (e.g., Flye, Hifiasm), accession provenance (BioSample IDs), and software versioning of all software and pipelines used. Missing metadata, as observed in early barley submissions, must be addressed via enforced submission guidelines ( Jayakodi et al., 2024 ). For pangenome datasets, additional metadata fields are critical to ensure traceability and interoperability across studies. These should include the species name and NCBI Taxonomy ID, pangenome version and build date, and a complete list of constituent genomes with corresponding assembly accessions, strain names, and versions. Furthermore, metadata should describe the methods and parameters used to construct the pangenome. Capturing this information in structured formats such as JSON-LD or RO-Crate ( Peroni et al., 2022 ) would align pangenome submissions with broader FAIR data principles and facilitate integration with knowledge graphs and comparative genomics resources. 5. Visualization and analysis guidelines 5.1 Visualization tools Plant pan-genomes capture a species’ full genomic diversity, constructed using either linear-based or graph-based methods, each with distinct strengths and limitations. To provide a clearer comparison, linear-based approaches are divided into two distinct categories: sequence-based and gene-based analyses. Sequence-based linear analysis involves aligning multiple genomes to a single reference or consensus sequence to identify sequence-level variations, such as single-nucleotide polymorphisms (SNPs) and insertions/deletions (indels). This process typically employs variant callers like GATK ( McKenna et al., 2010 ) or freebayes ( Garrison & Marth, 2012 ) to detect SNPs and indels from whole-genome alignments. These methods are computationally efficient and compatible with visualization tools like JBrowse2 ( Diesh et al., 2023 ) or IGV ( Robinson et al., 2023 ) for synteny and variant visualization ( Figure 1D ). Web-portals such as PanBARLEX ( PanBARLEX - Barley Pangenome Explorer ) enable pan-genome research by providing searchable and pre-rendered visualizations ( Figure 1E ). However, reference bias in sequence-based linear approaches can limit their ability to capture complex structural variations, particularly in repetitive or polyploid plant genomes. Gene-based linear analysis focuses on inferring orthology and identifying gene-level presence/absence variations (PAVs) using tools like OrthoFinder ( Emms & Kelly, 2019 ) or Ensembl Compara ( Dyer et al., 2025 ). These tools analyze annotated gene sets to determine the pan-gene repertoire, identifying core and accessory genes across a species. While effective for gene-level PAV detection, these methods do not directly address sequence-level variations like SNPs or indels, requiring separate workflows for comprehensive analysis. Orthology inference tools must be benchmarked using inflation value sweeps to minimize false positives ( Emms & Kelly, 2019 ). Visualization of gene-level PAVs can be achieved through UpSet plots or as presence/absence relationships in KnetMiner knowledge graphs ( Hassani-Pak et al., 2021 ) ( Figure 1F ). In contrast, graph-based approaches model genomes as interconnected nodes (shared regions) and edges (SNPs, indels, and structural variants) using tools like VG Toolkit ( Hickey et al., 2020 ), PGGB ( Garrison et al., 2024 ), PanTools ( Jonkheer et al., 2022 ), or wfmash ( Guarracino et al., 2021 ) ( Figure 1D ). These methods integrate both sequence-level and structural variations in a single framework, offering an unbiased, comprehensive view of genomic diversity. They are particularly suited for complex genomes, such as tomato ( Zhou et al., 2022 ). Visualization tools like Bandage ( Wick et al., 2015 ) or Cytoscape ( Shannon et al., 2003 ) are used to represent structural complexity, though these approaches are computationally intensive and require specialized expertise ( Figure 1D ). In summary, sequence-based linear methods excel in rapid SNP and indel detection but are limited by reference bias, while gene-based linear methods are ideal for pan-gene analysis but require separate homology-based workflows. Graph-based approaches unify both gene-level and structural variation analyses, offering greater flexibility for complex genomes despite higher computational demands. As computational resources and tools advance, graph-based methods are becoming more accessible, enhancing plant pan-genome studies as demonstrated in rice ( Qin et al., 2021 ). 5.2 Integrative analysis best practices The integration of pangenomic information into crop improvement remains challenging, despite its potential to illuminate the genetic basis of agronomic traits. Pangenomes reveal extensive structural polymorphisms and gene content diversity across accessions, yet these findings often remain siloed from other key data sources such as GWAS and QTL mappings, gene expression profiles, gene regulation, functional annotations, and published literature. Without coherent integration, researchers face difficulties in linking genomic variation to phenotype and in distinguishing biologically meaningful signals from background noise. Bridging these data types requires frameworks capable of harmonizing heterogeneous evidence, tracking provenance, and enabling transparent reasoning across molecular, phenotypic, and bibliographic domains. Platforms such as KnetMiner ( Hassani-Pak et al., 2021 , https://knetminer.com ) address these challenges by synthesizing pangenomic, association, omics, and literature-derived evidence within a unified knowledge graph. This integrative approach allows relationships among genes, traits, and pathways to be explored in context, supporting AI-assisted hypothesis generation and candidate gene prioritization. By providing explainable connections between diverse evidence sources, KnetMiner exemplifies how knowledge graph technologies can transform FAIR yet fragmented genomic data into a coherent foundation for evidence-based crop breeding. 6. Case studies Barley Pan-genome ( Jayakodi et al., 2024 ): The IPK barley pan-genome, encompassing 76 accessions, faced significant challenges in diploid genome assembly due to the crop’s complex genetic structure. The adoption of automated quality control (QC) pipelines, implemented via Snakemake ( Köster & Rahmann, 2012 ) and, alongside validation gene sets, was critical to ensuring reproducibility and accuracy. These standardized tools mitigated errors from manual curation, which previously led to inconsistent gene annotations across accessions. By streamlining QC processes, the project achieved robust assembly outcomes, enabling reliable downstream analyses for barley breeding programs. Without such standards, the project risked fragmented datasets, highlighting the necessity of automation for handling complexity. Rice Pan-genome ( Qin et al., 2021 ): Analysis of 31 rice accessions using Sniffles revealed hidden structural variations critical for understanding genetic diversity. However, the absence of standardized QC metrics initially led to discrepancies in variant calling, complicating comparisons across accessions. The project’s success in identifying novel variations was enhanced by post-hoc implementation of rigorous QC protocols, which improved variant validation and reproducibility. This case underscores the need for predefined, community-wide QC standards to ensure consistency in pan-genome analyses, as their absence delayed insights into rice diversity and potential breeding applications. Tomato Super-Pan-genome ( Zhou et al., 2022 ): The tomato super-pan-genome, comprising 838 genomes, utilized a graph-based representation to resolve complex structural variants, directly informing breeding strategies for disease resistance. The adoption of standardized graph-based assembly tools ensured accurate representation of genetic diversity, overcoming limitations of linear reference genomes. This standardized approach facilitated the identification of novel resistance genes, significantly advancing breeding outcomes. Without such standards, the project could have faced misassembled variants, reducing its utility for applied breeding. This case exemplifies how standardized frameworks enhance the resolution of complex genomic data for practical applications. Arabidopsis ( Jiao & Schneeberger 2020 ; Zhong et al., 2025 ): Annotation gene naming and transfer across Arabidopsis MAGIC founders using Liftoff achieved cross-accession consistency. The use of standardized annotation pipelines ensured accurate gene mapping, enabling robust multi-omic and pan-genomic comparisons. This standardization was pivotal in identifying functional genomic variations within the population, supporting downstream genetic studies. In contrast, earlier Arabidopsis pan-genome efforts lacking such standardized tools faced annotation inconsistencies, which hindered comparative analyses. This case highlights how standardized naming conventions and annotation transfer tools like Liftoff are essential for ensuring reliable and reproducible pan-genomic insights. 7. Future directions • Artificial Intelligence : Tools like DeepVariant ( Poplin et al., 2018 ) will enhance variant calling in polyploid genomes. Detection of other genomic features, such as repeat elements, regulatory elements, and binding sites, will be enabled and refined using foundational models, as demonstrated in recent high-impact studies. For instance, BigRNA predicts tissue-specific RNA expression and identifies regulatory elements like microRNA and protein binding sites with high accuracy ( Celaj et al., 2023 ). Similarly, Evo 2 detects transcription factor binding sites and exon-intron boundaries across diverse genomes ( Brixi et al., 2025 ), while models like DNABERT ( Ji et al., 2021 ) and Enformer ( Avsec et al., 2021 ) excel in promoter prediction and variant effect analysis ( Li et al., 2024 ). These advancements highlight the transformative potential of foundational models in refining genomic feature detection, particularly for complex polyploid genomes. • Cross-species standards : Develop clade-wide frameworks (e.g., Brassicaceae) to unify super-pan-genome analyses. • Community engagement : ELIXIR hackathons will refine workflows and ontology terms, ensuring adaptability to technological advances. 8. Conclusion This white paper establishes a community-driven framework for plant pan-genome research. By adopting these guidelines, researchers can ensure data interoperability, reproducibility, and translational impact. The E-PAN consortium calls for global collaboration to iteratively refine these standards, fostering innovation in plant genomics and breeding. Endorsed by ELIXIR Nodes : DE, BE, PT, SI, UK. Contact : [email protected] Data availability No data is associated with this article. Acknowledgments The E-PAN consortium acknowledges contributions from researchers at ELIXIR nodes and foundational studies in rice, barley, tomato, and Arabidopsis. AI tools (DeepSeek R1, Qwen QwQ 32B) hosted on https://chat-ai.academiccloud.de helped create the draft from multiple meeting notes, with thorough human oversight ensuring scientific accuracy. For updates, visit the ELIXIR Plant Sciences Community Portal . References Alonge M, et al. : Major impacts of widespread structural variation on gene expression and crop improvement in tomato. Nature. 2022; 606 : 527–534. PubMed Abstract | Publisher Full Text | Free Full Text Avsec Ž, et al. : Effective gene expression prediction from sequence by integrating long-range interactions. Nat. Methods. 2021; 18 : 1196–1203. PubMed Abstract | Publisher Full Text | Free Full Text Bolger M, et al. : MapMan Visualization of RNA-Seq Data Using Mercator4 Functional Annotations. Dobnik D, Gruden K, Ramšak Ž, et al. , editors. Solanum tuberosum. Methods in Molecular Biology. New York, NY: Humana; 2021; vol. 2354 . . Publisher Full Text Brixi G, et al. : Genome modeling and design across all domains of life with Evo 2. bioRxiv. 2025. Publisher Full Text Brown MR, et al. : tidk: a toolkit to rapidly identify telomeric repeats from genomic datasets Open Access. Bioinformatics. February 2025; 41 (2): btaf049. PubMed Abstract | Publisher Full Text | Free Full Text Cannon EKS, et al. : Guidelines for gene and genome assembly nomenclature. Genetics. 2025; 229 (3). PubMed Abstract | Publisher Full Text | Free Full Text Celaj A, et al. : An RNA foundation model enables discovery of disease mechanisms and candidate therapeutics. bioRxiv. 2023. Publisher Full Text Cheng H, et al. : Scalable telomere-to-telomere assembly for diploid and polyploid genomes with double graph. Nat. Methods. 2024; 21 : 967–970. PubMed Abstract | Publisher Full Text | Free Full Text Darwin Tree of Life Consortium: The Darwin Tree of Life project: Sequencing all life in Britain and Ireland.2023. Reference Source Diesh C, et al. : JBrowse2: A modular genome browser with next-generation data support. Genome Biol. 2023; 24 (74): 74. PubMed Abstract | Publisher Full Text | Free Full Text Di Tommaso P, et al. : Nextflow enables reproducible computational workflows. Nat. Biotechnol. 2017; 35 : 316–319. PubMed Abstract | Publisher Full Text Dyer S, et al. : Ensembl 2025. Nucleic Acids Res. 6 January 2025; 53 (D1): D948–D957. PubMed Abstract | Publisher Full Text | Free Full Text Eilbeck K, et al. : The Sequence Ontology: A tool for the unification of genome annotations. Genome Biol. 2005; 6 (R44): R44. PubMed Abstract | Publisher Full Text | Free Full Text Emms DM, Kelly S: OrthoFinder: Phylogenetic orthology inference for comparative genomics. Genome Biol. 2019; 20 (238): 238. PubMed Abstract | Publisher Full Text | Free Full Text Gabriel L, et al. : BRAKER3: Fully automated genome annotation using RNA-seq and protein evidence with GeneMark-ETP, AUGUSTUS, and TSEBRA. Genome Res. 2024; 34 (34): 769–777. PubMed Abstract | Publisher Full Text | Free Full Text Garrison E, et al. : Building pangenome graphs. Nat. Methods. 2024; 21 : 2008–2012. PubMed Abstract | Publisher Full Text Garrison E, Marth G: Haplotype-based variant detection from short-read sequencing. arXiv preprint arXiv:1207.3907 [q-bio.GN] 2012. 2012. Publisher Full Text Guarracino A, et al. : wfmash: whole-chromosome pairwise alignment using the hierarchical wavefront algorithm. GitHub; 2021. Reference Source Haas B-J, et al. : Improving the Arabidopsis genome annotation using maximal transcript alignment assemblies. Nucleic Acids Res. 1 October 2003; 31 (19): 5654–5666. PubMed Abstract | Publisher Full Text | Free Full Text Hassani-Pak K, et al. : KnetMiner: a comprehensive approach for supporting evidence-based gene discovery and complex trait analysis across species. Plant Biotechnol. J. 2021; 19 : 1670–1678. PubMed Abstract | Publisher Full Text | Free Full Text Heller D, Vingron M: SVIM: structural variant identification using mapped long reads Open Access. Bioinformatics. September 2019; 35 (17): 2907–2915. PubMed Abstract | Publisher Full Text | Free Full Text Hickey G, et al. : Genotyping structural variants in pangenome graphs using the vg toolkit. Genome Biol. 2020; 21 : 35. PubMed Abstract | Publisher Full Text | Free Full Text Holt C, Yandell M: MAKER2: an annotation pipeline and genome-database management tool for second-generation genome projects. BMC Bioinformatics. 2011; 12 : Article number: 491. PubMed Abstract | Publisher Full Text | Free Full Text Jayakodi M, et al. : The barley pan-genome reveals genomic diversity across wild and cultivated accessions. Nature. 2024; 636 : 654–662. PubMed Abstract | Publisher Full Text | Free Full Text Ji Y, et al. : DNABERT: pre-trained Bidirectional Encoder Representations from Transformers model for DNA-language in genome Free. Bioinformatics. August 2021; 37 (15): 2112–2120. PubMed Abstract | Publisher Full Text | Free Full Text Jiao W-B, Schneeberger K: Chromosome-level assemblies of multiple Arabidopsis genomes reveal hotspots of rearrangements with altered evolutionary dynamics. Nat. Commun. 2020; 11 (989): 989. PubMed Abstract | Publisher Full Text | Free Full Text Jonkheer EM, et al. : PanTools v3: Functional analysis of prokaryotic pangenomes. Bioinformatics. 2022; 38 (18): 4403–4405. PubMed Abstract | Publisher Full Text | Free Full Text Kolmogorov M, et al. : metaFlye: scalable long-read metagenome assembly using repeat graphs. Nat. Methods. 2020; 17 : 1103–1110. PubMed Abstract | Publisher Full Text | Free Full Text Koren S, et al. : Canu: scalable and accurate long-read assembly via adaptive k-mer weighting and repeat separation. Genome Res. 2017; 27 : 722–736. PubMed Abstract | Publisher Full Text | Free Full Text Köster J, Rahmann S: Snakemake—A scalable bioinformatics workflow engine. Bioinformatics. 2012; 28 (19): 2520–2522. PubMed Abstract | Publisher Full Text Li H, et al. : The design and construction of reference pangenome graphs. Genome Biol. 2020; 21 (265): 265. PubMed Abstract | Publisher Full Text | Free Full Text Li N, et al. : Super-pangenome analyses highlight genomic diversity and structural variation across wild and cultivated tomato species. Nat. Genet. 2023a; 55 (8): 852–860. PubMed Abstract | Publisher Full Text | Free Full Text Li K, et al. : Identification of errors in draft genome assemblies at single-nucleotide resolution for quality assessment and improvement. Nat. Commun. 2023b; 14 : 6556. PubMed Abstract | Publisher Full Text | Free Full Text Li Q, et al. : Progress and opportunities of foundation models in bioinformatics. Brief. Bioinform. 2024; 25 (6). PubMed Abstract | Publisher Full Text | Free Full Text Manni M, et al. : BUSCO: Assessing genome assembly and annotation completeness. Current Protocols. 2021; 1 (7): e323. PubMed Abstract | Publisher Full Text Marçais G, et al. : A fast, lock-free approach for efficient parallel counting of occurrences of k-mers Free. Bioinformatics. March 2011; 27 (6): 764–770. PubMed Abstract | Publisher Full Text | Free Full Text McKenna A, et al. : The Genome Analysis Toolkit: a MapReduce framework for analyzing next-generation DNA sequencing data. Genome Res. 2010; 20 : 1297–1303. PubMed Abstract | Publisher Full Text | Free Full Text Mendes FK, et al. : CAFE 5 models variation in evolutionary rates among gene families. Bioinformatics. December 2020; 36 (22-23): 5516–5518. PubMed Abstract | Publisher Full Text Mikheenko A, et al. : WebQUAST: online evaluation of genome assemblies Open Access. Nucleic Acids Res. 5 July 2023; 51 (W1): W601–W606. Publisher Full Text Naithani S, et al. : Exploring Pan-Genomes: An Overview of Resources and Tools for Unraveling Structure, Function, and Evolution of Crop Genes and Genomes. Biomolecules. 2023 Sep 17; 13 (9): 1403. PubMed Abstract | Publisher Full Text | Free Full Text Nevers Y, et al. : OMArk: Genome assembly quality assessment using evolutionary signals. Nat. Biotechnol. 2025; 43 : 124–133. PubMed Abstract | Publisher Full Text | Free Full Text Papoutsoglou EA, et al. : Enabling reusability of plant phenomic datasets with MIAPPE 1.1. New Phytol. 2020; 227 : 260–273. PubMed Abstract | Publisher Full Text | Free Full Text Peroni S, et al. : Packaging research artefacts with RO-Crate. Data Sci. 2022; 5 (2): 97–138. Publisher Full Text Poplin R, et al. : A universal SNP and small-indel variant caller using deep neural networks. Nat. Biotechnol. 2018; 36 (10): 983–987. PubMed Abstract | Publisher Full Text Qin P, et al. : Pan-genome analysis of 33 genetically diverse rice accessions reveals hidden genomic variations. Cell. 2021; 184 (13): 3542–3558.e16. PubMed Abstract | Publisher Full Text Ranallo-Benavidez TR, et al. : GenomeScope 2.0 and Smudgeplot for reference-free profiling of polyploid genomes. Nat. Commun. 2020; 11 : 1432. PubMed Abstract | Publisher Full Text | Free Full Text Rhie A, et al. : Merqury: Reference-free quality assessment of genome assemblies. Genome Biol. 2020; 21 (245): 245. PubMed Abstract | Publisher Full Text | Free Full Text Robinson J-T, et al. : igv.js: an embeddable JavaScript implementation of the Integrative Genomics Viewer (IGV). Bioinformatics. January 2023; 39 (1): btac830. PubMed Abstract | Publisher Full Text | Free Full Text Schreiber M, et al. : Plant pangenomes for crop improvement, biodiversity and evolution. Nat. Rev. Genet. 2024; 25 : 563–577. PubMed Abstract | Publisher Full Text | Free Full Text Shang L, et al. : A super pan-genomic landscape of rice. Cell Res. 2022; 32 : 878–896. PubMed Abstract | Publisher Full Text | Free Full Text Shannon P, et al. : Cytoscape: A software environment for integrated models of biomolecular interaction networks. Genome Res. 2003; 13 (11): 2498–2504. PubMed Abstract | Publisher Full Text | Free Full Text Shumate A, Salzberg SL: Liftoff: Accurate alignment-based annotation transfer in phylogenomics. Bioinformatics. 2021; 37 (12): 1639–1643. PubMed Abstract | Publisher Full Text | Free Full Text Smolka M, et al. : (2024). Detection of mosaic and population-level structural variants with Sniffles2. Nat. Biotechnol. 2024; 42 : 1571–1580. PubMed Abstract | Publisher Full Text | Free Full Text Sommer MJ, et al. : PSAURON: A tool for structural annotation quality assessment. NAR Genomics and Bioinformatics. 2025; 7 (1). PubMed Abstract | Publisher Full Text | Free Full Text Stiehler F, et al. : Helixer: Cross-species gene annotation with deep learning. Bioinformatics. 2020; 36 (22-23): 5291–5298. PubMed Abstract | Publisher Full Text | Free Full Text Tettelin H, et al. : Genome analysis of multiple pathogenic isolates of Streptococcus agalactiae. Proc. Natl. Acad. Sci. 2005; 102 (39): 13950–13955. PubMed Abstract | Publisher Full Text | Free Full Text Tonkin-Hill G, et al. : Panaroo: Pangenome analysis pipeline for microbial genomes. Genome Biol. 2020; 21 (180): 180. PubMed Abstract | Publisher Full Text | Free Full Text Ou S, et al. : Assessing genome assembly quality using the LTR Assembly Index (LAI) Open Access. Nucleic Acids Res. 30 November 2018; 46 (21): e126. PubMed Abstract | Publisher Full Text | Free Full Text Wick RR, et al. : Bandage: Interactive visualization of de novo genome assemblies. Bioinformatics. 2015; 31 (20): 3350–3352. PubMed Abstract | Publisher Full Text | Free Full Text Zhong Z, et al. : The distinct roles of genome, methylation, transcription, and translation on protein expression in Arabidopsis thaliana resolve the Central Dogma’s information flow. Genome Biol. 2025; 26 (1): 319. PubMed Abstract | Publisher Full Text | Free Full Text Zhou Y, et al. : Graph pangenome captures missing heritability and empowers tomato breeding. Nature. 2022; 606 : 527–534. PubMed Abstract | Publisher Full Text | Free Full Text Additional Resources AgBioData Nomenclature Working Group: GitHub repository.2025. Reference Source ENA Metadata Standards: European Nucleotide Archive.2025. Reference Source ENSEMBL: Genome data & annotation.2025. Reference Source FAIR Cookbook: ELIXIR Europe.2025. Reference Source INSDC: The International Nucleotide Sequence Database Collaboration.2025. Reference Source Merqury Documentation: GitHub.2020. Reference Source PanBARLEX: 2025. Reference Source Comments on this article Comments (0) Version 3 VERSION 3 PUBLISHED 28 Jul 2025 ADD YOUR COMMENT Comment Author details Author details 1 Leibniz Institute of Plant Genetics and Crop Plant Research (IPK), Seeland, Saxony-Anhalt, 06466, Germany 2 Universidade Nova de Lisboa Instituto de Tecnologia Quimica e Biologica, Oeiras, Lisbon, Portugal 3 Forschungszentrum Jülich GmbH Institute of Bio- and Geosciences, Jülich, North Rhine-Westphalia, 52425, Germany 4 Helmholtz Zentrum München, Neuherberg, 85764, Germany 5 European Molecular Biology Laboratory, European Bioinformatics Institute, Wellcome Genome Campus, Hinxton, Cambridge, CB10 1SD, UK 6 Rothamsted Research, Harpenden, England, AL52JQ, UK 7 National Institute of Biology, Večna pot 111, Ljubljana, 1000, Slovenia 8 Department of Plant Biotechnology and Bioinformatics, Ghent University, Technologiepark 71, Ghent, 9052, Belgium Marc C. Heuermann Roles: Conceptualization, Writing – Original Draft Preparation, Writing – Review & Editing Pedro Barros Roles: Writing – Review & Editing Sebastian Beier Roles: Writing – Review & Editing Heidrun Gundlach Roles: Writing – Review & Editing Jorge Alvarez-Jarreta Roles: Writing – Review & Editing Keywan Hassani-Pak Roles: Writing – Review & Editing Patrick König Roles: Writing – Review & Editing Anne Fiebig Roles: Writing – Review & Editing Tim Godec Roles: Writing – Review & Editing Kristina Gruden Roles: Writing – Review & Editing Nadja Nolte Roles: Writing – Review & Editing Marko Petek Roles: Writing – Review & Editing Uwe Scholz Roles: Writing – Review & Editing Maja Zagorščak Roles: Writing – Review & Editing Klaas Vandepoele Roles: Project Administration, Writing – Review & Editing Michiel Van Bel Roles: Project Administration, Writing – Review & Editing Competing interests No competing interests were disclosed. Grant information This study has received funding from ELIXIR under the call for proposals on Biodiversity, Food Safety and Pathogens (2024-SCIENCE-BFSP) as part of WP2 E-PAN: Enhancing pan-genome analysis in plants. MCH received funding from ELIXIR-DE, which was supported by the Federal Ministry of Education and Research BMBF within the framework of de.NBI/ELIXIR-DE (W-de.NBI-009). The funders had no role in study design, data collection and analysis, decision to publish, or preparation of the manuscript. Article Versions (3) version 3 Revised Published: 07 May 2026, 14:739 https://doi.org/10.12688/f1000research.166538.3 version 2 Revised Published: 18 Nov 2025, 14:739 https://doi.org/10.12688/f1000research.166538.2 version 1 Published: 28 Jul 2025, 14:739 https://doi.org/10.12688/f1000research.166538.1 Copyright © 2025 Heuermann MC et al . This is an open access article distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. Download Export To Sciwheel Bibtex EndNote ProCite Ref. Manager (RIS) Sente metrics Views Downloads F1000Research - - PubMed Central info_outline Data from PMC are received and updated monthly. - - Citations open_in_new 0 open_in_new 0 open_in_new SEE MORE DETAILS CITE how to cite this article Heuermann MC, Barros P, Beier S et al. White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.12688/f1000research.166538.2 ) NOTE: If applicable, it is important to ensure the information in square brackets after the title is included in all citations of this article. COPY CITATION DETAILS track receive updates on this article Track an article to receive email alerts on any updates to this article. TRACK THIS ARTICLE Share Open Peer Review Current Reviewer Status: ? Key to Reviewer Statuses VIEW HIDE Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions Version 2 VERSION 2 PUBLISHED 18 Nov 2025 Revised Views 0 Cite How to cite this report: Xu J. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r436510 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-436510 NOTE: it is important to ensure the information in square brackets after the title is included in this citation. Close Copy Citation Details Reviewer Report 30 Dec 2025 Jianping Xu , Department of Biology, McMaster University, Hamilton, Canada Approved with Reservations VIEWS 0 https://doi.org/10.5256/f1000research.191128.r436510 This is an excellent set of recommendations for handling and analyzing plant pan-genomes. I have only three minor comments/questions for authors' considerations. 1. Should there be a clearly stated minimum standard for a genome to be included in plant ... Continue reading READ ALL This is an excellent set of recommendations for handling and analyzing plant pan-genomes. I have only three minor comments/questions for authors' considerations. 1. Should there be a clearly stated minimum standard for a genome to be included in plant pan-genome analyses? In the examples/case studies provided, what were the inclusion criteria and is there an emerging consensus? 2. Even though the abstract included "Super-pan-genomes", aside from the tomato case study example at the very end, very little attention was paid to this topic in the main text. Should there be additional criteria for super-pan-genome studies on top of what's recommended for pan-genome analyses? 3. This White Paper listed INSDC and Ensembl as the suggested data repositories. Given the increasing importance of genomic and pan-genomic data from China and the depositions of such data in the Chinese National Genomic Data Center (https://ngdc.cncb.ac.cn/), I think it's important to include that database as a suggested repository for pan-genome datasets. A minor editorial comment: two citations were included in the abstract of this paper. Can the abstract in this journal include citations? Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Yes Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests: No competing interests were disclosed. Reviewer Expertise: population genetics and genomics, with a focus on fungi I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above. Close READ LESS CITE CITE HOW TO CITE THIS REPORT Xu J. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r436510 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-436510 NOTE: it is important to ensure the information in square brackets after the title is included in all citations of this article. COPY CITATION DETAILS Report a concern Author Response 27 Apr 2026 Marc Christian Heuermann , $usrAffiliation 27 Apr 2026 Author Response 1. Should there be a clearly stated minimum standard for a genome to be included in plant pan-genome analyses? In the examples/case studies provided, what were the inclusion criteria and ... Continue reading 1. Should there be a clearly stated minimum standard for a genome to be included in plant pan-genome analyses? In the examples/case studies provided, what were the inclusion criteria and is there an emerging consensus? Answer: Thank you for your suggestions. We added a sentence in Chapter 3.1, referred to a publication by Wang & Wang 2023, and provided a summary of their proposed framework for quality control in genome assembly, which also contains threshold recommendations. 2. Even though the abstract included "Super-pan-genomes", aside from the tomato case study example at the very end, very little attention was paid to this topic in the main text. Should there be additional criteria for super-pan-genome studies on top of what's recommended for pan-genome analyses? Answer: In the “Case studies” section, we have discussed in greater detail the difference between intra-species pan-genomes and inter-species super-pan-genomes, as well as their complementary nature. In addition, we have included a new Section 3.4 to explain in more detail the differences in quality control when analyzing an inter-species super-pan-genome. 3. This White Paper listed INSDC and Ensembl as the suggested data repositories. Given the increasing importance of genomic and pan-genomic data from China and the depositions of such data in the Chinese National Genomic Data Center (https://ngdc.cncb.ac.cn/), I think it's important to include that database as a suggested repository for pan-genome datasets. Answer: Thank you very much for pointing that out. This would indeed improve the overall visibility and reliability of data storage, which is why we have included this in the manuscript. A minor editorial comment: two citations were included in the abstract of this paper. Can the abstract in this journal include citations? Answer: Indeed, according to the guidelines, this is not permitted. We moved the whole sentence with citation into the introduction section. 1. Should there be a clearly stated minimum standard for a genome to be included in plant pan-genome analyses? In the examples/case studies provided, what were the inclusion criteria and is there an emerging consensus? Answer: Thank you for your suggestions. We added a sentence in Chapter 3.1, referred to a publication by Wang & Wang 2023, and provided a summary of their proposed framework for quality control in genome assembly, which also contains threshold recommendations. 2. Even though the abstract included "Super-pan-genomes", aside from the tomato case study example at the very end, very little attention was paid to this topic in the main text. Should there be additional criteria for super-pan-genome studies on top of what's recommended for pan-genome analyses? Answer: In the “Case studies” section, we have discussed in greater detail the difference between intra-species pan-genomes and inter-species super-pan-genomes, as well as their complementary nature. In addition, we have included a new Section 3.4 to explain in more detail the differences in quality control when analyzing an inter-species super-pan-genome. 3. This White Paper listed INSDC and Ensembl as the suggested data repositories. Given the increasing importance of genomic and pan-genomic data from China and the depositions of such data in the Chinese National Genomic Data Center (https://ngdc.cncb.ac.cn/), I think it's important to include that database as a suggested repository for pan-genome datasets. Answer: Thank you very much for pointing that out. This would indeed improve the overall visibility and reliability of data storage, which is why we have included this in the manuscript. A minor editorial comment: two citations were included in the abstract of this paper. Can the abstract in this journal include citations? Answer: Indeed, according to the guidelines, this is not permitted. We moved the whole sentence with citation into the introduction section. Competing Interests: no competing interests Close Report a concern Respond or Comment COMMENTS ON THIS REPORT Author Response 27 Apr 2026 Marc Christian Heuermann , $usrAffiliation 27 Apr 2026 Author Response 1. Should there be a clearly stated minimum standard for a genome to be included in plant pan-genome analyses? In the examples/case studies provided, what were the inclusion criteria and ... Continue reading 1. Should there be a clearly stated minimum standard for a genome to be included in plant pan-genome analyses? In the examples/case studies provided, what were the inclusion criteria and is there an emerging consensus? Answer: Thank you for your suggestions. We added a sentence in Chapter 3.1, referred to a publication by Wang & Wang 2023, and provided a summary of their proposed framework for quality control in genome assembly, which also contains threshold recommendations. 2. Even though the abstract included "Super-pan-genomes", aside from the tomato case study example at the very end, very little attention was paid to this topic in the main text. Should there be additional criteria for super-pan-genome studies on top of what's recommended for pan-genome analyses? Answer: In the “Case studies” section, we have discussed in greater detail the difference between intra-species pan-genomes and inter-species super-pan-genomes, as well as their complementary nature. In addition, we have included a new Section 3.4 to explain in more detail the differences in quality control when analyzing an inter-species super-pan-genome. 3. This White Paper listed INSDC and Ensembl as the suggested data repositories. Given the increasing importance of genomic and pan-genomic data from China and the depositions of such data in the Chinese National Genomic Data Center (https://ngdc.cncb.ac.cn/), I think it's important to include that database as a suggested repository for pan-genome datasets. Answer: Thank you very much for pointing that out. This would indeed improve the overall visibility and reliability of data storage, which is why we have included this in the manuscript. A minor editorial comment: two citations were included in the abstract of this paper. Can the abstract in this journal include citations? Answer: Indeed, according to the guidelines, this is not permitted. We moved the whole sentence with citation into the introduction section. 1. Should there be a clearly stated minimum standard for a genome to be included in plant pan-genome analyses? In the examples/case studies provided, what were the inclusion criteria and is there an emerging consensus? Answer: Thank you for your suggestions. We added a sentence in Chapter 3.1, referred to a publication by Wang & Wang 2023, and provided a summary of their proposed framework for quality control in genome assembly, which also contains threshold recommendations. 2. Even though the abstract included "Super-pan-genomes", aside from the tomato case study example at the very end, very little attention was paid to this topic in the main text. Should there be additional criteria for super-pan-genome studies on top of what's recommended for pan-genome analyses? Answer: In the “Case studies” section, we have discussed in greater detail the difference between intra-species pan-genomes and inter-species super-pan-genomes, as well as their complementary nature. In addition, we have included a new Section 3.4 to explain in more detail the differences in quality control when analyzing an inter-species super-pan-genome. 3. This White Paper listed INSDC and Ensembl as the suggested data repositories. Given the increasing importance of genomic and pan-genomic data from China and the depositions of such data in the Chinese National Genomic Data Center (https://ngdc.cncb.ac.cn/), I think it's important to include that database as a suggested repository for pan-genome datasets. Answer: Thank you very much for pointing that out. This would indeed improve the overall visibility and reliability of data storage, which is why we have included this in the manuscript. A minor editorial comment: two citations were included in the abstract of this paper. Can the abstract in this journal include citations? Answer: Indeed, according to the guidelines, this is not permitted. We moved the whole sentence with citation into the introduction section. Competing Interests: no competing interests Close Report a concern COMMENT ON THIS REPORT Views 0 Cite How to cite this report: Barmukh R. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r434365 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-434365 NOTE: it is important to ensure the information in square brackets after the title is included in this citation. Close Copy Citation Details Reviewer Report 30 Dec 2025 Rutwik Barmukh , Centre for Crop and Food Innovation, Murdoch University, Murdoch, Western Australia, Australia Approved with Reservations VIEWS 0 https://doi.org/10.5256/f1000research.191128.r434365 This white paper makes an impressive effort to harmonize methodological practices for plant pan-genome construction, analysis, and sharing, as pan-genomic resources are rapidly increasing across different crop species. The manuscript is highly relevant and addresses a clear need within the ... Continue reading READ ALL This white paper makes an impressive effort to harmonize methodological practices for plant pan-genome construction, analysis, and sharing, as pan-genomic resources are rapidly increasing across different crop species. The manuscript is highly relevant and addresses a clear need within the plant genomics community. However, to function effectively as a widely adopted standards document, the manuscript would benefit from stronger justification of recommended practices and better consideration of downstream use cases and implementation challenges. The manuscript’s clarity, usability, and long-term impact will significantly improve after addressing some issues highlighted below. 1. Although the manuscript highlights the importance of the proposed standards for improving FAIR compliance, the practical aspects of implementing these standards in real-world scenarios can be explored further. For instance, challenges related to community-wide adoption, such as maintaining consistent metadata across projects and the limited support for certain recommended formats (e.g. GFA, JSON-LD) in existing repositories, deserve more explicit discussion. In addition, suggestions for handling legacy datasets that lack complete or standardized metadata would be beneficial. Providing concrete examples of common pitfalls (e.g., interoperability failures caused by inconsistent metadata) along with potential mitigation approaches would further strengthen the paper. 2. While the manuscript precisely captures genomic and computational standards, it currently lacks guidance on how pan-genome outputs should interface with downstream applications that are most relevant to plant breeders and geneticists (e.g., GWAS, QTL mapping, selection decisions, etc.). A subsection linking pan-genome data to common downstream analyses can be added. Also, example schemas or pipelines showing how standardized pan-genome representations improve trait mapping or selection decisions in practice can be included. 3. The Case Studies section highlights several key projects, but it reads as descriptive rather than analytical. It would be more convincing if this section contained quantitative comparisons showing how applying the proposed standards increased reproducibility, efficiency, or interpretability over previous, unstandardized approaches. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Partly Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests: No competing interests were disclosed. Reviewer Expertise: Crop genomics, bioinformatics, molecular breeding I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above. Close READ LESS CITE CITE HOW TO CITE THIS REPORT Barmukh R. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r434365 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-434365 NOTE: it is important to ensure the information in square brackets after the title is included in all citations of this article. COPY CITATION DETAILS Report a concern Author Response 27 Apr 2026 Marc Christian Heuermann , $usrAffiliation 27 Apr 2026 Author Response 1. Although the manuscript highlights the importance of the proposed standards for improving FAIR compliance, the practical aspects of implementing these standards in real-world scenarios can be explored further. For ... Continue reading 1. Although the manuscript highlights the importance of the proposed standards for improving FAIR compliance, the practical aspects of implementing these standards in real-world scenarios can be explored further. For instance, challenges related to community-wide adoption, such as maintaining consistent metadata across projects and the limited support for certain recommended formats (e.g. GFA, JSON-LD) in existing repositories, deserve more explicit discussion. In addition, suggestions for handling legacy datasets that lack complete or standardized metadata would be beneficial. Providing concrete examples of common pitfalls (e.g., interoperability failures caused by inconsistent metadata) along with potential mitigation approaches would further strengthen the paper. Answer: Thank you for your suggestions. We have added a new subsection 4.4 (“Practical implementation challenges and best practices for community adoption”) to Section 4. This subsection explicitly discusses challenges such as maintaining consistent metadata across independent projects, the current limited native support for GFA and JSON-LD/RO-Crate formats in major repositories (INSDC and Ensembl), and the difficulties posed by legacy datasets that pre-date these standards. 2. While the manuscript precisely captures genomic and computational standards, it currently lacks guidance on how pan-genome outputs should interface with downstream applications that are most relevant to plant breeders and geneticists (e.g., GWAS, QTL mapping, selection decisions, etc.). A subsection linking pan-genome data to common downstream analyses can be added. Also, example schemas or pipelines showing how standardized pan-genome representations improve trait mapping or selection decisions in practice can be included. Answer: We have added discussions and background information to the “Case studies” section to use them as examples of how pan-genome analyses can contribute to downstream analyses. 3. The Case Studies section highlights several key projects, but it reads as descriptive rather than analytical. It would be more convincing if this section contained quantitative comparisons showing how applying the proposed standards increased reproducibility, efficiency, or interpretability over previous, unstandardized approaches. Answer: We have expanded the “Case studies” section to provide more background information and explanations regarding how pan-genome analysis has significantly improved and contributed to the downstream analyses. However, providing quantitative comparisons is, in our opinion, out of scope for this review paper. 1. Although the manuscript highlights the importance of the proposed standards for improving FAIR compliance, the practical aspects of implementing these standards in real-world scenarios can be explored further. For instance, challenges related to community-wide adoption, such as maintaining consistent metadata across projects and the limited support for certain recommended formats (e.g. GFA, JSON-LD) in existing repositories, deserve more explicit discussion. In addition, suggestions for handling legacy datasets that lack complete or standardized metadata would be beneficial. Providing concrete examples of common pitfalls (e.g., interoperability failures caused by inconsistent metadata) along with potential mitigation approaches would further strengthen the paper. Answer: Thank you for your suggestions. We have added a new subsection 4.4 (“Practical implementation challenges and best practices for community adoption”) to Section 4. This subsection explicitly discusses challenges such as maintaining consistent metadata across independent projects, the current limited native support for GFA and JSON-LD/RO-Crate formats in major repositories (INSDC and Ensembl), and the difficulties posed by legacy datasets that pre-date these standards. 2. While the manuscript precisely captures genomic and computational standards, it currently lacks guidance on how pan-genome outputs should interface with downstream applications that are most relevant to plant breeders and geneticists (e.g., GWAS, QTL mapping, selection decisions, etc.). A subsection linking pan-genome data to common downstream analyses can be added. Also, example schemas or pipelines showing how standardized pan-genome representations improve trait mapping or selection decisions in practice can be included. Answer: We have added discussions and background information to the “Case studies” section to use them as examples of how pan-genome analyses can contribute to downstream analyses. 3. The Case Studies section highlights several key projects, but it reads as descriptive rather than analytical. It would be more convincing if this section contained quantitative comparisons showing how applying the proposed standards increased reproducibility, efficiency, or interpretability over previous, unstandardized approaches. Answer: We have expanded the “Case studies” section to provide more background information and explanations regarding how pan-genome analysis has significantly improved and contributed to the downstream analyses. However, providing quantitative comparisons is, in our opinion, out of scope for this review paper. Competing Interests: no competing interests Close Report a concern Respond or Comment COMMENTS ON THIS REPORT Author Response 27 Apr 2026 Marc Christian Heuermann , $usrAffiliation 27 Apr 2026 Author Response 1. Although the manuscript highlights the importance of the proposed standards for improving FAIR compliance, the practical aspects of implementing these standards in real-world scenarios can be explored further. For ... Continue reading 1. Although the manuscript highlights the importance of the proposed standards for improving FAIR compliance, the practical aspects of implementing these standards in real-world scenarios can be explored further. For instance, challenges related to community-wide adoption, such as maintaining consistent metadata across projects and the limited support for certain recommended formats (e.g. GFA, JSON-LD) in existing repositories, deserve more explicit discussion. In addition, suggestions for handling legacy datasets that lack complete or standardized metadata would be beneficial. Providing concrete examples of common pitfalls (e.g., interoperability failures caused by inconsistent metadata) along with potential mitigation approaches would further strengthen the paper. Answer: Thank you for your suggestions. We have added a new subsection 4.4 (“Practical implementation challenges and best practices for community adoption”) to Section 4. This subsection explicitly discusses challenges such as maintaining consistent metadata across independent projects, the current limited native support for GFA and JSON-LD/RO-Crate formats in major repositories (INSDC and Ensembl), and the difficulties posed by legacy datasets that pre-date these standards. 2. While the manuscript precisely captures genomic and computational standards, it currently lacks guidance on how pan-genome outputs should interface with downstream applications that are most relevant to plant breeders and geneticists (e.g., GWAS, QTL mapping, selection decisions, etc.). A subsection linking pan-genome data to common downstream analyses can be added. Also, example schemas or pipelines showing how standardized pan-genome representations improve trait mapping or selection decisions in practice can be included. Answer: We have added discussions and background information to the “Case studies” section to use them as examples of how pan-genome analyses can contribute to downstream analyses. 3. The Case Studies section highlights several key projects, but it reads as descriptive rather than analytical. It would be more convincing if this section contained quantitative comparisons showing how applying the proposed standards increased reproducibility, efficiency, or interpretability over previous, unstandardized approaches. Answer: We have expanded the “Case studies” section to provide more background information and explanations regarding how pan-genome analysis has significantly improved and contributed to the downstream analyses. However, providing quantitative comparisons is, in our opinion, out of scope for this review paper. 1. Although the manuscript highlights the importance of the proposed standards for improving FAIR compliance, the practical aspects of implementing these standards in real-world scenarios can be explored further. For instance, challenges related to community-wide adoption, such as maintaining consistent metadata across projects and the limited support for certain recommended formats (e.g. GFA, JSON-LD) in existing repositories, deserve more explicit discussion. In addition, suggestions for handling legacy datasets that lack complete or standardized metadata would be beneficial. Providing concrete examples of common pitfalls (e.g., interoperability failures caused by inconsistent metadata) along with potential mitigation approaches would further strengthen the paper. Answer: Thank you for your suggestions. We have added a new subsection 4.4 (“Practical implementation challenges and best practices for community adoption”) to Section 4. This subsection explicitly discusses challenges such as maintaining consistent metadata across independent projects, the current limited native support for GFA and JSON-LD/RO-Crate formats in major repositories (INSDC and Ensembl), and the difficulties posed by legacy datasets that pre-date these standards. 2. While the manuscript precisely captures genomic and computational standards, it currently lacks guidance on how pan-genome outputs should interface with downstream applications that are most relevant to plant breeders and geneticists (e.g., GWAS, QTL mapping, selection decisions, etc.). A subsection linking pan-genome data to common downstream analyses can be added. Also, example schemas or pipelines showing how standardized pan-genome representations improve trait mapping or selection decisions in practice can be included. Answer: We have added discussions and background information to the “Case studies” section to use them as examples of how pan-genome analyses can contribute to downstream analyses. 3. The Case Studies section highlights several key projects, but it reads as descriptive rather than analytical. It would be more convincing if this section contained quantitative comparisons showing how applying the proposed standards increased reproducibility, efficiency, or interpretability over previous, unstandardized approaches. Answer: We have expanded the “Case studies” section to provide more background information and explanations regarding how pan-genome analysis has significantly improved and contributed to the downstream analyses. However, providing quantitative comparisons is, in our opinion, out of scope for this review paper. Competing Interests: no competing interests Close Report a concern COMMENT ON THIS REPORT Views 0 Cite How to cite this report: Xie X. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r433712 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-433712 NOTE: it is important to ensure the information in square brackets after the title is included in this citation. Close Copy Citation Details Reviewer Report 24 Dec 2025 Xiaoming Xie , Wheat Genetics and Genomics Center, China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, Beijing, China Approved VIEWS 0 https://doi.org/10.5256/f1000research.191128.r433712 I have no further ... Continue reading READ ALL I have no further comments to make. Competing Interests: No competing interests were disclosed. Reviewer Expertise: wheat pangenome, gene-based pangenome, comparative genomics I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard. Close READ LESS CITE CITE HOW TO CITE THIS REPORT Xie X. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r433712 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-433712 NOTE: it is important to ensure the information in square brackets after the title is included in all citations of this article. COPY CITATION DETAILS Report a concern Respond or Comment COMMENT ON THIS REPORT Views 0 Cite How to cite this report: Sahu SK. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r433713 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-433713 NOTE: it is important to ensure the information in square brackets after the title is included in this citation. Close Copy Citation Details Reviewer Report 25 Nov 2025 Sunil Kumar Sahu , State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China Approved VIEWS 0 https://doi.org/10.5256/f1000research.191128.r433713 I am happy with the author's thorough revision ... Continue reading READ ALL I am happy with the author's thorough revision and detailed reponse. I have no further comments Competing Interests: No competing interests were disclosed. Reviewer Expertise: Plant genomics and evolution I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard. Close READ LESS CITE CITE HOW TO CITE THIS REPORT Sahu SK. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r433713 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-433713 NOTE: it is important to ensure the information in square brackets after the title is included in all citations of this article. COPY CITATION DETAILS Report a concern Respond or Comment COMMENT ON THIS REPORT Version 1 VERSION 1 PUBLISHED 28 Jul 2025 Views 0 Cite How to cite this report: Xie X. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.183537.r404154 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v1#referee-response-404154 NOTE: it is important to ensure the information in square brackets after the title is included in this citation. Close Copy Citation Details Reviewer Report 04 Sep 2025 Xiaoming Xie , Wheat Genetics and Genomics Center, China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, Beijing, China Approved with Reservations VIEWS 0 https://doi.org/10.5256/f1000research.183537.r404154 This white paper by Heuermann et al. presents a timely and comprehensive framework aiming to establish community-wide standards for plant pan-genome analysis. The authors cover critical aspects from nomenclature and quality control to data sharing and visualization. This work represents ... Continue reading READ ALL This white paper by Heuermann et al. presents a timely and comprehensive framework aiming to establish community-wide standards for plant pan-genome analysis. The authors cover critical aspects from nomenclature and quality control to data sharing and visualization. This work represents a valuable and necessary initiative to promote FAIR principles in a rapidly evolving field. However, several major revisions are required to enhance its practical utility, scientific rigor, and overall impact before it can be endorsed as a foundational guide for the community. Major comments 1. Lack of Practical Guidance and Actionable Workflows. While the paper provides an exhaustive list of tools and standards, it currently functions more as a catalogue than a practical guide. A researcher new to the field would struggle to navigate the options and select the most appropriate methodology for their specific project. To address this, the authors should incorporate one or more decision-tree figures or summary tables that guide users based on their specific research context (e.g., species ploidy, data type, biological question). Such a resource would transform this document from a simple list into an indispensable, actionable guide. 2. Understated Importance of the Generalized Feature Identifier (GFI) Concept. The proposal of a 'Generalized Feature Identifier' (GFI) in the 'Future Directions' section is a highly innovative and critical idea. It elegantly addresses a major bottleneck in functionally annotating the non-genic 'dark matter' of pan-genomes, which is often overlooked. However, its placement as a future thought diminishes its significance. This concept should be introduced much earlier in the manuscript, possibly in the nomenclature section, and framed as a core recommendation of this white paper to highlight its forward-thinking contribution. 3. Imprecise Comparison of Linear- vs. Graph-Based Approaches. The distinction between linear- and graph-based pan-genomes in Section 5.1 is crucial, but the current description of linear approaches could be refined for greater accuracy and clarity. The manuscript conflates two distinct types of 'linear-based' analyses. It states that these approaches identify sequence-level variations (SNPs, indels) as well as gene-level presence/absence variations (PAVs). However, the tools cited as examples, such as OrthoFinder and Ensembl Compara, are primarily used for inferring orthology and identifying gene-level PAVs. They are not the primary tools for calling SNPs and small indels from whole-genome alignments (which typically involves a separate workflow with variant callers like GATK against a linear reference). This conflation creates an imprecise comparison with graph-based approaches, which are fundamentally designed to model sequence-level variation directly. To improve this section, we recommend the authors explicitly distinguish between: (a) Sequence-based linear analysis: Aligning multiple genomes to a single linear reference to call SNPs and indels. (b) Gene-based linear analysis: Using orthology inference tools on annotated gene sets to determine the pan-gene repertoire and gene-level PAVs. By separating these two concepts, the manuscript can provide a more accurate and nuanced comparison, highlighting how graph-based pan-genomes aim to integrate both types of variation in a way that requires distinct workflows in a traditional linear framework. Minor comments 1. The authors should adopt a more authoritative tone appropriate for a standards paper. Phrases like "probably more suited" (Section 2.3) should be replaced with definitive recommendations (e.g., "we recommend the use of...") to provide clear guidance. 2. In Section 4.3 (Metadata requirements), the list of mandatory fields should be expanded to include the specific versions of all software and pipelines used. This is essential for ensuring full reproducibility of the analyses. 3. The case studies in Section 6 are too brief to be impactful. Each case should be slightly expanded to illustrate how the application (or lack thereof) of the proposed standards directly impacted the project's outcomes, challenges, or successes. This would provide concrete evidence for the importance of the proposed standards. 4. Regarding the classification of genes into "core, shell, and cloud" (Section 2.3), it is crucial to state that the specific percentage thresholds used for these definitions must be explicitly reported in the metadata, as they can significantly impact downstream comparative analyses. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Partly Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests: No competing interests were disclosed. Reviewer Expertise: wheat pangenome, gene-based pangenome, comparative genomics I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above. Close READ LESS CITE CITE HOW TO CITE THIS REPORT Xie X. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.183537.r404154 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v1#referee-response-404154 NOTE: it is important to ensure the information in square brackets after the title is included in all citations of this article. COPY CITATION DETAILS Report a concern Author Response 24 Nov 2025 Marc Christian Heuermann , $usrAffiliation 24 Nov 2025 Author Response Reviewer 2 Xiaoming Xie ( https://orcid.org/0000-0002-7925-4964 ), Wheat Genetics and Genomics Center, China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, Beijing, China Approved with Reservations This white ... Continue reading Reviewer 2 Xiaoming Xie ( https://orcid.org/0000-0002-7925-4964 ), Wheat Genetics and Genomics Center, China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, Beijing, China Approved with Reservations This white paper by Heuermann et al. presents a timely and comprehensive framework aiming to establish community-wide standards for plant pan-genome analysis. The authors cover critical aspects from nomenclature and quality control to data sharing and visualization. This work represents a valuable and necessary initiative to promote FAIR principles in a rapidly evolving field. However, several major revisions are required to enhance its practical utility, scientific rigor, and overall impact before it can be endorsed as a foundational guide for the community. Major comments 1. Lack of Practical Guidance and Actionable Workflows. While the paper provides an exhaustive list of tools and standards, it currently functions more as a catalogue than a practical guide. A researcher new to the field would struggle to navigate the options and select the most appropriate methodology for their specific project. To address this, the authors should incorporate one or more decision-tree figures or summary tables that guide users based on their specific research context (e.g., species ploidy, data type, biological question). Such a resource would transform this document from a simple list into an indispensable, actionable guide. Answer: Thank you for your insightful comments. Both reviewers raised this point, prompting us to create Figure 1, which clearly illustrates how each tool fits into the pan-genome analysis workflow. We have now cross-referenced the figure in both Section 3 and Section 5. 2. Understated Importance of the Generalized Feature Identifier (GFI) Concept. The proposal of a 'Generalized Feature Identifier' (GFI) in the 'Future Directions' section is a highly innovative and critical idea. It elegantly addresses a major bottleneck in functionally annotating the non-genic 'dark matter' of pan-genomes, which is often overlooked. However, its placement as a future thought diminishes its significance. This concept should be introduced much earlier in the manuscript, possibly in the nomenclature section, and framed as a core recommendation of this white paper to highlight its forward-thinking contribution. Answer: We do agree with the assessment and positioned the GFI concept now as paragraph 2.4. 3. Imprecise Comparison of Linear- vs. Graph-Based Approaches. The distinction between linear- and graph-based pan-genomes in Section 5.1 is crucial, but the current description of linear approaches could be refined for greater accuracy and clarity. The manuscript conflates two distinct types of 'linear-based' analyses. It states that these approaches identify sequence-level variations (SNPs, indels) as well as gene-level presence/absence variations (PAVs). However, the tools cited as examples, such as OrthoFinder and Ensembl Compara, are primarily used for inferring orthology and identifying gene-level PAVs. They are not the primary tools for calling SNPs and small indels from whole-genome alignments (which typically involves a separate workflow with variant callers like GATK against a linear reference). This conflation creates an imprecise comparison with graph-based approaches, which are fundamentally designed to model sequence-level variation directly. To improve this section, we recommend the authors explicitly distinguish between: (a) Sequence-based linear analysis: Aligning multiple genomes to a single linear reference to call SNPs and indels. (b) Gene-based linear analysis: Using orthology inference tools on annotated gene sets to determine the pan-gene repertoire and gene-level PAVs. By separating these two concepts, the manuscript can provide a more accurate and nuanced comparison, highlighting how graph-based pan-genomes aim to integrate both types of variation in a way that requires distinct workflows in a traditional linear framework. Answer: Thank you for this specific and helpful comment. We have reworked and updated our paragraph 5 accordingly. Minor comments 1. The authors should adopt a more authoritative tone appropriate for a standards paper. Phrases like "probably more suited" (Section 2.3) should be replaced with definitive recommendations (e.g., "we recommend the use of...") to provide clear guidance. Answer: Thank you for the suggestion. We rephrased the paragraph. 2. In Section 4.3 (Metadata requirements), the list of mandatory fields should be expanded to include the specific versions of all software and pipelines used. This is essential for ensuring full reproducibility of the analyses. Answer: Thanks, we have now addressed this important point and extended the paragraph to elaborate more on the importance of metadata requirements. 3. The case studies in Section 6 are too brief to be impactful. Each case should be slightly expanded to illustrate how the application (or lack thereof) of the proposed standards directly impacted the project's outcomes, challenges, or successes. This would provide concrete evidence for the importance of the proposed standards. Answer: Agreed. We updated the paragraph and extended the description of the case studies and their relevance. 4. Regarding the classification of genes into "core, shell, and cloud" (Section 2.3), it is crucial to state that the specific percentage thresholds used for these definitions must be explicitly reported in the metadata, as they can significantly impact downstream comparative analyses. Answer: We added a sentence to be more precise regarding this point. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Partly Are the conclusions drawn appropriate in the context of the current research literature? Yes Reviewer 2 Xiaoming Xie ( https://orcid.org/0000-0002-7925-4964 ), Wheat Genetics and Genomics Center, China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, Beijing, China Approved with Reservations This white paper by Heuermann et al. presents a timely and comprehensive framework aiming to establish community-wide standards for plant pan-genome analysis. The authors cover critical aspects from nomenclature and quality control to data sharing and visualization. This work represents a valuable and necessary initiative to promote FAIR principles in a rapidly evolving field. However, several major revisions are required to enhance its practical utility, scientific rigor, and overall impact before it can be endorsed as a foundational guide for the community. Major comments 1. Lack of Practical Guidance and Actionable Workflows. While the paper provides an exhaustive list of tools and standards, it currently functions more as a catalogue than a practical guide. A researcher new to the field would struggle to navigate the options and select the most appropriate methodology for their specific project. To address this, the authors should incorporate one or more decision-tree figures or summary tables that guide users based on their specific research context (e.g., species ploidy, data type, biological question). Such a resource would transform this document from a simple list into an indispensable, actionable guide. Answer: Thank you for your insightful comments. Both reviewers raised this point, prompting us to create Figure 1, which clearly illustrates how each tool fits into the pan-genome analysis workflow. We have now cross-referenced the figure in both Section 3 and Section 5. 2. Understated Importance of the Generalized Feature Identifier (GFI) Concept. The proposal of a 'Generalized Feature Identifier' (GFI) in the 'Future Directions' section is a highly innovative and critical idea. It elegantly addresses a major bottleneck in functionally annotating the non-genic 'dark matter' of pan-genomes, which is often overlooked. However, its placement as a future thought diminishes its significance. This concept should be introduced much earlier in the manuscript, possibly in the nomenclature section, and framed as a core recommendation of this white paper to highlight its forward-thinking contribution. Answer: We do agree with the assessment and positioned the GFI concept now as paragraph 2.4. 3. Imprecise Comparison of Linear- vs. Graph-Based Approaches. The distinction between linear- and graph-based pan-genomes in Section 5.1 is crucial, but the current description of linear approaches could be refined for greater accuracy and clarity. The manuscript conflates two distinct types of 'linear-based' analyses. It states that these approaches identify sequence-level variations (SNPs, indels) as well as gene-level presence/absence variations (PAVs). However, the tools cited as examples, such as OrthoFinder and Ensembl Compara, are primarily used for inferring orthology and identifying gene-level PAVs. They are not the primary tools for calling SNPs and small indels from whole-genome alignments (which typically involves a separate workflow with variant callers like GATK against a linear reference). This conflation creates an imprecise comparison with graph-based approaches, which are fundamentally designed to model sequence-level variation directly. To improve this section, we recommend the authors explicitly distinguish between: (a) Sequence-based linear analysis: Aligning multiple genomes to a single linear reference to call SNPs and indels. (b) Gene-based linear analysis: Using orthology inference tools on annotated gene sets to determine the pan-gene repertoire and gene-level PAVs. By separating these two concepts, the manuscript can provide a more accurate and nuanced comparison, highlighting how graph-based pan-genomes aim to integrate both types of variation in a way that requires distinct workflows in a traditional linear framework. Answer: Thank you for this specific and helpful comment. We have reworked and updated our paragraph 5 accordingly. Minor comments 1. The authors should adopt a more authoritative tone appropriate for a standards paper. Phrases like "probably more suited" (Section 2.3) should be replaced with definitive recommendations (e.g., "we recommend the use of...") to provide clear guidance. Answer: Thank you for the suggestion. We rephrased the paragraph. 2. In Section 4.3 (Metadata requirements), the list of mandatory fields should be expanded to include the specific versions of all software and pipelines used. This is essential for ensuring full reproducibility of the analyses. Answer: Thanks, we have now addressed this important point and extended the paragraph to elaborate more on the importance of metadata requirements. 3. The case studies in Section 6 are too brief to be impactful. Each case should be slightly expanded to illustrate how the application (or lack thereof) of the proposed standards directly impacted the project's outcomes, challenges, or successes. This would provide concrete evidence for the importance of the proposed standards. Answer: Agreed. We updated the paragraph and extended the description of the case studies and their relevance. 4. Regarding the classification of genes into "core, shell, and cloud" (Section 2.3), it is crucial to state that the specific percentage thresholds used for these definitions must be explicitly reported in the metadata, as they can significantly impact downstream comparative analyses. Answer: We added a sentence to be more precise regarding this point. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Partly Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests: No competing interests. Close Report a concern Respond or Comment COMMENTS ON THIS REPORT Author Response 24 Nov 2025 Marc Christian Heuermann , $usrAffiliation 24 Nov 2025 Author Response Reviewer 2 Xiaoming Xie ( https://orcid.org/0000-0002-7925-4964 ), Wheat Genetics and Genomics Center, China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, Beijing, China Approved with Reservations This white ... Continue reading Reviewer 2 Xiaoming Xie ( https://orcid.org/0000-0002-7925-4964 ), Wheat Genetics and Genomics Center, China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, Beijing, China Approved with Reservations This white paper by Heuermann et al. presents a timely and comprehensive framework aiming to establish community-wide standards for plant pan-genome analysis. The authors cover critical aspects from nomenclature and quality control to data sharing and visualization. This work represents a valuable and necessary initiative to promote FAIR principles in a rapidly evolving field. However, several major revisions are required to enhance its practical utility, scientific rigor, and overall impact before it can be endorsed as a foundational guide for the community. Major comments 1. Lack of Practical Guidance and Actionable Workflows. While the paper provides an exhaustive list of tools and standards, it currently functions more as a catalogue than a practical guide. A researcher new to the field would struggle to navigate the options and select the most appropriate methodology for their specific project. To address this, the authors should incorporate one or more decision-tree figures or summary tables that guide users based on their specific research context (e.g., species ploidy, data type, biological question). Such a resource would transform this document from a simple list into an indispensable, actionable guide. Answer: Thank you for your insightful comments. Both reviewers raised this point, prompting us to create Figure 1, which clearly illustrates how each tool fits into the pan-genome analysis workflow. We have now cross-referenced the figure in both Section 3 and Section 5. 2. Understated Importance of the Generalized Feature Identifier (GFI) Concept. The proposal of a 'Generalized Feature Identifier' (GFI) in the 'Future Directions' section is a highly innovative and critical idea. It elegantly addresses a major bottleneck in functionally annotating the non-genic 'dark matter' of pan-genomes, which is often overlooked. However, its placement as a future thought diminishes its significance. This concept should be introduced much earlier in the manuscript, possibly in the nomenclature section, and framed as a core recommendation of this white paper to highlight its forward-thinking contribution. Answer: We do agree with the assessment and positioned the GFI concept now as paragraph 2.4. 3. Imprecise Comparison of Linear- vs. Graph-Based Approaches. The distinction between linear- and graph-based pan-genomes in Section 5.1 is crucial, but the current description of linear approaches could be refined for greater accuracy and clarity. The manuscript conflates two distinct types of 'linear-based' analyses. It states that these approaches identify sequence-level variations (SNPs, indels) as well as gene-level presence/absence variations (PAVs). However, the tools cited as examples, such as OrthoFinder and Ensembl Compara, are primarily used for inferring orthology and identifying gene-level PAVs. They are not the primary tools for calling SNPs and small indels from whole-genome alignments (which typically involves a separate workflow with variant callers like GATK against a linear reference). This conflation creates an imprecise comparison with graph-based approaches, which are fundamentally designed to model sequence-level variation directly. To improve this section, we recommend the authors explicitly distinguish between: (a) Sequence-based linear analysis: Aligning multiple genomes to a single linear reference to call SNPs and indels. (b) Gene-based linear analysis: Using orthology inference tools on annotated gene sets to determine the pan-gene repertoire and gene-level PAVs. By separating these two concepts, the manuscript can provide a more accurate and nuanced comparison, highlighting how graph-based pan-genomes aim to integrate both types of variation in a way that requires distinct workflows in a traditional linear framework. Answer: Thank you for this specific and helpful comment. We have reworked and updated our paragraph 5 accordingly. Minor comments 1. The authors should adopt a more authoritative tone appropriate for a standards paper. Phrases like "probably more suited" (Section 2.3) should be replaced with definitive recommendations (e.g., "we recommend the use of...") to provide clear guidance. Answer: Thank you for the suggestion. We rephrased the paragraph. 2. In Section 4.3 (Metadata requirements), the list of mandatory fields should be expanded to include the specific versions of all software and pipelines used. This is essential for ensuring full reproducibility of the analyses. Answer: Thanks, we have now addressed this important point and extended the paragraph to elaborate more on the importance of metadata requirements. 3. The case studies in Section 6 are too brief to be impactful. Each case should be slightly expanded to illustrate how the application (or lack thereof) of the proposed standards directly impacted the project's outcomes, challenges, or successes. This would provide concrete evidence for the importance of the proposed standards. Answer: Agreed. We updated the paragraph and extended the description of the case studies and their relevance. 4. Regarding the classification of genes into "core, shell, and cloud" (Section 2.3), it is crucial to state that the specific percentage thresholds used for these definitions must be explicitly reported in the metadata, as they can significantly impact downstream comparative analyses. Answer: We added a sentence to be more precise regarding this point. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Partly Are the conclusions drawn appropriate in the context of the current research literature? Yes Reviewer 2 Xiaoming Xie ( https://orcid.org/0000-0002-7925-4964 ), Wheat Genetics and Genomics Center, China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, Beijing, China Approved with Reservations This white paper by Heuermann et al. presents a timely and comprehensive framework aiming to establish community-wide standards for plant pan-genome analysis. The authors cover critical aspects from nomenclature and quality control to data sharing and visualization. This work represents a valuable and necessary initiative to promote FAIR principles in a rapidly evolving field. However, several major revisions are required to enhance its practical utility, scientific rigor, and overall impact before it can be endorsed as a foundational guide for the community. Major comments 1. Lack of Practical Guidance and Actionable Workflows. While the paper provides an exhaustive list of tools and standards, it currently functions more as a catalogue than a practical guide. A researcher new to the field would struggle to navigate the options and select the most appropriate methodology for their specific project. To address this, the authors should incorporate one or more decision-tree figures or summary tables that guide users based on their specific research context (e.g., species ploidy, data type, biological question). Such a resource would transform this document from a simple list into an indispensable, actionable guide. Answer: Thank you for your insightful comments. Both reviewers raised this point, prompting us to create Figure 1, which clearly illustrates how each tool fits into the pan-genome analysis workflow. We have now cross-referenced the figure in both Section 3 and Section 5. 2. Understated Importance of the Generalized Feature Identifier (GFI) Concept. The proposal of a 'Generalized Feature Identifier' (GFI) in the 'Future Directions' section is a highly innovative and critical idea. It elegantly addresses a major bottleneck in functionally annotating the non-genic 'dark matter' of pan-genomes, which is often overlooked. However, its placement as a future thought diminishes its significance. This concept should be introduced much earlier in the manuscript, possibly in the nomenclature section, and framed as a core recommendation of this white paper to highlight its forward-thinking contribution. Answer: We do agree with the assessment and positioned the GFI concept now as paragraph 2.4. 3. Imprecise Comparison of Linear- vs. Graph-Based Approaches. The distinction between linear- and graph-based pan-genomes in Section 5.1 is crucial, but the current description of linear approaches could be refined for greater accuracy and clarity. The manuscript conflates two distinct types of 'linear-based' analyses. It states that these approaches identify sequence-level variations (SNPs, indels) as well as gene-level presence/absence variations (PAVs). However, the tools cited as examples, such as OrthoFinder and Ensembl Compara, are primarily used for inferring orthology and identifying gene-level PAVs. They are not the primary tools for calling SNPs and small indels from whole-genome alignments (which typically involves a separate workflow with variant callers like GATK against a linear reference). This conflation creates an imprecise comparison with graph-based approaches, which are fundamentally designed to model sequence-level variation directly. To improve this section, we recommend the authors explicitly distinguish between: (a) Sequence-based linear analysis: Aligning multiple genomes to a single linear reference to call SNPs and indels. (b) Gene-based linear analysis: Using orthology inference tools on annotated gene sets to determine the pan-gene repertoire and gene-level PAVs. By separating these two concepts, the manuscript can provide a more accurate and nuanced comparison, highlighting how graph-based pan-genomes aim to integrate both types of variation in a way that requires distinct workflows in a traditional linear framework. Answer: Thank you for this specific and helpful comment. We have reworked and updated our paragraph 5 accordingly. Minor comments 1. The authors should adopt a more authoritative tone appropriate for a standards paper. Phrases like "probably more suited" (Section 2.3) should be replaced with definitive recommendations (e.g., "we recommend the use of...") to provide clear guidance. Answer: Thank you for the suggestion. We rephrased the paragraph. 2. In Section 4.3 (Metadata requirements), the list of mandatory fields should be expanded to include the specific versions of all software and pipelines used. This is essential for ensuring full reproducibility of the analyses. Answer: Thanks, we have now addressed this important point and extended the paragraph to elaborate more on the importance of metadata requirements. 3. The case studies in Section 6 are too brief to be impactful. Each case should be slightly expanded to illustrate how the application (or lack thereof) of the proposed standards directly impacted the project's outcomes, challenges, or successes. This would provide concrete evidence for the importance of the proposed standards. Answer: Agreed. We updated the paragraph and extended the description of the case studies and their relevance. 4. Regarding the classification of genes into "core, shell, and cloud" (Section 2.3), it is crucial to state that the specific percentage thresholds used for these definitions must be explicitly reported in the metadata, as they can significantly impact downstream comparative analyses. Answer: We added a sentence to be more precise regarding this point. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Partly Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests: No competing interests. Close Report a concern COMMENT ON THIS REPORT Views 0 Cite How to cite this report: Sahu SK. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.183537.r404153 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v1#referee-response-404153 NOTE: it is important to ensure the information in square brackets after the title is included in this citation. Close Copy Citation Details Reviewer Report 03 Sep 2025 Sunil Kumar Sahu , State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China Approved with Reservations VIEWS 0 https://doi.org/10.5256/f1000research.183537.r404153 This article presents a very comprehensive and thoughtful set of recommendations, covering a wide spectrum from naming conventions to quality control and data sharing. I enjoyed reading it and have a few suggestions that I believe could strengthen its impact ... Continue reading READ ALL This article presents a very comprehensive and thoughtful set of recommendations, covering a wide spectrum from naming conventions to quality control and data sharing. I enjoyed reading it and have a few suggestions that I believe could strengthen its impact and practicality for the community. My main thought is that the sheer breadth of recommendations, while excellent, might feel daunting for some labs, especially those with limited resources. To make the framework more accessible, it would be incredibly helpful if the authors could more clearly distinguish between what they consider essential "minimum standards" and what are "aspirational best practices." For instance, while the framework is well-described, I found myself wishing for a more concrete, practical roadmap. The QC section, for example, lists many excellent tools (FastQC, GenomeScope, QUAST, etc.), but a visual workflow diagram would be immensely valuable. A figure illustrating the step-by-step process from raw data QC, through assembly and annotation QC, to pan-genome QC would really help readers visualize how to integrate these tools into their own standardized processes. Finally, on the topic of quality control, the article does a great job listing the available tools but could go further in guiding users on how to apply them. For example, some guidance on tool selection would be useful, such as which aspects of QUAST or CRAQ are best for evaluating polyploid assemblies. It would also be helpful to address how to interpret conflicting results from different tools or databases. Furthermore, in the pan-genome section, the concept of "saturation analysis" is mentioned. It would strengthen this part to include some discussion on the sample size required to confidently claim saturation, particularly for species with different ploidy levels. These are all meant as constructive feedback to enhance what is already a very valuable and needed framework. I hope my comments are helpful. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Yes Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests: No competing interests were disclosed. Reviewer Expertise: Plant genomics and evolution I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above. Close READ LESS CITE CITE HOW TO CITE THIS REPORT Sahu SK. Reviewer Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.183537.r404153 ) The direct URL for this report is: https://f1000research.com/articles/14-739/v1#referee-response-404153 NOTE: it is important to ensure the information in square brackets after the title is included in all citations of this article. COPY CITATION DETAILS Report a concern Author Response 24 Nov 2025 Marc Christian Heuermann , $usrAffiliation 24 Nov 2025 Author Response Reviewer 1 Sunil Kumar Sahu ( https://orcid.org/0000-0002-4742-9870 ), State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China Approved with Reservations This article presents a very comprehensive and thoughtful ... Continue reading Reviewer 1 Sunil Kumar Sahu ( https://orcid.org/0000-0002-4742-9870 ), State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China Approved with Reservations This article presents a very comprehensive and thoughtful set of recommendations, covering a wide spectrum from naming conventions to quality control and data sharing. I enjoyed reading it and have a few suggestions that I believe could strengthen its impact and practicality for the community. My main thought is that the sheer breadth of recommendations, while excellent, might feel daunting for some labs, especially those with limited resources. To make the framework more accessible, it would be incredibly helpful if the authors could more clearly distinguish between what they consider essential "minimum standards" and what are "aspirational best practices." For instance, while the framework is well-described, I found myself wishing for a more concrete, practical roadmap. The QC section, for example, lists many excellent tools (FastQC, GenomeScope, QUAST, etc.), but a visual workflow diagram would be immensely valuable. A figure illustrating the step-by-step process from raw data QC, through assembly and annotation QC, to pan-genome QC would really help readers visualize how to integrate these tools into their own standardized processes. Answer: Thank you for your constructive feedback. We have added Figure 1 to the manuscript to clearly illustrate the recommended tools for each step of the pan-genome analysis workflow. The figure is now cross-referenced in both Section 3 and Section 5 for better integration with the discussed content. Finally, on the topic of quality control, the article does a great job listing the available tools but could go further in guiding users on how to apply them. For example, some guidance on tool selection would be useful, such as which aspects of QUAST or CRAQ are best for evaluating polyploid assemblies. It would also be helpful to address how to interpret conflicting results from different tools or databases. Furthermore, in the pan-genome section, the concept of "saturation analysis" is mentioned. It would strengthen this part to include some discussion on the sample size required to confidently claim saturation, particularly for species with different ploidy levels. These are all meant as constructive feedback to enhance what is already a very valuable and needed framework. I hope my comments are helpful. Answer: We have revised section 3. Quality Control (QC) Standards to fully incorporate your suggestions. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Yes Are the conclusions drawn appropriate in the context of the current research literature? Yes Reviewer 1 Sunil Kumar Sahu ( https://orcid.org/0000-0002-4742-9870 ), State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China Approved with Reservations This article presents a very comprehensive and thoughtful set of recommendations, covering a wide spectrum from naming conventions to quality control and data sharing. I enjoyed reading it and have a few suggestions that I believe could strengthen its impact and practicality for the community. My main thought is that the sheer breadth of recommendations, while excellent, might feel daunting for some labs, especially those with limited resources. To make the framework more accessible, it would be incredibly helpful if the authors could more clearly distinguish between what they consider essential "minimum standards" and what are "aspirational best practices." For instance, while the framework is well-described, I found myself wishing for a more concrete, practical roadmap. The QC section, for example, lists many excellent tools (FastQC, GenomeScope, QUAST, etc.), but a visual workflow diagram would be immensely valuable. A figure illustrating the step-by-step process from raw data QC, through assembly and annotation QC, to pan-genome QC would really help readers visualize how to integrate these tools into their own standardized processes. Answer: Thank you for your constructive feedback. We have added Figure 1 to the manuscript to clearly illustrate the recommended tools for each step of the pan-genome analysis workflow. The figure is now cross-referenced in both Section 3 and Section 5 for better integration with the discussed content. Finally, on the topic of quality control, the article does a great job listing the available tools but could go further in guiding users on how to apply them. For example, some guidance on tool selection would be useful, such as which aspects of QUAST or CRAQ are best for evaluating polyploid assemblies. It would also be helpful to address how to interpret conflicting results from different tools or databases. Furthermore, in the pan-genome section, the concept of "saturation analysis" is mentioned. It would strengthen this part to include some discussion on the sample size required to confidently claim saturation, particularly for species with different ploidy levels. These are all meant as constructive feedback to enhance what is already a very valuable and needed framework. I hope my comments are helpful. Answer: We have revised section 3. Quality Control (QC) Standards to fully incorporate your suggestions. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Yes Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests: No competing interests. Close Report a concern Respond or Comment COMMENTS ON THIS REPORT Author Response 24 Nov 2025 Marc Christian Heuermann , $usrAffiliation 24 Nov 2025 Author Response Reviewer 1 Sunil Kumar Sahu ( https://orcid.org/0000-0002-4742-9870 ), State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China Approved with Reservations This article presents a very comprehensive and thoughtful ... Continue reading Reviewer 1 Sunil Kumar Sahu ( https://orcid.org/0000-0002-4742-9870 ), State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China Approved with Reservations This article presents a very comprehensive and thoughtful set of recommendations, covering a wide spectrum from naming conventions to quality control and data sharing. I enjoyed reading it and have a few suggestions that I believe could strengthen its impact and practicality for the community. My main thought is that the sheer breadth of recommendations, while excellent, might feel daunting for some labs, especially those with limited resources. To make the framework more accessible, it would be incredibly helpful if the authors could more clearly distinguish between what they consider essential "minimum standards" and what are "aspirational best practices." For instance, while the framework is well-described, I found myself wishing for a more concrete, practical roadmap. The QC section, for example, lists many excellent tools (FastQC, GenomeScope, QUAST, etc.), but a visual workflow diagram would be immensely valuable. A figure illustrating the step-by-step process from raw data QC, through assembly and annotation QC, to pan-genome QC would really help readers visualize how to integrate these tools into their own standardized processes. Answer: Thank you for your constructive feedback. We have added Figure 1 to the manuscript to clearly illustrate the recommended tools for each step of the pan-genome analysis workflow. The figure is now cross-referenced in both Section 3 and Section 5 for better integration with the discussed content. Finally, on the topic of quality control, the article does a great job listing the available tools but could go further in guiding users on how to apply them. For example, some guidance on tool selection would be useful, such as which aspects of QUAST or CRAQ are best for evaluating polyploid assemblies. It would also be helpful to address how to interpret conflicting results from different tools or databases. Furthermore, in the pan-genome section, the concept of "saturation analysis" is mentioned. It would strengthen this part to include some discussion on the sample size required to confidently claim saturation, particularly for species with different ploidy levels. These are all meant as constructive feedback to enhance what is already a very valuable and needed framework. I hope my comments are helpful. Answer: We have revised section 3. Quality Control (QC) Standards to fully incorporate your suggestions. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Yes Are the conclusions drawn appropriate in the context of the current research literature? Yes Reviewer 1 Sunil Kumar Sahu ( https://orcid.org/0000-0002-4742-9870 ), State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China Approved with Reservations This article presents a very comprehensive and thoughtful set of recommendations, covering a wide spectrum from naming conventions to quality control and data sharing. I enjoyed reading it and have a few suggestions that I believe could strengthen its impact and practicality for the community. My main thought is that the sheer breadth of recommendations, while excellent, might feel daunting for some labs, especially those with limited resources. To make the framework more accessible, it would be incredibly helpful if the authors could more clearly distinguish between what they consider essential "minimum standards" and what are "aspirational best practices." For instance, while the framework is well-described, I found myself wishing for a more concrete, practical roadmap. The QC section, for example, lists many excellent tools (FastQC, GenomeScope, QUAST, etc.), but a visual workflow diagram would be immensely valuable. A figure illustrating the step-by-step process from raw data QC, through assembly and annotation QC, to pan-genome QC would really help readers visualize how to integrate these tools into their own standardized processes. Answer: Thank you for your constructive feedback. We have added Figure 1 to the manuscript to clearly illustrate the recommended tools for each step of the pan-genome analysis workflow. The figure is now cross-referenced in both Section 3 and Section 5 for better integration with the discussed content. Finally, on the topic of quality control, the article does a great job listing the available tools but could go further in guiding users on how to apply them. For example, some guidance on tool selection would be useful, such as which aspects of QUAST or CRAQ are best for evaluating polyploid assemblies. It would also be helpful to address how to interpret conflicting results from different tools or databases. Furthermore, in the pan-genome section, the concept of "saturation analysis" is mentioned. It would strengthen this part to include some discussion on the sample size required to confidently claim saturation, particularly for species with different ploidy levels. These are all meant as constructive feedback to enhance what is already a very valuable and needed framework. I hope my comments are helpful. Answer: We have revised section 3. Quality Control (QC) Standards to fully incorporate your suggestions. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Yes Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests: No competing interests. Close Report a concern COMMENT ON THIS REPORT Comments on this article Comments (0) Version 3 VERSION 3 PUBLISHED 28 Jul 2025 ADD YOUR COMMENT Comment keyboard_arrow_left keyboard_arrow_right Open Peer Review Reviewer Status info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions Reviewer Reports Invited Reviewers 1 2 3 4 Version 3 (revision) 07 May 26 read Version 2 (revision) 18 Nov 25 read read read read Version 1 28 Jul 25 read read Sunil Kumar Sahu , State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China Xiaoming Xie , China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, China Rutwik Barmukh , Murdoch University, Murdoch, Australia Jianping Xu , McMaster University, Hamilton, Canada Comments on this article All Comments (0) Add a comment Sign up for content alerts Sign Up You are now signed up to receive this alert Browse by related subjects keyboard_arrow_left Back to all reports Reviewer Report 0 Views copyright © 2026 Xu J. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. 08 May 2026 | for Version 3 Jianping Xu , Department of Biology, McMaster University, Hamilton, Canada 0 Views copyright © 2026 Xu J. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. format_quote Cite this report speaker_notes Responses (0) Approved info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions I'm very happy to endorse the newly revised version for indexing. Competing Interests No competing interests were disclosed. Reviewer Expertise population genetics and genomics, with a focus on fungi I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard. reply Respond to this report Responses (0) Xu J. Peer Review Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.200310.r482397) NOTE: it is important to ensure the information in square brackets after the title is included in this citation. The direct URL for this report is: https://f1000research.com/articles/14-739/v3#referee-response-482397 keyboard_arrow_left Back to all reports Reviewer Report 0 Views copyright © 2026 Xu J. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. 30 Dec 2025 | for Version 2 Jianping Xu , Department of Biology, McMaster University, Hamilton, Canada 0 Views copyright © 2026 Xu J. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. format_quote Cite this report speaker_notes Responses (1) Approved With Reservations info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions This is an excellent set of recommendations for handling and analyzing plant pan-genomes. I have only three minor comments/questions for authors' considerations. 1. Should there be a clearly stated minimum standard for a genome to be included in plant pan-genome analyses? In the examples/case studies provided, what were the inclusion criteria and is there an emerging consensus? 2. Even though the abstract included "Super-pan-genomes", aside from the tomato case study example at the very end, very little attention was paid to this topic in the main text. Should there be additional criteria for super-pan-genome studies on top of what's recommended for pan-genome analyses? 3. This White Paper listed INSDC and Ensembl as the suggested data repositories. Given the increasing importance of genomic and pan-genomic data from China and the depositions of such data in the Chinese National Genomic Data Center (https://ngdc.cncb.ac.cn/), I think it's important to include that database as a suggested repository for pan-genome datasets. A minor editorial comment: two citations were included in the abstract of this paper. Can the abstract in this journal include citations? Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Yes Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests No competing interests were disclosed. Reviewer Expertise population genetics and genomics, with a focus on fungi I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above. reply Respond to this report Responses (1) Author Response 27 Apr 2026 Marc Christian Heuermann, 1. Should there be a clearly stated minimum standard for a genome to be included in plant pan-genome analyses? In the examples/case studies provided, what were the inclusion criteria and is there an emerging consensus? Answer: Thank you for your suggestions. We added a sentence in Chapter 3.1, referred to a publication by Wang & Wang 2023, and provided a summary of their proposed framework for quality control in genome assembly, which also contains threshold recommendations. 2. Even though the abstract included "Super-pan-genomes", aside from the tomato case study example at the very end, very little attention was paid to this topic in the main text. Should there be additional criteria for super-pan-genome studies on top of what's recommended for pan-genome analyses? Answer: In the “Case studies” section, we have discussed in greater detail the difference between intra-species pan-genomes and inter-species super-pan-genomes, as well as their complementary nature. In addition, we have included a new Section 3.4 to explain in more detail the differences in quality control when analyzing an inter-species super-pan-genome. 3. This White Paper listed INSDC and Ensembl as the suggested data repositories. Given the increasing importance of genomic and pan-genomic data from China and the depositions of such data in the Chinese National Genomic Data Center (https://ngdc.cncb.ac.cn/), I think it's important to include that database as a suggested repository for pan-genome datasets. Answer: Thank you very much for pointing that out. This would indeed improve the overall visibility and reliability of data storage, which is why we have included this in the manuscript. A minor editorial comment: two citations were included in the abstract of this paper. Can the abstract in this journal include citations? Answer: Indeed, according to the guidelines, this is not permitted. We moved the whole sentence with citation into the introduction section. View more View less Competing Interests no competing interests reply Respond Report a concern Xu J. Peer Review Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r436510) NOTE: it is important to ensure the information in square brackets after the title is included in this citation. The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-436510 keyboard_arrow_left Back to all reports Reviewer Report 0 Views copyright © 2026 Barmukh R. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. 30 Dec 2025 | for Version 2 Rutwik Barmukh , Centre for Crop and Food Innovation, Murdoch University, Murdoch, Western Australia, Australia 0 Views copyright © 2026 Barmukh R. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. format_quote Cite this report speaker_notes Responses (1) Approved With Reservations info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions This white paper makes an impressive effort to harmonize methodological practices for plant pan-genome construction, analysis, and sharing, as pan-genomic resources are rapidly increasing across different crop species. The manuscript is highly relevant and addresses a clear need within the plant genomics community. However, to function effectively as a widely adopted standards document, the manuscript would benefit from stronger justification of recommended practices and better consideration of downstream use cases and implementation challenges. The manuscript’s clarity, usability, and long-term impact will significantly improve after addressing some issues highlighted below. 1. Although the manuscript highlights the importance of the proposed standards for improving FAIR compliance, the practical aspects of implementing these standards in real-world scenarios can be explored further. For instance, challenges related to community-wide adoption, such as maintaining consistent metadata across projects and the limited support for certain recommended formats (e.g. GFA, JSON-LD) in existing repositories, deserve more explicit discussion. In addition, suggestions for handling legacy datasets that lack complete or standardized metadata would be beneficial. Providing concrete examples of common pitfalls (e.g., interoperability failures caused by inconsistent metadata) along with potential mitigation approaches would further strengthen the paper. 2. While the manuscript precisely captures genomic and computational standards, it currently lacks guidance on how pan-genome outputs should interface with downstream applications that are most relevant to plant breeders and geneticists (e.g., GWAS, QTL mapping, selection decisions, etc.). A subsection linking pan-genome data to common downstream analyses can be added. Also, example schemas or pipelines showing how standardized pan-genome representations improve trait mapping or selection decisions in practice can be included. 3. The Case Studies section highlights several key projects, but it reads as descriptive rather than analytical. It would be more convincing if this section contained quantitative comparisons showing how applying the proposed standards increased reproducibility, efficiency, or interpretability over previous, unstandardized approaches. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Partly Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests No competing interests were disclosed. Reviewer Expertise Crop genomics, bioinformatics, molecular breeding I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above. reply Respond to this report Responses (1) Author Response 27 Apr 2026 Marc Christian Heuermann, 1. Although the manuscript highlights the importance of the proposed standards for improving FAIR compliance, the practical aspects of implementing these standards in real-world scenarios can be explored further. For instance, challenges related to community-wide adoption, such as maintaining consistent metadata across projects and the limited support for certain recommended formats (e.g. GFA, JSON-LD) in existing repositories, deserve more explicit discussion. In addition, suggestions for handling legacy datasets that lack complete or standardized metadata would be beneficial. Providing concrete examples of common pitfalls (e.g., interoperability failures caused by inconsistent metadata) along with potential mitigation approaches would further strengthen the paper. Answer: Thank you for your suggestions. We have added a new subsection 4.4 (“Practical implementation challenges and best practices for community adoption”) to Section 4. This subsection explicitly discusses challenges such as maintaining consistent metadata across independent projects, the current limited native support for GFA and JSON-LD/RO-Crate formats in major repositories (INSDC and Ensembl), and the difficulties posed by legacy datasets that pre-date these standards. 2. While the manuscript precisely captures genomic and computational standards, it currently lacks guidance on how pan-genome outputs should interface with downstream applications that are most relevant to plant breeders and geneticists (e.g., GWAS, QTL mapping, selection decisions, etc.). A subsection linking pan-genome data to common downstream analyses can be added. Also, example schemas or pipelines showing how standardized pan-genome representations improve trait mapping or selection decisions in practice can be included. Answer: We have added discussions and background information to the “Case studies” section to use them as examples of how pan-genome analyses can contribute to downstream analyses. 3. The Case Studies section highlights several key projects, but it reads as descriptive rather than analytical. It would be more convincing if this section contained quantitative comparisons showing how applying the proposed standards increased reproducibility, efficiency, or interpretability over previous, unstandardized approaches. Answer: We have expanded the “Case studies” section to provide more background information and explanations regarding how pan-genome analysis has significantly improved and contributed to the downstream analyses. However, providing quantitative comparisons is, in our opinion, out of scope for this review paper. View more View less Competing Interests no competing interests reply Respond Report a concern Barmukh R. Peer Review Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r434365) NOTE: it is important to ensure the information in square brackets after the title is included in this citation. The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-434365 keyboard_arrow_left Back to all reports Reviewer Report 0 Views copyright © 2025 Xie X. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. 24 Dec 2025 | for Version 2 Xiaoming Xie , Wheat Genetics and Genomics Center, China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, Beijing, China 0 Views copyright © 2025 Xie X. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. format_quote Cite this report speaker_notes Responses (0) Approved info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions I have no further comments to make. Competing Interests No competing interests were disclosed. Reviewer Expertise wheat pangenome, gene-based pangenome, comparative genomics I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard. reply Respond to this report Responses (0) Xie X. Peer Review Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r433712) NOTE: it is important to ensure the information in square brackets after the title is included in this citation. The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-433712 keyboard_arrow_left Back to all reports Reviewer Report 0 Views copyright © 2025 Sahu S. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. 25 Nov 2025 | for Version 2 Sunil Kumar Sahu , State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China 0 Views copyright © 2025 Sahu S. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. format_quote Cite this report speaker_notes Responses (0) Approved info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions I am happy with the author's thorough revision and detailed reponse. I have no further comments Competing Interests No competing interests were disclosed. Reviewer Expertise Plant genomics and evolution I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard. reply Respond to this report Responses (0) Sahu SK. Peer Review Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.191128.r433713) NOTE: it is important to ensure the information in square brackets after the title is included in this citation. The direct URL for this report is: https://f1000research.com/articles/14-739/v2#referee-response-433713 keyboard_arrow_left Back to all reports Reviewer Report 0 Views copyright © 2025 Xie X. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. 04 Sep 2025 | for Version 1 Xiaoming Xie , Wheat Genetics and Genomics Center, China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, Beijing, China 0 Views copyright © 2025 Xie X. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. format_quote Cite this report speaker_notes Responses (1) Approved With Reservations info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions This white paper by Heuermann et al. presents a timely and comprehensive framework aiming to establish community-wide standards for plant pan-genome analysis. The authors cover critical aspects from nomenclature and quality control to data sharing and visualization. This work represents a valuable and necessary initiative to promote FAIR principles in a rapidly evolving field. However, several major revisions are required to enhance its practical utility, scientific rigor, and overall impact before it can be endorsed as a foundational guide for the community. Major comments 1. Lack of Practical Guidance and Actionable Workflows. While the paper provides an exhaustive list of tools and standards, it currently functions more as a catalogue than a practical guide. A researcher new to the field would struggle to navigate the options and select the most appropriate methodology for their specific project. To address this, the authors should incorporate one or more decision-tree figures or summary tables that guide users based on their specific research context (e.g., species ploidy, data type, biological question). Such a resource would transform this document from a simple list into an indispensable, actionable guide. 2. Understated Importance of the Generalized Feature Identifier (GFI) Concept. The proposal of a 'Generalized Feature Identifier' (GFI) in the 'Future Directions' section is a highly innovative and critical idea. It elegantly addresses a major bottleneck in functionally annotating the non-genic 'dark matter' of pan-genomes, which is often overlooked. However, its placement as a future thought diminishes its significance. This concept should be introduced much earlier in the manuscript, possibly in the nomenclature section, and framed as a core recommendation of this white paper to highlight its forward-thinking contribution. 3. Imprecise Comparison of Linear- vs. Graph-Based Approaches. The distinction between linear- and graph-based pan-genomes in Section 5.1 is crucial, but the current description of linear approaches could be refined for greater accuracy and clarity. The manuscript conflates two distinct types of 'linear-based' analyses. It states that these approaches identify sequence-level variations (SNPs, indels) as well as gene-level presence/absence variations (PAVs). However, the tools cited as examples, such as OrthoFinder and Ensembl Compara, are primarily used for inferring orthology and identifying gene-level PAVs. They are not the primary tools for calling SNPs and small indels from whole-genome alignments (which typically involves a separate workflow with variant callers like GATK against a linear reference). This conflation creates an imprecise comparison with graph-based approaches, which are fundamentally designed to model sequence-level variation directly. To improve this section, we recommend the authors explicitly distinguish between: (a) Sequence-based linear analysis: Aligning multiple genomes to a single linear reference to call SNPs and indels. (b) Gene-based linear analysis: Using orthology inference tools on annotated gene sets to determine the pan-gene repertoire and gene-level PAVs. By separating these two concepts, the manuscript can provide a more accurate and nuanced comparison, highlighting how graph-based pan-genomes aim to integrate both types of variation in a way that requires distinct workflows in a traditional linear framework. Minor comments 1. The authors should adopt a more authoritative tone appropriate for a standards paper. Phrases like "probably more suited" (Section 2.3) should be replaced with definitive recommendations (e.g., "we recommend the use of...") to provide clear guidance. 2. In Section 4.3 (Metadata requirements), the list of mandatory fields should be expanded to include the specific versions of all software and pipelines used. This is essential for ensuring full reproducibility of the analyses. 3. The case studies in Section 6 are too brief to be impactful. Each case should be slightly expanded to illustrate how the application (or lack thereof) of the proposed standards directly impacted the project's outcomes, challenges, or successes. This would provide concrete evidence for the importance of the proposed standards. 4. Regarding the classification of genes into "core, shell, and cloud" (Section 2.3), it is crucial to state that the specific percentage thresholds used for these definitions must be explicitly reported in the metadata, as they can significantly impact downstream comparative analyses. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Partly Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests No competing interests were disclosed. Reviewer Expertise wheat pangenome, gene-based pangenome, comparative genomics I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above. reply Respond to this report Responses (1) Author Response 24 Nov 2025 Marc Christian Heuermann, Reviewer 2 Xiaoming Xie ( https://orcid.org/0000-0002-7925-4964 ), Wheat Genetics and Genomics Center, China Agricultural University College of Agronomy and Biotechnology (Ringgold ID: 200630), Beijing, Beijing, China Approved with Reservations This white paper by Heuermann et al. presents a timely and comprehensive framework aiming to establish community-wide standards for plant pan-genome analysis. The authors cover critical aspects from nomenclature and quality control to data sharing and visualization. This work represents a valuable and necessary initiative to promote FAIR principles in a rapidly evolving field. However, several major revisions are required to enhance its practical utility, scientific rigor, and overall impact before it can be endorsed as a foundational guide for the community. Major comments 1. Lack of Practical Guidance and Actionable Workflows. While the paper provides an exhaustive list of tools and standards, it currently functions more as a catalogue than a practical guide. A researcher new to the field would struggle to navigate the options and select the most appropriate methodology for their specific project. To address this, the authors should incorporate one or more decision-tree figures or summary tables that guide users based on their specific research context (e.g., species ploidy, data type, biological question). Such a resource would transform this document from a simple list into an indispensable, actionable guide. Answer: Thank you for your insightful comments. Both reviewers raised this point, prompting us to create Figure 1, which clearly illustrates how each tool fits into the pan-genome analysis workflow. We have now cross-referenced the figure in both Section 3 and Section 5. 2. Understated Importance of the Generalized Feature Identifier (GFI) Concept. The proposal of a 'Generalized Feature Identifier' (GFI) in the 'Future Directions' section is a highly innovative and critical idea. It elegantly addresses a major bottleneck in functionally annotating the non-genic 'dark matter' of pan-genomes, which is often overlooked. However, its placement as a future thought diminishes its significance. This concept should be introduced much earlier in the manuscript, possibly in the nomenclature section, and framed as a core recommendation of this white paper to highlight its forward-thinking contribution. Answer: We do agree with the assessment and positioned the GFI concept now as paragraph 2.4. 3. Imprecise Comparison of Linear- vs. Graph-Based Approaches. The distinction between linear- and graph-based pan-genomes in Section 5.1 is crucial, but the current description of linear approaches could be refined for greater accuracy and clarity. The manuscript conflates two distinct types of 'linear-based' analyses. It states that these approaches identify sequence-level variations (SNPs, indels) as well as gene-level presence/absence variations (PAVs). However, the tools cited as examples, such as OrthoFinder and Ensembl Compara, are primarily used for inferring orthology and identifying gene-level PAVs. They are not the primary tools for calling SNPs and small indels from whole-genome alignments (which typically involves a separate workflow with variant callers like GATK against a linear reference). This conflation creates an imprecise comparison with graph-based approaches, which are fundamentally designed to model sequence-level variation directly. To improve this section, we recommend the authors explicitly distinguish between: (a) Sequence-based linear analysis: Aligning multiple genomes to a single linear reference to call SNPs and indels. (b) Gene-based linear analysis: Using orthology inference tools on annotated gene sets to determine the pan-gene repertoire and gene-level PAVs. By separating these two concepts, the manuscript can provide a more accurate and nuanced comparison, highlighting how graph-based pan-genomes aim to integrate both types of variation in a way that requires distinct workflows in a traditional linear framework. Answer: Thank you for this specific and helpful comment. We have reworked and updated our paragraph 5 accordingly. Minor comments 1. The authors should adopt a more authoritative tone appropriate for a standards paper. Phrases like "probably more suited" (Section 2.3) should be replaced with definitive recommendations (e.g., "we recommend the use of...") to provide clear guidance. Answer: Thank you for the suggestion. We rephrased the paragraph. 2. In Section 4.3 (Metadata requirements), the list of mandatory fields should be expanded to include the specific versions of all software and pipelines used. This is essential for ensuring full reproducibility of the analyses. Answer: Thanks, we have now addressed this important point and extended the paragraph to elaborate more on the importance of metadata requirements. 3. The case studies in Section 6 are too brief to be impactful. Each case should be slightly expanded to illustrate how the application (or lack thereof) of the proposed standards directly impacted the project's outcomes, challenges, or successes. This would provide concrete evidence for the importance of the proposed standards. Answer: Agreed. We updated the paragraph and extended the description of the case studies and their relevance. 4. Regarding the classification of genes into "core, shell, and cloud" (Section 2.3), it is crucial to state that the specific percentage thresholds used for these definitions must be explicitly reported in the metadata, as they can significantly impact downstream comparative analyses. Answer: We added a sentence to be more precise regarding this point. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Partly Are the conclusions drawn appropriate in the context of the current research literature? Yes View more View less Competing Interests No competing interests. reply Respond Report a concern Xie X. Peer Review Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.183537.r404154) NOTE: it is important to ensure the information in square brackets after the title is included in this citation. The direct URL for this report is: https://f1000research.com/articles/14-739/v1#referee-response-404154 keyboard_arrow_left Back to all reports Reviewer Report 0 Views copyright © 2025 Sahu S. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. 03 Sep 2025 | for Version 1 Sunil Kumar Sahu , State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China 0 Views copyright © 2025 Sahu S. This is an open access peer review report distributed under the terms of the Creative Commons Attribution License , which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited. format_quote Cite this report speaker_notes Responses (1) Approved With Reservations info_outline Alongside their report, reviewers assign a status to the article: Approved The paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved Fundamental flaws in the paper seriously undermine the findings and conclusions This article presents a very comprehensive and thoughtful set of recommendations, covering a wide spectrum from naming conventions to quality control and data sharing. I enjoyed reading it and have a few suggestions that I believe could strengthen its impact and practicality for the community. My main thought is that the sheer breadth of recommendations, while excellent, might feel daunting for some labs, especially those with limited resources. To make the framework more accessible, it would be incredibly helpful if the authors could more clearly distinguish between what they consider essential "minimum standards" and what are "aspirational best practices." For instance, while the framework is well-described, I found myself wishing for a more concrete, practical roadmap. The QC section, for example, lists many excellent tools (FastQC, GenomeScope, QUAST, etc.), but a visual workflow diagram would be immensely valuable. A figure illustrating the step-by-step process from raw data QC, through assembly and annotation QC, to pan-genome QC would really help readers visualize how to integrate these tools into their own standardized processes. Finally, on the topic of quality control, the article does a great job listing the available tools but could go further in guiding users on how to apply them. For example, some guidance on tool selection would be useful, such as which aspects of QUAST or CRAQ are best for evaluating polyploid assemblies. It would also be helpful to address how to interpret conflicting results from different tools or databases. Furthermore, in the pan-genome section, the concept of "saturation analysis" is mentioned. It would strengthen this part to include some discussion on the sample size required to confidently claim saturation, particularly for species with different ploidy levels. These are all meant as constructive feedback to enhance what is already a very valuable and needed framework. I hope my comments are helpful. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Yes Are the conclusions drawn appropriate in the context of the current research literature? Yes Competing Interests No competing interests were disclosed. Reviewer Expertise Plant genomics and evolution I confirm that I have read this submission and believe that I have an appropriate level of expertise to confirm that it is of an acceptable scientific standard, however I have significant reservations, as outlined above. reply Respond to this report Responses (1) Author Response 24 Nov 2025 Marc Christian Heuermann, Reviewer 1 Sunil Kumar Sahu ( https://orcid.org/0000-0002-4742-9870 ), State Key Laboratory of Genome and Multi-omics Technologies, BGI Research, Shenzhen, China Approved with Reservations This article presents a very comprehensive and thoughtful set of recommendations, covering a wide spectrum from naming conventions to quality control and data sharing. I enjoyed reading it and have a few suggestions that I believe could strengthen its impact and practicality for the community. My main thought is that the sheer breadth of recommendations, while excellent, might feel daunting for some labs, especially those with limited resources. To make the framework more accessible, it would be incredibly helpful if the authors could more clearly distinguish between what they consider essential "minimum standards" and what are "aspirational best practices." For instance, while the framework is well-described, I found myself wishing for a more concrete, practical roadmap. The QC section, for example, lists many excellent tools (FastQC, GenomeScope, QUAST, etc.), but a visual workflow diagram would be immensely valuable. A figure illustrating the step-by-step process from raw data QC, through assembly and annotation QC, to pan-genome QC would really help readers visualize how to integrate these tools into their own standardized processes. Answer: Thank you for your constructive feedback. We have added Figure 1 to the manuscript to clearly illustrate the recommended tools for each step of the pan-genome analysis workflow. The figure is now cross-referenced in both Section 3 and Section 5 for better integration with the discussed content. Finally, on the topic of quality control, the article does a great job listing the available tools but could go further in guiding users on how to apply them. For example, some guidance on tool selection would be useful, such as which aspects of QUAST or CRAQ are best for evaluating polyploid assemblies. It would also be helpful to address how to interpret conflicting results from different tools or databases. Furthermore, in the pan-genome section, the concept of "saturation analysis" is mentioned. It would strengthen this part to include some discussion on the sample size required to confidently claim saturation, particularly for species with different ploidy levels. These are all meant as constructive feedback to enhance what is already a very valuable and needed framework. I hope my comments are helpful. Answer: We have revised section 3. Quality Control (QC) Standards to fully incorporate your suggestions. Is the topic of the review discussed comprehensively in the context of the current literature? Yes Are all factual statements correct and adequately supported by citations? Yes Is the review written in accessible language? Yes Are the conclusions drawn appropriate in the context of the current research literature? Yes View more View less Competing Interests No competing interests. reply Respond Report a concern Sahu SK. Peer Review Report For: White paper: standards for handling and analyzing plant pan-genomes [version 2; peer review: 2 approved, 2 approved with reservations] . F1000Research 2025, 14 :739 ( https://doi.org/10.5256/f1000research.183537.r404153) NOTE: it is important to ensure the information in square brackets after the title is included in this citation. The direct URL for this report is: https://f1000research.com/articles/14-739/v1#referee-response-404153 Alongside their report, reviewers assign a status to the article: Approved - the paper is scientifically sound in its current form and only minor, if any, improvements are suggested Approved with reservations - A number of small changes, sometimes more significant revisions are required to address specific details and improve the papers academic merit. Not approved - fundamental flaws in the paper seriously undermine the findings and conclusions Adjust parameters to alter display View on desktop for interactive features Includes Interactive Elements View on desktop for interactive features Competing Interests Policy Provide sufficient details of any financial or non-financial competing interests to enable users to assess whether your comments might lead a reasonable person to question your impartiality. Consider the following examples, but note that this is not an exhaustive list: Examples of 'Non-Financial Competing Interests' Within the past 4 years, you have held joint grants, published or collaborated with any of the authors of the selected paper. You have a close personal relationship (e.g. parent, spouse, sibling, or domestic partner) with any of the authors. You are a close professional associate of any of the authors (e.g. scientific mentor, recent student). You work at the same institute as any of the authors. You hope/expect to benefit (e.g. favour or employment) as a result of your submission. You are an Editor for the journal in which the article is published. Examples of 'Financial Competing Interests' You expect to receive, or in the past 4 years have received, any of the following from any commercial organisation that may gain financially from your submission: a salary, fees, funding, reimbursements. You expect to receive, or in the past 4 years have received, shared grant support or other funding with any of the authors. You hold, or are currently applying for, any patents or significant stocks/shares relating to the subject matter of the paper you are commenting on. Stay Updated Sign up for content alerts and receive a weekly or monthly email with all newly published articles Register with F1000Research Already registered? Sign in Not now, thanks close PLEASE NOTE If you are an AUTHOR of this article, please check that you signed in with the account associated with this article otherwise we cannot automatically identify your role as an author and your comment will be labelled as a “User Comment”. If you are a REVIEWER of this article, please check that you have signed in with the account associated with this article and then go to your account to submit your report, please do not post your review here. If you do not have access to your original account, please contact us . All commenters must hold a formal affiliation as per our Policies . The information that you give us will be displayed next to your comment. User comments must be in English, comprehensible and relevant to the article under discussion. We reserve the right to remove any comments that we consider to be inappropriate, offensive or otherwise in breach of the User Comment Terms and Conditions . Commenters must not use a comment for personal attacks. When criticisms of the article are based on unpublished data, the data should be made available. I accept the User Comment Terms and Conditions Please confirm that you accept the User Comment Terms and Conditions. Affiliation ✕ refresh Please enter your institution. Note: To add your institution or organisation, start typing the name and then select the correct name from the list. Where applicable, the name will appear in both the original language and in English. Do not paste in the name. If the name does not appear in the drop-down list, we will display the information you have entered. ✕ refresh Country/Region * USA UK Canada China France Germany Afghanistan Aland Islands Albania Algeria American Samoa Andorra Angola Anguilla Antarctica Antigua and Barbuda Argentina Armenia Aruba Australia Austria Azerbaijan Bahamas Bahrain Bangladesh Barbados Belarus Belgium Belize Benin Bermuda Bhutan Bolivia Bosnia and Herzegovina Botswana Bouvet Island Brazil British Indian Ocean Territory British Virgin Islands Brunei Bulgaria Burkina Faso Burundi Cambodia Cameroon Canada Cape Verde Cayman Islands Central African Republic Chad Chile China Christmas Island Cocos (Keeling) Islands Colombia Comoros Congo Cook Islands Costa Rica Cote d'Ivoire Croatia Cuba Cyprus Czech Republic Democratic Republic of the Congo Denmark Djibouti Dominica Dominican Republic Ecuador Egypt El Salvador Equatorial Guinea Eritrea Estonia Ethiopia Falkland Islands Faroe Islands Federated States of Micronesia Fiji Finland France French Guiana French Polynesia French Southern Territories Gabon Georgia Germany Ghana Gibraltar Greece Greenland Grenada Guadeloupe Guam Guatemala Guernsey Guinea Guinea-Bissau Guyana Haiti Heard Island and Mcdonald Islands Holy See (Vatican City State) Honduras Hong Kong Hungary Iceland India Indonesia Iran Iraq Ireland Israel Italy Jamaica Japan Jersey Jordan Kazakhstan Kenya Kiribati Kosovo (Serbia and Montenegro) Kuwait Kyrgyzstan Lao People's Democratic Republic Latvia Lebanon Lesotho Liberia Libya Liechtenstein Lithuania Luxembourg Macao Madagascar Malawi Malaysia Maldives Mali Malta Marshall Islands Martinique Mauritania Mauritius Mayotte Mexico Minor Outlying Islands of the United States Moldova Monaco Mongolia Montenegro Montserrat Morocco Mozambique Myanmar Namibia Nauru Nepal Netherlands Antilles New Caledonia New Zealand Nicaragua Niger Nigeria Niue Norfolk Island North Korea North Macedonia Northern Mariana Islands Norway Oman Pakistan Palau Palestinian Territory Panama Papua New Guinea Paraguay Peru Philippines Pitcairn Poland Portugal Puerto Rico Qatar Reunion Romania Russian Federation Rwanda Saint Helena Saint Kitts and Nevis Saint Lucia Saint Pierre and Miquelon Saint Vincent and the Grenadines Samoa San Marino Sao Tome and Principe Saudi Arabia Senegal Serbia Seychelles Sierra Leone Singapore Slovakia Slovenia Solomon Islands Somalia South Africa South Georgia and the South Sandwich Is South Korea South Sudan Spain Sri Lanka Sudan Suriname Svalbard and Jan Mayen Swaziland Sweden Switzerland Syria Taiwan Tajikistan Tanzania Thailand The Gambia The Netherlands Timor-Leste Togo Tokelau Tonga Trinidad and Tobago Tunisia Turkey Turkmenistan Turks and Caicos Islands Tuvalu UK USA Uganda Ukraine United Arab Emirates United States Virgin Islands Uruguay Uzbekistan Vanuatu Venezuela Vietnam Wallis and Futuna West Bank and Gaza Strip Western Sahara Yemen Zambia Zimbabwe Please select your country/region. You must enter a comment. Competing Interests Please disclose any competing interests that might be construed to influence your judgment of the article's or peer review report's validity or importance. Competing Interests Policy Provide sufficient details of any financial or non-financial competing interests to enable users to assess whether your comments might lead a reasonable person to question your impartiality. Consider the following examples, but note that this is not an exhaustive list: Examples of 'Non-Financial Competing Interests' Within the past 4 years, you have held joint grants, published or collaborated with any of the authors of the selected paper. You have a close personal relationship (e.g. parent, spouse, sibling, or domestic partner) with any of the authors. You are a close professional associate of any of the authors (e.g. scientific mentor, recent student). You work at the same institute as any of the authors. You hope/expect to benefit (e.g. favour or employment) as a result of your submission. You are an Editor for the journal in which the article is published. Examples of 'Financial Competing Interests' You expect to receive, or in the past 4 years have received, any of the following from any commercial organisation that may gain financially from your submission: a salary, fees, funding, reimbursements. You expect to receive, or in the past 4 years have received, shared grant support or other funding with any of the authors. You hold, or are currently applying for, any patents or significant stocks/shares relating to the subject matter of the paper you are commenting on. Please state your competing interests The comment has been saved. An error has occurred. Please try again. Cancel Post var lTitle = "White paper: standards for handling and analyzing...".replace("'", ''); var linkedInUrl = "http://www.linkedin.com/shareArticle?url=https://f1000research.com/articles/14-739/v2" + "&title=" + encodeURIComponent(lTitle) + "&summary=" + encodeURIComponent('Read the article by '); var deliciousUrl = "https://del.icio.us/post?url=https://f1000research.com/articles/14-739/v2&title=" + encodeURIComponent(lTitle); var redditUrl = "http://reddit.com/submit?url=https://f1000research.com/articles/14-739/v2" + "&title=" + encodeURIComponent(lTitle); linkedInUrl += encodeURIComponent('Heuermann MC et al.'); var offsetTop = /chrome/i.test( navigator.userAgent ) ? 4 : -10; var addthis_config = { ui_offset_top: offsetTop, services_compact : "facebook,twitter,www.linkedin.com,www.mendeley.com,reddit.com", services_expanded : "facebook,twitter,www.linkedin.com,www.mendeley.com,reddit.com", services_custom : [ { name: "LinkedIn", url: linkedInUrl, icon:"/img/icon/at_linkedin.svg" }, { name: "Mendeley", url: "http://www.mendeley.com/import/?url=https://f1000research.com/articles/14-739/v2/mendeley", icon:"/img/icon/at_mendeley.svg" }, { name: "Reddit", url: redditUrl, icon:"/img/icon/at_reddit.svg" }, ] }; var addthis_share = { url: "https://f1000research.com/articles/14-739", templates : { twitter : "White paper: standards for handling and analyzing plant pan-genomes. Heuermann MC et al., published by " + "@F1000Research" + ", https://f1000research.com/articles/14-739/v2" } }; if (typeof(addthis) != "undefined"){ addthis.addEventListener('addthis.ready', checkCount); addthis.addEventListener('addthis.menu.share', checkCount); } $(".f1r-shares-twitter").attr("href", "https://twitter.com/intent/tweet?text=" + addthis_share.templates.twitter); $(".f1r-shares-facebook").attr("href", "https://www.facebook.com/sharer/sharer.php?u=" + addthis_share.url); $(".f1r-shares-linkedin").attr("href", addthis_config.services_custom[0].url); $(".f1r-shares-reddit").attr("href", addthis_config.services_custom[2].url); $(".f1r-shares-mendelay").attr("href", addthis_config.services_custom[1].url); function checkCount(){ setTimeout(function(){ $(".addthis_button_expanded").each(function(){ var count = $(this).text(); if (count !== "" && count != "0") $(this).removeClass("is-hidden"); else $(this).addClass("is-hidden"); }); }, 1000); } close How to cite this report {{reportCitation}} Cancel Copy Citation Details $(function(){R.ui.buttonDropdowns('.dropdown-for-downloads');}); $(function(){R.ui.toolbarDropdowns('.toolbar-dropdown-for-downloads');}); $.get("/articles/acj/166538/191128") new F1000.Clipboard(); new F1000.ThesaurusTermsDisplay("articles", "article", "191128"); $(document).ready(function() { $( "#frame1" ).on('load', function() { var mydiv = $(this).contents().find("div"); var h = mydiv.height(); console.log(h) }); var tooltipLivingFigure = jQuery(".interactive-living-figure-label .icon-more-info"), titleLivingFigure = tooltipLivingFigure.attr("title"); tooltipLivingFigure.simpletip({ fixed: true, position: ["-115", "30"], baseClass: 'small-tooltip', content:titleLivingFigure + " " }); tooltipLivingFigure.removeAttr("title"); $("body").on("click", ".cite-living-figure", function(e) { e.preventDefault(); var ref = $(this).attr("data-ref"); $(this).closest(".living-figure-list-container").find("#" + ref).fadeIn(200); }); $("body").on("click", ".close-cite-living-figure", function(e) { e.preventDefault(); $(this).closest(".popup-window-wrapper").fadeOut(200); }); $(document).on("mouseup", function(e) { var metricsContainer = $(".article-metrics-popover-wrapper"); if (!metricsContainer.is(e.target) && metricsContainer.has(e.target).length === 0) { $(".article-metrics-close-button").click(); } }); var articleId = $('#articleId').val(); if($("#main-article-count-box").attachArticleMetrics) { $("#main-article-count-box").attachArticleMetrics(articleId, { articleMetricsView: true }); } }); var figshareWidget = $(".new_figshare_widget"); if (figshareWidget.length > 0) { window.figshare.load("f1000", function(Widget) { // Select a tag/tags defined in your page. In this tag we will place the widget. _.map(figshareWidget, function(el){ var widget = new Widget({ articleId: $(el).attr("figshare_articleId") //height:300 // this is the height of the viewer part. [Default: 550] }); widget.initialize(); // initialize the widget widget.mount(el); // mount it in a tag that's on your page // this will save the widget on the global scope for later use from // your JS scripts. This line is optional. //window.widget = widget; }); }); } close Error Close Add Reset F1000.MICROSERVICES.AFFILIATION = ''; $(document).ready(function () { $('.js-affiliations-form').each((index, form) => { new AffiliationForm({ formId: form.id, institutionErrorSelector: '.comment-enter-institution', departmentErrorSelector: '.comment-enter-department', placeSelector: '.js-add-comment-place', stateSelector: '.js-add-comment-state', zipCodeSelector: '.js-add-comment-zipcode', countrySelector: '.js-add-comment-country', countryErrorSelector: '.comment-enter-country', }); }); }); $(document).ready(function () { var reportIds = { "436510": 22, "436511": 0, "436508": 0, "482397": 5, "436509": 0, "482396": 0, "436506": 0, "482395": 0, "436507": 0, "482394": 0, "436504": 0, "436505": 0, "436512": 0, "436513": 0, "401966": 0, "401967": 0, "401964": 0, "401965": 0, "401963": 0, "434358": 0, "404150": 0, "434359": 0, "404151": 0, "401972": 0, "404148": 0, "404149": 0, "401970": 0, "401971": 0, "433712": 14, "401968": 0, "433713": 22, "401969": 0, "434366": 0, "434367": 0, "434364": 0, "404156": 0, "434365": 23, "404157": 0, "434362": 0, "404154": 34, "434363": 0, "404155": 0, "434360": 0, "404152": 0, "434361": 0, "404153": 43, }; $(".referee-response-container,.js-referee-report").each(function(index, el) { var reportId = $(el).attr("data-reportid"), reportCount = reportIds[reportId] || 0; $(el).find(".comments-count-container,.js-referee-report-views").html(reportCount); }); var uuidInput = $("#article_uuid"), oldUUId = uuidInput.val(), newUUId = "397895c9-8913-4297-baf9-d4a7313e4036"; uuidInput.val(newUUId); $("a[href*='article_uuid=']").each(function(index, el) { var newHref = $(el).attr("href").replace(oldUUId, newUUId); $(el).attr("href", newHref); }); }); An innovative open access publishing platform offering rapid publication and open peer review, whilst supporting data deposition and sharing. Browse Gateways Collections How it Works Contact For Developers Cookie Notice Privacy Notice RSS Submit Your Research Follow us © 2012-2026 F1000 Research Ltd. ISSN 2046-1402 | Legal | Partner of Research4Life • CrossRef • ORCID • FAIRSharing R.templateTests.simpleTemplate = R.template(' $text $text $text $text $text '); R.templateTests.runTests(); var F1000platform = new F1000.Platform({ name: "f1000research", displayName: "F1000Research", hostName: "f1000research.com", id: "1", editorialEmail: "[email protected]", infoEmail: "[email protected]", usePmcStats: true }); $(function(){R.ui.dropdowns('.dropdown-for-authors, .dropdown-for-about, .dropdown-for-myresearch');}); // $(function(){R.ui.dropdowns('.dropdown-for-referees');}); $(document).ready(function () { if ($(".cookie-warning").is(":visible")) { $(".sticky").css("margin-bottom", "35px"); $(".devices").addClass("devices-and-cookie-warning"); } $(".cookie-warning .close-button").click(function (e) { $(".devices").removeClass("devices-and-cookie-warning"); $(".sticky").css("margin-bottom", "0"); }); $("#tweeter-feed .tweet-message").each(function (i, message) { var self = $(message); self.html(linkify(self.html())); }); $(".partner").on("mouseenter mouseleave", function() { $(this).find(".gray-scale, .colour").toggleClass("is-hidden"); }); }); Sign In Remember me Forgotten your password? Sign In Cancel Email or password not correct. Please try again Please wait... $(function(){ // Note: All the setup needs to run against a name attribute and *not* the id due the clonish // nature of facebox... $("a[id=googleSignInButton]").click(function(event){ event.preventDefault(); $("input[id=oAuthSystem]").val("GOOGLE"); $("form[id=oAuthForm]").submit(); }); $("a[id=facebookSignInButton]").click(function(event){ event.preventDefault(); $("input[id=oAuthSystem]").val("FACEBOOK"); $("form[id=oAuthForm]").submit(); }); $("a[id=orcidSignInButton]").click(function(event){ event.preventDefault(); $("input[id=oAuthSystem]").val("ORCID"); $("form[id=oAuthForm]").submit(); }); }); If you've forgotten your password, please enter your email address below and we'll send you instructions on how to reset your password. The email address should be the one you originally registered with F1000. Email address not valid, please try again You registered with F1000 via Google, so we cannot reset your password. To sign in, please click here . If you still need help with your Google account password, please click here . You registered with F1000 via Facebook, so we cannot reset your password. To sign in, please click here . If you still need help with your Facebook account password, please click here . Code not correct, please try again Reset password Cancel Email us for further assistance. Server error, please try again. If your email address is registered with us, we will email you instructions to reset your password. If you think you should have received this email but it has not arrived, please check your spam filters and/or contact for further assistance. Please wait... Register $(document).ready(function () { signIn.createSignInAsRow($("#sign-in-form-gfb-popup")); $(".target-field").each(function () { var uris = $(this).val().split("/"); if (uris.pop() === "login") { $(this).val(uris.toString().replace(",","/")); } }); });

Text is read by the "Ask this paper" AI Q&A widget below. Extraction quality varies by source — PMC NXML preserves structure cleanly, OA-HTML may include some navigation residue, and OA-PDF can have broken hyphenation. The publisher copy (via DOI) is the canonical version.

My notes (saved in your browser only)

⚙ Ask this paper AI returns verbatim quotes from the full text · source: preprint-html ⓘ

Answers must be backed by verbatim quotes from this paper's full text. Hallucinated quotes are dropped automatically; if no verbatim passage answers the question, we say so. How this works

Citation neighborhood (no data yet)

We don't have any in-corpus citations linked to this paper yet. This is a recent paper (2025) — citers typically take a year or two to land, and the OpenAlex reference graph may still be filling in.

Source provenance

europepmc: last seen: 2026-05-20T01:45:00.602351+00:00
unpaywall: last seen: 2026-05-23T02:00:01.238055+00:00

License: CC-BY-4.0