<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.1 20151215//EN" "http://jats.nlm.nih.gov/publishing/1.1/JATS-journalpublishing1.dtd">
<article xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xml:lang="en" article-type="research-article" dtd-version="1.1">
  <front>
    <journal-meta>
      <journal-id journal-id-type="pmc">Phyton</journal-id>
      <journal-id journal-id-type="nlm-ta">Phyton</journal-id>
      <journal-id journal-id-type="publisher-id">Phyton</journal-id>
      <journal-title-group>
        <journal-title>Phyton-International Journal of Experimental Botany</journal-title>
      </journal-title-group>
      <issn pub-type="epub">1851-5657</issn>
      <issn pub-type="ppub">0031-9457</issn>
      <publisher>
        <publisher-name>Tech Science Press</publisher-name>
        <publisher-loc>USA</publisher-loc>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="publisher-id">73509</article-id>
      <article-id pub-id-type="doi">10.32604/phyton.2026.073509</article-id>
      <article-categories>
        <subj-group subj-group-type="heading">
          <subject>Article</subject>
        </subj-group>
      </article-categories>
      <title-group>
        <article-title>A Comprehensive Expression Atlas of <italic>Nicotiana tabacum</italic>: Revealing Specificity Expression Patterns and Regulatory Variants</article-title>
        <alt-title alt-title-type="left-running-head">A Comprehensive Expression Atlas of <italic>Nicotiana tabacum</italic>: Revealing Specificity Expression Patterns and Regulatory Variants</alt-title>
        <alt-title alt-title-type="right-running-head">A Comprehensive Expression Atlas of <italic>Nicotiana tabacum</italic>: Revealing Specificity Expression Patterns and Regulatory Variants</alt-title>
      </title-group>
      <contrib-group>
        <contrib id="author-1" contrib-type="author">
          <name name-style="western">
            <surname>Yu</surname>
            <given-names>Shizhou</given-names>
          </name>
          <xref ref-type="aff" rid="aff-1">1</xref>
          <xref ref-type="aff" rid="aff-2">2</xref>
        </contrib>
        <contrib id="author-2" contrib-type="author">
          <name name-style="western">
            <surname>Zhang</surname>
            <given-names>Jie</given-names>
          </name>
          <xref ref-type="aff" rid="aff-1">1</xref>
        </contrib>
        <contrib id="author-3" contrib-type="author">
          <name name-style="western">
            <surname>Cao</surname>
            <given-names>Linggai</given-names>
          </name>
          <xref ref-type="aff" rid="aff-1">1</xref>
        </contrib>
        <contrib id="author-4" contrib-type="author">
          <name name-style="western">
            <surname>Liu</surname>
            <given-names>Jie</given-names>
          </name>
          <xref ref-type="aff" rid="aff-1">1</xref>
        </contrib>
        <contrib id="author-5" contrib-type="author">
          <name name-style="western">
            <surname>Lu</surname>
            <given-names>Peng</given-names>
          </name>
          <xref ref-type="aff" rid="aff-3">3</xref>
        </contrib>
        <contrib id="author-6" contrib-type="author">
          <name name-style="western">
            <surname>Tao</surname>
            <given-names>Jiemeng</given-names>
          </name>
          <xref ref-type="aff" rid="aff-3">3</xref>
        </contrib>
        <contrib id="author-7" contrib-type="author">
          <name name-style="western">
            <surname>Ren</surname>
            <given-names>Xueliang</given-names>
          </name>
          <xref ref-type="aff" rid="aff-1">1</xref>
        </contrib>
        <contrib id="author-8" contrib-type="author" corresp="yes">
          <name name-style="western">
            <surname>Yang</surname>
            <given-names>Zhixiao</given-names>
          </name>
          <xref ref-type="aff" rid="aff-1">1</xref>
          <xref ref-type="aff" rid="aff-2">2</xref>
          <email>linyingxian2006@126.com</email>
        </contrib>
        <aff id="aff-1">
          <label>1</label>
          <institution>Molecular Genetics Key Laboratory of China Tobacco, Guizhou Academy of Tobacco Science</institution>, <addr-line>Guiyang</addr-line>, <country>China</country>
        </aff>
        <aff id="aff-2">
          <label>2</label>
          <institution>Guizhou Provincial Key Laboratory for Tobacco Quality Improvement and Efficiency Enhancement</institution>, <addr-line>Guiyang</addr-line>, <country>China</country>
        </aff>
        <aff id="aff-3">
          <label>3</label>
          <institution>China Tobacco Gene Research Center, Zhengzhou Tobacco Research Institute of CNTC</institution>, <addr-line>Zhengzhou</addr-line>, <country>China</country>
        </aff>
      </contrib-group>
      <author-notes>
        <corresp id="cor1"><label>*</label>Corresponding Author: Zhixiao Yang. Email: <email>linyingxian2006@126.com</email></corresp>
      </author-notes>
      <pub-date date-type="collection" publication-format="electronic">
        <year>2026</year>
      </pub-date>
      <pub-date date-type="pub" publication-format="electronic">
        <day>28</day>
        <month>2</month>
        <year>2026</year>
      </pub-date>
      <volume>95</volume>
      <issue>2</issue>
      <elocation-id>6</elocation-id>
      <history>
        <date date-type="received">
          <day>19</day>
          <month>9</month>
          <year>2025</year>
        </date>
        <date date-type="accepted">
          <day>08</day>
          <month>1</month>
          <year>2026</year>
        </date>
      </history>
      <permissions>
        <copyright-statement>&#xA9; 2026 The Authors. Published by Tech Science Press.</copyright-statement>
        <copyright-year>2026</copyright-year>
        <copyright-holder>The Authors</copyright-holder>
        <license xlink:href="https://creativecommons.org/licenses/by/4.0/">
          <license-p>This work is licensed under a <ext-link ext-link-type="uri" xlink:type="simple" xlink:href="https://creativecommons.org/licenses/by/4.0/">Creative Commons Attribution 4.0 International License</ext-link>, which permits unrestricted use, distribution, and reproduction in any medium, provided the original work is properly cited.</license-p>
        </license>
      </permissions>
      <self-uri content-type="pdf" xlink:href="Phyton-95-73509.pdf"/>
      <abstract>
        <p>Tobacco (<italic>Nicotiana tabacum</italic>, 2n = 48) is a key non-food economic crop, yet its stress response and gene regulatory mechanisms remain poorly understood. By analyzing 603 transcriptome datasets, this study identified 1405 tissue-specific genes, revealing tissue-specific synthesis of terpenoids and other ecologically important secondary metabolites in sepals and other tissues. Comparative stress-response analysis highlighted distinct gene expression patterns in leaves and roots under biotic and abiotic stresses. Additionally, 28,396 expression quantitative trait loci (eQTLs) were mapped in leaves, offering valuable genetic regulatory markers. These findings provide crucial insights into tobacco&#x2019;s gene expression characteristics and their functional implications, serving as a foundation for future research. </p>
      </abstract>
      <kwd-group kwd-group-type="author">
        <kwd>Tobacco</kwd>
        <kwd>eQTLs</kwd>
        <kwd>regulatory loci</kwd>
        <kwd>transcriptional atlas</kwd>
      </kwd-group>
      <funding-group>
        <award-group id="awg1">
          <funding-source>Guizhou Provincial Basic Research Program (Natural Science)</funding-source>
          <award-id>(2024) 648</award-id>
        </award-group>
		<award-group id="awg2">
          <funding-source>Program of China National Tobacco Corporation</funding-source>
          <award-id>110202101032(JY-09)</award-id>
		  <award-id>110202201003(JY-03)</award-id>
        </award-group>
		<award-group id="awg3">
          <funding-source>Program of Guizhou Branch of China National Tobacco Corporation</funding-source>
          <award-id>2023XM02</award-id>
		  <award-id>2022XM05</award-id>
		  <award-id>2024XM01</award-id>
        </award-group>
		<award-group id="awg4">
          <funding-source>Qiankehe Platform Project</funding-source>
          <award-id>ZSYS [2025] 028</award-id>
        </award-group>
		<award-group id="awg5">
          <funding-source>Program of China National Tobacco Corporation</funding-source>
          <award-id>110202102034</award-id>
        </award-group>
      </funding-group>
    </article-meta>
  </front>
  <body>
    <sec id="s1">
      <label>1</label>
      <title>Introduction</title>
      <p>Plant development is a continuous process, and with the continuous generation and development of new organs, gene expression and regulation undergo constant changes, forming a complex network [<xref ref-type="bibr" rid="ref-1">1</xref>]. In such processes, studying gene expression patterns contributes to understanding the mechanisms of development and regulation. The utilization of spatiotemporal transcriptome sequencing is an important approach to elucidate such regulatory networks, and detailed transcriptional atlases of many important plants have already been outlined [<xref ref-type="bibr" rid="ref-2">2</xref>,<xref ref-type="bibr" rid="ref-3">3</xref>]. In addition, several tools have also been developed for the analysis of expression atlases [<xref ref-type="bibr" rid="ref-4">4</xref>,<xref ref-type="bibr" rid="ref-5">5</xref>]. However, in comparison to research on animals, studies on plant transcriptional atlases often lack sufficient sampling across different organs and over time; for example, a transcriptional atlas of pigs was constructed using samples from 31 pig organs and 2 pig cell lines [<xref ref-type="bibr" rid="ref-6">6</xref>]. This extensive sampling is crucial for understanding the complex transcriptional landscape and its variations. Similarly, to gain a comprehensive understanding of the plant transcriptome, sampling across various organs and developmental stages, as well as different environmental conditions, is essential.</p>
      <p>Constructing a large-scale transcriptional atlas is costly, so another approach to understanding certain features of plant development is through unified reanalysis by integrating different datasets. For example, in soybean research, a study gathered over 5000 RNA-seq datasets for analysis and constructed a transcriptional atlas database for soybeans [<xref ref-type="bibr" rid="ref-7">7</xref>]. For species with limited database resources, research has provided insights into the transcriptional characteristics of individual species through plant cultivation and transcriptome sequencing analysis. For example, Xanthopoulou et al. collected samples of seeds, sprouts, stem leaves, tender and mature leaves, male and female flowers, fruits at seven developmental stages, and primary and lateral roots and constructed a comprehensive gene expression atlas for Cucurbita pepo [<xref ref-type="bibr" rid="ref-8">8</xref>]. However, data obtained from individual organisms lack population-level insights. When studying temporal and spatial transcriptional features, research on the regulation of gene expression should not be overlooked. Two impressive large-sample analysis studies focusing on the transcriptional atlas of pigs and cattle not only revealed the tissue-specific expression characteristics of genes in pigs and cattle but also importantly identified numerous regulatory loci in the genome [<xref ref-type="bibr" rid="ref-9">9</xref>,<xref ref-type="bibr" rid="ref-10">10</xref>].</p>
      <p>Tobacco, an important economic crop, faces various biotic and abiotic stresses during its growth, which significantly impact tobacco growth and the tobacco industry. Transcriptome sequencing analysis is commonly employed to study stress response mechanisms in tobacco. For example, cadmium can inhibit tobacco growth and reduce leaf quality, and its presence in tobacco smoke affects the health of both smokers and the surrounding environment. Hence, studies have elucidated the mechanisms of cadmium accumulation and tolerance in tobacco leaves through transcriptome sequencing and analysis [<xref ref-type="bibr" rid="ref-11">11</xref>]. By comparing the transcriptomes of plants with differential cold tolerance between two tobacco cultivars, important candidate genes for cold stress resistance, such as NtCBF2, have been identified [<xref ref-type="bibr" rid="ref-12">12</xref>]. The accumulation of transcriptome analysis data provides possibilities for conducting tobacco transcriptomic studies through data collection methods.</p>
      <p>This study manually collected and screened RNA-seq data originating from 35 independent research projects involving various tobacco tissues and treatments. Through comprehensive analysis, genes exhibiting tissue-specific expression patterns and the similarities and differences in tobacco responses to different stresses were identified. Single-nucleotide polymorphism (SNP) calling based on RNA-seq and identification of eQTLs provide rich genetic regulatory loci for tobacco gene expression. This study presents a comprehensive analysis of tobacco transcriptome levels and features, which provides valuable assistance in accelerating tobacco research.</p>
    </sec>
    <sec id="s2">
      <label>2</label>
      <title>Materials and Methods</title>
      <sec id="s2_1">
        <label>2.1</label>
        <title>Data Sources</title>
        <p>We retrieved RNA-seq data for 35 BioProjects from National Center for Biotechnology Information (NCBI) through literature mining, encompassing 603 samples across 13 tissues (<xref ref-type="sec" rid="supplementary-materials">Supplementary Table S1</xref>). Genomic data pertinent to tobacco were obtained from the Sol Genomics Network database (<ext-link ext-link-type="uri" xlink:href="https://solgenomics.net/">https://solgenomics.net/</ext-link>). The genome published by Edwards et al. [<xref ref-type="bibr" rid="ref-13">13</xref>] was used as a reference.</p>
      </sec>
      <sec id="s2_2">
        <label>2.2</label>
        <title>Gene Expression Analysis</title>
        <p>The original data were converted to fastq format using fastq-dump from the SRA Toolkit v3.0.5 (<ext-link ext-link-type="uri" xlink:href="https://github.com/ncbi/sra-tools">https://github.com/ncbi/sra-tools</ext-link>). Subsequently, adapter sequences and low-quality sequences in the fastq were removed using fastp with default parameters [<xref ref-type="bibr" rid="ref-14">14</xref>]. After obtaining clean data, the transcriptome data were mapped to the reference genome using STAR (v2.7.10a) [<xref ref-type="bibr" rid="ref-15">15</xref>]. Subsequently, StringTie (v2.1.7) [<xref ref-type="bibr" rid="ref-16">16</xref>] with default parameters was used in conjunction with the annotation of the reference genome to quantify gene expression levels. The gene expression levels were subjected to t-distributed stochastic neighbour embedding (tSNE) clustering using the R package Rtsne (v0.16) [<xref ref-type="bibr" rid="ref-17">17</xref>], and the umap (v0.2.10.0) package was utilized for uniform manifold approximation and projection (UMAP) clustering of gene expression [<xref ref-type="bibr" rid="ref-18">18</xref>].</p>
      </sec>
      <sec id="s2_3">
        <label>2.3</label>
        <title>Analysis of Tissue-Specific Genes in Tobacco</title>
        <p>We utilized the median transcripts per million (TPM) values of genes in each tissue (calculated with R function media) for calculation of the tissue-specific index (TSI). Genes with a median expression level less than 0.1 TPM were assigned a value of 0. TPM values were then log2 transformed (TPM + 1). Subsequently, all genes or transcripts with accumulated expression values less than 0.1 were excluded from the analysis to filter out genes with low expression or transcripts with low expression [<xref ref-type="bibr" rid="ref-19">19</xref>].</p>
        <p>The formula for calculating the TSI is as follows:
        <disp-formula id="eqn-1">
          <mml:math id="mml-eqn-1" display="block">
            <mml:mrow>
              <mml:mi>T</mml:mi>
              <mml:mi>S</mml:mi>
              <mml:mi>I</mml:mi>
              <mml:mo>=</mml:mo>
              <mml:mfrac>
                <mml:mrow>
                  <mml:mrow>
                    <mml:munderover>
                      <mml:mo stretchy="false">&#x2211;</mml:mo>
                      <mml:mrow>
                        <mml:mi>i</mml:mi>
                        <mml:mo>=</mml:mo>
                        <mml:mn>1</mml:mn>
                      </mml:mrow>
                      <mml:mrow>
                        <mml:mi>n</mml:mi>
                      </mml:mrow>
                    </mml:munderover>
                    <mml:mrow>
                      <mml:mfenced separators="|">
                        <mml:mrow>
                          <mml:mn>1</mml:mn>
                          <mml:mo>&#x2212;</mml:mo>
                          <mml:mfrac>
                            <mml:mrow>
                              <mml:msub>
                                <mml:mrow>
                                  <mml:mi>x</mml:mi>
                                </mml:mrow>
                                <mml:mrow>
                                  <mml:mi>i</mml:mi>
                                </mml:mrow>
                              </mml:msub>
                            </mml:mrow>
                            <mml:mrow>
                              
                                <mml:mrow>
                                  <mml:mrow>
                                    <mml:mrow>
                                      <mml:munder>
                                        <mml:mrow>
                                          <mml:mi mathvariant="normal">max</mml:mi>
                                        </mml:mrow>
                                        <mml:mrow>
                                          <mml:mn>1</mml:mn>
                                          <mml:mo>&#x2264;</mml:mo>
                                          <mml:mi>i</mml:mi>
                                          <mml:mo>&#x2264;</mml:mo>
                                          <mml:mi>n</mml:mi>
                                        </mml:mrow>
                                      </mml:munder>
									  </mml:mrow>
									  <mml:msub>
                                    <mml:mrow>
                                      <mml:mi>x</mml:mi>
                                    </mml:mrow>
									 <mml:mrow>
                                  <mml:mi>i</mml:mi>
                                </mml:mrow>
								 </mml:msub>
                                  </mml:mrow>
                                </mml:mrow>
                            </mml:mrow>
                          </mml:mfrac>
                        </mml:mrow>
                      </mml:mfenced>
                    </mml:mrow>
                  </mml:mrow>
                </mml:mrow>
                <mml:mrow>
                  <mml:mi>n</mml:mi>
                  <mml:mo>&#x2212;</mml:mo>
                  <mml:mn>1</mml:mn>
                </mml:mrow>
              </mml:mfrac>
            </mml:mrow>
          </mml:math>
        </disp-formula>
        where <italic>n</italic> is the number of tissues, <italic>x</italic> is the median gene expression in the sample group, and <italic>i</italic> is the sample group. This study identified tissue-specific genes for which the TSI was greater than 0.85. The functional annotation of protein sequences was performed using eggNOG-mapper software [<xref ref-type="bibr" rid="ref-20">20</xref>]. Enrichment analysis of tissue-specific genes was conducted using the R package clusterProfiler (v4.6.2) [<xref ref-type="bibr" rid="ref-21">21</xref>]. The enrichment results of tissue-specific genes in sepal tissue were visualized using CirGO (v1.0) [<xref ref-type="bibr" rid="ref-22">22</xref>]. Transcription Factor (TF) identification of tobacco was carried out using the Plant Transcription Factor Database (PlantTFDB) database [<xref ref-type="bibr" rid="ref-23">23</xref>] (<ext-link ext-link-type="uri" xlink:href="https://planttfdb.gao-lab.org/">https://planttfdb.gao-lab.org/</ext-link>).</p>
      </sec>
      <sec id="s2_4">
        <label>2.4</label>
        <title>Analysis of Gene Expression Patterns in Response to Tobacco Stress</title>
        <p>From 603 transcriptome datasets, 29 stress groups including roots, leaves, axillary shoots, and other tissues, were selected. We used featureCounts (v2.0.1) [<xref ref-type="bibr" rid="ref-24">24</xref>] to calculate the read counts of genes in the samples. Gene differential expression analysis was conducted using the R package DESeq2 (v1.38.3) [<xref ref-type="bibr" rid="ref-25">25</xref>]. Genes with a |log2FoldChange| &gt; 1 and an adjusted <italic>p</italic> value &lt; 0.05 were identified as differentially expressed genes (DEGs). Genes with accumulated TPM expression values less than 0.1 in all samples were filtered out, and the remaining genes were considered to have stable expression. The R package corrplot (v0.92) was used to create the correlograms with log2FoldChange in each group [<xref ref-type="bibr" rid="ref-26">26</xref>]. Functional enrichment analysis of the DEGs was conducted using the R package clusterProfiler [<xref ref-type="bibr" rid="ref-27">27</xref>].</p>
        <p>To construct the regulatory network of TFs and genes, we first downloaded the plant TF protein files from PlantTFDB (<ext-link ext-link-type="uri" xlink:href="https://planttfdb.gao-lab.org/">https://planttfdb.gao-lab.org/</ext-link>). Next, we used BLASTP to align the tobacco proteins with the plant TF protein sequences, using an E-value cut-off of 1E&#x2212;5. Genes that passed the threshold were identified as tobacco TFs. Subsequently, we calculated the Pearson correlation coefficients (PCCs) between the tobacco TFs and the DEGs shared across all the stress treatments. TF and DEG pairs with a PCC greater than 0.9 and q-values less than 0.01 were considered coexpressed. We utilized HOMER (v4.11) (<ext-link ext-link-type="uri" xlink:href="http://homer.ucsd.edu/homer/">http://homer.ucsd.edu/homer/</ext-link>) [<xref ref-type="bibr" rid="ref-28">28</xref>] to identify common stable motifs in the upstream 2 kb of DEGs shared across all the stress treatments. First, we used the loadGenome.pl subroutine of HOMER to load the tobacco genome file; next, we used the findMotifsGenome.pl subroutine to identify motifs in the 2 kb upstream promoter regions of the DEGs. As a background, we randomly selected the 2 kb upstream regions of 5000 genes across the entire tobacco genome, repeated the sampling 50 times, and selected motifs that consistently appeared in each sampling as the final identified motifs. We constructed a coexpression network of TFs that could bind to these motifs and were coexpressed with the DEGs shared across all the stress treatments with the coexpression PCC threshold set to 0.8. The coexpression network was visualized using Cytoscape (v3.10.2) software [<xref ref-type="bibr" rid="ref-29">29</xref>].</p>
      </sec>
      <sec id="s2_5">
        <label>2.5</label>
        <title>Identification of SNPs in Tobacco Leaves</title>
        <p>RNA-seq alignment results were sorted using SAMtools (v1.8) software with default parameters [<xref ref-type="bibr" rid="ref-30">30</xref>], and duplicated reads within the BAM files were marked using Picard (<ext-link ext-link-type="uri" xlink:href="https://github.com/broadinstitute/picard">https://github.com/broadinstitute/picard</ext-link>). The GATK tool SplitNCigarReads was used to filter the BAM files obtained in the previous step [<xref ref-type="bibr" rid="ref-31">31</xref>]. Subsequently, SNP calling and variant filtration were performed using the HaplotypeCaller tool from the GATK toolkit, filtering candidate SNPs with Fisher strand (FS) values &lt; 30.0 and quality depth (QD) values &gt; 2.0. Further filtering was conducted to retain only biallelic SNPs. VCFtools (0.1.16) software [<xref ref-type="bibr" rid="ref-32">32</xref>] was then utilized with the parameters&#x2014;max-missing 0.9 and&#x2014;maf 0.05 to filter SNPs in the population with missing rates exceeding 10% and minor allele frequencies greater than 5%, respectively.</p>
      </sec>
      <sec id="s2_6">
        <label>2.6</label>
        <title>Identification of eQTLs</title>
        <p>Gene expression data were filtered first, and genes with a median TPM greater than 0 were selected for eQTL analysis. The filtered expression data were subjected to confounding factor identification using the PEER (v1.0) package, and the top 10 confounding factors for covariance in eQTL analysis were selected. FastQTL (v2.0) [<xref ref-type="bibr" rid="ref-33">33</xref>] was used to identify cis-eQTLs in tobacco leaves. The size of the cis window was set to 1000000, and the &#x2018;normal&#x2019; parameter was used for the transformation of phenotypes. EMMAX [<xref ref-type="bibr" rid="ref-34">34</xref>] was used to identify SNPs associated with the expression of each gene. The pvalues obtained from FastQTL were adjusted using the Bonferroni method to derive adjusted pvalues (p.adjust), with a significance threshold set at p.adjust &lt; 0.05 in cis-eQTL analysis. Genetic Type I error calculator (GEC) software [<xref ref-type="bibr" rid="ref-32">32</xref>] was utilized to determine the effective number of SNPs (Me), and a threshold of 1.43 &#xD7; 10<sup>&#x2212;7</sup> (0.05/Me) was adopted as the threshold for determining the significance of trans-eQTLs, adjusted by the Bonferroni method. PLINK (1.90b6.21) software [<xref ref-type="bibr" rid="ref-35">35</xref>] was used with the &#x2018;clump&#x2019; parameter to merge linkage blocks of related SNPs, with a maximum block length of 500 kb. The SNP with the smallest pvalue in each linkage block containing at least three significant SNPs was selected as the lead SNP. Enrichment analysis was performed for cis- and trans-eGenes, and visualization was carried out using CirGO software.</p>
      </sec>
    </sec>
    <sec id="s3">
      <label>3</label>
      <title>Results</title>
      <sec id="s3_1">
        <label>3.1</label>
        <title>Sample Statistics and Cluster Analysis of Tobacco Transcription Data</title>
        <p>Tobacco is an important economic crop, and transcriptomic studies of this species have generated a large amount of sequencing data. In this study, we collected 603 available tobacco transcriptome datasets from 13 tissues or organs, including leaves, roots, seedlings, stems, trichomes, petals, and sepals, from the NCBI database and published research (<xref ref-type="fig" rid="fig-1">Fig. 1</xref>A). Notably, the samples from leaf and root tissues were the most numerous, with 329 and 146 samples, respectively. These RNA-seq samples were derived from 35 distinct NCBI BioProjects, which is indicative of their diverse origins. This aggregation reflects the inclusion of samples from various laboratories potentially harbouring rich genetic polymorphisms, thereby laying a foundation for the exploration of regulatory loci influencing tobacco gene expression. Among these studies, 10 Bioprojects were related to stress studies in tobacco, providing a foundation for cross-stress analysis of tobacco stress response mechanisms.</p>
        <p>After RNA-seq data were downloaded from the NCBI SRA database, a unified analysis pipeline was used to perform data cleaning, alignment, and quantification on all datasets. After quantifying the expression levels of all genes in the samples (<xref ref-type="sec" rid="supplementary-materials">Supplementary File</xref> <ext-link ext-link-type="uri" xlink:href="https://doi.org/10.6084/m9.figshare.29666060">https://doi.org/10.6084/m9.figshare.29666060</ext-link>), clustering was performed using tSNE. The results revealed that some samples clustered together based on tissue relationships (<xref ref-type="fig" rid="fig-1">Fig. 1</xref>B). However, the clustering analysis could not completely differentiate certain tissues, possibly due to anatomical proximity. For example, petals and sepals are parts of flowers, whereas the blade, lamina, and midrib are constituents of leaves. However, flowers are considered a morphological modification of leaves, leading to an inability for complete discrimination. Notably, there was a clear separation between leaves from the seedling and nonseedling stages in the clustering results, indicating differences in gene expression patterns between tobacco seedling leaves and mature leaves and validating the feasibility of categorizing them into two distinct tissues. From the perspective of treatments, samples under different treatments showed a clear clustering trend, indicating that both treatment conditions and growth environments can influence the clustering results (<xref ref-type="sec" rid="supplementary-materials">Supplementary Fig. S1</xref>). Similar patterns have been observed in transcriptome clustering analyses of poplar and soybean, suggesting that tissue type and environmental factors are major determinants of clustering [<xref ref-type="bibr" rid="ref-36">36</xref>,<xref ref-type="bibr" rid="ref-37">37</xref>].</p>
        <fig id="fig-1">
          <label>Figure 1</label>
          <caption>
            <p>The number and types of RNA-seq samples utilized in this study. (<bold>A</bold>) Sample quantity statistics for each tissue. &#x201C;Flower&#x201D; denotes immature flowers. (<bold>B</bold>) tSNE clustering results based on sample expression levels.</p>
          </caption>
          <graphic mimetype="image" mime-subtype="tif" xlink:href="Phyton-95-73509-f001.tif"/>
        </fig>
      </sec>
      <sec id="s3_2">
        <label>3.2</label>
        <title>Analysis of Tobacco Tissue-Specific Genes</title>
        <p>The above results indicate that tSNE analysis can effectively distinguish most tissues, suggesting relatively high expression similarity among samples within the same tissue. This finding implies that identifying genes with tissue-specific expression can further elucidate the relationship between gene expression and tissue function. The samples collected in this study covered a total of 13 tissues, and the TSI of each gene was calculated as the median expression level across tissues (<xref ref-type="sec" rid="supplementary-materials">Supplementary Table S2</xref>). Additionally, genes were categorized into four groups (null, weak, broad, and tissue-specific) based on their median expression across tissues (<xref ref-type="sec" rid="supplementary-materials">Supplementary Table S3</xref>) [<xref ref-type="bibr" rid="ref-7">7</xref>]. The results revealed that 28.9% of the genes were classified as null genes (TPM &lt;1 in all tissues; n = 10,272), 9.9% were classified as weakly expressed genes (TPM &lt;5 in all tissues; n = 3529), over 57% were classified as broadly expressed genes (TPM &#x2265; 5 in all tissues, TSI &lt; 0.85; n = 20,313), and only a small fraction were classified as tissue-specific genes (TPM &#x2265; 5 in all tissues, TSI &#x2265; 0.85; n = 1405) (<xref ref-type="sec" rid="supplementary-materials">Supplementary Table S4</xref>) (<xref ref-type="fig" rid="fig-2">Fig. 2</xref>A).</p>
        <p>The number of tissue-specific genes was the greatest in the immature flower, petal, sepal, and root tissues, with 308, 642, 63, and 303 genes, respectively (<xref ref-type="fig" rid="fig-2">Fig. 2</xref>B). Although most tissue-specific genes are unique to individual tissues, there are also a few genes that exhibit specific expression in multiple tissues. Notably, a subset of genes exhibited very high tissue-specific expression in both tobacco flowers and petals (<xref ref-type="fig" rid="fig-2">Fig. 2</xref>C). The greater number of tissue-specific genes and high expression levels in tissues or organs related to reproduction may be associated with their unique functions. To further understand the functions of these tissue-specific genes, this study conducted gene ontology (GO) enrichment analysis using all genes as background. The genes that were specifically expressed in nine tissues&#x2014;axillary shoot, blade, young leaf, midrib, petal, sepal, immature flower, root, and stem&#x2014;were collectively enriched in 341 GO terms (<xref ref-type="sec" rid="supplementary-materials">Supplementary Table S5, Supplementary Fig. S2</xref>). For example, genes specifically expressed in the axillary shoot were enriched in genes related to anatomical structure formation involved in morphogenesis, plant organ formation, regulation of development, heterochrony, anatomical structure formation involved in morphogenesis, regulation of plant organ formation, monooxygenase activity, and other genes related to plant organ formation. Genes specifically expressed in petals and flowers were enriched in a series of GO terms related to floral organ development such as floral whorl development, floral organ development, androecium development, gynoecium development, and carpel development. Particularly in sepals, a large number of tissue-specific genes related to terpenoid biosynthesis processes, sesquiterpenoid biosynthesis processes, terpene synthase activity, and other terpenoid synthesis-related processes were identified (<xref ref-type="fig" rid="fig-2">Fig. 2</xref>D). The top four enriched terms of tissue-specific genes in sepals were sesquiterpene biosynthetic process, sesquiterpene metabolic process, terpene biosynthetic process, and terpene metabolic process, and other biological processes were also predominantly associated with terpenoid synthesis. Several studies have revealed the involvement of terpenoids in processes such as attracting insects for pollination [<xref ref-type="bibr" rid="ref-38">38</xref>,<xref ref-type="bibr" rid="ref-39">39</xref>], indicating that the secondary metabolites synthesized in tobacco sepals also play similar important roles.</p>
        <p>Given the crucial regulatory roles of TFs, this study aimed to identify the TFs contained within the abovementioned tissue-specific genes. Among the genes showing tissue-specific expression in petals, flowers, and roots, there was a relatively greater abundance of TFs such as MYB and MYB_related (<xref ref-type="fig" rid="fig-2">Fig. 2</xref>E). Furthermore, ERFs were exclusively found in reproductive-related tissues such as petals, sepals, and flowers. These TFs most likely play important regulatory roles in growth, development, and secondary metabolite synthesis in their corresponding tissues.</p>
        <fig id="fig-2">
          <label>Figure 2</label>
          <caption>
            <p>Specific expression patterns of genes across 13 tobacco tissues. (<bold>A</bold>) Numbers of genes in four groups: null, weak, broad, and tissue specific. (<bold>B</bold>) Quantity and intersection relationships of tissue-specific genes across various tissues. The left bar plot of the UpSet plot represents the number of tissue-specific genes for each tissue, whereas the top bar plot shows the number of tissue-specific genes shared between different tissues. The dots and lines in the figure represent shared tissue-specific genes among these tissues. (<bold>C</bold>) Heatmap of the median TPM of tissue-specific genes in each tissue. (<bold>D</bold>) GO biological process (BP) enrichment terms for genes specifically expressed in sepals. (<bold>E</bold>) Identification of tissue-specific TFs in tissues.</p>
          </caption>
          <graphic mimetype="image" mime-subtype="tif" xlink:href="Phyton-95-73509-f002.tif"/>
        </fig>
      </sec>
      <sec id="s3_3">
        <label>3.3</label>
        <title>Cross-Stress Gene Expression Patterns</title>
        <p>As sessile organisms, plants face numerous biotic and abiotic stresses, so they have evolved a wide range of mechanisms to respond to and minimize these stresses. The transcriptome data collected in this study, including data from 29 biotic and abiotic stresses in roots, leaves, and axillary shoots, were manually curated (<xref ref-type="sec" rid="supplementary-materials">Supplementary Table S6</xref>). This provides an opportunity to identify various stress-responsive genes and outline relationships between these genes that single-stress studies cannot reveal. The stress studies conducted on leaves primarily involved investigations into resistance mechanisms against drought stress induced by salicylic acid (SA), melatonin (MEL), and abscisic acid (ABA) as well as resistance to cold and salt stress. The stress studies conducted on root tissues mainly involved investigations into resistance to <italic>Phytophthora nicotianae</italic> and high and low concentrations of nitrate (N), whereas axillary shoot studies have primarily focused on stresses associated with topping treatments.</p>
        <p>Transcriptomic analysis comparing various stress treatment groups with the control group revealed significant differences in the number of genes responsive to different external stresses in tobacco (<xref ref-type="sec" rid="supplementary-materials">Supplementary Table S7</xref>). The quantity of DEGs shows a gradual increase in response gene numbers with increasing duration or intensity of the same type of stress. In particular, when tobacco leaves were subjected to 4&#xB0;C environmental treatment for 0.5, 1, 2, 4, or 8 h, the number of DEGs gradually increased (<xref ref-type="fig" rid="fig-3">Fig. 3</xref>A). In this study, the number of upregulated and downregulated DEGs between the stress treatment groups and control group samples generally ranged from 1 to 7-fold. Taking <italic>Phytophthora nicotianae</italic> infection as an example, as the stress increased, the log2FoldChange also increased accordingly (<xref ref-type="fig" rid="fig-3">Fig. 3</xref>B). GO enrichment analysis was performed separately for genes under various stresses (<xref ref-type="sec" rid="supplementary-materials">Supplementary Figs. S3 and S4, Supplementary Table S8</xref>), revealing that many upregulated genes under adverse stress conditions were enriched in stress-related GO terms such as those related to drought response and auxin response. For example, under drought stress, the differentially expressed genes were enriched in the response to water category, including a histone deacetylase (<italic>Nitab4.5_0001922g0030</italic>), a gene widely known to participate in drought tolerance across plant species [<xref ref-type="bibr" rid="ref-40">40</xref>]. Under biotic stress treatments, the differentially expressed genes were enriched in GO terms such as response to bacterium, defense response to bacterium, and response to karrikin. Notably, these categories contained a shared gene, NB-LRR (<italic>Nitab4.5_0000068g0290</italic>), which encodes a key immune protein broadly involved in plant defense [<xref ref-type="bibr" rid="ref-41">41</xref>].</p>
        <p>Genes with TPM expression levels less than 0.1 in all samples were filtered out, and the similarity of gene response patterns between different treatments was assessed based on the log2FoldChange. In the roots, regardless of the N concentration, there was a strong positive correlation between the different treatments based on the log2FoldChange (<xref ref-type="fig" rid="fig-3">Fig. 3</xref>C). Based on the number of DEGs and their log2FoldChange, although there were differences in the number of DEGs under varying concentrations and durations of nitrate treatment, the direction of the gene response (upregulation or downregulation) and the log2FoldChange were similar (<xref ref-type="fig" rid="fig-3">Fig. 3</xref>A,B). Moreover, in tobacco roots infected by <italic>Phytophthora nicotianae</italic>, the direction and magnitude of gene responses were strongly correlated with those after nitrate treatment. This suggests that although nitrate is a nonbiological stress and <italic>Phytophthora nicotianae</italic> infection is a biotic stress, they may stimulate some common response mechanisms. However, in the case of the root treatments under the shoot topping treatment, the direction and log2FoldChange of stress-responsive genes were negatively correlated with those under the N and <italic>Phytophthora nicotianae</italic> treatments, reflecting differences in gene response patterns between the different stresses.</p>
        <fig id="fig-3">
          <label>Figure 3</label>
          <caption>
            <p>Analysis of response patterns of genes under multiple stress treatments. Abbreviations for the labels on the horizontal axis are shown in <xref ref-type="sec" rid="supplementary-materials">Supplementary Table S6</xref>. (<bold>A</bold>) The variation of genes under treatments in different tissues. &#x201C;Down&#x201D; represents downregulated genes, &#x201C;Up&#x201D; represents upregulated genes, and &#x201C;None&#x201D; represents genes whose expression did not significantly change. The <italic>y</italic>-axis represents the gene counts. (<bold>B</bold>) Log2FoldChange in gene expression in different tissues and treatments. The <italic>x</italic>-axis represents the groups of different treatments for different tissues, and the y-axis represents the absolute values of the log2FoldChange of the DEGs belonging to this group. The whiskers represent the range from the first quartile to the minimum value of the dataset and from the third quartile to the maximum value of the dataset. (<bold>C</bold>) Correlation analysis of changes in gene expression levels under multiple stress treatments.</p>
          </caption>
          <graphic mimetype="image" mime-subtype="tif" xlink:href="Phyton-95-73509-f003.tif"/>
        </fig>
        <p>The response to shoot topping treatment in roots was not only negatively correlated with the response of genes under other stresses in roots but also negatively correlated with the response of genes under various stresses in tobacco leaves, such as those induced by cold stress. Additionally, in leaves, there was a correlation between samples subjected to drought stress alone and those treated with MEL and SA, but the correlation between gene expression under drought stress after ABA treatment and drought stress alone was weaker, possibly because ABA can enhance the drought resistance of plants. In summary, understanding the response mechanisms of genes to different stresses plays a crucial role in enhancing the stress tolerance of tobacco plants.</p>
      </sec>
      <sec id="s3_4">
        <label>3.4</label>
        <title>TF Regulatory Network in Tobacco Roots and Leaves</title>
        <p>TFs play pivotal roles in the regulation processes of tobacco. In this study, we analysed tobacco gene expression under various stress conditions. Initially, 1865 TFs were identified in the tobacco genome using the PlantTFDBdatabase. The number of differentially expressed TFs varied with the type of stress treatment. There were more differentially expressed TFs in the roots under N treatment and topping treatment, and in the leaves under drought treatment and 4-h and 8-h freezing treatments (<xref ref-type="fig" rid="fig-4">Fig. 4</xref>A,B). The distribution of differentially expressed TFs was similar to the overall distribution trends of DEGs, with an increase in the number of differentially expressed TFs with increasing stress (<xref ref-type="fig" rid="fig-3">Fig. 3</xref>A and <xref ref-type="fig" rid="fig-4">Fig. 4</xref>A). Notably, in the drought stress treatment of leaves, the application of hormones resulted in a decrease in the number of differentially expressed TFs compared with those in the drought treatment without hormones, suggesting that these TFs with altered expression levels may be involved in the hormone response. Additionally, both the roots and leaves exhibited abundant common responsive genes among the different stress treatments (<xref ref-type="sec" rid="supplementary-materials">Supplementary Figs. S5 and S6</xref>).</p>
        <p>Based on the aforementioned research findings, our study focused on genes that exhibit shared responses to stress in both roots and leaves. In leaves, the ABA_D1 and S treatments resulted in fewer DEGs (376 and 493, respectively), indicating that these stresses were not sufficiently intense to fully activate defence mechanisms. Furthermore, MEL is not a stress. Similarly, the T1 and T2 treatments resulted in a low number of DEGs in the roots, and these treatments resulted in root stress. Therefore, data from these conditions were excluded. There were 338 and 24 DEGs shared among the root and leaf tissues under the various stress treatments. To understand the regulatory mechanisms of genes responding to multiple stresses, this study calculated the PCC of TFs and the DEGs shared by roots and leaves under different treatments. Gene pairs with a PCC greater than or equal to 0.9 were considered coexpressed; i.e., the TFs within the gene pairs may regulate the DEGs (<xref ref-type="sec" rid="supplementary-materials">Supplementary Tables S9 and S10</xref>). In the roots, we identified 285 TFs regulating 132 DEGs, including more than 40 different families of TFs such as WRKY, MYB, and bHLH (<xref ref-type="fig" rid="fig-4">Fig. 4</xref>C). This suggests the presence of a complex stress resistance regulatory network in tobacco roots. Numerous response genes are shared between biotic and abiotic stressors, and these genes are also commonly regulated by various TFs. In the leaves, 25 TFs, including WRKY, MYB, and ERF, regulated the expression of 4 stress-responsive genes (<xref ref-type="fig" rid="fig-4">Fig. 4</xref>D). These genes encode proteins such as F-box PP2-A13-like and G-type lectin S-receptor-like serine threonine-protein kinase, which are considered important stress resistance candidate genes in plant leaves, according to many studies [<xref ref-type="bibr" rid="ref-42">42</xref>,<xref ref-type="bibr" rid="ref-43">43</xref>]. Additionally, we predicted common stable motifs in the 2 kb upstream region of the DEGs. Due to the stringent coexpression PCC threshold of 0.9, which resulted in a very small number of TFs that could bind to these common stable motifs in the DEGs, we relaxed the threshold to 0.8. Combined with the coexpression results, we identified 26 TFs in leaves and 21 in roots that can bind to these common stable motifs among the DEGs (<xref ref-type="sec" rid="supplementary-materials">Supplementary Figs. S7 and S8, Supplementary Table S11</xref>). This result provides valuable resources for analysing gene regulation in response to stress. In summary, these results provide an opportunity for a more comprehensive understanding of the functions of TFs in stress responses.</p>
        <fig id="fig-4">
          <label>Figure 4</label>
          <caption>
            <p>The expression patterns of TFs under various stress conditions. Abbreviations for the labels on the horizontal axis are shown in <xref ref-type="sec" rid="supplementary-materials">Supplementary Table S6</xref>. (<bold>A</bold>) The variations in TFs in different tissues under different treatments. &#x201C;Up&#x201D; represents upregulated TFs, &#x201C;Down&#x201D; represents downregulated TFs, and &#x201C;None&#x201D; represents TFs with no significant change in expression. (<bold>B</bold>) Heatmap of TF expression patterns under different stress conditions. (<bold>C</bold>) The network of TF-regulated stress response genes in roots. The hexagons represent DEGs, and the circles represent TFs. The coexpression threshold was set to 0.9. (<bold>D</bold>) The network of TF-regulated stress response genes in leaves. The hexagons represent DEGs, and the circles represent TFs. The coexpression threshold was set to 0.9.</p>
          </caption>
          <graphic mimetype="image" mime-subtype="tif" xlink:href="Phyton-95-73509-f004.tif"/>
        </fig>
		</sec>
		
		<sec id="s3_5">
        <label>3.5</label>
		<title>eQTL Analysis of Tobacco</title>
        <p>Tobacco leaves are key organs used in cigarette processing, and the availability of 379 leaf samples enabled a population-level analysis of the relationship between gene expression and genetic polymorphisms. From the RNA-seq data, a total of 598,293 high-quality SNPs were identified across the tobacco genome. Their chromosomal distribution revealed clear regional enrichment on chromosomes 2, 4, 12, 14, and 19 (<xref ref-type="fig" rid="fig-5">Fig. 5</xref>A), suggesting that SNP density varies among chromosomes, likely reflecting differences in structural features and evolutionary histories.</p>
        <p>To dissect how these genetic variants influence transcriptional regulation, we performed eQTL mapping using leaf tissues and identified 28,396 eQTLs (<xref ref-type="sec" rid="supplementary-materials">Supplementary Table S12</xref>). Based on their physical proximity to associated genes, these loci were classified as cis- or trans-eQTLs. The cis-eQTLs displayed a strong diagonal pattern, whereas trans-eQTLs were widely dispersed and formed several distinct regulatory bands (<xref ref-type="fig" rid="fig-5">Fig. 5</xref>B), highlighting clear differences in regulatory architecture. In total, 14,559 genes (41% of all expressed genes) were regulated by at least one eQTL, indicating that genetic variation extensively shapes gene expression in tobacco leaves. Among these eGenes, 53% were regulated exclusively by cis-eQTLs, 21% only by trans-eQTLs, and 26% by both (<xref ref-type="fig" rid="fig-5">Fig. 5</xref>C). On average, each gene was associated with 4.6 eQTLs, and only 5771 genes were influenced by a single locus (<xref ref-type="fig" rid="fig-5">Fig. 5</xref>D), underscoring the complexity of regulatory interactions involving both local and distal genetic effects.</p>
        <p>To further characterize the biological roles of these eGenes, we conducted functional enrichment analyses. Trans-regulated eGenes showed strong overrepresentation in biological process categories, with limited enrichment in molecular function and cellular component terms (<xref ref-type="sec" rid="supplementary-materials">Supplementary Fig. S9</xref>). Many trans-eGenes were involved in photosynthesis-related pathways, including photosynthesis, light reaction, photosynthesis, light harvesting, tetrapyrrole metabolic process, and chloroplast organization. Additionally, they were enriched in hormone signaling and stress-responsive processes such as response to fatty acid, response to jasmonic acid, response to herbicide, intracellular monoatomic cation homeostasis, and protein K63-linked ubiquitination (<xref ref-type="sec" rid="supplementary-materials">Supplementary Fig. S9</xref>). Several eGenes were also associated with nicotine biosynthesis (<xref ref-type="sec" rid="supplementary-materials">Supplementary Table S13</xref>), providing candidate genes relevant to tobacco trait improvement.</p>
        <p>We further identified 1669 cis-eQTL hotspots and 1858 trans-eQTL hotspots across the genome (<xref ref-type="fig" rid="fig-5">Fig. 5</xref>E). Notably, the trans-eQTL hotspots contained 68 transcription factors, including members of the WRKY, bHLH, and MYB families (<xref ref-type="sec" rid="supplementary-materials">Supplementary Table S14</xref>), suggesting that these regions may exert broad regulatory influence through transcription factor&#x2013;mediated cascades. For example, within the trans-eQTL hotspot I47_C2, the locus eQTL (chr04:1227307) cis-regulated the transcription factor MYB (<italic>Nitab4.5_0001158g0050</italic>), a TF related to drought responses, while simultaneously trans-regulating a drought-induced protein (<italic>Nitab4.5_0001808g0020</italic>). This illustrates how single regulatory variants can coordinate hierarchical control of stress-responsive pathways. These findings provide a comprehensive view of the genetic regulation of gene expression in tobacco leaves.</p>
        <fig id="fig-5">
          <label>Figure 5</label>
          <caption>
            <p>(<bold>A</bold>) The distribution of tobacco SNPs across chromosomes. (<bold>B</bold>) The distribution of cis- and trans-eQTLs on chromosomes. (<bold>C</bold>) The distribution of genes regulated by cis- or trans-eQTLs in tobacco leaves. (<bold>D</bold>) Relationships between the number of eGenes and eQTLs. (<bold>E</bold>) Circos plot illustrating the genomic landscape of eQTL hotspots in tobacco. From the outermost to the innermost rings: the outer ring represents the 24 tobacco chromosomes; the second ring shows the genomic density of cis-eQTL hotspots; the third ring displays the density of trans-eQTL hotspots; the innermost layer depicts the trans-eQTL hotspot I47_C2, with lines connecting this hotspot to its significantly associated downstream genes across the genome.</p>
          </caption>
          <graphic mimetype="image" mime-subtype="tif" xlink:href="Phyton-95-73509-f005.tif"/>
        </fig>
      </sec>
    </sec>
    <sec id="s4">
      <label>4</label>
      <title>Discussion</title>
      <p>Comprehending the expression characteristics of genes in different plant organs, particularly under various stresses, is highly important [<xref ref-type="bibr" rid="ref-44">44</xref>]. However, it is challenging for a single laboratory to construct a large experimental design to conduct transcriptome profiling on hundreds or even thousands of samples. Transcriptome sequencing with small sample sizes has long been a common biological research tool, accumulating extensive transcriptomic data, and thereby providing opportunities for large-scale expression profiling studies in tobacco. Indeed, such opportunities are equally applicable to many other species [<xref ref-type="bibr" rid="ref-7">7</xref>]. This study collected a large quantity of tobacco transcriptome data, which also serves as a summary of tobacco transcriptomics, to provide a clearer understanding of the current status of the tobacco genome.</p>
      <p>The comprehensive comparative transcriptomic analysis yielded numerous intriguing findings such as the enrichment of genes specifically expressed in tobacco sepals involved in the synthesis pathways of certain terpenoids. Terpenoids play pivotal roles in various biological functions such as attracting pollinators and defending against biotic stresses [<xref ref-type="bibr" rid="ref-45">45</xref>,<xref ref-type="bibr" rid="ref-46">46</xref>]. This finding is particularly intriguing because the synthesis and accumulation of secondary metabolites in plants often exhibit strong tissue specificity [<xref ref-type="bibr" rid="ref-47">47</xref>,<xref ref-type="bibr" rid="ref-48">48</xref>]. Furthermore, many of these metabolites often possess significant chemical and ecological functions [<xref ref-type="bibr" rid="ref-49">49</xref>]. The abundant tissue-specific expression patterns provide crucial indications that employing molecular biology, metabolomics, and synthetic biology approaches to study the synthesis pathways and ecological functions of secondary metabolites in tobacco sepals holds significant value. Although the potential for terpenoid synthesis in sepals has been noted in other species, further in-depth investigations into their functionalities are lacking [<xref ref-type="bibr" rid="ref-50">50</xref>]. Furthermore, this study identified 128 tissue-specific TFs, among which MYB plays significant roles in regulating the cell cycle, secondary metabolite synthesis, and plant response to hormones [<xref ref-type="bibr" rid="ref-51">51</xref>,<xref ref-type="bibr" rid="ref-52">52</xref>]. Considering the tissue-specific expression patterns of genes related to plant secondary metabolites, these MYBs could serve as key regulators of secondary metabolite synthesis and are worthy of focused attention. ERFs are a family of TFs that are mainly present in plants and play crucial roles in plant growth and development, hormone responses, and plant stress. In many reports, ERFs are believed to be associated with flower growth, development, floral morphology, and flower senescence [<xref ref-type="bibr" rid="ref-53">53</xref>,<xref ref-type="bibr" rid="ref-54">54</xref>]. Thus, it is reasonable to speculate that ERFs that are specifically expressed in floral organs might be involved in tobacco flowering regulation. These findings provide guidance and candidate genes for studying tobacco development and defence mechanisms.</p>
      <p>The regulatory networks and mechanisms underlying plant responses to biotic and abiotic stresses are complex [<xref ref-type="bibr" rid="ref-55">55</xref>]. Understanding the similarities and differences in the response mechanisms of plants to these various stresses will help elucidate how plants integrate and respond to various environmental cues [<xref ref-type="bibr" rid="ref-44">44</xref>]. Although we cannot simultaneously impose different stresses on a single plant through data collection and analysis, we can delineate the response patterns of genes to stress. For instance, following the infection of tobacco roots by <italic>Phytophthora nicotianae</italic>, although the number of responsive genes differed from that induced by N treatment, the direction and fold change of these responsive genes exhibited a significant correlation. This finding implies the potential existence of overlap in response mechanisms between biotic and abiotic stresses. Through the above analysis, this study revealed that some genes may have universal responses to adversity. This understanding is valuable for understanding the mechanisms of tobacco response to different adverse conditions and for breeding tobacco varieties with multiple stress resistance mechanisms. The RNA-seq data utilized in this study originated from diverse samples, thereby enabling investigations into the impact of genomic variation on gene expression. Given the significance of tobacco leaves and the availability of data, this study conducted an analysis of eQTLs using RNA-seq data derived from tobacco leaves. Examination of the distance between cis-eQTLs and transcription start sites (TSSs) revealed a gradual decrease in the number of eQTLs as the distance from the TSS increased within a range of 250 K. Beyond 250 K from the TSSs, the count of eQTLs remained relatively low, possibly due to the decreasing impact of SNPs on TSSs as distance increased. Within 250 K, a closer distance had a greater potential impact on the TSSs (<xref ref-type="sec" rid="supplementary-materials">Supplementary Fig. S10</xref>). This study provides further insights into the polymorphisms of the tobacco genome and an overview of gene expression regulatory mechanisms. Utilizing large datasets from databases for integration and analysis contributes to a better understanding of the genetic architecture controlling agronomic traits, thereby facilitating crop improvement and quality enhancement.</p>
    </sec>
    <sec id="s5">
      <label>5</label>
      <title>Conclusions</title>
      <p>This study integrated large-scale transcriptome data involving multiple tobacco tissues and different treatments. A total of 1405 tissue-specific genes were identified. This study revealed the specific synthesis and accumulation of secondary metabolites such as terpenoids in organs such as sepals, providing important insights into the functionality of different tobacco organs. Additionally, comparative analysis of RNA-seq data under various stress conditions revealed gene differences between leaves and roots in response to biotic and abiotic stresses, offering crucial clues for understanding tobacco mechanisms in response to diverse stresses. Finally, by identifying 28,396 eQTLs in leaves, much information was provided on the genetic regulation of gene expression in tobacco leaves. In summary, this study provides important research references for understanding the characteristics of tissue-specific genes and their potential functions in tobacco, laying a foundation for a deeper understanding of tobacco biology and genetic regulatory mechanisms.</p>
    </sec>
  </body>
  <back>
    <ack>
      <p>Not applicable.</p>
    </ack>
    <sec>
      <title>Funding Statement</title>
      <p>This work was supported by the Guizhou Provincial Basic Research Program (Natural Science) [(2024) 648], the Program of China National Tobacco Corporation (110202101032(JY-09), 110202201003(JY-03)), the Program of Guizhou Branch of China National Tobacco Corporation (2023XM02, 2022XM05 and 2024XM01), the Qiankehe Platform Project (ZSYS [2025] 028), and the Program of China National Tobacco Corporation (110202102034).</p>
    </sec>
    <sec>
      <title>Author Contributions</title>
      <p>Shizhou Yu and Zhixiao Yang: Conceptualization, Methodology, Supervision, Writing&#x2014;review &amp; editing and Funding acquisition. Jie Zhang and Linggai Cao: Data curation, Visualization, Writing-Original draft preparation. Xueliang Ren and Jie Liu: Data curation, Visualization. Jiemeng Tao and Peng Lu: Data curation, Supervision. Guobo Chen: Writing-Reviewing and Editing, Supervision. All authors reviewed and approved the final version of the manuscript.</p>
    </sec>
    <sec sec-type="data-availability">
      <title>Availability of Data and Materials</title>
      <p>The authors confirm that the data supporting the findings of this study are available within the <xref ref-type="sec" rid="supplementary-materials">Supplementary Materials</xref>.</p>
    </sec>
    <sec>
      <title>Ethics Approval</title>
      <p>Not applicable.</p>
    </sec>
    <sec sec-type="COI-statement">
      <title>Conflicts of Interest</title>
      <p>The authors declare no conflicts of interest.</p>
    </sec>
    <sec id="supplementary-materials">
      <title>Supplementary Materials</title>
      <p>The supplementary material is available online at <ext-link ext-link-type="uri" xlink:href="https://www.techscience.com/doi/10.32604/phyton.2026.073509/s1">https://www.techscience.com/doi/10.32604/phyton.2026.073509/s1</ext-link>. Supplementary Table S1 Information on tissues of samples used in this study. Supplementary Table S2 TSI values in different tissues. Supplementary Table S3 Expression-based gene classification. Supplementary Table S4 Statistics of tissue-specific genes in each tissue. Supplementary Table S5 Go enrichment results for tissue-specific genes. Supplementary Table S6 Information on treatments of samples used in this study. Supplementary Table S7 Differentially expressed genes under different treatments. Supplementary Table S8 Go enrichment results for differentially expressed genes. Supplementary Table S9 Co-expression network of TFs and differentially expressed genes in roots. Supplementary Table S10 Co-expression network of TFs and differentially expressed genes in leaves. Supplementary Table S11 Co-expression network of DEGs and TFs that could bind to the common stable motifs of DEGs in tobacco roots and leaves (the co-expression PCC threshold was set to 0.8). Supplementary Table S12 Lead SNPs identified in this study. Supplementary Table S13 eQTLs associated with nicotine synthesis genes. Supplementary Table S14 Genes regulated by eQTL hotspot regions. Supplementary Fig. S1 tSNE clustering results based on expression levels of 84 samples with different treatments. Supplementary Fig. S2 GO enrichment analysis of tissue-specific genes. Supplementary Fig. S3 GO enrichment analysis of up-regulated differentially expressed genes. Supplementary Fig. S4 GO enrichment analysis of down-regulated differentially expressed genes. Supplementary Fig. S5 the left bar plot of the UpSet plot represents the number of DEGs for each treatment, whereas the top bar plot shows the number of DEGs shared between different treatments. The dots and lines in the figure represent DEGs shared among these treatments. Supplementary Fig. S6 the root bar plot of the UpSet plot represents the number of DEGs for each treatment, whereas the top bar plot shows the number of DEGs shared between different treatments. The dots and lines in the figure represent DEGs shared among these treatments. Supplementary Fig. S7 Co-expression network of DEGs and TFs that could bind to the common stable motifs of DEGs in tobacco leaves (the co-expression PCC threshold was set to 0.8). Supplementary Fig. S8 Co-expression network of DEGs and TFs that could bind to the common stable motifs of DEGs in tobacco roots (the co-expression PCC threshold was set to 0.8). Supplementary Fig. S9 GO enrichment analysis of trans-eGenes in leaves. Supplementary Fig. S10 Density curve of distance from transcription start sites for cis-eQTLs in leaves. Supplementary File: (Gene expression level in different samples) can be downloaded from <ext-link ext-link-type="uri" xlink:href="https://figshare.com">https://figshare.com</ext-link> (<ext-link ext-link-type="uri" xlink:href="https://doi.org/10.6084/m9.figshare.29666060">https://doi.org/10.6084/m9.figshare.29666060</ext-link>)</p>
      <supplementary-material id="SD-1" xlink:href="Phyton-95-73509-s001.zip"/>
    </sec>
    <glossary content-type="abbreviations" id="glossary-1">
      <title>Nomenclature</title>
      <array>
        <tbody>
          <tr>
            <td align="left" valign="middle">eQTLs</td>
            <td align="left" valign="middle">Expression quantitative trait loci</td>
          </tr>
          <tr>
            <td align="left" valign="middle">SNP</td>
            <td align="left" valign="middle">Single nucleotide polymorphism</td>
          </tr>
          <tr>
            <td align="left" valign="middle">tSNE</td>
            <td align="left" valign="middle">T-distributed stochastic neighbor embedding</td>
          </tr>
          <tr>
            <td align="left" valign="middle">UMAP</td>
            <td align="left" valign="middle">Uniform Manifold Approximation and Projection</td>
          </tr>
          <tr>
            <td align="left" valign="middle">TPM</td>
            <td align="left" valign="middle">Transcripts per million</td>
          </tr>
          <tr>
            <td align="left" valign="middle">TSI</td>
            <td align="left" valign="middle">Tissue specific index</td>
          </tr>
          <tr>
            <td align="left" valign="middle">GEC</td>
            <td align="left" valign="middle">Genetic Type I error calculator</td>
          </tr>
          <tr>
            <td align="left" valign="middle">GO</td>
            <td align="left" valign="middle">Gene ontology</td>
          </tr>
          <tr>
            <td align="left" valign="middle">TSSs</td>
            <td align="left" valign="middle">Transcription Start Sites</td>
          </tr>
          <tr>
            <td align="left" valign="middle">SA</td>
            <td align="left" valign="middle">Salicylic acid</td>
          </tr>
          <tr>
            <td align="left" valign="middle">MEL</td>
            <td align="left" valign="middle">Melatonin</td>
          </tr>
          <tr>
            <td align="left" valign="middle">ABA</td>
            <td align="left" valign="middle">Abscisic acid</td>
          </tr>
        </tbody>
      </array>
    </glossary>
    <ref-list content-type="authoryear">
      <title>References</title>
      <ref id="ref-1">
        <label>1.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Sinha</surname> 
<given-names>P</given-names>
</string-name>, 
<string-name>
<surname>Bajaj</surname> 
<given-names>P</given-names>
</string-name>, 
<string-name>
<surname>Pazhamala</surname> 
<given-names>LT</given-names>
</string-name>, 
<string-name>
<surname>Nayak</surname> 
<given-names>SN</given-names>
</string-name>, 
<string-name>
<surname>Pandey</surname> 
<given-names>MK</given-names>
</string-name>, 
<string-name>
<surname>Chitikineni</surname> 
<given-names>A</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title><italic>Arachis hypogaea</italic> gene expression atlas for fastigiata subspecies of cultivated groundnut to accelerate functional and translational genomics applications</article-title>. 
<source>Plant Biotechnol J</source>. 
<year>2020</year>;
<volume>18</volume>(
<issue>11</issue>):
<fpage>2187</fpage>&#x2013;
<lpage>200</lpage>. 
doi:<pub-id pub-id-type="doi">10.1111/pbi.13374</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-2">
        <label>2.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Liu</surname> 
<given-names>C</given-names>
</string-name>, 
<string-name>
<surname>Leng</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Li</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Ge</surname> 
<given-names>T</given-names>
</string-name>, 
<string-name>
<surname>Li</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Chen</surname> 
<given-names>Y</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>A spatiotemporal atlas of organogenesis in the development of orchid flowers</article-title>. 
<source>Nucleic Acids Res</source>. 
<year>2022</year>;
<volume>50</volume>(
<issue>17</issue>):
<fpage>9724</fpage>&#x2013;
<lpage>37</lpage>. 
doi:<pub-id pub-id-type="doi">10.1093/nar/gkac773</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-3">
        <label>3.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Meir</surname> 
<given-names>Z</given-names>
</string-name>, 
<string-name>
<surname>Aviezer</surname> 
<given-names>I</given-names>
</string-name>, 
<string-name>
<surname>Chongloi</surname> 
<given-names>GL</given-names>
</string-name>, 
<string-name>
<surname>Ben-Kiki</surname> 
<given-names>O</given-names>
</string-name>, 
<string-name>
<surname>Bronstein</surname> 
<given-names>R</given-names>
</string-name>, 
<string-name>
<surname>Mukamel</surname> 
<given-names>Z</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>Dissection of floral transition by single-meristem transcriptomes at high temporal resolution</article-title>. 
<source>Nat Plants</source>. 
<year>2021</year>;
<volume>7</volume>(
<issue>6</issue>):
<fpage>800</fpage>&#x2013;
<lpage>13</lpage>. 
doi:<pub-id pub-id-type="doi">10.1038/s41477-021-00936-8</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-4">
        <label>4.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>George</surname> 
<given-names>N</given-names>
</string-name>, 
<string-name>
<surname>Fexova</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Fuentes</surname> 
<given-names>AM</given-names>
</string-name>, 
<string-name>
<surname>Madrigal</surname> 
<given-names>P</given-names>
</string-name>, 
<string-name>
<surname>Bi</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Iqbal</surname> 
<given-names>H</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>Expression Atlas update: insights from sequencing data at both bulk and single cell level</article-title>. 
<source>Nucleic Acids Res</source>. 
<year>2024</year>;
<volume>52</volume>(
<issue>D1</issue>):
<fpage>D107</fpage>&#x2013;
<lpage>14</lpage>. 
doi:<pub-id pub-id-type="doi">10.1093/nar/gkad1021</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-5">
        <label>5.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Tian</surname> 
<given-names>F</given-names>
</string-name>, 
<string-name>
<surname>Yang</surname> 
<given-names>DC</given-names>
</string-name>, 
<string-name>
<surname>Meng</surname> 
<given-names>YQ</given-names>
</string-name>, 
<string-name>
<surname>Jin</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Gao</surname> 
<given-names>G</given-names>
</string-name></person-group>. 
<article-title>PlantRegMap: charting functional regulatory maps in plants</article-title>. 
<source>Nucleic Acids Res</source>. 
<year>2020</year>;
<volume>48</volume>(
<issue>D1</issue>):
<fpage>D1104</fpage>&#x2013;
<lpage>13</lpage>. 
doi:<pub-id pub-id-type="doi">10.1093/nar/gkz1020</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-6">
        <label>6.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Jin</surname> 
<given-names>L</given-names>
</string-name>, 
<string-name>
<surname>Tang</surname> 
<given-names>Q</given-names>
</string-name>, 
<string-name>
<surname>Hu</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Chen</surname> 
<given-names>Z</given-names>
</string-name>, 
<string-name>
<surname>Zhou</surname> 
<given-names>X</given-names>
</string-name>, 
<string-name>
<surname>Zeng</surname> 
<given-names>B</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>A pig BodyMap transcriptome reveals diverse tissue physiologies and evolutionary dynamics of transcription</article-title>. 
<source>Nat Commun</source>. 
<year>2021</year>;
<volume>12</volume>(
<issue>1</issue>):
<fpage>3715</fpage>. 
doi:<pub-id pub-id-type="doi">10.1038/s41467-021-23560-8</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-7">
        <label>7.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Almeida-Silva</surname> 
<given-names>F</given-names>
</string-name>, 
<string-name>
<surname>Pedrosa-Silva</surname> 
<given-names>F</given-names>
</string-name>, 
<string-name>
<surname>Venancio</surname> 
<given-names>TM</given-names>
</string-name></person-group>. 
<article-title>The Soybean Expression Atlas v2: a comprehensive database of over 5000 RNA-seq samples</article-title>. 
<source>Plant J</source>. 
<year>2023</year>;
<volume>116</volume>(
<issue>4</issue>):
<fpage>1041</fpage>&#x2013;
<lpage>51</lpage>. 
doi:<pub-id pub-id-type="doi">10.1111/tpj.16459</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-8">
        <label>8.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Xanthopoulou</surname> 
<given-names>A</given-names>
</string-name>, 
<string-name>
<surname>Montero-Pau</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Pic&#xF3;</surname> 
<given-names>B</given-names>
</string-name>, 
<string-name>
<surname>Boumpas</surname> 
<given-names>P</given-names>
</string-name>, 
<string-name>
<surname>Tsaliki</surname> 
<given-names>E</given-names>
</string-name>, 
<string-name>
<surname>Paris</surname> 
<given-names>HS</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>A comprehensive RNA-Seq-based gene expression atlas of the summer squash (<italic>Cucurbita pepo</italic>) provides insights into fruit morphology and ripening mechanisms</article-title>. 
<source>BMC Genomics</source>. 
<year>2021</year>;
<volume>22</volume>(
<issue>1</issue>):
<fpage>341</fpage>. 
doi:<pub-id pub-id-type="doi">10.1186/s12864-021-07683-2</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-9">
        <label>9.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Liu</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Gao</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Canela-Xandri</surname> 
<given-names>O</given-names>
</string-name>, 
<string-name>
<surname>Wang</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Yu</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Cai</surname> 
<given-names>W</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>A multi-tissue atlas of regulatory variants in cattle</article-title>. 
<source>Nat Genet</source>. 
<year>2022</year>;
<volume>54</volume>(
<issue>9</issue>):
<fpage>1438</fpage>&#x2013;
<lpage>47</lpage>. 
doi:<pub-id pub-id-type="doi">10.1038/s41588-022-01153-5</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-10">
        <label>10.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Teng</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Gao</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Yin</surname> 
<given-names>H</given-names>
</string-name>, 
<string-name>
<surname>Bai</surname> 
<given-names>Z</given-names>
</string-name>, 
<string-name>
<surname>Liu</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Zeng</surname> 
<given-names>H</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>A compendium of genetic regulatory effects across pig tissues</article-title>. 
<source>Nat Genet</source>. 
<year>2024</year>;
<volume>56</volume>(
<issue>1</issue>):
<fpage>112</fpage>&#x2013;
<lpage>23</lpage>. 
doi:<pub-id pub-id-type="doi">10.1038/s41588-023-01585-7</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-11">
        <label>11.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Liu</surname> 
<given-names>Z</given-names>
</string-name>, 
<string-name>
<surname>Wu</surname> 
<given-names>X</given-names>
</string-name>, 
<string-name>
<surname>Hou</surname> 
<given-names>L</given-names>
</string-name>, 
<string-name>
<surname>Ji</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Zhang</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Fan</surname> 
<given-names>W</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>Effects of cadmium on transcription, physiology, and ultrastructure of two tobacco cultivars</article-title>. 
<source>Sci Total Environ</source>. 
<year>2023</year>;
<volume>869</volume>:
<fpage>161751</fpage>. 
doi:<pub-id pub-id-type="doi">10.1016/j.scitotenv.2023.161751</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-12">
        <label>12.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Luo</surname> 
<given-names>Z</given-names>
</string-name>, 
<string-name>
<surname>Zhou</surname> 
<given-names>Z</given-names>
</string-name>, 
<string-name>
<surname>Li</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Tao</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Hu</surname> 
<given-names>ZR</given-names>
</string-name>, 
<string-name>
<surname>Yang</surname> 
<given-names>JS</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>Transcriptome-based gene regulatory network analyses of differential cold tolerance of two tobacco cultivars</article-title>. 
<source>BMC Plant Biol</source>. 
<year>2022</year>;
<volume>22</volume>(
<issue>1</issue>):
<fpage>369</fpage>. 
doi:<pub-id pub-id-type="doi">10.1186/s12870-022-03767-7</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-13">
        <label>13.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Edwards</surname> 
<given-names>KD</given-names>
</string-name>, 
<string-name>
<surname>Fernandez-Pozo</surname> 
<given-names>N</given-names>
</string-name>, 
<string-name>
<surname>Drake-Stowe</surname> 
<given-names>K</given-names>
</string-name>, 
<string-name>
<surname>Humphry</surname> 
<given-names>M</given-names>
</string-name>, 
<string-name>
<surname>Evans</surname> 
<given-names>AD</given-names>
</string-name>, 
<string-name>
<surname>Bombarely</surname> 
<given-names>A</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>A reference genome for <italic>Nicotiana tabacum</italic> enables map-based cloning of homeologous loci implicated in nitrogen utilization efficiency</article-title>. 
<source>BMC Genomics</source>. 
<year>2017</year>;
<volume>18</volume>(
<issue>1</issue>):
<fpage>448</fpage>. 
doi:<pub-id pub-id-type="doi">10.1186/s12864-017-3791-6</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-14">
        <label>14.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Chen</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Zhou</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Chen</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Gu</surname> 
<given-names>J</given-names>
</string-name></person-group>. 
<article-title>Fastp: an ultra-fast all-in-one FASTQ preprocessor</article-title>. 
<source>Bioinformatics</source>. 
<year>2018</year>;
<volume>34</volume>(
<issue>17</issue>):
<fpage>i884</fpage>&#x2013;
<lpage>90</lpage>. 
doi:<pub-id pub-id-type="doi">10.1093/bioinformatics/bty560</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-15">
        <label>15.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Dobin</surname> 
<given-names>A</given-names>
</string-name>, 
<string-name>
<surname>Davis</surname> 
<given-names>CA</given-names>
</string-name>, 
<string-name>
<surname>Schlesinger</surname> 
<given-names>F</given-names>
</string-name>, 
<string-name>
<surname>Drenkow</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Zaleski</surname> 
<given-names>C</given-names>
</string-name>, 
<string-name>
<surname>Jha</surname> 
<given-names>S</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>STAR: ultrafast universal RNA-seq aligner</article-title>. 
<source>Bioinformatics</source>. 
<year>2013</year>;
<volume>29</volume>(
<issue>1</issue>):
<fpage>15</fpage>&#x2013;
<lpage>21</lpage>. 
doi:<pub-id pub-id-type="doi">10.1093/bioinformatics/bts635</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-16">
        <label>16.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Pertea</surname> 
<given-names>M</given-names>
</string-name>, 
<string-name>
<surname>Pertea</surname> 
<given-names>GM</given-names>
</string-name>, 
<string-name>
<surname>Antonescu</surname> 
<given-names>CM</given-names>
</string-name>, 
<string-name>
<surname>Chang</surname> 
<given-names>TC</given-names>
</string-name>, 
<string-name>
<surname>Mendell</surname> 
<given-names>JT</given-names>
</string-name>, 
<string-name>
<surname>Salzberg</surname> 
<given-names>SL</given-names>
</string-name></person-group>. 
<article-title>StringTie enables improved reconstruction of a transcriptome from RNA-seq reads</article-title>. 
<source>Nat Biotechnol</source>. 
<year>2015</year>;
<volume>33</volume>(
<issue>3</issue>):
<fpage>290</fpage>&#x2013;
<lpage>5</lpage>. 
doi:<pub-id pub-id-type="doi">10.1038/nbt.3122</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-17">
        <label>17.</label>
        <mixed-citation publication-type="web">
<person-group person-group-type="author">
<string-name>
<surname>Krijthe</surname> 
<given-names>JH</given-names>
</string-name>, 
<string-name>
<surname>Van der Maaten</surname> 
<given-names>L</given-names>
</string-name></person-group>. 
<article-title>Rtsne: T-distributed stochastic neighbor embedding using Barnes-Hut implementation. Package &#x2018;Rtsne&#x2019; [Internet]</article-title>. [cited 
<date-in-citation>2026 Jan 1</date-in-citation>]. 
<comment>Available from: <ext-link ext-link-type="uri" xlink:href="https://cran.r-project.org/web/packages/Rtsne/Rtsne.pdf" xmlns:xlink="http://www.w3.org/1999/xlink">https://cran.r-project.org/web/packages/Rtsne/Rtsne.pdf</ext-link></comment>. 

        </mixed-citation>
    </ref>
      <ref id="ref-18">
        <label>18.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>McInnes</surname> 
<given-names>L</given-names>
</string-name>, 
<string-name>
<surname>Healy</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Saul</surname> 
<given-names>N</given-names>
</string-name>, 
<string-name>
<surname>Gro&#xDF;berger</surname> 
<given-names>L</given-names>
</string-name></person-group>. 
<article-title>UMAP: uniform manifold approximation and projection</article-title>. 
<source>J Open Source Softw</source>. 
<year>2018</year>;
<volume>3</volume>(
<issue>29</issue>):
<fpage>861</fpage>. 
doi:<pub-id pub-id-type="doi">10.21105/joss.00861</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-19">
        <label>19.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Garc&#xED;a-P&#xE9;rez</surname> 
<given-names>R</given-names>
</string-name>, 
<string-name>
<surname>Esteller-Cucala</surname> 
<given-names>P</given-names>
</string-name>, 
<string-name>
<surname>Mas</surname> 
<given-names>G</given-names>
</string-name>, 
<string-name>
<surname>Lob&#xF3;n</surname> 
<given-names>I</given-names>
</string-name>, 
<string-name>
<surname>Di Carlo</surname> 
<given-names>V</given-names>
</string-name>, 
<string-name>
<surname>Riera</surname> 
<given-names>M</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>Epigenomic profiling of primate lymphoblastoid cell lines reveals the evolutionary patterns of epigenetic activities in gene regulatory architectures</article-title>. 
<source>Nat Commun</source>. 
<year>2021</year>;
<volume>12</volume>(
<issue>1</issue>):
<fpage>3116</fpage>. 
doi:<pub-id pub-id-type="doi">10.1038/s41467-021-23397-1</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-20">
        <label>20.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Cantalapiedra</surname> 
<given-names>CP</given-names>
</string-name>, 
<string-name>
<surname>Hern&#xE1;ndez-Plaza</surname> 
<given-names>A</given-names>
</string-name>, 
<string-name>
<surname>Letunic</surname> 
<given-names>I</given-names>
</string-name>, 
<string-name>
<surname>Bork</surname> 
<given-names>P</given-names>
</string-name>, 
<string-name>
<surname>Huerta-Cepas</surname> 
<given-names>J</given-names>
</string-name></person-group>. 
<article-title>eggNOG-mapper v2: functional annotation, orthology assignments, and domain prediction at the metagenomic scale</article-title>. 
<source>Mol Biol Evol</source>. 
<year>2021</year>;
<volume>38</volume>(
<issue>12</issue>):
<fpage>5825</fpage>&#x2013;
<lpage>9</lpage>. 
doi:<pub-id pub-id-type="doi">10.1093/molbev/msab293</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-21">
        <label>21.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Wu</surname> 
<given-names>T</given-names>
</string-name>, 
<string-name>
<surname>Hu</surname> 
<given-names>E</given-names>
</string-name>, 
<string-name>
<surname>Xu</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Chen</surname> 
<given-names>M</given-names>
</string-name>, 
<string-name>
<surname>Guo</surname> 
<given-names>P</given-names>
</string-name>, 
<string-name>
<surname>Dai</surname> 
<given-names>Z</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>clusterProfiler 4.0: a universal enrichment tool for interpreting omics data</article-title>. 
<source>Innovation</source>. 
<year>2021</year>;
<volume>2</volume>(
<issue>3</issue>):
<fpage>100141</fpage>. 
doi:<pub-id pub-id-type="doi">10.1016/j.xinn.2021.100141</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-22">
        <label>22.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Kuznetsova</surname> 
<given-names>I</given-names>
</string-name>, 
<string-name>
<surname>Lugmayr</surname> 
<given-names>A</given-names>
</string-name>, 
<string-name>
<surname>Siira</surname> 
<given-names>SJ</given-names>
</string-name>, 
<string-name>
<surname>Rackham</surname> 
<given-names>O</given-names>
</string-name>, 
<string-name>
<surname>Filipovska</surname> 
<given-names>A</given-names>
</string-name></person-group>. 
<article-title>CirGO: an alternative circular way of visualising gene ontology terms</article-title>. 
<source>BMC Bioinform</source>. 
<year>2019</year>;
<volume>20</volume>(
<issue>1</issue>):
<fpage>84</fpage>. 
doi:<pub-id pub-id-type="doi">10.1186/s12859-019-2671-2</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-23">
        <label>23.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Jin</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Tian</surname> 
<given-names>F</given-names>
</string-name>, 
<string-name>
<surname>Yang</surname> 
<given-names>DC</given-names>
</string-name>, 
<string-name>
<surname>Meng</surname> 
<given-names>YQ</given-names>
</string-name>, 
<string-name>
<surname>Kong</surname> 
<given-names>L</given-names>
</string-name>, 
<string-name>
<surname>Luo</surname> 
<given-names>J</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>PlantTFDB 4.0: toward a central hub for transcription factors and regulatory interactions in plants</article-title>. 
<source>Nucleic Acids Res</source>. 
<year>2017</year>;
<volume>45</volume>(
<issue>D1</issue>):
<fpage>D1040</fpage>&#x2013;
<lpage>5</lpage>. 
doi:<pub-id pub-id-type="doi">10.1093/nar/gkw982</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-24">
        <label>24.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Liao</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Smyth</surname> 
<given-names>GK</given-names>
</string-name>, 
<string-name>
<surname>Shi</surname> 
<given-names>W</given-names>
</string-name></person-group>. 
<article-title>featureCounts: an efficient general purpose program for assigning sequence reads to genomic features</article-title>. 
<source>Bioinformatics</source>. 
<year>2014</year>;
<volume>30</volume>(
<issue>7</issue>):
<fpage>923</fpage>&#x2013;
<lpage>30</lpage>. 
doi:<pub-id pub-id-type="doi">10.1093/bioinformatics/btt656</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-25">
        <label>25.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Love</surname> 
<given-names>MI</given-names>
</string-name>, 
<string-name>
<surname>Huber</surname> 
<given-names>W</given-names>
</string-name>, 
<string-name>
<surname>Anders</surname> 
<given-names>S</given-names>
</string-name></person-group>. 
<article-title>Moderated estimation of fold change and dispersion for RNA-seq data with DESeq2</article-title>. 
<source>Genome Biol</source>. 
<year>2014</year>;
<volume>15</volume>(
<issue>12</issue>):
<fpage>550</fpage>. 
doi:<pub-id pub-id-type="doi">10.1186/s13059-014-0550-8</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-26">
        <label>26.</label>
        <mixed-citation publication-type="web">
<person-group person-group-type="author">
<string-name>
<surname>Wei</surname> 
<given-names>T</given-names>
</string-name>, 
<string-name>
<surname>Simko</surname> 
<given-names>V</given-names>
</string-name>, 
<string-name>
<surname>Levy</surname> 
<given-names>M</given-names>
</string-name>, 
<string-name>
<surname>Xie</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Jin</surname> 
<given-names>YJ</given-names>
</string-name>, 
<string-name>
<surname>Zemla</surname> 
<given-names>J</given-names>
</string-name></person-group>. 
<article-title>Visualization of a Correlation Matrix. R Package &#x201C;corrplot&#x201D; [Internet]</article-title>. [cited 
<date-in-citation>2026 Jan 1</date-in-citation>]. 
<comment>Available from: <ext-link ext-link-type="uri" xlink:href="https://github.com/taiyun/corrplot" xmlns:xlink="http://www.w3.org/1999/xlink">https://github.com/taiyun/corrplot</ext-link></comment>. 

        </mixed-citation>
    </ref>
      <ref id="ref-27">
        <label>27.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Yu</surname> 
<given-names>G</given-names>
</string-name>, 
<string-name>
<surname>Wang</surname> 
<given-names>LG</given-names>
</string-name>, 
<string-name>
<surname>Han</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>He</surname> 
<given-names>QY</given-names>
</string-name></person-group>. 
<article-title>clusterProfiler: an R package for comparing biological themes among gene clusters</article-title>. 
<source>OMICS</source>. 
<year>2012</year>;
<volume>16</volume>(
<issue>5</issue>):
<fpage>284</fpage>&#x2013;
<lpage>7</lpage>. 
doi:<pub-id pub-id-type="doi">10.1089/omi.2011.0118</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-28">
        <label>28.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Heinz</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Benner</surname> 
<given-names>C</given-names>
</string-name>, 
<string-name>
<surname>Spann</surname> 
<given-names>N</given-names>
</string-name>, 
<string-name>
<surname>Bertolino</surname> 
<given-names>E</given-names>
</string-name>, 
<string-name>
<surname>Lin</surname> 
<given-names>YC</given-names>
</string-name>, 
<string-name>
<surname>Laslo</surname> 
<given-names>P</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>Simple combinations of lineage-determining transcription factors prime <italic>cis</italic>-regulatory elements required for macrophage and B cell identities</article-title>. 
<source>Mol Cell</source>. 
<year>2010</year>;
<volume>38</volume>(
<issue>4</issue>):
<fpage>576</fpage>&#x2013;
<lpage>89</lpage>. 
doi:<pub-id pub-id-type="doi">10.1016/j.molcel.2010.05.004</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-29">
        <label>29.</label>
        <mixed-citation publication-type="book">
<person-group person-group-type="author">
<string-name>
<surname>Kohl</surname> 
<given-names>M</given-names>
</string-name>, 
<string-name>
<surname>Wiese</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Warscheid</surname> 
<given-names>B</given-names>
</string-name></person-group>. 
<chapter-title>Cytoscape: software for visualization and analysis of biological networks</chapter-title>. In: 
<person-group person-group-type="editor">
<string-name>
<surname>Hamacher</surname> 
<given-names>M</given-names>
</string-name>, 
<string-name>
<surname>Eisenacher</surname> 
<given-names>M</given-names>
</string-name>, 
<string-name>
<surname>Stephan</surname> 
<given-names>C</given-names>
</string-name></person-group>, editors. 
<source>Data mining in proteomics</source>. 
<publisher-loc>Totowa, NJ, USA</publisher-loc>: 
<publisher-name>Humana Press</publisher-name>; 
<year>2011</year>. p. 
<fpage>291</fpage>&#x2013;
<lpage>303</lpage>. 
doi:<pub-id pub-id-type="doi">10.1007/978-1-60761-987-1_18</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-30">
        <label>30.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Danecek</surname> 
<given-names>P</given-names>
</string-name>, 
<string-name>
<surname>Bonfield</surname> 
<given-names>JK</given-names>
</string-name>, 
<string-name>
<surname>Liddle</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Marshall</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Ohan</surname> 
<given-names>V</given-names>
</string-name>, 
<string-name>
<surname>Pollard</surname> 
<given-names>MO</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>Twelve years of SAMtools and BCFtools</article-title>. 
<source>Gigascience</source>. 
<year>2021</year>;
<volume>10</volume>(
<issue>2</issue>):
<elocation-id>giab008</elocation-id>. 
doi:<pub-id pub-id-type="doi">10.1093/gigascience/giab008</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-31">
        <label>31.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Brouard</surname> 
<given-names>JS</given-names>
</string-name>, 
<string-name>
<surname>Schenkel</surname> 
<given-names>F</given-names>
</string-name>, 
<string-name>
<surname>Marete</surname> 
<given-names>A</given-names>
</string-name>, 
<string-name>
<surname>Bissonnette</surname> 
<given-names>N</given-names>
</string-name></person-group>. 
<article-title>The GATK joint genotyping workflow is appropriate for calling variants in RNA-seq experiments</article-title>. 
<source>J Anim Sci Biotechnol</source>. 
<year>2019</year>;
<volume>10</volume>:
<fpage>44</fpage>. 
doi:<pub-id pub-id-type="doi">10.1186/s40104-019-0359-0</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-32">
        <label>32.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Danecek</surname> 
<given-names>P</given-names>
</string-name>, 
<string-name>
<surname>Auton</surname> 
<given-names>A</given-names>
</string-name>, 
<string-name>
<surname>Abecasis</surname> 
<given-names>G</given-names>
</string-name>, 
<string-name>
<surname>Albers</surname> 
<given-names>CA</given-names>
</string-name>, 
<string-name>
<surname>Banks</surname> 
<given-names>E</given-names>
</string-name>, 
<string-name>
<surname>DePristo</surname> 
<given-names>MA</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>The variant call format and VCFtools</article-title>. 
<source>Bioinformatics</source>. 
<year>2011</year>;
<volume>27</volume>(
<issue>15</issue>):
<fpage>2156</fpage>&#x2013;
<lpage>8</lpage>. 
doi:<pub-id pub-id-type="doi">10.1093/bioinformatics/btr330</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-33">
        <label>33.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Ongen</surname> 
<given-names>H</given-names>
</string-name>, 
<string-name>
<surname>Buil</surname> 
<given-names>A</given-names>
</string-name>, 
<string-name>
<surname>Brown</surname> 
<given-names>AA</given-names>
</string-name>, 
<string-name>
<surname>Dermitzakis</surname> 
<given-names>ET</given-names>
</string-name>, 
<string-name>
<surname>Delaneau</surname> 
<given-names>O</given-names>
</string-name></person-group>. 
<article-title>Fast and efficient QTL mapper for thousands of molecular phenotypes</article-title>. 
<source>Bioinformatics</source>. 
<year>2016</year>;
<volume>32</volume>(
<issue>10</issue>):
<fpage>1479</fpage>&#x2013;
<lpage>85</lpage>. 
doi:<pub-id pub-id-type="doi">10.1093/bioinformatics/btv722</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-34">
        <label>34.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Kang</surname> 
<given-names>HM</given-names>
</string-name>, 
<string-name>
<surname>Sul</surname> 
<given-names>JH</given-names>
</string-name>, 
<string-name>
<surname>Service</surname> 
<given-names>SK</given-names>
</string-name>, 
<string-name>
<surname>Zaitlen</surname> 
<given-names>NA</given-names>
</string-name>, 
<string-name>
<surname>Kong</surname> 
<given-names>SY</given-names>
</string-name>, 
<string-name>
<surname>Freimer</surname> 
<given-names>NB</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>Variance component model to account for sample structure in genome-wide association studies</article-title>. 
<source>Nat Genet</source>. 
<year>2010</year>;
<volume>42</volume>(
<issue>4</issue>):
<fpage>348</fpage>&#x2013;
<lpage>54</lpage>. 
doi:<pub-id pub-id-type="doi">10.1038/ng.548</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-35">
        <label>35.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Purcell</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Neale</surname> 
<given-names>B</given-names>
</string-name>, 
<string-name>
<surname>Todd-Brown</surname> 
<given-names>K</given-names>
</string-name>, 
<string-name>
<surname>Thomas</surname> 
<given-names>L</given-names>
</string-name>, 
<string-name>
<surname>Ferreira</surname> 
<given-names>MAR</given-names>
</string-name>, 
<string-name>
<surname>Bender</surname> 
<given-names>D</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>PLINK: a tool set for whole-genome association and population-based linkage analyses</article-title>. 
<source>Am J Hum Genet</source>. 
<year>2007</year>;
<volume>81</volume>(
<issue>3</issue>):
<fpage>559</fpage>&#x2013;
<lpage>75</lpage>. 
doi:<pub-id pub-id-type="doi">10.1086/519795</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-36">
        <label>36.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Fan</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Shen</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Chen</surname> 
<given-names>C</given-names>
</string-name>, 
<string-name>
<surname>Chen</surname> 
<given-names>X</given-names>
</string-name>, 
<string-name>
<surname>Yang</surname> 
<given-names>X</given-names>
</string-name>, 
<string-name>
<surname>Liu</surname> 
<given-names>H</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>A large-scale integrated transcriptomic atlas for soybean organ development</article-title>. 
<source>Mol Plant</source>. 
<year>2025</year>;
<volume>18</volume>(
<issue>4</issue>):
<fpage>669</fpage>&#x2013;
<lpage>89</lpage>. 
doi:<pub-id pub-id-type="doi">10.1016/j.molp.2025.02.003</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-37">
        <label>37.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Marcon</surname> 
<given-names>A</given-names>
</string-name>, 
<string-name>
<surname>Roma&#xF1;ach</surname> 
<given-names>LG</given-names>
</string-name>, 
<string-name>
<surname>Andr&#xE9;</surname> 
<given-names>D</given-names>
</string-name>, 
<string-name>
<surname>Ding</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Zhang</surname> 
<given-names>B</given-names>
</string-name>, 
<string-name>
<surname>Hvidsten</surname> 
<given-names>TR</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>A transcriptional roadmap of the yearly growth cycle in <italic>Populus</italic> trees</article-title>. 
<source>Plant Cell</source>. 
<year>2025</year>;
<volume>37</volume>(
<issue>9</issue>):
<elocation-id>koaf208</elocation-id>. 
doi:<pub-id pub-id-type="doi">10.1093/plcell/koaf208</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-38">
        <label>38.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Slavkovi&#x107;</surname> 
<given-names>F</given-names>
</string-name>, 
<string-name>
<surname>Bendahmane</surname> 
<given-names>A</given-names>
</string-name></person-group>. 
<article-title>Floral phytochemistry: impact of volatile organic compounds and nectar secondary metabolites on pollinator behavior and health</article-title>. 
<source>Chem Biodivers</source>. 
<year>2023</year>;
<volume>20</volume>(
<issue>4</issue>):
<elocation-id>e202201139</elocation-id>. 
doi:<pub-id pub-id-type="doi">10.1002/cbdv.202201139</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-39">
        <label>39.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>D&#xF6;tterl</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Gershenzon</surname> 
<given-names>J</given-names>
</string-name></person-group>. 
<article-title>Chemistry, biosynthesis and biology of floral volatiles: roles in pollination and other functions</article-title>. 
<source>Nat Prod Rep</source>. 
<year>2023</year>;
<volume>40</volume>(
<issue>12</issue>):
<fpage>1901</fpage>&#x2013;
<lpage>37</lpage>. 
doi:<pub-id pub-id-type="doi">10.1039/D3NP00024A</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-40">
        <label>40.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Li</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>He</surname> 
<given-names>X</given-names>
</string-name>, 
<string-name>
<surname>Gao</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Zhou</surname> 
<given-names>C</given-names>
</string-name>, 
<string-name>
<surname>Chiang</surname> 
<given-names>VL</given-names>
</string-name>, 
<string-name>
<surname>Li</surname> 
<given-names>W</given-names>
</string-name></person-group>. 
<article-title>Histone acetylation changes in plant response to drought stress</article-title>. 
<source>Genes</source>. 
<year>2021</year>;
<volume>12</volume>(
<issue>9</issue>):
<fpage>1409</fpage>. 
doi:<pub-id pub-id-type="doi">10.3390/genes12091409</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-41">
        <label>41.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Dangl</surname> 
<given-names>JL</given-names>
</string-name>, 
<string-name>
<surname>Jones</surname> 
<given-names>JD</given-names>
</string-name></person-group>. 
<article-title>Plant pathogens and integrated defence responses to infection</article-title>. 
<source>Nature</source>. 
<year>2001</year>;
<volume>411</volume>(
<issue>6839</issue>):
<fpage>826</fpage>&#x2013;
<lpage>33</lpage>. 
doi:<pub-id pub-id-type="doi">10.1038/35081161</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-42">
        <label>42.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>de Freitas</surname> 
<given-names>ST</given-names>
</string-name>, 
<string-name>
<surname>Martinelli</surname> 
<given-names>F</given-names>
</string-name>, 
<string-name>
<surname>Feng</surname> 
<given-names>B</given-names>
</string-name>, 
<string-name>
<surname>Reitz</surname> 
<given-names>NF</given-names>
</string-name>, 
<string-name>
<surname>Mitcham</surname> 
<given-names>EJ</given-names>
</string-name></person-group>. 
<article-title>Transcriptome approach to understand the potential mechanisms inhibiting or triggering blossom-end rot development in tomato fruit in response to plant growth regulators</article-title>. 
<source>J Plant Growth Regul</source>. 
<year>2018</year>;
<volume>37</volume>(
<issue>1</issue>):
<fpage>183</fpage>&#x2013;
<lpage>98</lpage>. 
doi:<pub-id pub-id-type="doi">10.1007/s00344-017-9718-2</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-43">
        <label>43.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Pignocchi</surname> 
<given-names>C</given-names>
</string-name>, 
<string-name>
<surname>Fletcher</surname> 
<given-names>JM</given-names>
</string-name>, 
<string-name>
<surname>Wilkinson</surname> 
<given-names>JE</given-names>
</string-name>, 
<string-name>
<surname>Barnes</surname> 
<given-names>JD</given-names>
</string-name>, 
<string-name>
<surname>Foyer</surname> 
<given-names>CH</given-names>
</string-name></person-group>. 
<article-title>The function of ascorbate oxidase in tobacco</article-title>. 
<source>Plant Physiol</source>. 
<year>2003</year>;
<volume>132</volume>(
<issue>3</issue>):
<fpage>1631</fpage>&#x2013;
<lpage>41</lpage>. 
doi:<pub-id pub-id-type="doi">10.1104/pp.103.022798</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-44">
        <label>44.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Tan</surname> 
<given-names>QW</given-names>
</string-name>, 
<string-name>
<surname>Lim</surname> 
<given-names>PK</given-names>
</string-name>, 
<string-name>
<surname>Chen</surname> 
<given-names>Z</given-names>
</string-name>, 
<string-name>
<surname>Pasha</surname> 
<given-names>A</given-names>
</string-name>, 
<string-name>
<surname>Provart</surname> 
<given-names>N</given-names>
</string-name>, 
<string-name>
<surname>Arend</surname> 
<given-names>M</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>Cross-stress gene expression atlas of <italic>Marchantia polymorpha</italic> reveals the hierarchy and regulatory principles of abiotic stress responses</article-title>. 
<source>Nat Commun</source>. 
<year>2023</year>;
<volume>14</volume>(
<issue>1</issue>):
<fpage>986</fpage>. 
doi:<pub-id pub-id-type="doi">10.1038/s41467-023-36517-w</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-45">
        <label>45.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Li</surname> 
<given-names>C</given-names>
</string-name>, 
<string-name>
<surname>Zha</surname> 
<given-names>W</given-names>
</string-name>, 
<string-name>
<surname>Li</surname> 
<given-names>W</given-names>
</string-name>, 
<string-name>
<surname>Wang</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>You</surname> 
<given-names>A</given-names>
</string-name></person-group>. 
<article-title>Advances in the biosynthesis of terpenoids and their ecological functions in plant resistance</article-title>. 
<source>Int J Mol Sci</source>. 
<year>2023</year>;
<volume>24</volume>(
<issue>14</issue>):
<fpage>11561</fpage>. 
doi:<pub-id pub-id-type="doi">10.3390/ijms241411561</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-46">
        <label>46.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Cao</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Liu</surname> 
<given-names>L</given-names>
</string-name>, 
<string-name>
<surname>Ma</surname> 
<given-names>K</given-names>
</string-name>, 
<string-name>
<surname>Wang</surname> 
<given-names>W</given-names>
</string-name>, 
<string-name>
<surname>Lv</surname> 
<given-names>H</given-names>
</string-name>, 
<string-name>
<surname>Gao</surname> 
<given-names>M</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>The jasmonate-induced bHLH gene SlJIG functions in terpene biosynthesis and resistance to insects and fungus</article-title>. 
<source>J Integr Plant Biol</source>. 
<year>2022</year>;
<volume>64</volume>(
<issue>5</issue>):
<fpage>1102</fpage>&#x2013;
<lpage>15</lpage>. 
doi:<pub-id pub-id-type="doi">10.1111/jipb.13248</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-47">
        <label>47.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Jiang</surname> 
<given-names>C</given-names>
</string-name>, 
<string-name>
<surname>Fei</surname> 
<given-names>X</given-names>
</string-name>, 
<string-name>
<surname>Pan</surname> 
<given-names>X</given-names>
</string-name>, 
<string-name>
<surname>Huang</surname> 
<given-names>H</given-names>
</string-name>, 
<string-name>
<surname>Qi</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Wang</surname> 
<given-names>X</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>Tissue-specific transcriptome and metabolome analyses reveal a gene module regulating the terpenoid biosynthesis in <italic>Curcuma wenyujin</italic></article-title>. 
<source>Ind Crops Prod</source>. 
<year>2021</year>;
<volume>170</volume>:
<fpage>113758</fpage>. 
doi:<pub-id pub-id-type="doi">10.1016/j.indcrop.2021.113758</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-48">
        <label>48.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Zhang</surname> 
<given-names>K</given-names>
</string-name>, 
<string-name>
<surname>Wang</surname> 
<given-names>N</given-names>
</string-name>, 
<string-name>
<surname>Gao</surname> 
<given-names>X</given-names>
</string-name>, 
<string-name>
<surname>Ma</surname> 
<given-names>Q</given-names>
</string-name></person-group>. 
<article-title>Integrated metabolite profiling and transcriptome analysis reveals tissue-specific regulation of terpenoid biosynthesis in <italic>Artemisia argyi</italic></article-title>. 
<source>Genomics</source>. 
<year>2022</year>;
<volume>114</volume>(
<issue>4</issue>):
<fpage>110388</fpage>. 
doi:<pub-id pub-id-type="doi">10.1016/j.ygeno.2022.110388</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-49">
        <label>49.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Cheng</surname> 
<given-names>AX</given-names>
</string-name>, 
<string-name>
<surname>Lou</surname> 
<given-names>YG</given-names>
</string-name>, 
<string-name>
<surname>Mao</surname> 
<given-names>YB</given-names>
</string-name>, 
<string-name>
<surname>Lu</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Wang</surname> 
<given-names>LJ</given-names>
</string-name>, 
<string-name>
<surname>Chen</surname> 
<given-names>XY</given-names>
</string-name></person-group>. 
<article-title>Plant terpenoids: biosynthesis and ecological functions</article-title>. 
<source>J Integr Plant Biol</source>. 
<year>2007</year>;
<volume>49</volume>(
<issue>2</issue>):
<fpage>179</fpage>&#x2013;
<lpage>86</lpage>. 
doi:<pub-id pub-id-type="doi">10.1111/j.1744-7909.2007.00395.x</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-50">
        <label>50.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Li</surname> 
<given-names>J</given-names>
</string-name>, 
<string-name>
<surname>Wang</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Dong</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Zhang</surname> 
<given-names>W</given-names>
</string-name>, 
<string-name>
<surname>Wang</surname> 
<given-names>D</given-names>
</string-name>, 
<string-name>
<surname>Bai</surname> 
<given-names>H</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>The chromosome-based lavender genome provides new insights into Lamiaceae evolution and terpenoid biosynthesis</article-title>. 
<source>Hortic Res</source>. 
<year>2021</year>;
<volume>8</volume>(
<issue>1</issue>):
<fpage>53</fpage>. 
doi:<pub-id pub-id-type="doi">10.1038/s41438-021-00490-6</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-51">
        <label>51.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Ortigosa</surname> 
<given-names>A</given-names>
</string-name>, 
<string-name>
<surname>Fonseca</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Franco-Zorrilla</surname> 
<given-names>JM</given-names>
</string-name>, 
<string-name>
<surname>Fern&#xE1;ndez-Calvo</surname> 
<given-names>P</given-names>
</string-name>, 
<string-name>
<surname>Zander</surname> 
<given-names>M</given-names>
</string-name>, 
<string-name>
<surname>Lewsey</surname> 
<given-names>MG</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>The JA-pathway <italic>MYC</italic> transcription factors regulate photomorphogenic responses by targeting HY5 gene expression</article-title>. 
<source>Plant J</source>. 
<year>2020</year>;
<volume>102</volume>(
<issue>1</issue>):
<fpage>138</fpage>&#x2013;
<lpage>52</lpage>. 
doi:<pub-id pub-id-type="doi">10.1111/tpj.14618</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-52">
        <label>52.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Bessa</surname> 
<given-names>M</given-names>
</string-name>, 
<string-name>
<surname>Joaquin</surname> 
<given-names>M</given-names>
</string-name>, 
<string-name>
<surname>Tavner</surname> 
<given-names>F</given-names>
</string-name>, 
<string-name>
<surname>Saville</surname> 
<given-names>MK</given-names>
</string-name>, 
<string-name>
<surname>Watson</surname> 
<given-names>RJ</given-names>
</string-name></person-group>. 
<article-title>Regulation of the cell cycle by B-myb</article-title>. 
<source>Blood Cells Mol Dis</source>. 
<year>2001</year>;
<volume>27</volume>(
<issue>2</issue>):
<fpage>416</fpage>&#x2013;
<lpage>21</lpage>. 
doi:<pub-id pub-id-type="doi">10.1006/bcmd.2001.0399</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-53">
        <label>53.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Wang</surname> 
<given-names>Z</given-names>
</string-name>, 
<string-name>
<surname>Song</surname> 
<given-names>G</given-names>
</string-name>, 
<string-name>
<surname>Zhang</surname> 
<given-names>F</given-names>
</string-name>, 
<string-name>
<surname>Shu</surname> 
<given-names>X</given-names>
</string-name>, 
<string-name>
<surname>Wang</surname> 
<given-names>N</given-names>
</string-name></person-group>. 
<article-title>Functional characterization of <italic>AP2</italic>/<italic>ERF</italic> transcription factors during flower development and anthocyanin biosynthesis related candidate genes in <italic>Lycoris</italic></article-title>. 
<source>Int J Mol Sci</source>. 
<year>2023</year>;
<volume>24</volume>(
<issue>19</issue>):
<fpage>14464</fpage>. 
doi:<pub-id pub-id-type="doi">10.3390/ijms241914464</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-54">
        <label>54.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Zhang</surname> 
<given-names>H</given-names>
</string-name>, 
<string-name>
<surname>Pan</surname> 
<given-names>X</given-names>
</string-name>, 
<string-name>
<surname>Liu</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Lin</surname> 
<given-names>W</given-names>
</string-name>, 
<string-name>
<surname>Li</surname> 
<given-names>Y</given-names>
</string-name>, 
<string-name>
<surname>Zhang</surname> 
<given-names>X</given-names>
</string-name></person-group>. 
<article-title>Genome-wide analysis of AP2/ERF transcription factors in pineapple reveals functional divergence during flowering induction mediated by ethylene and floral organ development</article-title>. 
<source>Genomics</source>. 
<year>2021</year>;
<volume>113</volume>(
<issue>2</issue>):
<fpage>474</fpage>&#x2013;
<lpage>89</lpage>. 
doi:<pub-id pub-id-type="doi">10.1016/j.ygeno.2020.10.040</pub-id>. 

        </mixed-citation>
    </ref>
      <ref id="ref-55">
        <label>55.</label>
        <mixed-citation publication-type="journal">
<person-group person-group-type="author">
<string-name>
<surname>Gong</surname> 
<given-names>Z</given-names>
</string-name>, 
<string-name>
<surname>Xiong</surname> 
<given-names>L</given-names>
</string-name>, 
<string-name>
<surname>Shi</surname> 
<given-names>H</given-names>
</string-name>, 
<string-name>
<surname>Yang</surname> 
<given-names>S</given-names>
</string-name>, 
<string-name>
<surname>Herrera-Estrella</surname> 
<given-names>LR</given-names>
</string-name>, 
<string-name>
<surname>Xu</surname> 
<given-names>G</given-names>
</string-name>, 
<etal>et al</etal></person-group>. 
<article-title>Plant abiotic stress response and nutrient use efficiency</article-title>. 
<source>Sci China Life Sci</source>. 
<year>2020</year>;
<volume>63</volume>(
<issue>5</issue>):
<fpage>635</fpage>&#x2013;
<lpage>74</lpage>. 
doi:<pub-id pub-id-type="doi">10.1007/s11427-020-1683-x</pub-id>. 

        </mixed-citation>
    </ref>
    </ref-list>
  </back>
</article>
