<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE root>
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="research-article" dtd-version="1.2" xml:lang="en"><front><journal-meta><journal-id journal-id-type="publisher-id">Ecological genetics</journal-id><journal-title-group><journal-title xml:lang="en">Ecological genetics</journal-title><trans-title-group xml:lang="ru"><trans-title>Экологическая генетика</trans-title></trans-title-group></journal-title-group><issn publication-format="print">1811-0932</issn><issn publication-format="electronic">2411-9202</issn><publisher><publisher-name xml:lang="en">Eco-Vector</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">696083</article-id><article-id pub-id-type="doi">10.17816/ecogen696083</article-id><article-id pub-id-type="edn">STZYGV</article-id><article-categories><subj-group subj-group-type="toc-heading" xml:lang="en"><subject>Methodology in ecological genetics</subject></subj-group><subj-group subj-group-type="toc-heading" xml:lang="ru"><subject>Методология экологической генетики</subject></subj-group><subj-group subj-group-type="article-type"><subject>Research Article</subject></subj-group></article-categories><title-group><article-title xml:lang="en">CTGA: a web-based functional genomic resource for <italic>Cyamopsis tetragonoloba</italic> (L.) Taub.</article-title><trans-title-group xml:lang="ru"><trans-title>CTGA: геномный веб-ресурс <italic>Cyamopsis tetragonoloba</italic> (L.) Taub.</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-5666-3020</contrib-id><contrib-id contrib-id-type="spin">5048-0203</contrib-id><name-alternatives><name xml:lang="en"><surname>Zorin</surname><given-names>Evgeny A.</given-names></name><name xml:lang="ru"><surname>Зорин</surname><given-names>Евгений Андреевич</given-names></name></name-alternatives><address><country country="RU">Russian Federation</country></address><bio xml:lang="en"><p>Cand. Sci. (Biology)</p></bio><bio xml:lang="ru"><p>канд. биол. наук</p></bio><email>ezorin@arriam.ru</email><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0003-2808-7745</contrib-id><contrib-id contrib-id-type="spin">2802-9614</contrib-id><name-alternatives><name xml:lang="en"><surname>Vishnyakova</surname><given-names>Margarita A.</given-names></name><name xml:lang="ru"><surname>Вишнякова</surname><given-names>Маргарита Афанасьевна</given-names></name></name-alternatives><address><country country="RU">Russian Federation</country></address><bio xml:lang="en"><p>Dr. Sci. (Biology), Professor</p></bio><bio xml:lang="ru"><p>д-р биол. наук, профессор</p></bio><email>m.vishnyakova@vir.nw.ru</email><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-2411-9191</contrib-id><contrib-id contrib-id-type="spin">2610-3670</contrib-id><name-alternatives><name xml:lang="en"><surname>Zhukov</surname><given-names>Vladimir A.</given-names></name><name xml:lang="ru"><surname>Жуков</surname><given-names>Владимир Александрович</given-names></name></name-alternatives><address><country country="RU">Russian Federation</country></address><bio xml:lang="en"><p>Cand. Sci. (Biology)</p></bio><bio xml:lang="ru"><p>канд. биол. наук</p></bio><email>vzhukov@arriam.ru</email><xref ref-type="aff" rid="aff1"/><xref ref-type="aff" rid="aff2"/></contrib></contrib-group><aff-alternatives id="aff1"><aff><institution xml:lang="en">N.I. Vavilov All-Russian Institute of Plant Genetic Resources</institution></aff><aff><institution xml:lang="ru">Федеральный исследовательский центр Всероссийский институт генетических ресурсов растений им. Н.И. Вавилова</institution></aff></aff-alternatives><aff-alternatives id="aff2"><aff><institution xml:lang="en">All-Russia Research Institute for Agricultural Microbiology</institution></aff><aff><institution xml:lang="ru">Всероссийский научно-исследовательский институт сельскохозяйственной микробиологии</institution></aff></aff-alternatives><pub-date date-type="preprint" iso-8601-date="2025-12-11" publication-format="electronic"><day>11</day><month>12</month><year>2025</year></pub-date><pub-date date-type="pub" iso-8601-date="2026-02-09" publication-format="electronic"><day>09</day><month>02</month><year>2026</year></pub-date><volume>23</volume><issue>4</issue><issue-title xml:lang="en"/><issue-title xml:lang="ru"/><fpage>391</fpage><lpage>408</lpage><history><date date-type="received" iso-8601-date="2025-11-11"><day>11</day><month>11</month><year>2025</year></date><date date-type="accepted" iso-8601-date="2025-12-11"><day>11</day><month>12</month><year>2025</year></date></history><permissions><copyright-statement xml:lang="en">Copyright ©; 2025, Eco-Vector</copyright-statement><copyright-statement xml:lang="ru">Copyright ©; 2025, Эко-Вектор</copyright-statement><copyright-year>2025</copyright-year><copyright-holder xml:lang="en">Eco-Vector</copyright-holder><copyright-holder xml:lang="ru">Эко-Вектор</copyright-holder><license><ali:license_ref xmlns:ali="http://www.niso.org/schemas/ali/1.0/">https://creativecommons.org/licenses/by-nc-nd/4.0/</ali:license_ref></license></permissions><self-uri xlink:href="https://journals.eco-vector.com/ecolgenet/article/view/696083">https://journals.eco-vector.com/ecolgenet/article/view/696083</self-uri><abstract xml:lang="en"><p><bold>BACKGROUND:</bold> Guar (Cyamopsis tetragonoloba), an industrially important crop, is valued for the galactomannan gum derived from its seeds. Recent advances in genomic and transcriptomic research have provided valuable resources such as the reference genome and several sets of gene expression profiles. However, these data are currently fragmented and therefore require bioinformatics expertise to access and analyze them. Additionally, several genomic assemblies have been recently published, but there are currently no bioinformatics platforms specifically dedicated to guar genomics and transcriptomics.</p> <p><bold>AIM:</bold> To address this challenge, we have developed CTGA, a comprehensive functional genomic web portal for guar.</p> <p><bold>METHODS:</bold> Using Flask, as well as popular Python, CSS, and HTML libraries, we have developed a backend and frontend for the genomic platform.</p> <p><bold>RESULTS:</bold> We have performed a de novo structural and functional annotation of the guar genome predicting 57,019 protein-coding genes with UTRs. Besides, expression data from 85 public RNA-seq libraries representing various tissues and conditions were collected to create a normalized gene expression atlas. CTGA features an intuitive web interface to provide interactive tools, including a genome browser (IGV), BLAST for homology searching, tools for the Gene Ontology enrichment analysis, for working with guar genomic sequences, as well as a tool for generating heatmaps for more convenient analysis of guar gene expression in various tissues and experimental conditions. It also includes detailed functional annotations from various sources (eggNOG, Mercator4, GO, and KEGG) and instant visualization of gene expression profiles.</p> <p><bold>CONCLUSION:</bold> CTGA is available at: <ext-link ext-link-type="uri" xlink:href="https://guar.arriam.ru">https://guar.arriam.ru/</ext-link></p></abstract><trans-abstract xml:lang="ru"><p><bold>Обоснование.</bold> Гуар (Cyamopsis tetragonoloba (L.) Taub.) — сельскохозяйственная культура, имеющая важное промышленное значение, в том числе благодаря камеди, получаемой из семян. Достижения в области геномных и транскриптомных исследований в последние годы привели к появлению референсной геномной сборки и множества наборов профилей экспрессии генов. Однако в настоящее время эти данные разрознены и для доступа и их анализа требуются навыки в области биоинформатики. Несмотря на все достижения, на данный момент не существует специализированных биоинформатических платформ, посвященных геномике и транскриптомике гуара, которые бы облегчили процесс работы с этими данными.</p> <p><bold>Цель исследования.</bold> Разработать комплексный веб-портал, посвященный функциональной геномике гуара.</p> <p><bold>Методы.</bold> Мы провели de novo структурную и функциональную аннотацию генома гуара, предсказав 57 019 белок-кодирующих генов и их нетранслируемые области (UTRs). Кроме того, были собраны данные экспрессии из 85 публичных RNA-seq библиотек, представляющих различные ткани и экспериментальные условия, чтобы создать исчерпывающий атлас экспрессии генов.</p> <p><bold>Результаты.</bold> CTGA обладает интуитивно понятным веб-интерфейсом и предоставляет интерактивные инструменты, включая геномный браузер, BLAST-сервис для поиска гомологии, инструменты для анализа обогащения в терминах Gene Ontology, для работы с геномными последовательностями, а также инструмент для построения тепловых карт для удобного анализа профилей экспрессии генов гуара в различных тканях и экспериментальных условиях. Портал также включает подробные функциональную аннотацию генов из различных источников (eggNOG, Mercator4, GO и KEGG) и мгновенную визуализацию профилей экспрессии генов.</p> <p><bold>Заключение.</bold> Платформа CTGA доступна по адресу: <ext-link ext-link-type="uri" xlink:href="https://guar.arriam.ru/">https://guar.arriam.ru/</ext-link></p></trans-abstract><kwd-group xml:lang="en"><kwd>guar</kwd><kwd>Cyamopsis tetragonoloba</kwd><kwd>genomics</kwd><kwd>transcriptomics</kwd><kwd>gene expression</kwd><kwd>gene annotation</kwd><kwd>genome browser</kwd></kwd-group><kwd-group xml:lang="ru"><kwd>гуар</kwd><kwd>Cyamopsis tetragonoloba</kwd><kwd>геномика</kwd><kwd>транскриптомика</kwd><kwd>экспрессия генов</kwd><kwd>аннотация генов</kwd><kwd>геномный браузер</kwd></kwd-group><funding-group><award-group><funding-source><institution-wrap><institution xml:lang="en">Russian Science Foundation</institution></institution-wrap><institution-wrap><institution xml:lang="ru">Российский научный фонд</institution></institution-wrap></funding-source><award-id>23-16-00195</award-id></award-group><funding-statement xml:lang="en">This research was funded by the Russian Science Foundation, project No. 23-16-00195 dated 15 May 2023</funding-statement><funding-statement xml:lang="ru">Данная работа целиком поддержана грантом Российского научного фонда (проект № 23-16-00195)</funding-statement></funding-group></article-meta></front><body></body><back><ref-list><ref id="B1"><label>1.</label><mixed-citation>Thombare N, Jha U, Mishra S, et al. Guar gum as a promising starting material for diverse applications: a review. Int J Biol Macromol.2016;88:361–372. doi: 10.1016/j.ijbiomac.2016.04.001 EDN: WRSQWT</mixed-citation></ref><ref id="B2"><label>2.</label><mixed-citation>Naoumkina M, Torres-Jerez I, Allen S, et al. Analysis of cDNA libraries from developing seeds of guar (Cyamopsis tetragonoloba (L.) Taub). BMC Plant Biol. 2007;7:62. doi: 10.1186/1471-2229-7-62 EDN: NUVATW</mixed-citation></ref><ref id="B3"><label>3.</label><mixed-citation>Chaudhury A, Kaila T, Gaikwad K. Elucidation of galactomannan biosynthesis pathway genes through transcriptome sequencing of seeds collected at different developmental stages of commercially important Indian varieties of cluster bean (Cyamopsis tetragonoloba L.). Sci Rep. 2019;9(1):11539. doi: 10.1038/s41598-019-48072-w EDN: GEKMME</mixed-citation></ref><ref id="B4"><label>4.</label><mixed-citation>Hu H, Wang H, Zhang Y, et al. Characterization of genes in guar gum biosynthesis based on quantitative RNA-sequencing in guar bean (Cyamopsis tetragonoloba). Sci Rep. 2019;9(1):10991. doi: 10.1038/s41598-019-47518-5 EDN: XRKTMY</mixed-citation></ref><ref id="B5"><label>5.</label><mixed-citation>Sharma S, Tyagi A, Srivastava H, et al. Exploring the edible gum (galactomannan) biosynthesis and its regulation during pod developmental stages in clusterbean using comparative transcriptomic approach. Sci Rep. 2021;11(1):4000. doi: 10.1038/s41598-021-83507-3 EDN: JYLGKG</mixed-citation></ref><ref id="B6"><label>6.</label><mixed-citation>Gaikwad K, Ramakrishna G, Srivastava H, et al. The chromosome-scale genome assembly of cluster bean provides molecular insight into edible gum (galactomannan) biosynthesis family genes. Sci Rep. 2023;13(1):9941. doi: 10.1038/s41598-023-33762-3 EDN: ACCLTJ</mixed-citation></ref><ref id="B7"><label>7.</label><mixed-citation>Rawal HC, Kumar S, Mithra SVA, et al. High quality unigenes and microsatellite markers from tissue specific transcriptome and development of a database in clusterbean (Cyamopsis tetragonoloba, L. Taub). Genes. 2017;8(11):313. doi: 10.3390/genes8110313 EDN: YIOLPP</mixed-citation></ref><ref id="B8"><label>8.</label><mixed-citation>Thakur O, Randhawa GS. Identification and characterization of SSR, SNP and InDel molecular markers from RNA-Seq data of guar (Cyamopsis tetragonoloba, L. Taub.) roots. BMC Genomics. 2018;19(1):951. doi: 10.1186/s12864-018-5205-9 EDN: HZOERI</mixed-citation></ref><ref id="B9"><label>9.</label><mixed-citation>Grigoreva E, Barbitoff Y, Changalidi A, et al. Development of SNP set for the marker-assisted selection of guar (Cyamopsis tetragonoloba (L.) Taub.) based on a custom reference genome assembly. Plants. 2021;10(10):2063. doi: 10.3390/plants10102063 EDN: OZJRYH</mixed-citation></ref><ref id="B10"><label>10.</label><mixed-citation>Arkhimandritova S, Shavarda A, Potokina E. Key metabolites associated with the onset of flowering of guar genotypes (Cyamopsis tetragonoloba (L.) Taub). BMC Plant Biology. 2020;20(Suppl 1):291. doi: 10.1186/s12870-020-02498-x EDN: VMAHIS</mixed-citation></ref><ref id="B11"><label>11.</label><mixed-citation>Grigoreva E, Tkachenko A, Arkhimandritova S, et al. Identification of key metabolic pathways and biomarkers underlying flowering time of guar (Cyamopsis tetragonoloba (L.) Taub.) via integrated transcriptome-metabolome analysis. Genes. 2021;12(7):952. doi: 10.3390/genes12070952 EDN: XBDJOP</mixed-citation></ref><ref id="B12"><label>12.</label><mixed-citation>Kaila T, Chaduvla PK, Rawal HC, et al. Chloroplast genome sequence of clusterbean (Cyamopsis tetragonoloba L.): genome structure and comparative analysis. Genes. 2017;8(9):212. doi: 10.3390/genes8090212</mixed-citation></ref><ref id="B13"><label>13.</label><mixed-citation>Altschul SF, Gish W, Miller W, et al. Basic local alignment search tool. J Mol Biol. 1990;215(3):403–410. doi: 10.1016/S0022-2836(05)80360-2 EDN: SGUJER</mixed-citation></ref><ref id="B14"><label>14.</label><mixed-citation>Li JH, Li MJ, Li WL, et al. Leguminous industrial crop guar (Cyamopsis tetragonoloba): the chromosome-level reference genome de novo assembly. Industrial Crops and Products. 2024;216:118748. doi: 10.1016/j.indcrop.2024.118748 EDN: AIAYXK</mixed-citation></ref><ref id="B15"><label>15.</label><mixed-citation>Brůna T, Hoff KJ, Lomsadze A, et al. BRAKER2: automatic eukaryotic genome annotation with GeneMark-EP+ and AUGUSTUS supported by a protein database. NAR Genom Bioinform. 2021;3(1):lqaa108. doi: 10.1093/nargab/lqaa108 EDN: UMWJZR</mixed-citation></ref><ref id="B16"><label>16.</label><mixed-citation>Brůna T, Lomsadze A, Borodovsky M. GeneMark-EP+: eukaryotic gene prediction with self-training in the space of genes and proteins. NAR Genom Bioinform. 2020;2(2):lqaa026. doi: 10.1093/nargab/lqaa026 EDN: AOAAGH</mixed-citation></ref><ref id="B17"><label>17.</label><mixed-citation>Stanke M, Steinkamp R, Waack S, et al. AUGUSTUS: a web server for gene finding in eukaryotes. Nucleic Acids Res. 2004;32(Web Server issue): W309–W312. doi: 10.1093/nar/gkh379 EDN: IUCVSZ</mixed-citation></ref><ref id="B18"><label>18.</label><mixed-citation>The Gene Ontology Consortium, Aleksander SA, Balhoff J, et al. The Gene Ontology knowledgebase in 2023. Genetics. 2023;224(1):iyad031. doi: 10.1093/genetics/iyad031 EDN: OIDRSY</mixed-citation></ref><ref id="B19"><label>19.</label><mixed-citation>Ashburner M, Ball CA, Blake JA, et al. Gene Ontology: tool for the unification of biology. Nat Genet. 2000;25(1):25–29. doi: 10.1038/75556 EDN: SPYGDX</mixed-citation></ref><ref id="B20"><label>20.</label><mixed-citation>Kanehisa M, Goto S. KEGG: Kyoto Encyclopedia of Genes and Genomes. Nucleic Acids Res. 2000;28(1):27–30. doi: 10.1093/nar/28.1.27 EDN: IUQVVD</mixed-citation></ref><ref id="B21"><label>21.</label><mixed-citation>Cantalapiedra CP, Hernández-Plaza A, Letunic I, et al. eggNOG-mapper v2: functional annotation, orthology assignments, and domain prediction at the metagenomic scale. Mol Biol Evol. 2021;38(12):5825–5829. doi: 10.1093/molbev/msab293 EDN: PFFLTN</mixed-citation></ref><ref id="B22"><label>22.</label><mixed-citation>Bolger M, Schwacke R, Usadel B. MapMan visualization of RNA-Seq data using Mercator4 functional annotations. Methods in Molecular Biology. 2021;2354:195–212. doi: 10.1007/978-1-0716-1609-3_9 EDN: DMLUEF</mixed-citation></ref><ref id="B23"><label>23.</label><mixed-citation>Schwacke R, Ponce-Soto GY, Krause K, et al. MapMan4: a refined protein classification and annotation framework applicable to multi-omics data analysis. Mol Plant. 2019;12(6):879–892. doi: 10.1016/j.molp.2019.01.003</mixed-citation></ref><ref id="B24"><label>24.</label><mixed-citation>Manni M, Berkeley MR, Seppey M, et al. BUSCO update: novel and streamlined workflows along with broader and deeper phylogenetic coverage for scoring of eukaryotic, prokaryotic, and viral genomes. Mol Biol Evol. 2021;38(10):4647–4654. doi: 10.1093/molbev/msab199 EDN: LULTEI</mixed-citation></ref><ref id="B25"><label>25.</label><mixed-citation>github.com [Internet]. SRA-toolkit. Available from: https://github.com/ncbi/sra-tools/wiki/01.-Downloading-SRA-Toolkit Accessed: October 02, 2025.</mixed-citation></ref><ref id="B26"><label>26.</label><mixed-citation>sourceforge.net [Internet]. BBMap. Available from: https://sourceforge.net/projects/bbmap/ Accessed: October 02, 2025.</mixed-citation></ref><ref id="B27"><label>27.</label><mixed-citation>Dobin A, Davis CA, Schlesinger F, et al. STAR: ultrafast universal RNA-seq aligner. Bioinformatics. 2013;29(1):15–21. doi: 10.1093/bioinformatics/bts635</mixed-citation></ref><ref id="B28"><label>28.</label><mixed-citation>Liao Y, Smyth GK, Shi W. Featurecounts: an efficient general purpose program for assigning sequence reads to genomic features. Bioinformatics. 2014;30(7):923–930. doi: 10.1093/bioinformatics/btt656 EDN: YCINGW</mixed-citation></ref><ref id="B29"><label>29.</label><mixed-citation>flask.palletsprojects.com [Internet]. FLASK. Available from: https://flask.palletsprojects.com/en/stable/. Accessed: October 02, 2025.</mixed-citation></ref><ref id="B30"><label>30.</label><mixed-citation>Thorvaldsdottir H, Robinson JT, Mesirov JP. Integrative Genomics Viewer (IGV): high-performance genomics data visualization and exploration. Brief Bioinform. 2013;14(2):178–192. doi: 10.1093/bib/bbs017</mixed-citation></ref><ref id="B31"><label>31.</label><mixed-citation>Adrian A, Rahnenfuhrer J. topGO. Bioconductor: Buffalo, NY, USA; 2017.</mixed-citation></ref><ref id="B32"><label>32.</label><mixed-citation>Boneva S, Schlecht A, Böhringer D, et al. 3' MACE RNA-sequencing allows for transcriptome profiling in human tissue samples after long-term storage. Lab Invest. 2020;100(10):1345–1355. doi: 10.1038/s41374-020-0446-z EDN: RJUKRN</mixed-citation></ref></ref-list></back></article>
