<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">vavilov</journal-id><journal-title-group><journal-title xml:lang="ru">Вавиловский журнал генетики и селекции</journal-title><trans-title-group xml:lang="en"><trans-title>Vavilov Journal of Genetics and Breeding</trans-title></trans-title-group></journal-title-group><issn pub-type="epub">2500-3259</issn><publisher><publisher-name>Institute of Cytology and Genetics of Siberian Branch of the RAS</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.18699/vjgb-25-35</article-id><article-id custom-type="elpub" pub-id-type="custom">vavilov-4551</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>БИОИНФОРМАТИКА</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="en"><subject>BIOINFORMATICS</subject></subj-group></article-categories><title-group><article-title>CropGene: программный комплекс анализа геномных и транскриптомных данных сельскохозяйственных растений</article-title><trans-title-group xml:lang="en"><trans-title>CropGene: a software package for the analysis of genomic and transcriptomic data of agricultural plants</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-3011-6288</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Пронозин</surname><given-names>А. Ю.</given-names></name><name name-style="western" xml:lang="en"><surname>Pronozin</surname><given-names>A. Yu.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0009-0003-0918-8441</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Каретников</surname><given-names>Д. И.</given-names></name><name name-style="western" xml:lang="en"><surname>Karetnikov</surname><given-names>D.  I.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0009-0001-6414-5562</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Шмаков</surname><given-names>Н. А.</given-names></name><name name-style="western" xml:lang="en"><surname>Shmakov</surname><given-names>N. A.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-3477-2047</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Бочарникова</surname><given-names>М. Е.</given-names></name><name name-style="western" xml:lang="en"><surname>Bocharnikova</surname><given-names>M. E.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-7969-8015</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Афонникова</surname><given-names>С. Д.</given-names></name><name name-style="western" xml:lang="en"><surname>Afonnikova</surname><given-names>S. D.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-9738-1409</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Афонников</surname><given-names>Д. А.</given-names></name><name name-style="western" xml:lang="en"><surname>Afonnikov</surname><given-names>D. A.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0001-6800-8787</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Колчанов</surname><given-names>Н. А.</given-names></name><name name-style="western" xml:lang="en"><surname>Kolchanov</surname><given-names>N. A.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><xref ref-type="aff" rid="aff-1"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru">Федеральный исследовательский центр Институт цитологии и генетики Сибирского отделения Российской академии наук; Курчатовский геномный центр ИЦиГ СО РАН<country>Россия</country></aff><aff xml:lang="en">Institute of Cytology and Genetics of the Siberian Branch of the Russian Academy of Sciences; Kurchatov Genomic Center of ICG SB RAS<country>Russian Federation</country></aff></aff-alternatives><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>11</day><month>04</month><year>2025</year></pub-date><volume>29</volume><issue>2</issue><fpage>320</fpage><lpage>329</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Пронозин А.Ю., Каретников Д.И., Шмаков Н.А., Бочарникова М.Е., Афонникова С.Д., Афонников Д.А., Колчанов Н.А., 2025</copyright-statement><copyright-year>2025</copyright-year><copyright-holder xml:lang="ru">Пронозин А.Ю., Каретников Д.И., Шмаков Н.А., Бочарникова М.Е., Афонникова С.Д., Афонников Д.А., Колчанов Н.А.</copyright-holder><copyright-holder xml:lang="en">Pronozin A.Y., Karetnikov D.I., Shmakov N.A., Bocharnikova M.E., Afonnikova S.D., Afonnikov D.A., Kolchanov N.A.</copyright-holder><license license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://vavilov.elpub.ru/jour/article/view/4551">https://vavilov.elpub.ru/jour/article/view/4551</self-uri><abstract><p>В настоящее время селекция сельскохозяйственных растений все больше опирается на использование молекулярно-биологических данных о генетических последовательностях, что позволяет существенно ускорить селекционный процесс создания новых сортов растений за счет геномного редактирования. Эти данные имеют большой объем, разнообразны и требуют для анализа затрат большого количества ресурсов, как трудовых, так и вычислительных. Анализ данных с такими объемом и сложностью может быть эффективным лишь с применением современных методов биоинформатики, включающих алгоритмы идентификации генов, предсказания их функции, оценку влияния эффекта мутации на фенотип растений. Такой анализ в последнее время стал невозможным без использования интегрированных программных комплексов, решающих задачи разного уровня за счет выполнения вычислительных конвейеров. В статье описан программный комплекс CropGene, разработанный для комплексного анализа геномных и транскриптомных данных сельскохозяйственных растений. Система включает в себя несколько блоков биоинформатического анализа, таких как анализ вариаций генов, сборка геномов и транскриптомов, а также аннотация генов и белков. В комплексе реализованы новые методы анализа длинных некодирующих РНК, белковых доменов, поиска и анализа полиморфизмов и полногеномного исследования ассоциаций. В работе представлены примеры применения CropGene для анализа сельскохозяйственных организмов, таких как Solanum tuberosum, Zea mays. С помощью данного программного пакета найдены: генетические маркеры, объясняющие до 50 % изменчивости параметров окраски семян; потенциальные гены, которые могут стать перспективным материалом для получения сортов картофеля; более 100 тыс. новых длинных некодирующих РНК. Также обнаружены ортогруппы, доменная структура которых проявляет заметное сходство с доменной архитектурой характерных секретируемых фосфолипаз А2. Таким образом, CropGene представляет собой важный инструмент для ученых и практиков, работающих в области агробиотехнологий и генетики растений.</p></abstract><trans-abstract xml:lang="en"><p>Currently, the breeding of agricultural plants is increasingly based on the use of molecular biological data on genetic sequences, which makes it possible to significantly accelerate the breeding process, create new plant varieties through genomic editing. These data have a large volume, variety and require a large amount of resources, both labor and computing, to analyze the costs. Data analysis of such volume and complexity can be effective only when using modern bioinformatics methods, which include algorithms for identifying genes, predicting their function, and evaluating the effect of mutation on plant phenotype. Such an analysis has recently become impossible without the use of integrated software systems that solve problems of different levels by executing computational pipelines. The paper describes the CropGene software package developed for the comprehensive analysis of genomic and transcriptomic data of agricultural plants. CropGene includes several blocks of bioinformatic analysis, such as analysis of gene variations, assembly of genomes and transcriptomes, as well as annotation of genes and proteins. CropGene implements new methods for analyzing long non-coding RNAs, protein domains, searching and analyzing polymorphisms, and genomewide association research. CropGene has a user-friendly interface and supports working with various types of data, which greatly simplifies its use for researchers who do not have deep knowledge in the field of bioinformatics. The paper provides examples of the use of CropGene for the analysis of agricultural organisms such as Solanum tuberosum and Zea mays. With CropGene, genetic markers have been identified that explain up to 50 % of the variability in seed color parameters; potential genes that may become promising material for producing potato varieties; more than 100 thousand new long non-coding RNAs. Orthogroups were also found, the domain structure of which shows a marked similarity with the domain architecture of characteristic secreted A2 phospholipases. Thus, CropGene is an important tool for scientists and practitioners working in the field of agrobiotechnology and plant genetics.</p></trans-abstract><kwd-group xml:lang="ru"><kwd>биоинформатический конвейер</kwd><kwd>программный пакет</kwd><kwd>SNP</kwd><kwd>анализ полиморфизмов</kwd><kwd>идентификация генов</kwd></kwd-group><kwd-group xml:lang="en"><kwd>bioinformatics pipeline</kwd><kwd>software package</kwd><kwd>SNP</kwd><kwd>analyzing polymorphisms</kwd><kwd>identification of genes</kwd></kwd-group><funding-group xml:lang="en"><funding-statement>The work on the creation of the CropGene software package was carried out with the support of budget project No. FWNR-2022-0020.</funding-statement></funding-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Afonnikova S.D., Kiseleva A.A., Fedyaeva A.V., Komyshev E.G., Koval V.S., Afonnikov D.A., Salina E.A. Identification of novel loci precisely modulating pre-harvest sprouting resistance and red color components of the seed coat in T. aestivum L. Plants. 2024;13(10): 1309. doi 10.3390/plants13101309</mixed-citation><mixed-citation xml:lang="en">Afonnikova S.D., Kiseleva A.A., Fedyaeva A.V., Komyshev E.G., Koval V.S., Afonnikov D.A., Salina E.A. Identification of novel loci precisely modulating pre-harvest sprouting resistance and red color components of the seed coat in T. aestivum L. Plants. 2024;13(10): 1309. doi 10.3390/plants13101309</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Bray N.L., Pimentel H., Melsted P., Pachter L. Near-optimal probabilistic RNA-seq quantification. Nat Biotechnol. 2016;34(5):525-527. doi 10.1038/nbt.3519</mixed-citation><mixed-citation xml:lang="en">Bray N.L., Pimentel H., Melsted P., Pachter L. Near-optimal probabilistic RNA-seq quantification. Nat Biotechnol. 2016;34(5):525-527. doi 10.1038/nbt.3519</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Browning B.L., Zhou Y., Browning S.R. A one-penny imputed genome from next-generation reference panels. Am J Hum Genet. 2018; 103(3):338-348. doi 10.1016/j.ajhg.2018.07.015</mixed-citation><mixed-citation xml:lang="en">Browning B.L., Zhou Y., Browning S.R. A one-penny imputed genome from next-generation reference panels. Am J Hum Genet. 2018; 103(3):338-348. doi 10.1016/j.ajhg.2018.07.015</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Burghardt L.T., Young N.D., Tiffin P. A guide to genome‐wide association mapping in plants. Curr Protoc Plant Biol. 2017;2(1):22-38. doi 10.1002/cppb.20041</mixed-citation><mixed-citation xml:lang="en">Burghardt L.T., Young N.D., Tiffin P. A guide to genome‐wide association mapping in plants. Curr Protoc Plant Biol. 2017;2(1):22-38. doi 10.1002/cppb.20041</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Bushmanova E., Antipov D., Lapidus A., Suvorov V., Prjibelski A.D. rnaQUAST: a quality assessment tool for de novo transcript assemblies. Bioinformatics. 2016;32(14):2210-2212. doi 10.1093/bioinformatics/btw218</mixed-citation><mixed-citation xml:lang="en">Bushmanova E., Antipov D., Lapidus A., Suvorov V., Prjibelski A.D. rnaQUAST: a quality assessment tool for de novo transcript assemblies. Bioinformatics. 2016;32(14):2210-2212. doi 10.1093/bioinformatics/btw218</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Bushmanova E., Antipov D., Lapidus A., Prjibelski A.D. rnaSPAdes: a de novo transcriptome assembler and its application to RNA-Seq data. GigaScience. 2019;8(9):giz100. doi 10.1093/gigascience/giz100</mixed-citation><mixed-citation xml:lang="en">Bushmanova E., Antipov D., Lapidus A., Prjibelski A.D. rnaSPAdes: a de novo transcriptome assembler and its application to RNA-Seq data. GigaScience. 2019;8(9):giz100. doi 10.1093/gigascience/giz100</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Cardoso-Silva C.B., Costa E.A., Mancini M.C., Balsalobre T.W.A., Canesin L.E.C., Pinto L.R., Carneiro M.S., Garcia A.A.F., de Souza A.P., Vicentini R. De novo assembly and transcriptome analysis of contrasting sugarcane varieties. PloS One. 2014;9(2):e88462. doi 10.1371/journal.pone.0088462</mixed-citation><mixed-citation xml:lang="en">Cardoso-Silva C.B., Costa E.A., Mancini M.C., Balsalobre T.W.A., Canesin L.E.C., Pinto L.R., Carneiro M.S., Garcia A.A.F., de Souza A.P., Vicentini R. De novo assembly and transcriptome analysis of contrasting sugarcane varieties. PloS One. 2014;9(2):e88462. doi 10.1371/journal.pone.0088462</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Carninci P., Kasukawa T., Katayama S., Gough J., Frith M.C., Maeda N., Oyama R., … Watahiki A., Okamura-Oho Y., Suzuki H., Kawai J., Hayashizaki Y. The transcriptional landscape of the mammalian genome. Science. 2005;309(5740):1559-1563. doi 10.1126/science.1112014</mixed-citation><mixed-citation xml:lang="en">Carninci P., Kasukawa T., Katayama S., Gough J., Frith M.C., Maeda N., Oyama R., … Watahiki A., Okamura-Oho Y., Suzuki H., Kawai J., Hayashizaki Y. The transcriptional landscape of the mammalian genome. Science. 2005;309(5740):1559-1563. doi 10.1126/science.1112014</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Chen S., Zhou Y., Chen Y., Gu J. fastp: an ultra-fast all-in-one FASTQ preprocessor. Bioinformatics. 2018;34(17):i884-i890. doi 10.1093/bioinformatics/bty560</mixed-citation><mixed-citation xml:lang="en">Chen S., Zhou Y., Chen Y., Gu J. fastp: an ultra-fast all-in-one FASTQ preprocessor. Bioinformatics. 2018;34(17):i884-i890. doi 10.1093/bioinformatics/bty560</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Danecek P., Auton A., Abecasis G., Albers C.A., Banks E., DePristo M.A., Handsaker R.E., Lunter G., Marth G.T., Sherry S.T., McVean G., Durbin R.; 1000 Genomes Project Analysis Group. The variant call format and VCFtools. Bioinformatics. 2011;27(15): 2156-2158. doi 10.1093/bioinformatics/btr330</mixed-citation><mixed-citation xml:lang="en">Danecek P., Auton A., Abecasis G., Albers C.A., Banks E., DePristo M.A., Handsaker R.E., Lunter G., Marth G.T., Sherry S.T., McVean G., Durbin R.; 1000 Genomes Project Analysis Group. The variant call format and VCFtools. Bioinformatics. 2011;27(15): 2156-2158. doi 10.1093/bioinformatics/btr330</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Danecek P., Bonfield J.K., Liddle J., Marshall J., Ohan V., Pollard M.O., Whitwham A., Keane T., McCarthy S.A., Davies R.M., Li H. Twelve years of SAMtools and BCFtools. GigaScience. 2021;10(2): giab008. doi 10.1093/gigascence/giab008</mixed-citation><mixed-citation xml:lang="en">Danecek P., Bonfield J.K., Liddle J., Marshall J., Ohan V., Pollard M.O., Whitwham A., Keane T., McCarthy S.A., Davies R.M., Li H. Twelve years of SAMtools and BCFtools. GigaScience. 2021;10(2): giab008. doi 10.1093/gigascence/giab008</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Drewe P., Stegle O., Hartmann L., Kahles A., Bohnert R., Wachter A., Borgwardt K., Rätsch G. Accurate detection of differential RNA processing. Nucleic Acids Res. 2013;41(10):5189-5198. doi 10.1093/nar/gkt211</mixed-citation><mixed-citation xml:lang="en">Drewe P., Stegle O., Hartmann L., Kahles A., Bohnert R., Wachter A., Borgwardt K., Rätsch G. Accurate detection of differential RNA processing. Nucleic Acids Res. 2013;41(10):5189-5198. doi 10.1093/nar/gkt211</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Emms D.M., Kelly S. OrthoFinder: phylogenetic orthology inference for comparative genomics. Genome Biol. 2019;20(1):238. doi 10.1186/s13059-019-1832-y</mixed-citation><mixed-citation xml:lang="en">Emms D.M., Kelly S. OrthoFinder: phylogenetic orthology inference for comparative genomics. Genome Biol. 2019;20(1):238. doi 10.1186/s13059-019-1832-y</mixed-citation></citation-alternatives></ref><ref id="cit14"><label>14</label><citation-alternatives><mixed-citation xml:lang="ru">Grabherr M.G., Haas B.J., Yassour M., Levin J.Z., Thompson D.A., Amit I., Adiconis X., … Birren B.W., Nusbaum C., Lindblad-Toh K., Friedman N., Regev A. Full-length transcriptome assembly from RNA-Seq data without a reference genome. Nat Biotechnol. 2011; 29(7):644-652. doi 10.1038/nbt.1883</mixed-citation><mixed-citation xml:lang="en">Grabherr M.G., Haas B.J., Yassour M., Levin J.Z., Thompson D.A., Amit I., Adiconis X., … Birren B.W., Nusbaum C., Lindblad-Toh K., Friedman N., Regev A. Full-length transcriptome assembly from RNA-Seq data without a reference genome. Nat Biotechnol. 2011; 29(7):644-652. doi 10.1038/nbt.1883</mixed-citation></citation-alternatives></ref><ref id="cit15"><label>15</label><citation-alternatives><mixed-citation xml:lang="ru">Grosjean P., Ibanez F., Etienne M., Grosjean M.P. Package ‘Pastecs’. 2018. Available online: http://masterdistfiles.gentoo.org/pub/cran/web/packages/pastecs/pastecs.pdf</mixed-citation><mixed-citation xml:lang="en">Grosjean P., Ibanez F., Etienne M., Grosjean M.P. Package ‘Pastecs’. 2018. Available online: http://masterdistfiles.gentoo.org/pub/cran/web/packages/pastecs/pastecs.pdf</mixed-citation></citation-alternatives></ref><ref id="cit16"><label>16</label><citation-alternatives><mixed-citation xml:lang="ru">Han S., Liang Y., Ma Q., Xu Y., Zhang Y., Du W., Wang C., Li Y. LncFinder: an integrated platform for long non-coding RNA identification utilizing sequence intrinsic composition, structural information and physicochemical property. Brief Bioinform. 2019;20(6): 2009-2027. doi 10.1093/bib/bby065</mixed-citation><mixed-citation xml:lang="en">Han S., Liang Y., Ma Q., Xu Y., Zhang Y., Du W., Wang C., Li Y. LncFinder: an integrated platform for long non-coding RNA identification utilizing sequence intrinsic composition, structural information and physicochemical property. Brief Bioinform. 2019;20(6): 2009-2027. doi 10.1093/bib/bby065</mixed-citation></citation-alternatives></ref><ref id="cit17"><label>17</label><citation-alternatives><mixed-citation xml:lang="ru">Hassani‐Pak K., Singh A., Brandizi M., Hearnshaw J., Parsons J.D., Amberkar S., Phillips A.L., Doonan J.H., Rawlings C. KnetMiner: a comprehensive approach for supporting evidence‐based gene discovery and complex trait analysis across species. Plant Biotechnol J. 2021;19(8):1670-1678. doi 10.1111/pbi.13583</mixed-citation><mixed-citation xml:lang="en">Hassani‐Pak K., Singh A., Brandizi M., Hearnshaw J., Parsons J.D., Amberkar S., Phillips A.L., Doonan J.H., Rawlings C. KnetMiner: a comprehensive approach for supporting evidence‐based gene discovery and complex trait analysis across species. Plant Biotechnol J. 2021;19(8):1670-1678. doi 10.1111/pbi.13583</mixed-citation></citation-alternatives></ref><ref id="cit18"><label>18</label><citation-alternatives><mixed-citation xml:lang="ru">Jia L., Liu N., Huang F., Zhou Z., He X., Li H., Wang Z., Yao W. intansv: an R package for integrative analysis of structural variations. PeerJ. 2020;8:e8867. doi 10.7717/peerj.8867</mixed-citation><mixed-citation xml:lang="en">Jia L., Liu N., Huang F., Zhou Z., He X., Li H., Wang Z., Yao W. intansv: an R package for integrative analysis of structural variations. PeerJ. 2020;8:e8867. doi 10.7717/peerj.8867</mixed-citation></citation-alternatives></ref><ref id="cit19"><label>19</label><citation-alternatives><mixed-citation xml:lang="ru">Jin M., Liu H., He C., Fu J., Xiao Y., Wang Y., Xie W., Wang G., Yan J. Maize pan-transcriptome provides novel insights into genome complexity and quantitative trait variation. Sci Rep. 2016;6(1):18936. doi 10.1038/srep18936</mixed-citation><mixed-citation xml:lang="en">Jin M., Liu H., He C., Fu J., Xiao Y., Wang Y., Xie W., Wang G., Yan J. Maize pan-transcriptome provides novel insights into genome complexity and quantitative trait variation. Sci Rep. 2016;6(1):18936. doi 10.1038/srep18936</mixed-citation></citation-alternatives></ref><ref id="cit20"><label>20</label><citation-alternatives><mixed-citation xml:lang="ru">Johnson K.A., Krishnan A. Robust normalization and transformation techniques for constructing gene coexpression networks from RNA-seq data. Genome Biol. 2022;23(1):1. doi 10.1186/s13059-021-02568-9</mixed-citation><mixed-citation xml:lang="en">Johnson K.A., Krishnan A. Robust normalization and transformation techniques for constructing gene coexpression networks from RNA-seq data. Genome Biol. 2022;23(1):1. doi 10.1186/s13059-021-02568-9</mixed-citation></citation-alternatives></ref><ref id="cit21"><label>21</label><citation-alternatives><mixed-citation xml:lang="ru">Karetnikov D.I., Vasiliev G.V., Toshchakov S.V., Shmakov N.A., Genaev M.A., Nesterov M.A., Ibragimova S.M., Rybakov D.A., Gavrilenko T.A., Salina E.A., Patrushev M.V., Kochetov A.V., Afonnikov D.A. Analysis of genome structure and its variations in potato cultivars grown in Russia. Int J Mol Sci. 2023;24(6):5713. doi 10.3390/ijms24065713</mixed-citation><mixed-citation xml:lang="en">Karetnikov D.I., Vasiliev G.V., Toshchakov S.V., Shmakov N.A., Genaev M.A., Nesterov M.A., Ibragimova S.M., Rybakov D.A., Gavrilenko T.A., Salina E.A., Patrushev M.V., Kochetov A.V., Afonnikov D.A. Analysis of genome structure and its variations in potato cultivars grown in Russia. Int J Mol Sci. 2023;24(6):5713. doi 10.3390/ijms24065713</mixed-citation></citation-alternatives></ref><ref id="cit22"><label>22</label><citation-alternatives><mixed-citation xml:lang="ru">Khlestkina E.K. Molecular markers in genetic studies and breeding. Russ J Genet Appl Res. 2014;4:236-244. doi 10.1134/S2079059714030022</mixed-citation><mixed-citation xml:lang="en">Khlestkina E.K. Molecular markers in genetic studies and breeding. Russ J Genet Appl Res. 2014;4:236-244. doi 10.1134/S2079059714030022</mixed-citation></citation-alternatives></ref><ref id="cit23"><label>23</label><citation-alternatives><mixed-citation xml:lang="ru">Kim E.-D., Sung S. Long noncoding RNA: unveiling hidden layer of gene regulatory networks. Trends Plant Sci. 2012;17(1):16-21. doi 10.1016/j.tplants.2011.10.008</mixed-citation><mixed-citation xml:lang="en">Kim E.-D., Sung S. Long noncoding RNA: unveiling hidden layer of gene regulatory networks. Trends Plant Sci. 2012;17(1):16-21. doi 10.1016/j.tplants.2011.10.008</mixed-citation></citation-alternatives></ref><ref id="cit24"><label>24</label><citation-alternatives><mixed-citation xml:lang="ru">Kochetov A.V., Afonnikov D.A., Shmakov N., Vasiliev G.V., Antonova O.Y., Shatskaya N.V., Glagoleva A.Y., Ibragimova S.M., Khiutti A., Afanasenko O.S., Gavrilenko T.A. NLR genes related transcript sets in potato cultivars bearing genetic material of wild Mexican Solanum species. Agronomy. 2021;11(12):2426. doi 10.3390/agronomy11122426</mixed-citation><mixed-citation xml:lang="en">Kochetov A.V., Afonnikov D.A., Shmakov N., Vasiliev G.V., Antonova O.Y., Shatskaya N.V., Glagoleva A.Y., Ibragimova S.M., Khiutti A., Afanasenko O.S., Gavrilenko T.A. NLR genes related transcript sets in potato cultivars bearing genetic material of wild Mexican Solanum species. Agronomy. 2021;11(12):2426. doi 10.3390/agronomy11122426</mixed-citation></citation-alternatives></ref><ref id="cit25"><label>25</label><citation-alternatives><mixed-citation xml:lang="ru">Larkin D.L., Lozada D.N., Mason R.E. Genomic selection – considerations for successful implementation in wheat breeding programs. Agronomy. 2019;9(9):479. doi 10.3390/agronomy9090479</mixed-citation><mixed-citation xml:lang="en">Larkin D.L., Lozada D.N., Mason R.E. Genomic selection – considerations for successful implementation in wheat breeding programs. Agronomy. 2019;9(9):479. doi 10.3390/agronomy9090479</mixed-citation></citation-alternatives></ref><ref id="cit26"><label>26</label><citation-alternatives><mixed-citation xml:lang="ru">Li H. A statistical framework for SNP calling, mutation discovery, association mapping and population genetical parameter estimation from sequencing data. Bioinformatics. 2011;27(21):2987-2993. doi 10.1093/bioinformatics/btr509</mixed-citation><mixed-citation xml:lang="en">Li H. A statistical framework for SNP calling, mutation discovery, association mapping and population genetical parameter estimation from sequencing data. Bioinformatics. 2011;27(21):2987-2993. doi 10.1093/bioinformatics/btr509</mixed-citation></citation-alternatives></ref><ref id="cit27"><label>27</label><citation-alternatives><mixed-citation xml:lang="ru">Li H. Aligning sequence reads, clone sequences and assembly contigs with BWA-MEM. ArXiv. 2013;1303.3997</mixed-citation><mixed-citation xml:lang="en">Li H. Aligning sequence reads, clone sequences and assembly contigs with BWA-MEM. ArXiv. 2013;1303.3997</mixed-citation></citation-alternatives></ref><ref id="cit28"><label>28</label><citation-alternatives><mixed-citation xml:lang="ru">Li H., Durbin R. Fast and accurate short read alignment with Burrows– Wheeler transform. Bioinformatics. 2009;25(14):1754-1760. doi 10.1093/bioinformatics/btp324</mixed-citation><mixed-citation xml:lang="en">Li H., Durbin R. Fast and accurate short read alignment with Burrows– Wheeler transform. Bioinformatics. 2009;25(14):1754-1760. doi 10.1093/bioinformatics/btp324</mixed-citation></citation-alternatives></ref><ref id="cit29"><label>29</label><citation-alternatives><mixed-citation xml:lang="ru">Li H., Handsaker B., Wysoker A., Fennell T., Ruan J., Homer N., Marth G., Abecasis G., Durbin R; 1000 Genome Project Data Processing Subgroup. The sequence alignment/map format and SAMtools. Bioinformatics. 2009;25(16):2078-2079. doi 10.1093/bioinformatics/btp352</mixed-citation><mixed-citation xml:lang="en">Li H., Handsaker B., Wysoker A., Fennell T., Ruan J., Homer N., Marth G., Abecasis G., Durbin R; 1000 Genome Project Data Processing Subgroup. The sequence alignment/map format and SAMtools. Bioinformatics. 2009;25(16):2078-2079. doi 10.1093/bioinformatics/btp352</mixed-citation></citation-alternatives></ref><ref id="cit30"><label>30</label><citation-alternatives><mixed-citation xml:lang="ru">Liao Y., Smyth G.K., Shi W. featureCounts: an efficient general purpose program for assigning sequence reads to genomic features. Bioinformatics. 2014;30(7):923-930. doi 10.1093/bioinformatics/btt656</mixed-citation><mixed-citation xml:lang="en">Liao Y., Smyth G.K., Shi W. featureCounts: an efficient general purpose program for assigning sequence reads to genomic features. Bioinformatics. 2014;30(7):923-930. doi 10.1093/bioinformatics/btt656</mixed-citation></citation-alternatives></ref><ref id="cit31"><label>31</label><citation-alternatives><mixed-citation xml:lang="ru">Lin H.-N., Hsu W.-L. DART: a fast and accurate RNA-seq mapper with a partitioning strategy. Bioinformatics. 2018;34(2):190-197. doi 10.1093/bioinformatics/btx558</mixed-citation><mixed-citation xml:lang="en">Lin H.-N., Hsu W.-L. DART: a fast and accurate RNA-seq mapper with a partitioning strategy. Bioinformatics. 2018;34(2):190-197. doi 10.1093/bioinformatics/btx558</mixed-citation></citation-alternatives></ref><ref id="cit32"><label>32</label><citation-alternatives><mixed-citation xml:lang="ru">Muqaddasi Q.H., Brassac J., Ebmeyer E., Kollers S., Korzun V., Argillier O., Stiewe G., Plieske J., Ganal M.W., Röder M.S. Prospects of GWAS and predictive breeding for European winter wheat’s grain protein content, grain starch content, and grain hardness. Sci Rep. 2020;10(1):12541. doi 10.1038/s41598-020-69381-5</mixed-citation><mixed-citation xml:lang="en">Muqaddasi Q.H., Brassac J., Ebmeyer E., Kollers S., Korzun V., Argillier O., Stiewe G., Plieske J., Ganal M.W., Röder M.S. Prospects of GWAS and predictive breeding for European winter wheat’s grain protein content, grain starch content, and grain hardness. Sci Rep. 2020;10(1):12541. doi 10.1038/s41598-020-69381-5</mixed-citation></citation-alternatives></ref><ref id="cit33"><label>33</label><citation-alternatives><mixed-citation xml:lang="ru">Nazipova N.N. Variety of non-coding RNAs in eukaryotic genomes. Matematicheskaya Biologiya i Bioinformatika = Mathematical Biology Bioinformatics. 2021;16(2):256-298. doi 10.17537/2021.16.256 (in Russian)</mixed-citation><mixed-citation xml:lang="en">Nazipova N.N. Variety of non-coding RNAs in eukaryotic genomes. Matematicheskaya Biologiya i Bioinformatika = Mathematical Biology Bioinformatics. 2021;16(2):256-298. doi 10.17537/2021.16.256 (in Russian)</mixed-citation></citation-alternatives></ref><ref id="cit34"><label>34</label><citation-alternatives><mixed-citation xml:lang="ru">Pedregosa F., Varoquaux G., Gramfort A., Michel V., Thirion B., Grisel O., Blondel M., … Passos A., Cournapeau D., Brucher M., Perrot M., Duchesnay E. Scikit-learn: machine learning in Python. J Mach Learn Res. 2011;12:2825-2830</mixed-citation><mixed-citation xml:lang="en">Pedregosa F., Varoquaux G., Gramfort A., Michel V., Thirion B., Grisel O., Blondel M., … Passos A., Cournapeau D., Brucher M., Perrot M., Duchesnay E. Scikit-learn: machine learning in Python. J Mach Learn Res. 2011;12:2825-2830</mixed-citation></citation-alternatives></ref><ref id="cit35"><label>35</label><citation-alternatives><mixed-citation xml:lang="ru">Piskol R., Ramaswami G., Li J.B. Reliable identification of genomic variants from RNA-seq data. Am J Hum Genet. 2013;93(4):641-651. doi 10.1016/j.ajhg.2013.08.008</mixed-citation><mixed-citation xml:lang="en">Piskol R., Ramaswami G., Li J.B. Reliable identification of genomic variants from RNA-seq data. Am J Hum Genet. 2013;93(4):641-651. doi 10.1016/j.ajhg.2013.08.008</mixed-citation></citation-alternatives></ref><ref id="cit36"><label>36</label><citation-alternatives><mixed-citation xml:lang="ru">Pronozin A.Yu., Afonnikov D.A. ICAnnoLncRNA: A Snakemake pipeline for a long non-coding-RNA search and annotation in transcriptomic sequences. Genes. 2023;14(7):1331. doi 10.3390/genes14071331</mixed-citation><mixed-citation xml:lang="en">Pronozin A.Yu., Afonnikov D.A. ICAnnoLncRNA: A Snakemake pipeline for a long non-coding-RNA search and annotation in transcriptomic sequences. Genes. 2023;14(7):1331. doi 10.3390/genes14071331</mixed-citation></citation-alternatives></ref><ref id="cit37"><label>37</label><citation-alternatives><mixed-citation xml:lang="ru">Pronozin A.Yu., Bragina M.K., Salina E.A. Crop pangenomes. Vavilovskii Zhurnal Genetiki i Selektsii = Vavilov J Genet Breed. 2021; 25(1):57-63. DOI 10.18699/VJ21.007</mixed-citation><mixed-citation xml:lang="en">Pronozin A.Yu., Bragina M.K., Salina E.A. Crop pangenomes. Vavilovskii Zhurnal Genetiki i Selektsii = Vavilov J Genet Breed. 2021; 25(1):57-63. DOI 10.18699/VJ21.007</mixed-citation></citation-alternatives></ref><ref id="cit38"><label>38</label><citation-alternatives><mixed-citation xml:lang="ru">Pronozin A.Yu., Salina E.A., Afonnikov D.A. GBS-DP: a bioinformatics pipeline for processing data coming from genotyping by sequencing. Vavilov J Genet Breed. 2023;27(7):737-745. doi 10.18699/VJGB-23-86</mixed-citation><mixed-citation xml:lang="en">Pronozin A.Yu., Salina E.A., Afonnikov D.A. GBS-DP: a bioinformatics pipeline for processing data coming from genotyping by sequencing. Vavilov J Genet Breed. 2023;27(7):737-745. doi 10.18699/VJGB-23-86</mixed-citation></citation-alternatives></ref><ref id="cit39"><label>39</label><citation-alternatives><mixed-citation xml:lang="ru">Robertson G., Schein J., Chiu R., Corbett R., Field M., Jackman S.D., Mungall K., … Hirst M., Marra M.A., Jones S.J., Hoodless P.A., Bi rol I. De novo assembly and analysis of RNA-seq data. Nat Methods. 2010;7(11):909-912. doi 10.1038/nmeth.1517</mixed-citation><mixed-citation xml:lang="en">Robertson G., Schein J., Chiu R., Corbett R., Field M., Jackman S.D., Mungall K., … Hirst M., Marra M.A., Jones S.J., Hoodless P.A., Bi rol I. De novo assembly and analysis of RNA-seq data. Nat Methods. 2010;7(11):909-912. doi 10.1038/nmeth.1517</mixed-citation></citation-alternatives></ref><ref id="cit40"><label>40</label><citation-alternatives><mixed-citation xml:lang="ru">Scheben A., Batley J., Edwards D. Genotyping-by-sequencing approaches to characterize crop genomes: choosing the right tool for the right application. Plant Biotechnol J. 2017;15(2):149-161. doi 10.1111/pbi.12645</mixed-citation><mixed-citation xml:lang="en">Scheben A., Batley J., Edwards D. Genotyping-by-sequencing approaches to characterize crop genomes: choosing the right tool for the right application. Plant Biotechnol J. 2017;15(2):149-161. doi 10.1111/pbi.12645</mixed-citation></citation-alternatives></ref><ref id="cit41"><label>41</label><citation-alternatives><mixed-citation xml:lang="ru">Shendure J. The beginning of the end for microarrays? Nat Methods. 2008;5(7):585-587. doi 10.1038/nmeth0708-585</mixed-citation><mixed-citation xml:lang="en">Shendure J. The beginning of the end for microarrays? Nat Methods. 2008;5(7):585-587. doi 10.1038/nmeth0708-585</mixed-citation></citation-alternatives></ref><ref id="cit42"><label>42</label><citation-alternatives><mixed-citation xml:lang="ru">Simão F.A., Waterhouse R.M., Ioannidis P., Kriventseva E.V., Zdobnov E.M. BUSCO: assessing genome assembly and annotation completeness with single-copy orthologs. Bioinformatics. 2015;31(19): 3210-3212. doi 10.1093/bioinformatics/btv351</mixed-citation><mixed-citation xml:lang="en">Simão F.A., Waterhouse R.M., Ioannidis P., Kriventseva E.V., Zdobnov E.M. BUSCO: assessing genome assembly and annotation completeness with single-copy orthologs. Bioinformatics. 2015;31(19): 3210-3212. doi 10.1093/bioinformatics/btv351</mixed-citation></citation-alternatives></ref><ref id="cit43"><label>43</label><citation-alternatives><mixed-citation xml:lang="ru">Stanke M., Steinkamp R., Waack S., Morgenstern B. AUGUSTUS: a web server for gene finding in eukaryotes. Nucleic Acids Res. 2004;32(Suppl. 2):W309-W312. doi 10.1093/nar/gkh379</mixed-citation><mixed-citation xml:lang="en">Stanke M., Steinkamp R., Waack S., Morgenstern B. AUGUSTUS: a web server for gene finding in eukaryotes. Nucleic Acids Res. 2004;32(Suppl. 2):W309-W312. doi 10.1093/nar/gkh379</mixed-citation></citation-alternatives></ref><ref id="cit44"><label>44</label><citation-alternatives><mixed-citation xml:lang="ru">Sukhareva A.S., Kuluev B.R. DNA markers for genetic analysis of crops. Biomika = Biomics. 2018;10(1):69-84. doi 10.31301/2221-6197.bmcs.2018-15 (in Russian)</mixed-citation><mixed-citation xml:lang="en">Sukhareva A.S., Kuluev B.R. DNA markers for genetic analysis of crops. Biomika = Biomics. 2018;10(1):69-84. doi 10.31301/2221-6197.bmcs.2018-15 (in Russian)</mixed-citation></citation-alternatives></ref><ref id="cit45"><label>45</label><citation-alternatives><mixed-citation xml:lang="ru">Suvakov M., Panda A., Diesh C., Holmes I., Abyzov A. CNVpytor: a tool for copy number variation detection and analysis from read depth and allele imbalance in whole-genome sequencing. GigaScience. 2021;10(11):giab074. doi 10.1093/gigascience/giab074</mixed-citation><mixed-citation xml:lang="en">Suvakov M., Panda A., Diesh C., Holmes I., Abyzov A. CNVpytor: a tool for copy number variation detection and analysis from read depth and allele imbalance in whole-genome sequencing. GigaScience. 2021;10(11):giab074. doi 10.1093/gigascience/giab074</mixed-citation></citation-alternatives></ref><ref id="cit46"><label>46</label><citation-alternatives><mixed-citation xml:lang="ru">Tsai M.-C., Manor O., Wan Y., Mosammaparast N., Wang J.K., Lan F., Shi Y., Segal E., Chang H.Y. Long noncoding RNA as modular scaffold of histone modification complexes. Science. 2010;329(5992): 689-693. doi 10.1126/science.1192002</mixed-citation><mixed-citation xml:lang="en">Tsai M.-C., Manor O., Wan Y., Mosammaparast N., Wang J.K., Lan F., Shi Y., Segal E., Chang H.Y. Long noncoding RNA as modular scaffold of histone modification complexes. Science. 2010;329(5992): 689-693. doi 10.1126/science.1192002</mixed-citation></citation-alternatives></ref><ref id="cit47"><label>47</label><citation-alternatives><mixed-citation xml:lang="ru">Velculescu V.E., Zhang L., Zhou W., Vogelstein J., Basrai M.A., Bassett D.E., Hieter P., Vogelstein B., Kinzler K.W. Characterization of the yeast transcriptome. Cell. 1997;88(2):243-251. doi 10.1016/S0092-8674(00)81845-0</mixed-citation><mixed-citation xml:lang="en">Velculescu V.E., Zhang L., Zhou W., Vogelstein J., Basrai M.A., Bassett D.E., Hieter P., Vogelstein B., Kinzler K.W. Characterization of the yeast transcriptome. Cell. 1997;88(2):243-251. doi 10.1016/S0092-8674(00)81845-0</mixed-citation></citation-alternatives></ref><ref id="cit48"><label>48</label><citation-alternatives><mixed-citation xml:lang="ru">Vernikos G., Medini D., Riley D.R., Tettelin H. Ten years of pangenome analyses. Curr Opin Microbiol. 2015;23:148-154. doi 10.1016/j.mib.2014.11.016</mixed-citation><mixed-citation xml:lang="en">Vernikos G., Medini D., Riley D.R., Tettelin H. Ten years of pangenome analyses. Curr Opin Microbiol. 2015;23:148-154. doi 10.1016/j.mib.2014.11.016</mixed-citation></citation-alternatives></ref><ref id="cit49"><label>49</label><citation-alternatives><mixed-citation xml:lang="ru">Wang J., Zhang Z. GAPIT version 3: boosting power and accuracy for genomic association and prediction. Genomics Proteomics Bioinformatics. 2021;19(4):629-640. doi 10.1016/j.gpb.2021.08.005</mixed-citation><mixed-citation xml:lang="en">Wang J., Zhang Z. GAPIT version 3: boosting power and accuracy for genomic association and prediction. Genomics Proteomics Bioinformatics. 2021;19(4):629-640. doi 10.1016/j.gpb.2021.08.005</mixed-citation></citation-alternatives></ref><ref id="cit50"><label>50</label><citation-alternatives><mixed-citation xml:lang="ru">Wu T.D., Watanabe C.K. GMAP: a genomic mapping and alignment program for mRNA and EST sequences. Bioinformatics. 2005; 21(9):1859-1875. doi 10.1093/bioinformatics/bti310</mixed-citation><mixed-citation xml:lang="en">Wu T.D., Watanabe C.K. GMAP: a genomic mapping and alignment program for mRNA and EST sequences. Bioinformatics. 2005; 21(9):1859-1875. doi 10.1093/bioinformatics/bti310</mixed-citation></citation-alternatives></ref><ref id="cit51"><label>51</label><citation-alternatives><mixed-citation xml:lang="ru">Zatybekov A., Abugalieva S., Didorenko S., Gerasimova Y., Sidorik I., Anuarbek S., Turuspekov Y. GWAS of agronomic traits in soybean collection included in breeding pool in Kazakhstan. BMC Plant Biol. 2017;17(S1):179. doi 10.1186/s12870-017-1125-0</mixed-citation><mixed-citation xml:lang="en">Zatybekov A., Abugalieva S., Didorenko S., Gerasimova Y., Sidorik I., Anuarbek S., Turuspekov Y. GWAS of agronomic traits in soybean collection included in breeding pool in Kazakhstan. BMC Plant Biol. 2017;17(S1):179. doi 10.1186/s12870-017-1125-0</mixed-citation></citation-alternatives></ref><ref id="cit52"><label>52</label><citation-alternatives><mixed-citation xml:lang="ru">Zheng X. A tutorial for the R Package SNPRelate. Washington, USA: University of Washington, 2013 Zimin A.V., Marçais G., Puiu D., Roberts M., Salzberg S.L., Yorke J.A. The MaSuRCA genome assembler. Bioinformatics. 2013;29(21): 2669-2677. doi 10.1093/bioinformatics/btt476</mixed-citation><mixed-citation xml:lang="en">Zheng X. A tutorial for the R Package SNPRelate. Washington, USA: University of Washington, 2013 Zimin A.V., Marçais G., Puiu D., Roberts M., Salzberg S.L., Yorke J.A. The MaSuRCA genome assembler. Bioinformatics. 2013;29(21): 2669-2677. doi 10.1093/bioinformatics/btt476</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
