<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">vavilov</journal-id><journal-title-group><journal-title xml:lang="ru">Вавиловский журнал генетики и селекции</journal-title><trans-title-group xml:lang="en"><trans-title>Vavilov Journal of Genetics and Breeding</trans-title></trans-title-group></journal-title-group><issn pub-type="epub">2500-3259</issn><publisher><publisher-name>Institute of Cytology and Genetics of Siberian Branch of the RAS</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.18699/vjgb-25-99</article-id><article-id custom-type="elpub" pub-id-type="custom">vavilov-4876</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>КОМПЬЮТЕРНАЯ ГЕНОМИКА</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="en"><subject>MICROBIAL GENETICS AND BIOTECHNOLOGY</subject></subj-group></article-categories><title-group><article-title>Связь иерархической классификации транскрипционных факторов по структуре ДНК-связывающего домена и вариабельности мотивов сайтов связывания этих факторов</article-title><trans-title-group xml:lang="en"><trans-title>Linking hierarchical classification of transcription factors by the structure of their DNA-binding domains to the variability of their binding site motifs</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-4905-3088</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Левицкий</surname><given-names>В. Г.</given-names></name><name name-style="western" xml:lang="en"><surname>Levitsky</surname><given-names>V. G.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><email xlink:type="simple">levitsky@bionet.nsc.ru</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Ватолина</surname><given-names>Т. Ю.</given-names></name><name name-style="western" xml:lang="en"><surname>Vatolina</surname><given-names>T. Yu.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Радица</surname><given-names>В. В.</given-names></name><name name-style="western" xml:lang="en"><surname>Raditsa</surname><given-names>V. V.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><xref ref-type="aff" rid="aff-3"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru">Федеральный исследовательский центр Институт цитологии и генетики Сибирского отделения Российской академии наук; Институт молекулярной и клеточной биологии Сибирского отделения Российской академии наук<country>Россия</country></aff><aff xml:lang="en">Institute of Cytology and Genetics of the Siberian Branch of the Russian Academy of Sciences; Institute of Molecular and Cellular Biology of the Siberian Branch of the Russian Academy of Sciences<country>Russian Federation</country></aff></aff-alternatives><aff-alternatives id="aff-2"><aff xml:lang="ru">Институт молекулярной и клеточной биологии Сибирского отделения Российской академии наук<country>Россия</country></aff><aff xml:lang="en">Institute of Molecular and Cellular Biology of the Siberian Branch of the Russian Academy of Sciences<country>Russian Federation</country></aff></aff-alternatives><aff-alternatives id="aff-3"><aff xml:lang="ru">Федеральный исследовательский центр Институт цитологии и генетики Сибирского отделения Российской академии наук<country>Россия</country></aff><aff xml:lang="en">Institute of Cytology and Genetics of the Siberian Branch of the Russian Academy of Sciences<country>Russian Federation</country></aff></aff-alternatives><pub-date pub-type="collection"><year>2025</year></pub-date><pub-date pub-type="epub"><day>12</day><month>12</month><year>2025</year></pub-date><volume>29</volume><issue>7</issue><fpage>925</fpage><lpage>939</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Левицкий В.Г., Ватолина Т.Ю., Радица В.В., 2025</copyright-statement><copyright-year>2025</copyright-year><copyright-holder xml:lang="ru">Левицкий В.Г., Ватолина Т.Ю., Радица В.В.</copyright-holder><copyright-holder xml:lang="en">Levitsky V.G., Vatolina T.Y., Raditsa V.V.</copyright-holder><license license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://vavilov.elpub.ru/jour/article/view/4876">https://vavilov.elpub.ru/jour/article/view/4876</self-uri><abstract><p>   Поиск мотивов de novo – базовый подход определения нуклеотидной с  пецифичности связывания важнейших регуляторов транскрипции генов, транскрипционных факторов (ТФ), на основе данных массового полногеномного секвенирования районов их сайтов связывания in vivo, таких как ChIP-seq. Количество известных мотивов сайтов связывания ТФ (ССТФ) возросло в несколько раз в последние годы. Из-за сходства структуры ДНК-связывающих доменов ТФ многие структурно родственные ТФ имеют сходные или даже неразличимые мотивы сайтов связывания. Классификация ТФ по структуре ДНК-связывающих доменов из базы данных TFClass определяет верхние уровни иерархии (суперклассы и классы ТФ) по структуре этих доменов, а следующие уровни (семейства и подсемейства ТФ) по выравниваниям аминокислотных последовательностей доменов. Однако эта классификация не учитывает сходство мотивов ССТФ, а для идентификации действующих ТФ по данным массового секвенирования ССТФ ChIP-seq приходится иметь дело с мотивами ССТФ, а не с самими ТФ. Поэтому в данной работе мы взяли из баз данных Hocomoco/Jaspar мотивы CCТФ человека/плодовой мушки Drosophila melanogaster и рассмотрели сходство мотивов сайтов связывания в парах родственных ТФ согласно их классификации в базе данных TFClass. Показано, что общее дерево иерархии ТФ по структуре ДНК-связывающих доменов можно разделить на отдельные неперекрывающиеся множества ТФ – ветви. В пределах каждой ветви большинство пар ТФ имеет значимо похожие мотивы сайтов связывания. Каждая ветвь включает одну или несколько сестринских элементарных единиц иерархии и все более низкие ее/их уровни: один или несколько ТФ одного подсемейства или целое подсемейство, одно или несколько подсемейств одного семейства, целое семейство и т. д. до целого класса. Анализ семи крупнейших классов ТФ человека и двух плодовой мушки показал, что сходство ТФ по мотивам ССТФ для разных соответствующих уровней (классов, семейств) заметно отличается. Дополнение иерархической классификации ТФ ветвями, объединяющими значимо сходные мотивы ССТФ, может повысить эффективность идентификации ТФ, вовлеченных в регуляцию транскрипции, по результатам de novo поиска обогащенных мотивов для данных массового секвенирования ССТФ с помощью технологии ChIP-seq.</p></abstract><trans-abstract xml:lang="en"><p>   De novo motif search is the main approach for determining the nucleotide specificity of binding of the key regulators of gene transcription, transcription factors (TFs), based on data from massive genome-wide sequencing of their binding site regions in vivo, such as ChIP-seq. The number of motifs of known TF binding sites (TFBSs) has increased several times in recent years. Due to the similarity in the structure of the DNA-binding domains of TFs, many structurally cognate TFs have similar and sometimes almost indistinguishable binding site motifs. The classification of TFs by the structure of the DNA-binding domains from the TFClass database defines the top levels of the hierarchy (superclasses and classes of TFs) by the structure of these domains, and the next levels (families and subfamilies of TFs) by the alignments of amino acid sequences of domains. However, this classification does not take into account the similarity of TFBS motifs, whereas identification of valid TFs from massive sequencing data of TFBSs, such as ChIP-seq, requires working with TFBS motifs rather than TFs themselves. Therefore, in this study we extracted from the Hocomoco and Jaspar databases the TFBS motifs for human and fruit fly Drosophila melanogaster, and considered the pairwise similarity of binding site motifs of cognate TFs according to their classification from the TFClass database. We have shown that the common tree of the TF hierarchy by the structure of DNA-binding domains can be split into separate branches representing non-overlapping sets of TFs. Within each branch, the majority of TF pairs have significantly similar binding site motifs. Each branch can include one or more sister elementary units of the hierarchy and all its/their lower levels: one or more TFs of the same subfamily, or the whole subfamily, one or several subfamilies of the same family, an entire family, etc., up to the entire class. Analysis of the seven largest human and two largest Drosophila TF classes showed that the similarity of TFs in terms of TFBS motifs for different corresponding levels (classes, families) is noticeably different. Supplementing the hierarchical classification of TFs with branches combining significantly similar motifs of TFBSs can increase the efficiency of identifying involved TFs through enriched motifs detected by de novo motif search for massive sequencing data of TFBSs from the ChIP-seq technology.</p></trans-abstract><kwd-group xml:lang="ru"><kwd>de novo поиск мотивов</kwd><kwd>мотивы сайтов связывания транскрипционных факторов</kwd><kwd>структурные варианты мотивов сайтов связывания транскрипционных факторов</kwd><kwd>сходство мотивов сайтов связывания транскрипционных факторов</kwd><kwd>кооперативное действие транскрипционных факторов</kwd><kwd>массовое полногеномное секвенирование сайтов связывания транскрипционных факторов</kwd></kwd-group><kwd-group xml:lang="en"><kwd>de novo motif search</kwd><kwd>motifs of transcription factor binding sites</kwd><kwd>structural variants of motifs of transcription factor binding sites</kwd><kwd>similarity of motifs of transcription factor binding sites</kwd><kwd>cooperative action of transcription factors</kwd><kwd>massive whole-genome sequencing of transcription factor binding sites</kwd></kwd-group><funding-group xml:lang="en"><funding-statement>The work was supported by the Russian Science Foundation, grant No. 24-14-00133</funding-statement></funding-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Ambrosini G., Vorontsov I., Penzar D., Groux R., Fornes O., Nikolaeva D.D., Ballester B., Grau J., Grosse I., Makeev V., Kulakovskiy I., Bucher P. Insights gained from a comprehensive all-against-all transcription factor binding motif benchmarking study. Genome Biol. 2020;21(1):114. doi: 10.1186/s13059-020-01996-3</mixed-citation><mixed-citation xml:lang="en">Ambrosini G., Vorontsov I., Penzar D., Groux R., Fornes O., Nikolaeva D.D., Ballester B., Grau J., Grosse I., Makeev V., Kulakovskiy I., Bucher P. Insights gained from a comprehensive all-against-all transcription factor binding motif benchmarking study. Genome Biol. 2020;21(1):114. doi: 10.1186/s13059-020-01996-3</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Amoutzias G.D., Robertson D.L., Van de Peer Y., Oliver S.G. Choose your partners: dimerization in eukaryotic transcription factors. Trends Biochem Sci. 2008;33(5):220-229. doi: 10.1016/j.tibs.2008.02.002</mixed-citation><mixed-citation xml:lang="en">Amoutzias G.D., Robertson D.L., Van de Peer Y., Oliver S.G. Choose your partners: dimerization in eukaryotic transcription factors. Trends Biochem Sci. 2008;33(5):220-229. doi: 10.1016/j.tibs.2008.02.002</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Bailey T.L. STREME: Accurate and versatile sequence motif discovery. Bioinformatics 2021;37(18):2834-2840. doi: 10.1093/bioinformatics/btab203</mixed-citation><mixed-citation xml:lang="en">Bailey T.L. STREME: Accurate and versatile sequence motif discovery. Bioinformatics 2021;37(18):2834-2840. doi: 10.1093/bioinformatics/btab203</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Blanc-Mathieu R., Dumas R., Turchi L., Lucas J., Parcy F. Plant- TFClass: a structural classification for plant transcription factors. Trends Plant Sci. 2024;29(1):40-51. doi: 10.1016/j.tplants.2023.06.023</mixed-citation><mixed-citation xml:lang="en">Blanc-Mathieu R., Dumas R., Turchi L., Lucas J., Parcy F. Plant- TFClass: a structural classification for plant transcription factors. Trends Plant Sci. 2024;29(1):40-51. doi: 10.1016/j.tplants.2023.06.023</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">D’haeseleer P. What are DNA sequence motifs? Nat Biotechnol. 2006; 24(4):423-425. doi: 10.1038/nbt0406-423</mixed-citation><mixed-citation xml:lang="en">D’haeseleer P. What are DNA sequence motifs? Nat Biotechnol. 2006; 24(4):423-425. doi: 10.1038/nbt0406-423</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">de Martin X., Sodaei R., Santpere G. Mechanisms of binding specificity among bHLH transcription factors. Int J Mol Sci. 2021;22(17): 9150. doi: 10.3390/ijms22179150</mixed-citation><mixed-citation xml:lang="en">de Martin X., Sodaei R., Santpere G. Mechanisms of binding specificity among bHLH transcription factors. Int J Mol Sci. 2021;22(17): 9150. doi: 10.3390/ijms22179150</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Franco-Zorrilla J.M., López-Vidriero I., Carrasco J.L., Godoy M., Vera P., Solano R. DNA-binding specificities of plant transcription factors and their potential to define target genes. Proc Natl Acad Sci USA. 2014;111(6):2367-2372. doi: 10.1073/pnas.1316278111</mixed-citation><mixed-citation xml:lang="en">Franco-Zorrilla J.M., López-Vidriero I., Carrasco J.L., Godoy M., Vera P., Solano R. DNA-binding specificities of plant transcription factors and their potential to define target genes. Proc Natl Acad Sci USA. 2014;111(6):2367-2372. doi: 10.1073/pnas.1316278111</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Gupta S., Stamatoyannopolous J.A., Bailey T.L., Noble W.S. Quantifying similarity between motifs. Genome Biol. 2007;8(2):R24. doi: 10.1186/gb-2007-8-2-r24</mixed-citation><mixed-citation xml:lang="en">Gupta S., Stamatoyannopolous J.A., Bailey T.L., Noble W.S. Quantifying similarity between motifs. Genome Biol. 2007;8(2):R24. doi: 10.1186/gb-2007-8-2-r24</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Hammal F., de Langen P., Bergon A., Lopez F., Ballester B. ReMap 2022: A database of Human, Mouse, Drosophila and Arabidopsis regulatory regions from an integrative analysis of DNA-binding sequencing experiments. Nucleic Acids Res. 2022;50(D1):D316-D325. doi: 10.1093/nar/gkab996</mixed-citation><mixed-citation xml:lang="en">Hammal F., de Langen P., Bergon A., Lopez F., Ballester B. ReMap 2022: A database of Human, Mouse, Drosophila and Arabidopsis regulatory regions from an integrative analysis of DNA-binding sequencing experiments. Nucleic Acids Res. 2022;50(D1):D316-D325. doi: 10.1093/nar/gkab996</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Johnson D.S., Mortazavi A., Myers R.M., Wold B. Genome-wide mapping of in vivo protein-DNA interactions. Science. 2007;316(5830): 1497-1502. doi: 10.1126/science.1141319</mixed-citation><mixed-citation xml:lang="en">Johnson D.S., Mortazavi A., Myers R.M., Wold B. Genome-wide mapping of in vivo protein-DNA interactions. Science. 2007;316(5830): 1497-1502. doi: 10.1126/science.1141319</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Jolma A., Yan J., Whitington T., Toivonen J., Nitta K.R., Rastas P., Morgunova E., … Hughes T.R., Lemaire P., Ukkonen E., Kivioja T., Taipale J. DNA-binding specificities of human transcription factors. Cell. 2013;152(1-2):327-339. doi: 10.1016/j.cell.2012.12.009</mixed-citation><mixed-citation xml:lang="en">Jolma A., Yan J., Whitington T., Toivonen J., Nitta K.R., Rastas P., Morgunova E., … Hughes T.R., Lemaire P., Ukkonen E., Kivioja T., Taipale J. DNA-binding specificities of human transcription factors. Cell. 2013;152(1-2):327-339. doi: 10.1016/j.cell.2012.12.009</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Kolmykov S., Yevshin I., Kulyashov M., Sharipov R., Kondrakhin Y., Makeev V.J., Kulakovskiy I.V., Kel A., Kolpakov F. GTRD: An integrated view of transcription regulation. Nucleic Acids Res. 2021; 49(D1):D104-D111. doi: 10.1093/nar/gkaa1057</mixed-citation><mixed-citation xml:lang="en">Kolmykov S., Yevshin I., Kulyashov M., Sharipov R., Kondrakhin Y., Makeev V.J., Kulakovskiy I.V., Kel A., Kolpakov F. GTRD: An integrated view of transcription regulation. Nucleic Acids Res. 2021; 49(D1):D104-D111. doi: 10.1093/nar/gkaa1057</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Lambert S.A., Jolma A., Campitelli L.F., Das P.K., Yin Y., Albu M., Chen X., Taipale J., Hughes T.R., Weirauch M.T. The human transcription factors. Cell. 2018;172(4):650-665. doi: 10.1016/j.cell.2018.01.029</mixed-citation><mixed-citation xml:lang="en">Lambert S.A., Jolma A., Campitelli L.F., Das P.K., Yin Y., Albu M., Chen X., Taipale J., Hughes T.R., Weirauch M.T. The human transcription factors. Cell. 2018;172(4):650-665. doi: 10.1016/j.cell.2018.01.029</mixed-citation></citation-alternatives></ref><ref id="cit14"><label>14</label><citation-alternatives><mixed-citation xml:lang="ru">Lambert S.A., Yan A.W.H., Sasse A., Cowley G., Albu M., Caddick M.X., Morris Q.D., Weirauch M.T., Hughes T.R. Similarity regression predicts evolution of transcription factor sequence specificity. Nat Genet. 2019;51(6):981-989. doi: 10.1038/s41588-019-0411-1</mixed-citation><mixed-citation xml:lang="en">Lambert S.A., Yan A.W.H., Sasse A., Cowley G., Albu M., Caddick M.X., Morris Q.D., Weirauch M.T., Hughes T.R. Similarity regression predicts evolution of transcription factor sequence specificity. Nat Genet. 2019;51(6):981-989. doi: 10.1038/s41588-019-0411-1</mixed-citation></citation-alternatives></ref><ref id="cit15"><label>15</label><citation-alternatives><mixed-citation xml:lang="ru">Levitsky V., Zemlyanskaya E., Oshchepkov D., Podkolodnaya O., Ignatieva E., Grosse I., Mironova V., Merkulova T. A single ChIP-seq dataset is sufficient for comprehensive analysis of motifs co-occurrence with MCOT package. Nucleic Acids Res. 2019;47(21):e139. doi: 10.1093/nar/gkz800</mixed-citation><mixed-citation xml:lang="en">Levitsky V., Zemlyanskaya E., Oshchepkov D., Podkolodnaya O., Ignatieva E., Grosse I., Mironova V., Merkulova T. A single ChIP-seq dataset is sufficient for comprehensive analysis of motifs co-occurrence with MCOT package. Nucleic Acids Res. 2019;47(21):e139. doi: 10.1093/nar/gkz800</mixed-citation></citation-alternatives></ref><ref id="cit16"><label>16</label><citation-alternatives><mixed-citation xml:lang="ru">Liu B., Yang J., Li Y., McDermaid A., Ma Q. An algorithmic perspective of de novo cis-regulatory motif finding based on ChIP-seq data. Brief Bioinform. 2018;19(5):1069-1081. doi: 10.1093/bib/bbx026</mixed-citation><mixed-citation xml:lang="en">Liu B., Yang J., Li Y., McDermaid A., Ma Q. An algorithmic perspective of de novo cis-regulatory motif finding based on ChIP-seq data. Brief Bioinform. 2018;19(5):1069-1081. doi: 10.1093/bib/bbx026</mixed-citation></citation-alternatives></ref><ref id="cit17"><label>17</label><citation-alternatives><mixed-citation xml:lang="ru">Lloyd S.M., Bao X. Pinpointing the genomic localizations of chromatin-associated proteins: the yesterday, today, and tomorrow of ChIP-seq. Curr Protoc Cell Biol. 2019;84(1):e89. doi: 10.1002/cpcb.89</mixed-citation><mixed-citation xml:lang="en">Lloyd S.M., Bao X. Pinpointing the genomic localizations of chromatin-associated proteins: the yesterday, today, and tomorrow of ChIP-seq. Curr Protoc Cell Biol. 2019;84(1):e89. doi: 10.1002/cpcb.89</mixed-citation></citation-alternatives></ref><ref id="cit18"><label>18</label><citation-alternatives><mixed-citation xml:lang="ru">Morgunova E., Taipale J. Structural perspective of cooperative transcription factor binding. Curr Opin Struct Biol. 2017;47:1-8. doi: 10.1016/j.sbi.2017.03.006</mixed-citation><mixed-citation xml:lang="en">Morgunova E., Taipale J. Structural perspective of cooperative transcription factor binding. Curr Opin Struct Biol. 2017;47:1-8. doi: 10.1016/j.sbi.2017.03.006</mixed-citation></citation-alternatives></ref><ref id="cit19"><label>19</label><citation-alternatives><mixed-citation xml:lang="ru">Nagy G., Nagy L. Motif grammar: The basis of the language of gene expression. Comput Struct Biotechnol J. 2020;18:2026-2032. doi: 10.1016/j.csbj.2020.07.007</mixed-citation><mixed-citation xml:lang="en">Nagy G., Nagy L. Motif grammar: The basis of the language of gene expression. Comput Struct Biotechnol J. 2020;18:2026-2032. doi: 10.1016/j.csbj.2020.07.007</mixed-citation></citation-alternatives></ref><ref id="cit20"><label>20</label><citation-alternatives><mixed-citation xml:lang="ru">Najafabadi H.S., Mnaimneh S., Schmitges F.W., Garton M., Lam K.N., Yang A., Albu M., Weirauch M.T., Radovani E., Kim P.M., Greenblatt J., Frey B.J., Hughes T.R. C&lt;sub&gt;2&lt;/sub&gt;H&lt;sub&gt;2&lt;/sub&gt; zinc finger proteins greatly expand the human regulatory lexicon. Nat Biotechnol. 2015;33(5): 555-562. doi: 10.1038/nbt.3128</mixed-citation><mixed-citation xml:lang="en">Najafabadi H.S., Mnaimneh S., Schmitges F.W., Garton M., Lam K.N., Yang A., Albu M., Weirauch M.T., Radovani E., Kim P.M., Greenblatt J., Frey B.J., Hughes T.R. C&lt;sub&gt;2&lt;/sub&gt;H&lt;sub&gt;2&lt;/sub&gt; zinc finger proteins greatly expand the human regulatory lexicon. Nat Biotechnol. 2015;33(5): 555-562. doi: 10.1038/nbt.3128</mixed-citation></citation-alternatives></ref><ref id="cit21"><label>21</label><citation-alternatives><mixed-citation xml:lang="ru">Nakato R., Shirahige K. Recent advances in ChIP-seq analysis: from quality management to whole-genome annotation. Brief Bioinform. 2017;18(2):279-290. doi: 10.1093/bib/bbw023</mixed-citation><mixed-citation xml:lang="en">Nakato R., Shirahige K. Recent advances in ChIP-seq analysis: from quality management to whole-genome annotation. Brief Bioinform. 2017;18(2):279-290. doi: 10.1093/bib/bbw023</mixed-citation></citation-alternatives></ref><ref id="cit22"><label>22</label><citation-alternatives><mixed-citation xml:lang="ru">Nitta K.R., Jolma A., Yin Y., Morgunova E., Kivioja T., Akhtar J., Hens K., Toivonen J., Deplancke B., Furlong E.E., Taipale J. Conservation of transcription factor binding specificities across 600 million years of bilateria evolution. eLife. 2015;4:e04837. doi: 10.7554/eLife.04837</mixed-citation><mixed-citation xml:lang="en">Nitta K.R., Jolma A., Yin Y., Morgunova E., Kivioja T., Akhtar J., Hens K., Toivonen J., Deplancke B., Furlong E.E., Taipale J. Conservation of transcription factor binding specificities across 600 million years of bilateria evolution. eLife. 2015;4:e04837. doi: 10.7554/eLife.04837</mixed-citation></citation-alternatives></ref><ref id="cit23"><label>23</label><citation-alternatives><mixed-citation xml:lang="ru">Rauluseviciute I., Riudavets-Puig R., Blanc-Mathieu R., Castro-Mondragon J.A., Ferenc K., Kumar V., Lemma R.B., … Lenhard B., Sandelin A., Wasserman W.W., Parcy F., Mathelier A. JASPAR 2024: 20&lt;sup&gt;th&lt;/sup&gt; anniversary of the open-access database of transcription factor binding profiles. Nucleic Acids Res. 2024;52(D1):D174-D182. doi: 10.1093/nar/gkad1059</mixed-citation><mixed-citation xml:lang="en">Rauluseviciute I., Riudavets-Puig R., Blanc-Mathieu R., Castro-Mondragon J.A., Ferenc K., Kumar V., Lemma R.B., … Lenhard B., Sandelin A., Wasserman W.W., Parcy F., Mathelier A. JASPAR 2024: 20&lt;sup&gt;th&lt;/sup&gt; anniversary of the open-access database of transcription factor binding profiles. Nucleic Acids Res. 2024;52(D1):D174-D182. doi: 10.1093/nar/gkad1059</mixed-citation></citation-alternatives></ref><ref id="cit24"><label>24</label><citation-alternatives><mixed-citation xml:lang="ru">Schneider T.D., Stephens R.M. Sequence logos: a new way to display consensus sequences. Nucleic Acids Res. 1990;18(20):6097-6100. doi: 10.1093/nar/18.20.6097</mixed-citation><mixed-citation xml:lang="en">Schneider T.D., Stephens R.M. Sequence logos: a new way to display consensus sequences. Nucleic Acids Res. 1990;18(20):6097-6100. doi: 10.1093/nar/18.20.6097</mixed-citation></citation-alternatives></ref><ref id="cit25"><label>25</label><citation-alternatives><mixed-citation xml:lang="ru">Shen W.K., Chen S.Y., Gan Z.Q., Zhang Y.Z., Yue T., Chen M.M., Xue Y., Hu H., Guo A.Y. AnimalTFDB 4.0: a comprehensive animal transcription factor database updated with variation and expression annotations. Nucleic Acids Res. 2023;51(D1):D39-D45. doi: 10.1093/nar/gkac907</mixed-citation><mixed-citation xml:lang="en">Shen W.K., Chen S.Y., Gan Z.Q., Zhang Y.Z., Yue T., Chen M.M., Xue Y., Hu H., Guo A.Y. AnimalTFDB 4.0: a comprehensive animal transcription factor database updated with variation and expression annotations. Nucleic Acids Res. 2023;51(D1):D39-D45. doi: 10.1093/nar/gkac907</mixed-citation></citation-alternatives></ref><ref id="cit26"><label>26</label><citation-alternatives><mixed-citation xml:lang="ru">Skene P.J., Henikoff S. An efficient targeted nuclease strategy for high-resolution mapping of DNA binding sites. eLife. 2017;6:e21856. doi: 10.7554/eLife.21856</mixed-citation><mixed-citation xml:lang="en">Skene P.J., Henikoff S. An efficient targeted nuclease strategy for high-resolution mapping of DNA binding sites. eLife. 2017;6:e21856. doi: 10.7554/eLife.21856</mixed-citation></citation-alternatives></ref><ref id="cit27"><label>27</label><citation-alternatives><mixed-citation xml:lang="ru">Slattery M., Zhou T., Yang L., Dantas Machado A.C., Gordân R., Rohs R. Absence of a simple code: how transcription factors read the genome. Trends Biochem Sci. 2014;39(9):381-399. doi: 10.1016/j.tibs.2014.07.002</mixed-citation><mixed-citation xml:lang="en">Slattery M., Zhou T., Yang L., Dantas Machado A.C., Gordân R., Rohs R. Absence of a simple code: how transcription factors read the genome. Trends Biochem Sci. 2014;39(9):381-399. doi: 10.1016/j.tibs.2014.07.002</mixed-citation></citation-alternatives></ref><ref id="cit28"><label>28</label><citation-alternatives><mixed-citation xml:lang="ru">Sokal R.R., Michener C.D. A statistical method for evaluating systematic relationships. Univ Kansas Sci Bull. 1958;38:1409-1438. Available: https://archive.org/details/cbarchive_33927_astatisticalmethodforevaluatin1902/page/n1/mode/2up</mixed-citation><mixed-citation xml:lang="en">Sokal R.R., Michener C.D. A statistical method for evaluating systematic relationships. Univ Kansas Sci Bull. 1958;38:1409-1438. Available: https://archive.org/details/cbarchive_33927_astatisticalmethodforevaluatin1902/page/n1/mode/2up</mixed-citation></citation-alternatives></ref><ref id="cit29"><label>29</label><citation-alternatives><mixed-citation xml:lang="ru">Spitz F., Furlong E.E. Transcription factors: from enhancer binding to developmental control. Nat Rev Genet. 2012;13(9):613-626. doi: 10.1038/nrg3207</mixed-citation><mixed-citation xml:lang="en">Spitz F., Furlong E.E. Transcription factors: from enhancer binding to developmental control. Nat Rev Genet. 2012;13(9):613-626. doi: 10.1038/nrg3207</mixed-citation></citation-alternatives></ref><ref id="cit30"><label>30</label><citation-alternatives><mixed-citation xml:lang="ru">Stormo G.D., Zhao Y. Determining the specificity of protein-DNA interactions. Nat Rev Genet. 2010;11(11):751-760. doi: 10.1038/nrg2845</mixed-citation><mixed-citation xml:lang="en">Stormo G.D., Zhao Y. Determining the specificity of protein-DNA interactions. Nat Rev Genet. 2010;11(11):751-760. doi: 10.1038/nrg2845</mixed-citation></citation-alternatives></ref><ref id="cit31"><label>31</label><citation-alternatives><mixed-citation xml:lang="ru">Taing L., Dandawate A., L’Yi S., Gehlenborg N., Brown M., Meyer C.A. Cistrome Data Browser: integrated search, analysis and visualization of chromatin data. Nucleic Acids Res. 2024;52(D1):D61-D66. doi: 10.1093/nar/gkad1069</mixed-citation><mixed-citation xml:lang="en">Taing L., Dandawate A., L’Yi S., Gehlenborg N., Brown M., Meyer C.A. Cistrome Data Browser: integrated search, analysis and visualization of chromatin data. Nucleic Acids Res. 2024;52(D1):D61-D66. doi: 10.1093/nar/gkad1069</mixed-citation></citation-alternatives></ref><ref id="cit32"><label>32</label><citation-alternatives><mixed-citation xml:lang="ru">Vorontsov I.E., Eliseeva I.A., Zinkevich A., Nikonov M., Abramov S., Boytsov A., Kamenets V., … Medvedeva Y.A., Jolma A., Kolpakov F., Makeev V.J., Kulakovskiy I.V. HOCOMOCO in 2024: a rebuild of the curated collection of binding models for human and mouse transcription factors. Nucleic Acids Res. 2024;52(D1):D154-D163. doi: 10.1093/nar/gkad1077</mixed-citation><mixed-citation xml:lang="en">Vorontsov I.E., Eliseeva I.A., Zinkevich A., Nikonov M., Abramov S., Boytsov A., Kamenets V., … Medvedeva Y.A., Jolma A., Kolpakov F., Makeev V.J., Kulakovskiy I.V. HOCOMOCO in 2024: a rebuild of the curated collection of binding models for human and mouse transcription factors. Nucleic Acids Res. 2024;52(D1):D154-D163. doi: 10.1093/nar/gkad1077</mixed-citation></citation-alternatives></ref><ref id="cit33"><label>33</label><citation-alternatives><mixed-citation xml:lang="ru">Wasserman W.W., Sandelin A. Applied bioinformatics for the identification of regulatory elements. Nat Rev Genet. 2004;5(4):276-287. doi: 10.1038/nrg1315</mixed-citation><mixed-citation xml:lang="en">Wasserman W.W., Sandelin A. Applied bioinformatics for the identification of regulatory elements. Nat Rev Genet. 2004;5(4):276-287. doi: 10.1038/nrg1315</mixed-citation></citation-alternatives></ref><ref id="cit34"><label>34</label><citation-alternatives><mixed-citation xml:lang="ru">Weirauch M.T., Yang A., Albu M., Cote A.G., Montenegro-Monter A., Drewe P., Najafabadi H.S., … Bouget F.Y., Ratsch G., Larrondo L.F., Ecker J.R., Hughes T.R. Determination and inference of eukaryotic transcription factor sequence specificity. Cell. 2014;158(6):1431-1443. doi: 10.1016/j.cell.2014.08.009</mixed-citation><mixed-citation xml:lang="en">Weirauch M.T., Yang A., Albu M., Cote A.G., Montenegro-Monter A., Drewe P., Najafabadi H.S., … Bouget F.Y., Ratsch G., Larrondo L.F., Ecker J.R., Hughes T.R. Determination and inference of eukaryotic transcription factor sequence specificity. Cell. 2014;158(6):1431-1443. doi: 10.1016/j.cell.2014.08.009</mixed-citation></citation-alternatives></ref><ref id="cit35"><label>35</label><citation-alternatives><mixed-citation xml:lang="ru">Wingender E. Classification scheme of eukaryotic transcription factors. Mol Biol. 1997:31(4):483-497. (translated from Вингендер Э. Классификация транскрипционных факторов эукариот. Молекулярная биология. 1997;31(4):584-600. Russian)</mixed-citation><mixed-citation xml:lang="en">Wingender E. Classification scheme of eukaryotic transcription factors. Mol Biol. 1997:31(4):483-497. (translated from Вингендер Э. Классификация транскрипционных факторов эукариот. Молекулярная биология. 1997;31(4):584-600. Russian)</mixed-citation></citation-alternatives></ref><ref id="cit36"><label>36</label><citation-alternatives><mixed-citation xml:lang="ru">Wingender E. Criteria for an updated classification of human transcription factor DNA-binding domains. J Bioinform Comput Biol. 2013;11(1):1340007. doi: 10.1142/S0219720013400076</mixed-citation><mixed-citation xml:lang="en">Wingender E. Criteria for an updated classification of human transcription factor DNA-binding domains. J Bioinform Comput Biol. 2013;11(1):1340007. doi: 10.1142/S0219720013400076</mixed-citation></citation-alternatives></ref><ref id="cit37"><label>37</label><citation-alternatives><mixed-citation xml:lang="ru">Wingender E., Schoeps T., Dönitz J. TFClass: an expandable hierarchical classification of human transcription factors. Nucleic Acids Res. 2013;41(D1):D165-D170. doi: 10.1093/nar/gks1123</mixed-citation><mixed-citation xml:lang="en">Wingender E., Schoeps T., Dönitz J. TFClass: an expandable hierarchical classification of human transcription factors. Nucleic Acids Res. 2013;41(D1):D165-D170. doi: 10.1093/nar/gks1123</mixed-citation></citation-alternatives></ref><ref id="cit38"><label>38</label><citation-alternatives><mixed-citation xml:lang="ru">Wingender E., Schoeps T., Haubrock M., Dönitz J. TFClass: a classification of human transcription factors and their rodent orthologs. Nucleic Acids Res. 2015;43(D1):D97-D102. doi: 10.1093/nar/gku1064</mixed-citation><mixed-citation xml:lang="en">Wingender E., Schoeps T., Haubrock M., Dönitz J. TFClass: a classification of human transcription factors and their rodent orthologs. Nucleic Acids Res. 2015;43(D1):D97-D102. doi: 10.1093/nar/gku1064</mixed-citation></citation-alternatives></ref><ref id="cit39"><label>39</label><citation-alternatives><mixed-citation xml:lang="ru">Wingender E., Schoeps T., Haubrock M., Krull M., Dönitz J. TFClass: expanding the classification of human transcription factors to their mammalian orthologs. Nucleic Acids Res. 2018;46(D1):D343-D347. doi: 10.1093/nar/gkx987</mixed-citation><mixed-citation xml:lang="en">Wingender E., Schoeps T., Haubrock M., Krull M., Dönitz J. TFClass: expanding the classification of human transcription factors to their mammalian orthologs. Nucleic Acids Res. 2018;46(D1):D343-D347. doi: 10.1093/nar/gkx987</mixed-citation></citation-alternatives></ref><ref id="cit40"><label>40</label><citation-alternatives><mixed-citation xml:lang="ru">Zambelli F., Pesole G., Pavesi G. Motif discovery and transcription factor binding sites before and after the next-generation sequencing era. Brief Bioinform. 2013;14(2):225-237. doi: 10.1093/bib/bbs016</mixed-citation><mixed-citation xml:lang="en">Zambelli F., Pesole G., Pavesi G. Motif discovery and transcription factor binding sites before and after the next-generation sequencing era. Brief Bioinform. 2013;14(2):225-237. doi: 10.1093/bib/bbs016</mixed-citation></citation-alternatives></ref><ref id="cit41"><label>41</label><citation-alternatives><mixed-citation xml:lang="ru">Zenker S., Wulf D., Meierhenrich A., Viehöver P., Becker S., Eisenhut M., Stracke R., Weisshaar B., Bräutigam A. Many transcription factor families have evolutionarily conserved binding motifs in plants. Plant Physiol. 2025;198(2):kiaf205. doi: 10.1093/plphys/kiaf205</mixed-citation><mixed-citation xml:lang="en">Zenker S., Wulf D., Meierhenrich A., Viehöver P., Becker S., Eisenhut M., Stracke R., Weisshaar B., Bräutigam A. Many transcription factor families have evolutionarily conserved binding motifs in plants. Plant Physiol. 2025;198(2):kiaf205. doi: 10.1093/plphys/kiaf205</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
