<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">vavilov</journal-id><journal-title-group><journal-title xml:lang="ru">Вавиловский журнал генетики и селекции</journal-title><trans-title-group xml:lang="en"><trans-title>Vavilov Journal of Genetics and Breeding</trans-title></trans-title-group></journal-title-group><issn pub-type="epub">2500-3259</issn><publisher><publisher-name>Institute of Cytology and Genetics of Siberian Branch of the RAS</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.18699/VJGB-22-100</article-id><article-id custom-type="elpub" pub-id-type="custom">vavilov-3585</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>КОМПЬЮТЕРНАЯ ГЕНОМИКА</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="en"><subject>COMPUTATIONAL GENOMICS</subject></subj-group></article-categories><title-group><article-title>Свойства малого мира научных организаций  определяют динамику публикационной активности  в области миРНК</article-title><trans-title-group xml:lang="en"><trans-title>Small world of the miRNA science  drives its publication dynamics</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-7681-1032</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Фирсов</surname><given-names>А. Б.</given-names></name><name name-style="western" xml:lang="en"><surname>Firsov</surname><given-names>A. B.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><email xlink:type="simple">artyomfirsov@mail.ru</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-2691-3292</contrib-id><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Титов</surname><given-names>И. И.</given-names></name><name name-style="western" xml:lang="en"><surname>Titov</surname><given-names>I. I.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Новосибирск</p></bio><bio xml:lang="en"><p>Novosibirsk</p></bio><xref ref-type="aff" rid="aff-2"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru">Институт cистем информатики им. А.П. Ершова Сибирского отделения Российской академии наук<country>Россия</country></aff><aff xml:lang="en">A.P. Ershov Institute of Informatics Systems of the Siberian Branch of the Russian Academy of Sciences<country>Russian Federation</country></aff></aff-alternatives><aff-alternatives id="aff-2"><aff xml:lang="ru">Федеральный исследовательский центр Институт цитологии и генетики Сибирского отделения Российской академии наук; Новосибирский национальный исследовательский государственный университет<country>Россия</country></aff><aff xml:lang="en">Institute of Cytology and Genetics of the Siberian Branch of the Russian Academy of Sciences; Novosibirsk State University<country>Russian Federation</country></aff></aff-alternatives><pub-date pub-type="collection"><year>2022</year></pub-date><pub-date pub-type="epub"><day>05</day><month>01</month><year>2023</year></pub-date><volume>26</volume><issue>8</issue><fpage>826</fpage><lpage>829</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Фирсов А.Б., Титов И.И., 2023</copyright-statement><copyright-year>2023</copyright-year><copyright-holder xml:lang="ru">Фирсов А.Б., Титов И.И.</copyright-holder><copyright-holder xml:lang="en">Firsov A.B., Titov I.I.</copyright-holder><license license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://vavilov.elpub.ru/jour/article/view/3585">https://vavilov.elpub.ru/jour/article/view/3585</self-uri><abstract><p>Многие научные статьи стали доступны в цифровом виде, что позволяет запрашивать данные статей и, в частности, автоматически собирать метаданные, включая данные об аффилиации. Это, в свою очередь, можно использовать для количественных оценок научной области, например для идентификации организаций и анализа графа соавторства этих организаций для извлечения базовой структуры науки. В настоящей работе рассмотрена область исследования микроРНК, а именно граф соавторства организаций и анализ его эволюции. </p><p>Чтобы решить проблему вариативности написания названия организаций, был предложен алгоритм сортировки логических векторов признаков k-mer/n-gram. В нем используется тот факт, что содержание аффилиации довольно консистентно для одной и той же организации. Для учета ошибок написания и других артефактов названия организации в поле метаданных аффилиации наш подход преобразует упоминание организации внутри аффилиации в K-Mer (n-gram) булевый вектор присутствия. Далее векторы всех аффилиаций из набора данных лексикографически сортируются, образуя группы упоминаний организаций. Таким подходом был кластеризован набор данных аффилиаций в области исследования микроРНК и определены названия уникальных организаций, что позволило построить граф соавторства на уровне научных организаций. С помощью этого графа показано, что рост области исследования микроРНК контролируется архитектурой малого мира сети научных организаций и испытывает степенной рост с показателем степени 2.64 ± 0.23 для числа организаций в соответствии с диаметром сети, предлагая модель роста новых научных направлений. Скорость публикации первой статьи по микроРНК у организации при ее взаимодействии с другой организацией, уже публиковавшейся в этой области, аппроксимируется как 0.184 ± 0.002 год–1.</p></abstract><trans-abstract xml:lang="en"><p>Many scientific articles became available in the digital form which allows for querying articles data, and specifically the automated metadata gathering, which includes the affiliation data. This in turn can be used in the quantitative characterization of the scientific field, such as organizations identification, and analysis of the co-authorship graph of those organizations to extract the underlying structure of science. In our work, we focus on the miRNA science field, building the organization co-authorship network to provide the higher-level analysis of scientific community evolution rather than analyzing author-level characteristics. To tackle the problem of the institution name writing variability, we proposed the k-mer/n-gram boolean feature vector sorting algorithm, KOFER in short. This approach utilizes the fact that the contents of the affiliation are rather consistent for the same organization, and to account for writing errors and other organization name variations within the affiliation metadata field, it converts the organization mention within the affiliation to the K-Mer (n-gram) Boolean presence vector. Those vectors for all affiliations in the dataset are further lexicographically sorted, forming groups of organization mentions. With that approach, we clustered the miRNA field affiliation dataset and extracted unique organization names, which allowed us to build the co-authorship graph on the organization level. Using this graph, we show that the growth of the miRNA field is governed by the small-world architecture of the scientific institution network and experiences power-law growth with exponent 2.64 ± 0.23 for organization number, in accordance with network diameter, proposing the growth model for emerging scientific fields. The first miRNA publication rate of an organization interacting with already publishing organization is estimated as 0.184 ± 0.002 year–1. </p></trans-abstract><kwd-group xml:lang="ru"><kwd>k-mer</kwd><kwd>n-gram</kwd><kwd>миРНК</kwd><kwd>электронная библиотека</kwd><kwd>соавторство организаций</kwd><kwd>малый мир</kwd></kwd-group><kwd-group xml:lang="en"><kwd>k-mer</kwd><kwd>n-gram</kwd><kwd>miRNA</kwd><kwd>digital library</kwd><kwd>organization co-authorship</kwd><kwd>small world</kwd></kwd-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Goffman W., Newill V.A. Generalization of epidemic theory. An application to the transmission of ideas. Nature. 1964;204(4955):225228. DOI 10.1038/204225a0.</mixed-citation><mixed-citation xml:lang="en">Goffman W., Newill V.A. Generalization of epidemic theory. An application to the transmission of ideas. Nature. 1964;204(4955):225228. DOI 10.1038/204225a0.</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Humphries M.D., Gurney K. Network ‘small-world-ness’: a quantitative method for determining canonical network equivalence. PLoS One. 2008;3(4):e0002051. DOI 10.1371/journal.pone.0002051.</mixed-citation><mixed-citation xml:lang="en">Humphries M.D., Gurney K. Network ‘small-world-ness’: a quantitative method for determining canonical network equivalence. PLoS One. 2008;3(4):e0002051. DOI 10.1371/journal.pone.0002051.</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Leydesdorff L., Wagner C., Park H., Adams J. International collaboration in science: the global map and the network. Prof. Inf. 2013; 22(1):1-18. DOI 10.3145/epi.2013.ene.12.</mixed-citation><mixed-citation xml:lang="en">Leydesdorff L., Wagner C., Park H., Adams J. International collaboration in science: the global map and the network. Prof. Inf. 2013; 22(1):1-18. DOI 10.3145/epi.2013.ene.12.</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Liu M., Li D., Qin P., Liu C., Wang H., Wang F. Epidemics in interconnected small-world networks. PLoS One. 2015;10(3):e0120701. DOI 10.1371/journal.pone.0120701.</mixed-citation><mixed-citation xml:lang="en">Liu M., Li D., Qin P., Liu C., Wang H., Wang F. Epidemics in interconnected small-world networks. PLoS One. 2015;10(3):e0120701. DOI 10.1371/journal.pone.0120701.</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Muldoon S., Bridgeford E., Bassett D. Small-world propensity and weighted brain networks. Sci. Rep. 2016;6:22057. DOI 10.1038/srep22057.</mixed-citation><mixed-citation xml:lang="en">Muldoon S., Bridgeford E., Bassett D. Small-world propensity and weighted brain networks. Sci. Rep. 2016;6:22057. DOI 10.1038/srep22057.</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Newman M.E.J., Moore C., Watts D.J. Mean-field solution of the smallworld network model. Phys. Rev. Lett. 2000;84(14):3201-3204. DOI 10.1103/PhysRevLett.84.3201.</mixed-citation><mixed-citation xml:lang="en">Newman M.E.J., Moore C., Watts D.J. Mean-field solution of the smallworld network model. Phys. Rev. Lett. 2000;84(14):3201-3204. DOI 10.1103/PhysRevLett.84.3201.</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Ribeiro L., Rapini M., Silva L., Albuquerque E.M. Growth patterns of the network of international collaboration in science. Scientometrics. 2018;114:159-179. DOI 10.1007/s11192-017-2573-x.</mixed-citation><mixed-citation xml:lang="en">Ribeiro L., Rapini M., Silva L., Albuquerque E.M. Growth patterns of the network of international collaboration in science. Scientometrics. 2018;114:159-179. DOI 10.1007/s11192-017-2573-x.</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Shi Y., Guan J. Small-world network effects on innovation: evidences from nanotechnology patenting. J. Nanopart. Res. 2016;18:329. DOI 10.1007/s11051-016-3637-1.</mixed-citation><mixed-citation xml:lang="en">Shi Y., Guan J. Small-world network effects on innovation: evidences from nanotechnology patenting. J. Nanopart. Res. 2016;18:329. DOI 10.1007/s11051-016-3637-1.</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Vazquez A. Spreading dynamics on small-world networks with connectivity fluctuations and correlations. Phys. Rev. E. Stat. Nonlin. Soft Matter Phys. 2006;74:056101. DOI 10.1103/PhysRevE.74.056101.</mixed-citation><mixed-citation xml:lang="en">Vazquez A. Spreading dynamics on small-world networks with connectivity fluctuations and correlations. Phys. Rev. E. Stat. Nonlin. Soft Matter Phys. 2006;74:056101. DOI 10.1103/PhysRevE.74.056101.</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Wagner C., Leydesdorff L. Network structure, self-organization and the growth of international collaboration in science. Res. Policy. 2005; 34(10):1608-1618. DOI 10.1016/j.respol.2005.08.002.</mixed-citation><mixed-citation xml:lang="en">Wagner C., Leydesdorff L. Network structure, self-organization and the growth of international collaboration in science. Res. Policy. 2005; 34(10):1608-1618. DOI 10.1016/j.respol.2005.08.002.</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Watts D.J., Strogatz S.H. Collective dynamics of ‘small-world’ networks. Nature. 1998;393(6684):440-442. DOI 10.1038/30918.</mixed-citation><mixed-citation xml:lang="en">Watts D.J., Strogatz S.H. Collective dynamics of ‘small-world’ networks. Nature. 1998;393(6684):440-442. DOI 10.1038/30918.</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
