<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE article PUBLIC "-//NLM//DTD JATS (Z39.96) Journal Publishing DTD v1.3 20210610//EN" "JATS-journalpublishing1-3.dtd">
<article article-type="research-article" dtd-version="1.3" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xml:lang="ru"><front><journal-meta><journal-id journal-id-type="publisher-id">dan</journal-id><journal-title-group><journal-title xml:lang="ru">Доклады Национальной академии наук Беларуси</journal-title><trans-title-group xml:lang="en"><trans-title>Doklady of the National Academy of Sciences of Belarus</trans-title></trans-title-group></journal-title-group><issn pub-type="ppub">1561-8323</issn><issn pub-type="epub">2524-2431</issn><publisher><publisher-name>The Republican Unitary Enterprise Publishing House "Belaruskaya Navuka"</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="doi">10.29235/1561-8323-2023-67-5-388-398</article-id><article-id custom-type="elpub" pub-id-type="custom">dan-1152</article-id><article-categories><subj-group subj-group-type="heading"><subject>Research Article</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="ru"><subject>ХИМИЯ</subject></subj-group><subj-group subj-group-type="section-heading" xml:lang="en"><subject>CHEMISTRY</subject></subj-group></article-categories><title-group><article-title>Прогностическая модель идентификации новых лигандов CYP19A1 на аналитической платформе KNIME</article-title><trans-title-group xml:lang="en"><trans-title>Predictive model for identifying new CYP19A1 ligands on the KNIME analytical platform</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Шаладонова</surname><given-names>М. И.</given-names></name><name name-style="western" xml:lang="en"><surname>Shaladonova</surname><given-names>M. I.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Марина Игоревна Шаладонова, магистрант</p><p>220070</p><p>ул. Радиальная, 38Б</p><p>Минск</p></bio><bio xml:lang="en"><p>Marina I. Shaladonova, Master’s Student</p><p>220070</p><p>38B, Radialnaya Str.</p><p>Minsk</p></bio><email xlink:type="simple">shalmari@tut.by</email><xref ref-type="aff" rid="aff-1"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Диченко</surname><given-names>Я. В.</given-names></name><name name-style="western" xml:lang="en"><surname>Dzichenka</surname><given-names>Ya. V.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Ярослав Владимирович Диченко, канд. хим. наук, доцент, вед. науч. сотрудник</p><p>220084</p><p>ул. Купревича, 5/2</p><p>Минск</p></bio><bio xml:lang="en"><p>Yaraslau V. Dzichenka, Ph. D. (Chemistry), Associate Professor, Leading Researcher</p><p>220084</p><p>5/2, Kuprevich Str.</p><p>Minsk</p></bio><email xlink:type="simple">dichenko@iboch.by</email><xref ref-type="aff" rid="aff-2"/></contrib><contrib contrib-type="author" corresp="yes"><name-alternatives><name name-style="eastern" xml:lang="ru"><surname>Усанов</surname><given-names>С. А.</given-names></name><name name-style="western" xml:lang="en"><surname>Usanov</surname><given-names>S. A.</given-names></name></name-alternatives><bio xml:lang="ru"><p>Сергей Александрович Усанов, член-корреспондент, д-р хим. наук, профессор</p><p>220084</p><p>ул. Купревича, 5/2</p><p>Минск</p></bio><bio xml:lang="en"><p>Sergei A. Usanov, Corresponding Memberr, D. Sc. (Chemistry), Professor</p><p>220084</p><p>5/2, Kuprevich Str.</p><p>Minsk</p></bio><email xlink:type="simple">usanov@iboch.by</email><xref ref-type="aff" rid="aff-2"/></contrib></contrib-group><aff-alternatives id="aff-1"><aff xml:lang="ru"><institution>Университет Национальной академии наук Беларуси</institution></aff><aff xml:lang="en"><institution>University of the National Academy of Sciences of Belarus</institution></aff></aff-alternatives><aff-alternatives id="aff-2"><aff xml:lang="ru"><institution>Институт биоорганической химии Национальной академии наук Беларуси</institution></aff><aff xml:lang="en"><institution>Institute of Bioorganic Chemistry of the National Academy of Sciences of Belarus</institution></aff></aff-alternatives><pub-date pub-type="collection"><year>2023</year></pub-date><pub-date pub-type="epub"><day>31</day><month>10</month><year>2023</year></pub-date><volume>67</volume><issue>5</issue><fpage>388</fpage><lpage>398</lpage><permissions><copyright-statement>Copyright &amp;#x00A9; Шаладонова М.И., Диченко Я.В., Усанов С.А., 2023</copyright-statement><copyright-year>2023</copyright-year><copyright-holder xml:lang="ru">Шаладонова М.И., Диченко Я.В., Усанов С.А.</copyright-holder><copyright-holder xml:lang="en">Shaladonova M.I., Dzichenka Y.V., Usanov S.A.</copyright-holder><license xml:lang="ru" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>Данная работа распространяется под лицензией Creative Commons Attribution 4.0.</license-p></license><license xml:lang="en" license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/" xlink:type="simple"><license-p>This work is licensed under a Creative Commons Attribution 4.0 License.</license-p></license></permissions><self-uri xlink:href="https://doklady.belnauka.by/jour/article/view/1152">https://doklady.belnauka.by/jour/article/view/1152</self-uri><abstract><p>   Сформирована база данных химических соединений – низкомолекулярных лигандов CYP19A1 (ароматазы) человека на основании проанализированных данных, полученных in vitro. С использованием полученной базы данных при помощи метода машинного обучения «случайный лес деревьев принятия решений» на аналитической платформе KNIME построены две прогностические модели для идентификации активности лигандов стероидной (I типа) и нестероидной (II типа) структуры. В качестве обучающих данных при построении модели применялись топологические дескрипторы химической структуры, учитывающие корреляцию между структурой молекулы и биологическим эффектом. Для каждой модели был осуществлен отбор наиболее значимых признаков (дескрипторов), произведено вычисление оптимальных параметров и найдена область применимости моделей. На основании результатов показателей качества AUC проведена оценка способности моделей предсказывать результаты тестовой выборки. Полученные показатели качества свидетельствуют о достаточно высокой прогностической способности моделей и перспективности их использования для идентификации новых лигандов CYP19A1 человека. Найденные таким способом соединения могут рассматриваться как потенциальные к созданию лекарственные препараты для лечения гормон-зависимых опухолей.</p></abstract><trans-abstract xml:lang="en"><p>   The purpose of this study was to create a database of the chemical compounds – ligands of human steroid-hydroxylating cytochrome CYP19A1 (aromatase) in order to build a predictive model.</p><p>   The idea was to create a model on the basis of the machinery learning method such as random forest for two types of ligands – with steroidal (I type) and non-steroidal structure (II type). Two predictive models were built with the help of the KNIME analytical platform. Topological descriptors of the chemical structure were used as training data when building a model that takes into account their correlation between the structure of the molecule and the biological effect. The selection of the feature importance of the descriptors, optimal parameters of random forest and the definition of applicability domain of the models were carried out. The assessment of the ability to predict the results of a test sample was performed for each model. The quality marks of the obtained models indicated a rather high predictive ability of the models and the prospects of their use for identification of new human CYP19A1 ligands as potential drugs for treatment of hormone-dependent tumors.</p></trans-abstract><kwd-group xml:lang="ru"><kwd>CYP19A1 человека</kwd><kwd>ингибиторы ароматазы</kwd><kwd>лиганд</kwd><kwd>топологические дескрипторы</kwd><kwd>машинное обучение</kwd><kwd>прогностическая модель</kwd><kwd>область применимости</kwd><kwd>идентификация препаратов</kwd></kwd-group><kwd-group xml:lang="en"><kwd>human CYP19A1</kwd><kwd>aromatase inhibitors</kwd><kwd>ligand</kwd><kwd>topological descriptors</kwd><kwd>machinery learning</kwd><kwd>predictive model</kwd><kwd>applicability domain</kwd><kwd>drug identification</kwd></kwd-group></article-meta></front><back><ref-list><title>References</title><ref id="cit1"><label>1</label><citation-alternatives><mixed-citation xml:lang="ru">Guha, R. Development of Linear, Ensemble, and Nonlinear Models for the Prediction and Interpretation of the Biological Activity of a Set of PDGFR Inhibitors / R. Guha, P. C. Jurs // J. Chem. Inf. Comput. Sci. – 2004. – Vol. 44, N 6. – P. 2179–2189. doi: 10.1021/ci049849f</mixed-citation><mixed-citation xml:lang="en">Guha R., Jurs P. C. Development of Linear, Ensemble, and Nonlinear Models for the Prediction and Interpretation of the Biological Activity of a Set of PDGFR Inhibitors. Journal of Chemical Information and Computer Sciences, 2004, vol. 44, no. 6, pp. 2179–2189. doi: 10.1021/ci049849f</mixed-citation></citation-alternatives></ref><ref id="cit2"><label>2</label><citation-alternatives><mixed-citation xml:lang="ru">Novel triazole-tetrahydroisoquinoline hybrids as human aromatase inhibitors / C. Chamduang [et al.] // Bioorg. Chem. – 2019. – Vol. 93. – Art. 103327. doi: 10.1016/j.bioorg.2019.103327</mixed-citation><mixed-citation xml:lang="en">Chamduang C., Pingaew R., Prachayasittikul V., Prachayasittikul S., Ruchirawat S., Prahayasit tikul V. Novel triazole-tetrahydroisoquinoline hybrids as human aromatase inhibitors. Bioorganic Chemistry, 2019, vol. 93, art. 103327. doi: 10.1016/j.bioorg.2019.103327</mixed-citation></citation-alternatives></ref><ref id="cit3"><label>3</label><citation-alternatives><mixed-citation xml:lang="ru">Brueggemeier, R. W. Aromatase Inhibitors in the Treatment of Breast Cancer / R. W. Brueggemeier, J. C. Hackett, E. S. Diaz-Cruz // Endocrine Rev. – 2005. – Vol. 26, N 3. – P. 331–345. doi: 10.1210/er.2004-0015</mixed-citation><mixed-citation xml:lang="en">Brueggemeier R. W., Hackett J. C., Diaz-Cruz E. S. Aromatase Inhibitors in the Treatment of Breast Cancer. Endocrine Reviews, 2005, vol. 26, no. 3, pp. 331–345. doi: 10.1210/er.2004-0015</mixed-citation></citation-alternatives></ref><ref id="cit4"><label>4</label><citation-alternatives><mixed-citation xml:lang="ru">Bertelli, G. Sequencing of aromatase inhibitors / G. Bertelli // Br. J. Cancer. – 2005. – Vol. 93, N S1. – P. 6–9. doi: 10.1038/sj.bjc.6602689</mixed-citation><mixed-citation xml:lang="en">Bertelli G. Sequencing of aromatase inhibitors. British Journal of Cancer, 2005, vol. 93, no. S1, pp. 6–9. doi: 10.1038/sj.bjc.6602689</mixed-citation></citation-alternatives></ref><ref id="cit5"><label>5</label><citation-alternatives><mixed-citation xml:lang="ru">Studies on non-steroidal inhibitors of aromatase enzyme; 4-(aryl/heteroaryl)-2-(pyrimidin-2-yl) thiazole derivatives / Z. Sahin [et al.] // Bioorg. Med. Chem. – 2018. – Vol. 26, N 8. – P. 1986–1995. doi: 10.1016/j.bmc.2018.02.048</mixed-citation><mixed-citation xml:lang="en">Sahin Z., Ertas M., Berk B., Biltekin S. N., Yurttas L., Demirayak S. Studies on non-steroidal inhibitors of aromatase enzyme; 4-(aryl/heteroaryl)-2-(pyrimidin-2-yl)thiazole derivatives. Bioorganic &amp; Medicinal Chemistry, 2018, vol. 26, no. 8, pp. 1986–1995. doi: 10.1016/j.bmc.2018.02.048</mixed-citation></citation-alternatives></ref><ref id="cit6"><label>6</label><citation-alternatives><mixed-citation xml:lang="ru">Aromatase Inhibitors Evolution as Potential Class of Drugs in the Treatment of Postmenopausal Brest Cancer Women / S. Avvaru [et al.] // Mini-Rev. Med. Chem. – 2018. – Vol. 18, N 7. – P. 609–621. doi: 10.2174/1389557517666171101100902</mixed-citation><mixed-citation xml:lang="en">Avvaru S. P., Noolvi M. N., Aminbhavi T. M., Chkraborty S., Dash A., Shukla S. S. Aromatase Inhibitors Evolution as Potential Class of Drugs in the Treatment of Postmenopausal Brest Cancer Women. Mini-Reviews in Medicinal Chemistry, 2018, vol. 18, no. 7, pp. 609–621. doi: 10.2174/1389557517666171101100902</mixed-citation></citation-alternatives></ref><ref id="cit7"><label>7</label><citation-alternatives><mixed-citation xml:lang="ru">Determining the IC50 Values for Vorozole and Letrozole, on a Series of Human Liver Cytochrome P450s, to Help Determine the Binding Site of Vorozole in the Liver / L. Raymond [et al.] // Enzyme Research. – 2015. – Vol. 2015. – P. 1–4. doi: 10.1155/2015/321820</mixed-citation><mixed-citation xml:lang="en">Raymond L., Rayani N., Polson G., Sikorski K., Lian A., VanAlstine-Parris M. A. Determining the IC50 Values for Vorozole and Letrozole, on a Series of Human Liver Cytochrome P450s, to Help Determine the Binding Site of Vorozole in the Liver. Enzyme Research, 2015, vol. 2015, pp. 1–4. doi: 10.1155/2015/321820</mixed-citation></citation-alternatives></ref><ref id="cit8"><label>8</label><citation-alternatives><mixed-citation xml:lang="ru">Synthesis of Aromatase Inhibitors and Dual Aromatase Steroid Sulfatase Inhibitors by Linking an Arylsulfamate Motif to 4-(4H-1,2,4-triazol-4-ylamino)benzonitrile: SAR, Crystal Structures, in vitro and in vivo Activities / C. Bubert [et al.] // ChemMedChem. – 2008. – Vol. 3, N 11. – P. 1708–1730. doi: 10.1002/cmdc.200800164</mixed-citation><mixed-citation xml:lang="en">Bubert C., Woo L. W. L., Sutcliffe O. B., Mahon M. F., Chander S. K., Purohit A., Reed M. J., Potter B. V. L. Synthesis of Aromatase Inhibitors and Dual Aromatase Steroid Sulfatase Inhibitors by Linking an Arylsulfamate Motif to 4-(4H-1,2,4-triazol-4-ylamino)benzonitrile: SAR, Crystal Structures, in vitro and in vivo Activities. ChemMedChem, 2008, vol. 3, no. 11, pp. 1708–1730. doi: 10.1002/cmdc.200800164</mixed-citation></citation-alternatives></ref><ref id="cit9"><label>9</label><citation-alternatives><mixed-citation xml:lang="ru">Баскин, И. И. Введение в хемоинформатику / И. И. Баскин, Т. И. Маджидов, А. А. Варнек. – М., Казань, Страсбург, 2020. – Ч. 4: Методы машинного обучения. – 321 с.</mixed-citation><mixed-citation xml:lang="en">Baskin I. I., Madzhilov T. I., Varnek A. A. Introduction to Chemoinformatics. Vol. 4: Machine learning methods. Moscow, Kazan, Strasburg, 2020. 321 р. (in Russian).</mixed-citation></citation-alternatives></ref><ref id="cit10"><label>10</label><citation-alternatives><mixed-citation xml:lang="ru">Application of the Random Forest Method in Studies of Local Lymph Node Assay Based Skin Sensitization Data / S. Li [et al.] // J. Chem. Inf. Model. – 2005. – Vol. 45, N 4. – P. 952–964. doi: 10.1021/ci050049u</mixed-citation><mixed-citation xml:lang="en">Li S., Fedorowicz A., Singh H., Soderholm S. C. Application of the Random Forest Method in Studies of Local Lymph Node Assay Based Skin Sensitization Data. Journal of Chemical Information and Modeling, 2005, vol. 45, no. 4, pp. 952–964. doi: 10.1021/ci050049u</mixed-citation></citation-alternatives></ref><ref id="cit11"><label>11</label><citation-alternatives><mixed-citation xml:lang="ru">Применение метода количественных корреляций структура–свойство (ККСС) с использованием топологического индекса Балабана на примере группы сульфаниламидов / А. В. Сыроешкин [и др.] // Вестн. Рос. ун-та дружбы народов. Сер. Медицина. – 2000. – № 2. – С. 80–83.</mixed-citation><mixed-citation xml:lang="en">Syroeshkin A. V., Kovaleva A. N., Kandalaft E., Pleteneva T. V. Application of a method of quantitative correlations frame – property with usage of a topological coefficient on an example of group of sulfanilamidums. Vestnik Rossiiskogo universiteta druzhby narodov. Seriya: Meditsina = RUDN Journal of Medicine, 2000, no. 2, pp. 80–83 (in Russian).</mixed-citation></citation-alternatives></ref><ref id="cit12"><label>12</label><citation-alternatives><mixed-citation xml:lang="ru">Optimisation and evaluation of the random forest model in the efficacy prediction of chemoradiotherapy for advanced cervical cancer based on radiomics signature from high-resolution T2 weighted images / D. Liu [et al.] // Arch. Gynecol. Obstet. – 2021. – Vol. 303, N 3. – Р. 811–820. doi: 10.1007/s00404-020-05908-5</mixed-citation><mixed-citation xml:lang="en">Liu D., Zhang X., Zheng T., Shi Q., Cui Y., Wang Y., Liu L. Optimisation and evaluation of the random forest model in the efficacy prediction of chemoradiotherapy for advanced cervical cancer based on radiomics signature from high-resolution T2 weighted images. Archives of Gynecology and Obstetrics, 2021, vol. 303, no. 3, pp. 811–820. doi: 10.1007/s00404-020-05908-5</mixed-citation></citation-alternatives></ref><ref id="cit13"><label>13</label><citation-alternatives><mixed-citation xml:lang="ru">Janitza, S. An AUC-based permutation variable importance measure for random forests / S. Janitza, C. Strobl, A.-L. Boulesteix // BMC Bioinformatics. – 2013. – Vol. 14, N 1. – Р. 1–11. doi: 10.1186/1471-2105-14-119</mixed-citation><mixed-citation xml:lang="en">Janitza S., Strobl C., Boulesteix A.-L. An AUC-based permutation variable importance measure for random forests. BMC Bioinformatics, 2013, vol. 14, no. 1, pp. 1–11. doi: 10.1186/1471-2105-14-119</mixed-citation></citation-alternatives></ref></ref-list><fn-group><fn fn-type="conflict"><p>The authors declare that there are no conflicts of interest present.</p></fn></fn-group></back></article>
