<?xml version="1.0" encoding="UTF-8"?>
<article article-type="research-article" dtd-version="1.3" xml:lang="ru" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="https://metafora.rcsi.science/xsd_files/journal3.xsd">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">moitvivt</journal-id>
      <journal-title-group>
        <journal-title xml:lang="ru">Моделирование, оптимизация и информационные технологии</journal-title>
        <trans-title-group xml:lang="en">
          <trans-title>Modeling, Optimization and Information Technology</trans-title>
        </trans-title-group>
      </journal-title-group>
      <issn pub-type="epub">2310-6018</issn>
      <publisher>
        <publisher-name>Издательство</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.26102/2310-6018/2023.40.1.028</article-id>
      <article-id pub-id-type="custom" custom-type="elpub">1301</article-id>
      <title-group>
        <article-title xml:lang="ru">Применение машинного обучения для определения порядка прилагательных в английском языке</article-title>
        <trans-title-group xml:lang="en">
          <trans-title>Application of machine learning for adjective ordering in English sentences</trans-title>
        </trans-title-group>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author" corresp="yes">
          <contrib-id contrib-id-type="orcid">0000-0001-7667-7059</contrib-id>
          <name-alternatives>
            <name name-style="eastern" xml:lang="ru">
              <surname>Терехова</surname>
              <given-names>Анастасия Дмитриевна</given-names>
            </name>
            <name name-style="western" xml:lang="en">
              <surname>Terekhova</surname>
              <given-names>Anastasia Dmitrievna</given-names>
            </name>
          </name-alternatives>
          <email>nastyakr@list.ru</email>
          <xref ref-type="aff">aff-1</xref>
        </contrib>
        <contrib contrib-type="author" corresp="yes">
          <contrib-id contrib-id-type="orcid">0000-0002-0289-1834</contrib-id>
          <name-alternatives>
            <name name-style="eastern" xml:lang="ru">
              <surname>Терехов</surname>
              <given-names>Григорий Владимирович</given-names>
            </name>
            <name name-style="western" xml:lang="en">
              <surname>Terekhov</surname>
              <given-names>Grigory Vladimirovich</given-names>
            </name>
          </name-alternatives>
          <email>grvlter@gmail.com</email>
          <xref ref-type="aff">aff-2</xref>
        </contrib>
        <contrib contrib-type="author" corresp="yes">
          <contrib-id contrib-id-type="orcid">0000-0002-7296-2538</contrib-id>
          <name-alternatives>
            <name name-style="eastern" xml:lang="ru">
              <surname>Сычев</surname>
              <given-names>Олег Александрович</given-names>
            </name>
            <name name-style="western" xml:lang="en">
              <surname>Sychev</surname>
              <given-names>Oleg Aleksandrovich</given-names>
            </name>
          </name-alternatives>
          <email>oasychev@gmail.com</email>
          <xref ref-type="aff">aff-3</xref>
        </contrib>
      </contrib-group>
      <aff-alternatives id="aff-1">
        <aff xml:lang="ru">Волгоградский государственный технический университет Озон Технологии</aff>
        <aff xml:lang="en">Volgograd State Technical University OZON Tech</aff>
      </aff-alternatives>
      <aff-alternatives id="aff-2">
        <aff xml:lang="ru">Волгоградский государственный технический университет</aff>
        <aff xml:lang="en">Volgograd State Technical University</aff>
      </aff-alternatives>
      <aff-alternatives id="aff-3">
        <aff xml:lang="ru">Волгоградский государственный технический университет</aff>
        <aff xml:lang="en">Volgograd State Technical University</aff>
      </aff-alternatives>
      <pub-date pub-type="epub">
        <day>01</day>
        <month>01</month>
        <year>2026</year>
      </pub-date>
      <volume>1</volume>
      <issue>1</issue>
      <elocation-id>10.26102/2310-6018/2023.40.1.028</elocation-id>
      <permissions>
        <copyright-statement>Copyright © Авторы, 2026</copyright-statement>
        <copyright-year>2026</copyright-year>
        <license license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/">
          <license-p>This work is licensed under a Creative Commons Attribution 4.0 International License</license-p>
        </license>
      </permissions>
      <self-uri xlink:href="https://moitvivt.ru/ru/journal/article?id=1301"/>
      <abstract xml:lang="ru">
        <p>В статье рассматривается способ решения задачи упорядочивания прилагательных в предложении на английском языке путем определения их гиперонимов. Определение гиперонима можно свести к задаче классификации, поэтому в данной работе произведено сравнение наиболее популярных методов классификации в машинном обучении: метод поиска ближайших соседей, логистическая регрессия, классификатор дерева решений, метод опорных векторов и наивный байесовский метод. Модели были обучены на выборке, содержащей прилагательные и их гиперонимы. Для анализируемого прилагательного отбираются схожие уже классифицированные прилагательные из обучающей выборки и на основе этих данных определяется наиболее семантически подходящий гипероним. Информацию о схожести слов предлагается брать из готовых эмбеддингов GloVe. Используя технику gridsearch, были подобраны оптимальные значения гиперпараметров для метода поиска ближайших соседей K-Nearest Neighbors. С помощью метрик точности (precision), полноты (recall) и F1-меры было проанализировано качество классификации данных при использовании каждого из перечисленных выше методов. Так как готовых датасетов, состоящих из классифицированных прилагательных, на данный момент нет, то для измерений вручную было классифицировано 300 прилагательных.</p>
      </abstract>
      <trans-abstract xml:lang="en">
        <p>The article presents a methodology for solving the adjective ordering problem in English sentences by determining their hypernyms. The determining of a hypernym can be represented as a classification task; therefore, the most popular machine-learning classification methods were compared, they include the following: nearest neighbors method, logistic regression, decision classifier, support vector machine and naive Bayes method. The models were trained on a sample that contained adjectives and their hypernyms. For each adjective, similar adjectives from the training sample were selected; the most semantically appropriate hypernym was determined based on them. The use of information about word similarity from GloVe embeddings is proposed. The optimal values of hyperparameters for the K-Nearest Neighbors method were selected by means of the gridsearch technique. The quality of data classification was evaluated applying the metrics of precision, recall, and F1-measure for each of the methods. Since there were no ready-made datasets of classified adjectives, 300 adjectives were classified manually to create necessary samples.</p>
      </trans-abstract>
      <kwd-group xml:lang="ru">
        <kwd>порядок прилагательных</kwd>
        <kwd>обработка естественного языка</kwd>
        <kwd>векторное представление слов</kwd>
        <kwd>GloVe</kwd>
        <kwd>методы классификации</kwd>
        <kwd>гиперонимы</kwd>
      </kwd-group>
      <kwd-group xml:lang="en">
        <kwd>adjective ordering</kwd>
        <kwd>natural language processing</kwd>
        <kwd>word vector representation</kwd>
        <kwd>GloVe</kwd>
        <kwd>classification methods</kwd>
        <kwd>hypernyms</kwd>
      </kwd-group>
      <funding-group>
        <funding-statement xml:lang="ru">Исследование выполнено без спонсорской поддержки.</funding-statement>
        <funding-statement xml:lang="en">The study was performed without external funding.</funding-statement>
      </funding-group>
    </article-meta>
  </front>
  <back>
    <ref-list>
      <title>References</title>
      <ref id="cit1">
        <label>1</label>
        <mixed-citation xml:lang="ru">Mitrovic A., Koedinger K.R., Martin B. A comparative analysis of cognitive tutoring and constraint-based modeling. Lecture Notes in Computer Science. 2003;2702:313–322. DOI: 10.1007/3-540-44963-9_42.</mixed-citation>
      </ref>
      <ref id="cit2">
        <label>2</label>
        <mixed-citation xml:lang="ru">Углев В.А., Сычев О.А., Аникин А.В. Интеллектуальный анализ цифрового следа при оценке контрольно-измерительных материалов для поддержки принятия решений в образовательном процессе. Журнал Сибирского федерального университета. Техника и технологии. 2022;15(1):121–136. DOI: 10.17516/1999-494X-0378.</mixed-citation>
      </ref>
      <ref id="cit3">
        <label>3</label>
        <mixed-citation xml:lang="ru">Malkani N. A Comprehensive guide on General English for competitive examinations. Agra, Oswal Publishers; 2020. 518 p.</mixed-citation>
      </ref>
      <ref id="cit4">
        <label>4</label>
        <mixed-citation xml:lang="ru">Yogish D., Manjunath T. N., Hegadi S.R. Review on natural language processing trends and techniques using NLTK. Recent Trends in Image Processing and Pattern Recognition. 2018;1037:589–606. DOI: 10.1007/978-981-13-9187-3_53.</mixed-citation>
      </ref>
      <ref id="cit5">
        <label>5</label>
        <mixed-citation xml:lang="ru">Bird S, Klein E, Loper E. Natural language processing with Python: analyzing text with the natural language toolkit. O’Reilly Media, Inc; 2009. 502 p.</mixed-citation>
      </ref>
      <ref id="cit6">
        <label>6</label>
        <mixed-citation xml:lang="ru">Cheng X., Kong X., Liao L., Li B. A combined method for usage of NLP libraries towards analyzing software documents. Advanced Information Systems Engineering. CAiSE 2020. Lecture Notes in Computer Science. 2020;12127:515–529. DOI: 10.1007/978-3-030-49435-3_32.</mixed-citation>
      </ref>
      <ref id="cit7">
        <label>7</label>
        <mixed-citation xml:lang="ru">Sarkar D. Text Analytics with Python: A Practitioner's Guide to Natural Language Processing. New York, Apress; 2019. 698 p.</mixed-citation>
      </ref>
      <ref id="cit8">
        <label>8</label>
        <mixed-citation xml:lang="ru">Fellbaum C. WordNet: an Electronic Lexical Database. Cambridge, MIT Press; 1998. 422 p. DOI: 10.7551/mitpress/7287.001.0001.</mixed-citation>
      </ref>
      <ref id="cit9">
        <label>9</label>
        <mixed-citation xml:lang="ru">Pennington J., Socher R., Manning C.D. Glove: Global vectors for word representation. Proceedings of the 2014 Conference on Empirical Methods in Natural Language Processing (EMNLP). 2014:1532–1543. DOI: 10.3115/v1/D14-1162.</mixed-citation>
      </ref>
      <ref id="cit10">
        <label>10</label>
        <mixed-citation xml:lang="ru">Daniel T.L., Chantal D.L. Discovering knowledge in data: an introduction to data mining. New Jersey, Wiley-interscience. John Wiley &amp; Sons, Inc; 2005. 222 p.</mixed-citation>
      </ref>
      <ref id="cit11">
        <label>11</label>
        <mixed-citation xml:lang="ru">Haneen A.A.A., Ahmad B.A.H. Effects of distance measure choice on K-nearest neighbor classifier performance: a review. Big Data. 2019:221–248</mixed-citation>
      </ref>
      <ref id="cit12">
        <label>12</label>
        <mixed-citation xml:lang="ru">Li B. Importance weighted feature selection strategy for text classification. International Conference on Asian Language Processing (IALP). 2016:344–347.</mixed-citation>
      </ref>
      <ref id="cit13">
        <label>13</label>
        <mixed-citation xml:lang="ru">Cristianini N., Shawe-Taylor J. An introduction to support vector machines: and other kernel-based learning methods. Cambridge, Cambridge University Press; 2000. 204 p. DOI: 10.1017/CBO9780511801389.</mixed-citation>
      </ref>
      <ref id="cit14">
        <label>14</label>
        <mixed-citation xml:lang="ru">Shafieezadeh-Abadeh S., Esfahani P.M., Kuhn D., Distributionally robust logistic regression. Advances in Neural Information Processing Systems. 2015:1576–1584.</mixed-citation>
      </ref>
      <ref id="cit15">
        <label>15</label>
        <mixed-citation xml:lang="ru">Champandard A.J. AI Game Development: Synthetic Creatures with Learning and Reactive Behaviors. San Francisco, New Riders Pub; 2003. 500 p.</mixed-citation>
      </ref>
    </ref-list>
    <fn-group>
      <fn fn-type="conflict">
        <p>The authors declare that there are no conflicts of interest present.</p>
      </fn>
    </fn-group>
  </back>
</article>