<?xml version="1.0" encoding="UTF-8"?>
<article article-type="research-article" dtd-version="1.3" xml:lang="ru" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xsi:noNamespaceSchemaLocation="https://metafora.rcsi.science/xsd_files/journal3.xsd">
  <front>
    <journal-meta>
      <journal-id journal-id-type="publisher-id">moitvivt</journal-id>
      <journal-title-group>
        <journal-title xml:lang="ru">Моделирование, оптимизация и информационные технологии</journal-title>
        <trans-title-group xml:lang="en">
          <trans-title>Modeling, Optimization and Information Technology</trans-title>
        </trans-title-group>
      </journal-title-group>
      <issn pub-type="epub">2310-6018</issn>
      <publisher>
        <publisher-name>Издательство</publisher-name>
      </publisher>
    </journal-meta>
    <article-meta>
      <article-id pub-id-type="doi">10.26102/2310-6018/2026.57.6.009</article-id>
      <article-id pub-id-type="custom" custom-type="elpub">2368</article-id>
      <title-group>
        <article-title xml:lang="ru">Обнаружение фейковых новостей в малоресурсных языках с использованием больших языковых моделей</article-title>
        <trans-title-group xml:lang="en">
          <trans-title>Fake news detection in low-resource languages with LLMs</trans-title>
        </trans-title-group>
      </title-group>
      <contrib-group>
        <contrib contrib-type="author">
          <name-alternatives>
            <name name-style="eastern" xml:lang="ru">
              <surname>Кабир</surname>
              <given-names>А. С. M. Хумаюн</given-names>
            </name>
            <name name-style="western" xml:lang="en">
              <surname>Kabir</surname>
              <given-names>A. S. M. Humaun</given-names>
            </name>
          </name-alternatives>
          <email>humaun.kabir@phystech.edu</email>
          <xref ref-type="aff">aff-1</xref>
        </contrib>
        <contrib contrib-type="author">
          <name-alternatives>
            <name name-style="eastern" xml:lang="ru">
              <surname>Кхан</surname>
              <given-names>Самеед Ахмед</given-names>
            </name>
            <name name-style="western" xml:lang="en">
              <surname>Khan</surname>
              <given-names>Sameed Ahmed</given-names>
            </name>
          </name-alternatives>
          <email>sameedkhandurrani@gmail.com</email>
          <xref ref-type="aff">aff-2</xref>
        </contrib>
        <contrib contrib-type="author">
          <name-alternatives>
            <name name-style="eastern" xml:lang="ru">
              <surname>Харламов</surname>
              <given-names>Александр Александрович</given-names>
            </name>
            <name name-style="western" xml:lang="en">
              <surname>Kharlamov</surname>
              <given-names>Alexander Alexandrovich</given-names>
            </name>
          </name-alternatives>
          <email>kharlamov@analyst.ru</email>
          <xref ref-type="aff">aff-3</xref>
        </contrib>
        <contrib contrib-type="author">
          <name-alternatives>
            <name name-style="eastern" xml:lang="ru">
              <surname>Воронков</surname>
              <given-names>Илья Михайлович</given-names>
            </name>
            <name name-style="western" xml:lang="en">
              <surname>Voronkov</surname>
              <given-names>Ilia Mikhailovich</given-names>
            </name>
          </name-alternatives>
          <email>voronkov.im@phystech.edu</email>
          <xref ref-type="aff">aff-4</xref>
        </contrib>
      </contrib-group>
      <aff-alternatives id="aff-1">
        <aff xml:lang="ru">Московский физико-технический институт</aff>
        <aff xml:lang="en">Moscow Institute of Physics and Technology</aff>
      </aff-alternatives>
      <aff-alternatives id="aff-2">
        <aff xml:lang="ru">Университет Иннополис</aff>
        <aff xml:lang="en">Innopolis University</aff>
      </aff-alternatives>
      <aff-alternatives id="aff-3">
        <aff xml:lang="ru">Московский физико-технический институт</aff>
        <aff xml:lang="en">Moscow Institute of Physics and Technology</aff>
      </aff-alternatives>
      <aff-alternatives id="aff-4">
        <aff xml:lang="ru">Московский физико-технический институт</aff>
        <aff xml:lang="en">Moscow Institute of Physics and Technology</aff>
      </aff-alternatives>
      <pub-date pub-type="epub">
        <day>01</day>
        <month>01</month>
        <year>2026</year>
      </pub-date>
      <volume>1</volume>
      <issue>1</issue>
      <elocation-id>10.26102/2310-6018/2026.57.6.009</elocation-id>
      <permissions>
        <copyright-statement>Copyright © Авторы, 2026</copyright-statement>
        <copyright-year>2026</copyright-year>
        <license license-type="creative-commons-attribution" xlink:href="https://creativecommons.org/licenses/by/4.0/">
          <license-p>This work is licensed under a Creative Commons Attribution 4.0 International License</license-p>
        </license>
      </permissions>
      <self-uri xlink:href="https://moitvivt.ru/ru/journal/article?id=2368"/>
      <abstract xml:lang="ru">
        <p>Распространение фейковых новостей представляет собой глобальную проблему в цифровую эпоху доступности информации. Языки с богатыми ресурсами активно решают эту проблему благодаря значительным исследовательским усилиям, тогда как языки с ограниченными ресурсами остаются недостаточно охваченными в этом направлении. Бенгальский язык является одним из таких языков с ограниченными вычислительными ресурсами несмотря на то, что он входит в десятку самых распространённых языков мира. С целью внесения вклада в данную область и решения проблемы фейковых новостей, данное исследование сосредоточено на их обнаружении в бенгальском языке с использованием современных достижений в области языковых моделей, включая методы кросс-лингвистического промтинга для повышения качества ответов больших языковых моделей. В работе используются модели с открытым исходным кодом для обеспечения доступности ресурсов, а именно большие языковые модели DeepSeek-R1, Llama 3.2 и Qwen 2.5. Проводится подробный анализ способности каждой модели обнаруживать фейковые новости на бенгальском языке. Результаты показывают, что модель Qwen 2.5 превосходит другие модели в данной задаче, достигая максимальной точности 97,5 %, при этом не демонстрируя неопределённых ответов.</p>
      </abstract>
      <trans-abstract xml:lang="en">
        <p>The proliferation of fake news is a global challenge to tackle in the digital era of information availability. The resourceful languages are tackling this issue through enormous research works whereas the low-resource languages are left behind to address the issue adequately. Bangla is one of the low-resource languages in computation despite being in the top ten most spoken languages in the world. To contribute in the field and address the issue of fake news, this research work focuses on the fake news detection in Bangla language leveraging large recent advancement of language models using cross-lingual prompting techniques for better response from the large language models. We leverage the open source models for resource accessibility and utilize DeepSeek-R1, Llama 3.2 and Qwen 2.5 large language models in our experiments and extensively analyze the fake news detection capacity of each model in Bangla language. We find that Qwen 2.5 outperforms the other models in this specific task achieving a maximum accuracy of 97.5 while it also reports no inconclusive response.</p>
      </trans-abstract>
      <kwd-group xml:lang="ru">
        <kwd>фейковые новости</kwd>
        <kwd>бенгальский язык</kwd>
        <kwd>большие языковые модели</kwd>
        <kwd>языки с ограниченными ресурсами</kwd>
        <kwd>кросс-языковой промтинг</kwd>
      </kwd-group>
      <kwd-group xml:lang="en">
        <kwd>fake news</kwd>
        <kwd>bangla</kwd>
        <kwd>large language models</kwd>
        <kwd>low-resource language</kwd>
        <kwd>cross-lingual prompting</kwd>
      </kwd-group>
      <funding-group>
        <funding-statement xml:lang="ru">Исследование выполнено без спонсорской поддержки.</funding-statement>
        <funding-statement xml:lang="en">The study was performed without external funding.</funding-statement>
      </funding-group>
    </article-meta>
  </front>
  <back>
    <ref-list>
      <title>References</title>
      <ref id="cit1">
        <label>1</label>
        <mixed-citation xml:lang="ru">Darvin R. Language and identity in the digital age. In: The Routledge Handbook of Language and Identity. Routledge; 2016. P. 523–540.</mixed-citation>
      </ref>
      <ref id="cit2">
        <label>2</label>
        <mixed-citation xml:lang="ru">Lee N., Li B.Z., Wang S., et al. Language Models as Fact Checkers? In: Proceedings of the Third Workshop on Fact Extraction and VERification (FEVER), 09 July 2020, Seattle, WA, USA. Association for Computational Linguistics; 2020. P. 36–41. https://doi.org/10.18653/v1/2020.fever-1.5</mixed-citation>
      </ref>
      <ref id="cit3">
        <label>3</label>
        <mixed-citation xml:lang="ru">Hoes E., Altay S., Bermeo J. Leveraging ChatGPT for Efficient Fact-Checking. OSF. URL: https://doi.org/10.31234/osf.io/qnjkf [Accessed 19th April 2026].</mixed-citation>
      </ref>
      <ref id="cit4">
        <label>4</label>
        <mixed-citation xml:lang="ru">DeepSeek-AI, Guo D., Yang D., et al. DeepSeek-R1: Incentivizing Reasoning Capability in LLMs via Reinforcement Learning. arXiv. URL: https://arxiv.org/abs/2501.12948 [Accessed 19th April 2026].</mixed-citation>
      </ref>
      <ref id="cit5">
        <label>5</label>
        <mixed-citation xml:lang="ru">Grattafiori A., Dubey A., Jauhri A., et al. The Llama 3 Herd of Models. arXiv. URL: https://arxiv.org/abs/2407.21783 [Accessed 19th April 2026].</mixed-citation>
      </ref>
      <ref id="cit6">
        <label>6</label>
        <mixed-citation xml:lang="ru">Hossain M.Z., Rahman M.A., Islam M.S., et al. BanFakeNews: A Dataset for Detecting Fake News in Bangla. In: Proceedings of the Twelfth Language Resources and Evaluation Conference (LREC 2020), 11–16 May 2020, Marseille, France. European Language Resources Association; 2020. P. 2862–2871. URL: https://aclanthology.org/2020.lrec-1.349</mixed-citation>
      </ref>
      <ref id="cit7">
        <label>7</label>
        <mixed-citation xml:lang="ru">Kabir A.S.M.H., Kharlamov A.A., Voronkov I.M. Research Methods for Fake News Detection in Bangla Text. In: Advances in Neural Computation, Machine Learning, and Cognitive Research VII: Selected Papers from the XXV International Conference on Neuroinformatics, 23–27 October 2023, Moscow, Russia. Cham: Springer; 2023. P. 54–60. https://doi.org/10.1007/978-3-031-44865-2_6</mixed-citation>
      </ref>
      <ref id="cit8">
        <label>8</label>
        <mixed-citation xml:lang="ru">Shibu H.M., Datta Sh., Miah M.S., et al. From Scarcity to Capability: Empowering Fake News Detection in Low-Resource Languages with LLMs. In: Proceedings of the 31st International Conference on Computational Linguistics, COLING 2025 – Workshops, 19–24 January 2025, Abu Dhabi, UAE. Association for Computational Linguistics; 2025. P. 100–107. URL: https://aclanthology.org/2025.indonlp-1.12</mixed-citation>
      </ref>
      <ref id="cit9">
        <label>9</label>
        <mixed-citation xml:lang="ru">Rubin V., Conroy N., Chen Y., et al. Fake News or Truth? Using Satirical Cues to Detect Potentially Misleading News. In: Proceedings of the Second Workshop on Computational Approaches to Deception Detection, 17 June 2016, San Diego, CA, USA. Association for Computational Linguistics; 2016. P. 7–17. https://doi.org/10.18653/v1/W16-0802</mixed-citation>
      </ref>
      <ref id="cit10">
        <label>10</label>
        <mixed-citation xml:lang="ru">Hossain E., Kaysar M.N., Jalal Uddin Joy A.Z.M., et al. A Study Towards Bangla Fake News Detection Using Machine Learning and Deep Learning. In: Sentimental Analysis and Deep Learning: Proceedings of ICSADL 2021, 18–19 June 2021, Songkhla, Thailand. Singapore: Springer; 2021. P. 79–95. https://doi.org/10.1007/978-981-16-5157-1_7</mixed-citation>
      </ref>
      <ref id="cit11">
        <label>11</label>
        <mixed-citation xml:lang="ru">Shu K., Sliva A., Wang S., et al. Fake News Detection on Social Media: A Data Mining Perspective. ACM SIGKDD Explorations Newsletter. 2017;19(1):22–36. https://doi.org/10.1145/3137597.3137600</mixed-citation>
      </ref>
      <ref id="cit12">
        <label>12</label>
        <mixed-citation xml:lang="ru">Vaswani A., Shazeer N., Parmar N., et al. Attention is All You Need. In: Advances in Neural Information Processing Systems 30: Annual Conference on Neural Information Processing Systems, 04–09 December 2017, Long Beach, CA, USA. 2017. P. 5998–6008.</mixed-citation>
      </ref>
      <ref id="cit13">
        <label>13</label>
        <mixed-citation xml:lang="ru">Devlin J., Chang M.-W., Lee K., et al. BERT: Pre-training of Deep Bidirectional Transformers for Language Understanding. In: Proceedings of the 2019 Conference of the North American Chapter of the Association for Computational Linguistics: Human Language Technologies (NAACL-HLT 2019): Volume 1, 02–07 June 2019, Minneapolis, MN, USA. Association for Computational Linguistics; 2019. P. 4171–4186. https://doi.org/10.18653/v1/N19-1423</mixed-citation>
      </ref>
      <ref id="cit14">
        <label>14</label>
        <mixed-citation xml:lang="ru">Qin L., Chen Q., Wei F., et al. Cross-lingual Prompting: Improving Zero-shot Chain-of-Thought Reasoning across Languages. In: Proceedings of the 2023 Conference on Empirical Methods in Natural Language Processing (EMNLP 2023), 06–10 December 2023, Singapore. Association for Computational Linguistics; 2023. P. 2695–2709. https://doi.org/10.18653/v1/2023.emnlp-main.163</mixed-citation>
      </ref>
    </ref-list>
    <fn-group>
      <fn fn-type="conflict">
        <p>The authors declare that there are no conflicts of interest present.</p>
      </fn>
    </fn-group>
  </back>
</article>