<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE root>
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="research-article" dtd-version="1.2" xml:lang="en"><front><journal-meta><journal-id journal-id-type="publisher-id">Informacionnye Tehnologii</journal-id><journal-title-group><journal-title xml:lang="en">Informacionnye Tehnologii</journal-title><trans-title-group xml:lang="ru"><trans-title>Информационные технологии</trans-title></trans-title-group></journal-title-group><issn publication-format="print">1684-6400</issn><publisher><publisher-name xml:lang="en">New Technologies Publishing House</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">702054</article-id><article-id pub-id-type="doi">10.17587/it.31.649-658</article-id><article-categories><subj-group subj-group-type="toc-heading" xml:lang="en"><subject>Computing systems and networks</subject></subj-group><subj-group subj-group-type="toc-heading" xml:lang="ru"><subject>Вычислительные системы и сети</subject></subj-group><subj-group subj-group-type="article-type"><subject>Research Article</subject></subj-group></article-categories><title-group><article-title xml:lang="en">Optimization of the matching process in computing systems implementing a dataflow computing model with a dynamically formed context</article-title><trans-title-group xml:lang="ru"><trans-title>Оптимизация процесса сопоставлений в вычислительных системах, реализующих потоковую модель вычислений с динамически формируемым контекстом</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author"><name-alternatives><name xml:lang="en"><surname>Bobkov</surname><given-names>S. G.</given-names></name><name xml:lang="ru"><surname>Бобков</surname><given-names>С. Г.</given-names></name></name-alternatives><address><country country="RU">Russian Federation</country></address><bio xml:lang="en"><p>PhD, Professor, Deputy Head of the Department, Department for Design Problems in Microelectronics of the Center for Advanced Microelectronics</p></bio><bio xml:lang="ru"><p>д-р техн. наук, проф., зам. руководителя, отделение проблем проектирования в микроэлектронике Центра перспективной микроэлектроники</p></bio><email>s_g_bob@mail.ru</email><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name-alternatives><name xml:lang="en"><surname>Zmejev</surname><given-names>D. N.</given-names></name><name xml:lang="ru"><surname>Змеев</surname><given-names>Д. Н.</given-names></name></name-alternatives><address><country country="RU">Russian Federation</country></address><bio xml:lang="en"><p>Researcher, Department for Design Problems in Microelectronics of the Center for Advanced Microelectronics</p></bio><bio xml:lang="ru"><p>науч. сотр., отделение проблем проектирования в микроэлектронике Центра перспективной микроэлектроники</p></bio><email>zmejevdn@list.ru</email><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name-alternatives><name xml:lang="en"><surname>Klimov</surname><given-names>A. V.</given-names></name><name xml:lang="ru"><surname>Климов</surname><given-names>А. В.</given-names></name></name-alternatives><address><country country="RU">Russian Federation</country></address><bio xml:lang="en"><p>Senior Researcher, Department for Design Problems in Microelectronics of the Center for Advanced Microelectronics</p></bio><bio xml:lang="ru"><p>ст. науч. сотр., отделение проблем проектирования в микроэлектронике Центра перспективной микроэлектроники</p></bio><email>arkady.klimov@gmail.com</email><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><name-alternatives><name xml:lang="en"><surname>Levchenko</surname><given-names>N. N.</given-names></name><name xml:lang="ru"><surname>Левченко</surname><given-names>Н. Н.</given-names></name></name-alternatives><address><country country="RU">Russian Federation</country></address><bio xml:lang="en"><p>PhD, Leading Researcher, Department for Design Problems in Microelectronics of the Center for Advanced Microelectronics</p></bio><bio xml:lang="ru"><p>канд. техн. наук, вед. науч. сотр., отделение проблем проектирования в микроэлектронике Центра перспективной микроэлектроники</p></bio><email>nick@burcom.ru</email><xref ref-type="aff" rid="aff1"/></contrib></contrib-group><aff-alternatives id="aff1"><aff><institution xml:lang="en">NRC "Kurchatov institute"</institution></aff><aff><institution xml:lang="ru">НИЦ "Курчатовский институт"</institution></aff></aff-alternatives><pub-date date-type="pub" iso-8601-date="2025-12-15" publication-format="electronic"><day>15</day><month>12</month><year>2025</year></pub-date><volume>31</volume><issue>12</issue><issue-title xml:lang="en"/><issue-title xml:lang="ru"/><fpage>649</fpage><lpage>658</lpage><history><date date-type="received" iso-8601-date="2026-02-02"><day>02</day><month>02</month><year>2026</year></date><date date-type="accepted" iso-8601-date="2026-02-02"><day>02</day><month>02</month><year>2026</year></date></history><permissions><copyright-statement xml:lang="en">Copyright ©; 2025, Informacionnye Tehnologii</copyright-statement><copyright-statement xml:lang="ru">Copyright ©; 2025, Информационные технологии</copyright-statement><copyright-year>2025</copyright-year><copyright-holder xml:lang="en">Informacionnye Tehnologii</copyright-holder><copyright-holder xml:lang="ru">Информационные технологии</copyright-holder></permissions><self-uri xlink:href="https://journals.eco-vector.com/1684-6400/article/view/702054">https://journals.eco-vector.com/1684-6400/article/view/702054</self-uri><abstract xml:lang="en"><p>The paper considers the problem of a drop in real performance with an increase in the number of computing cores on supercomputer systems. The results of the first three systems from the TOP500 List are analyzed. The main approaches to solving the problem of increasing real performance are given.</p> <p>A dataflow computing model with a dynamically formed context is considered. The architecture of a parallel dataflow computing system implementing this model is described. The model and architecture are one of the approaches to improving the real performance of computing systems. The principles of functioning of hardware ternary content-addressable memory, which implements the dataflow computing model in the most efficient way, are described. This is due to the fact that the concept of the computing model, such as a token workspace, involves the simultaneous comparison of an incoming token with all tokens present in this space. One of the key problems of content-addressable memory is analyzed — high power consumption when performing matching operations. Methods for optimizing the matching process are proposed, which are divided into three groups — hardware, software, and hardware-software. Optimization methods are aimed at overall reducing the number of "parasitic" comparisons, as well as reducing the number of compared bits. An analysis of its effectiveness was carried out for each method. One of the effective methods of reducing the number of matchings in the content-addressable memory of the keys of the matching processor of the parallel dataflow computing system is the use of special "Double grouped" tokens. These tokens allow not only to reduce the total number of task tokens, but also to reduce the load on the communication network, reduce the number of comparisons, and free up execution units by transferring part of the load to the matching processor.</p> <p>The research results obtained when performing various tasks on the behavioral block-register model of the system and the emulator are presented. The results demonstrate the effectiveness of the proposed methods.</p></abstract><trans-abstract xml:lang="ru"><p>Рассматривается один из подходов к повышению реальной производительности вычислительных систем на основе потоковой модели вычислений с динамически формируемым контекстом и реализующей ее архитектуры параллельной потоковой вычислительной системы. Описываются принципы функционирования аппаратной ассоциативной памяти, которая наиболее эффективно реализует данную модель вычислений. Кроме того, обсуждается одна из ключевых проблем ассоциативной памяти — высокое энергопотребление при выполнении операций сопоставления. Предлагаются методы оптимизации процесса сопоставлений, направленные на общее уменьшение числа "лишних" сопоставлений, а также уменьшение числа сопоставляемых битов, участвующих в процессе сопоставления токенов. Приведены результаты исследований, полученные при выполнении различных программ на поведенческой блочно-регистровой модели системы и эмуляторе, демонстрирующие эффективность предложенных методов.</p></trans-abstract><kwd-group xml:lang="en"><kwd>content-addressable memory</kwd><kwd>parallel dataflow computing system</kwd><kwd>dataflow computing model</kwd><kwd>matching process</kwd></kwd-group><kwd-group xml:lang="ru"><kwd>ассоциативная память</kwd><kwd>параллельная потоковая вычислительная система</kwd><kwd>потоковая модель вычислений</kwd><kwd>процесс сопоставлений</kwd></kwd-group><funding-group><award-group><funding-source><institution-wrap><institution xml:lang="ru">Правительство РФ</institution></institution-wrap><institution-wrap><institution xml:lang="en">Government of the Russian Federation</institution></institution-wrap></funding-source></award-group><funding-statement xml:lang="en">The work was carried out within the state assignment of NRC "Kurchatov institute".</funding-statement><funding-statement xml:lang="ru">Работа проведена в рамках выполнения государственного задания НИЦ "Курчатовский институт"</funding-statement></funding-group></article-meta></front><body></body><back><ref-list><ref id="B1"><label>1.</label><citation-alternatives><mixed-citation xml:lang="en">Kokosinski Z., Malus B. FPGA implementations of a parallel associative processor with multi-comparand multi-search operations, in International Symposium on Parallel and Distributed Computing 2008, 1-5 July 2008, Krakow, Poland, pp. 444—448, DOI: 10.1109/ISPDC.2008.42.</mixed-citation><mixed-citation xml:lang="ru">Kokosinski Z., Malus B. FPGA implementations of a parallel associative processor with multi-comparand multi-search operations // In International Symposium on Parallel and Distributed Computing 2008. 1—5 July 2008. Krakow, Poland. P. 444—448. DOI: 10.1109/ISPDC.2008.42.</mixed-citation></citation-alternatives></ref><ref id="B2"><label>2.</label><citation-alternatives><mixed-citation xml:lang="en">Levin I. I., Dordopulo A. I., Kaljaev I. A., Doronchen- ko Ju. I., Raskladkin M. K. Modern and next-generation high- performance computer systems with reconfigurable architecture, Vestn. JuUrGU. Ser. Vych. matem. Inform, 2015б vol. 4, no. 3, pp. 24—39, DOI: 10.14529/cmse150303 (in Russian).</mixed-citation><mixed-citation xml:lang="ru">Левин И. И., Дордопуло А. И., Каляев И. А., Дорончен- ко Ю. И., Раскладкин М. К. Современные и перспективные высокопроизводительные вычислительные системы с реконфигурируемой архитектурой // Вестн. ЮУрГУ. Сер. Выч. матем. информ. 2015. Т. 4, № 3. С. 24—39. DOI: 10.14529/cmse150303.</mixed-citation></citation-alternatives></ref><ref id="B3"><label>3.</label><citation-alternatives><mixed-citation xml:lang="en">Cicconetti C. А practical introduction to quantum computing and networking, in proceedings of the 33rd International Symposium on High-Performance Parallel and Distributed Computing (HPDC ‘24), Association for Computing Machinery, New York, NY, USA, 2024, pp. 348—349, DOI: 10.1145/3625549.3660507.</mixed-citation><mixed-citation xml:lang="ru">Cicconetti C. А practical introduction to quantum computing and networking // Proceedings of the 33rd International Symposium on High-Performance Parallel and Distributed Computing (HPDC ‘24). Association for Computing Machinery. New York, NY, USA. 2024. P. 348—349. DOI: 10.1145/3625549.3660507.</mixed-citation></citation-alternatives></ref><ref id="B4"><label>4.</label><citation-alternatives><mixed-citation xml:lang="en">Abdeldayem H., Frazier D. O. Optical computing: need and challenge, Communications of the ACM, 01 September 2007, vol. 50, issue 9, pp. 60—62, DOI: 10.1145/1284621.1284649.</mixed-citation><mixed-citation xml:lang="ru">Abdeldayem H., Frazier D. O. Optical computing: need and challenge // Communications of the ACM. 01 September 2007. Vol. 50, Iss. 9. P. 60—62. DOI: 10.1145/1284621.1284649.</mixed-citation></citation-alternatives></ref><ref id="B5"><label>5.</label><citation-alternatives><mixed-citation xml:lang="en">Burcev В. C. About the need to create a supercomputer in Russia, Cbornik statej "Parallelizm vychislitel’nyh processov i razvitie arhitektury superJeVM", Moscow, IVVS RA, 1997 (in Russian).</mixed-citation><mixed-citation xml:lang="ru">Бурцев B. C. О необходимости создания суперЭВМ в России // Сборник статей "Параллелизм вычислительных процессов и развитие архитектуры суперЭВМ". М.: ИВВС РАН, 1997.</mixed-citation></citation-alternatives></ref><ref id="B6"><label>6.</label><citation-alternatives><mixed-citation xml:lang="en">Smith K. C., Sedra А. S. Associative memory, Encyclopedia of Computer Science, John Wiley and Sons Ltd., GBR, 2003, pp. 105—106.</mixed-citation><mixed-citation xml:lang="ru">Smith K. C., Sedra А. S. Associative memory // Encyclopedia of Computer Science. GBR: John Wiley and Sons Ltd., 2003. P. 105—106.</mixed-citation></citation-alternatives></ref><ref id="B7"><label>7.</label><citation-alternatives><mixed-citation xml:lang="en">Bohm A. P. W. Dataflow and hybrid dataflow architecture summary, Parallel computer systems, Rebecca Koskela and Margaret Simmons (Eds.), New York, NY, USA, ACM, 1990, pp. 281—286.</mixed-citation><mixed-citation xml:lang="ru">Bohm A. P. W. Dataflow and hybrid dataflow architecture summary // Parallel computer systems. Rebecca Koskela and Margaret Simmons (Eds.). New York, NY, USA: ACM, 1990. P. 281—286.</mixed-citation></citation-alternatives></ref><ref id="B8"><label>8.</label><citation-alternatives><mixed-citation xml:lang="en">Arvind A., Brobst S. The evolution of dataflow architectures: from static dataflow to P-RISC, International Journal of High Speed Computing, 1993, vol. 5, no. 2, pp. 125—153.</mixed-citation><mixed-citation xml:lang="ru">Arvind A., Brobst S. The evolution of dataflow architectures: from static dataflow to P-RISC // International Journal of High Speed Computing. 1993. Vol. 5, N. 2. P. 125—153.</mixed-citation></citation-alternatives></ref><ref id="B9"><label>9.</label><citation-alternatives><mixed-citation xml:lang="en">Lee B., Hurson А. R. Dataflow Architectures and Multithreading, Computer, Aug 1994, vol. 27, no. 8, pp. 27—39.</mixed-citation><mixed-citation xml:lang="ru">Lee B., Hurson А. R. Dataflow Architectures and Multithreading // Computer. Aug 1994. Vol. 27, N. 8. P. 27—39.</mixed-citation></citation-alternatives></ref><ref id="B10"><label>10.</label><citation-alternatives><mixed-citation xml:lang="en">Silc J., Robic B., Ungerer T. Asynchrony in parallel computing: From dataflow to multithreading, Parallel and Distributed Computing Practices, 1998, vol. 1, no. 1, pp. 3—30.</mixed-citation><mixed-citation xml:lang="ru">Silc J., Robic B., Ungerer T. Asynchrony in parallel computing: From dataflow to multithreading // Parallel and Distributed Computing Practices. 1998. Vol. 1, N. 1. P. 3—30.</mixed-citation></citation-alternatives></ref><ref id="B11"><label>11.</label><citation-alternatives><mixed-citation xml:lang="en">Zmeev D. N., Klimov A. V., Levchenko N. N., Okunev A. S., Stempkovskii А. L. Features of the architecture implementing the dataflow computational model and its application in the creation of microelectronic high-performance computing systems, Russian Microelectronics, 2019, vol. 48, no. 5, pp. 292—298.</mixed-citation><mixed-citation xml:lang="ru">Zmeev D. N., Klimov A. V., Levchenko N. N., Okunev A. S., Stempkovskii А. L. Features of the architecture implementing the dataflow computational model and its application in the creation of microelectronic high-performance computing systems // Russian Microelectronics. 2019. Vol. 48, N. 5. P. 292—298.</mixed-citation></citation-alternatives></ref><ref id="B12"><label>12.</label><citation-alternatives><mixed-citation xml:lang="en">Stempkovskij A. L., Levchenko N. N., Okunev A. S., Cvetkov V. V. Parallel stream computing system — further development of architecture and structural organization of computing system with automatic resource allocation, Informacionnye Tehnologii, 2008, no. 10, pp. 2—7 (in Russian).</mixed-citation><mixed-citation xml:lang="ru">Стемпковский А. Л., Левченко Н. Н., Окунев А. С., Цветков В. В. Параллельная потоковая вычислительная система — дальнейшее развитие архитектуры и структурной организации вычислительной системы с автоматическим распределением ресурсов // Информационные технологии. 2008. № 10. С. 2—7.</mixed-citation></citation-alternatives></ref><ref id="B13"><label>13.</label><citation-alternatives><mixed-citation xml:lang="en">Zmeev D. N. Design tools of high-performance dataflow computing systems, Problemy razrabotki perspektivnyh mikro- i nanojelektronnyh sistem - 2016. Sbornik trudov, А. L. Stempkovskii ed., Moscow, IPPM RAN, 2016, part II, pp. 159—163 (in Russian).</mixed-citation><mixed-citation xml:lang="ru">Змеев Д. Н. Средства проектирования высокопроизводительных потоковых вычислительных систем // Проблемы разработки перспективных микро- и наноэлектронных систем — 2016. Сб. тр. под общ. ред. академика РАН А. Л. Стемпковского. М.: ИППМ РАН. 2016. Часть II. С. 159—163.</mixed-citation></citation-alternatives></ref><ref id="B14"><label>14.</label><citation-alternatives><mixed-citation xml:lang="en">Levchenko N. N., Okunev A. S., Zmejev D. N. Development tools for high-performance computing systems using associative environment for computing process organization, in Proceedings of IEEE EAST-WEST DESIGN &amp; TEST SYMPOSIUM (EWDTS’2016), Yerevan, Armenia, 2016, October 14—17, pp. 359 —362.</mixed-citation><mixed-citation xml:lang="ru">Levchenko N. N., Okunev A. S., Zmejev D. N. Development tools for high-performance computing systems using associative environment for computing process organization // Proceedings of IEEE EAST-WEST DESIGN &amp; TEST SYMPOSIUM (EWDTS’2016). Yerevan, Armenia, October 14—17. 2016. P. 359—362.</mixed-citation></citation-alternatives></ref><ref id="B15"><label>15.</label><citation-alternatives><mixed-citation xml:lang="en">Soleimani P., Capson D. W., Li K. F. А partitioned CAM architecture with FPGA acceleration for binary descriptor matching, ACM Transactions on Reconfigurable Technology and Systems, March 2024, vol. 17, no. 1, article 10, pp. 1—21, DOI: 10.1145/3624749.</mixed-citation><mixed-citation xml:lang="ru">Soleimani P., Capson D. W., Li K. F. А partitioned CAM architecture with FPGA acceleration for binary descriptor matching // ACM Transactions on Reconfigurable Technology and Systems. March 2024. Vol. 17, N. 1. Article 10. P. 1—21. DOI: 10.1145/3624749.</mixed-citation></citation-alternatives></ref></ref-list></back></article>
