<?xml version="1.0" encoding="UTF-8"?>
<!DOCTYPE root>
<article xmlns:mml="http://www.w3.org/1998/Math/MathML" xmlns:xlink="http://www.w3.org/1999/xlink" xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance" xmlns:ali="http://www.niso.org/schemas/ali/1.0/" article-type="research-article" dtd-version="1.2" xml:lang="en"><front><journal-meta><journal-id journal-id-type="publisher-id">Computational nanotechnology</journal-id><journal-title-group><journal-title xml:lang="en">Computational nanotechnology</journal-title><trans-title-group xml:lang="ru"><trans-title>Computational nanotechnology</trans-title></trans-title-group></journal-title-group><issn publication-format="print">2313-223X</issn><issn publication-format="electronic">2587-9693</issn><publisher><publisher-name xml:lang="en">YUR-VAK</publisher-name></publisher></journal-meta><article-meta><article-id pub-id-type="publisher-id">380199</article-id><article-id pub-id-type="doi">10.33693/2313-223X-2025-12-4-187-194</article-id><article-id pub-id-type="edn">GSYBAH</article-id><article-categories><subj-group subj-group-type="toc-heading" xml:lang="en"><subject>INFORMATICS AND INFORMATION PROCESSING</subject></subj-group><subj-group subj-group-type="toc-heading" xml:lang="ru"><subject>ИНФОРМАТИКА И ИНФОРМАЦИОННЫЕ ПРОЦЕССЫ</subject></subj-group><subj-group subj-group-type="article-type"><subject>Research Article</subject></subj-group></article-categories><title-group><article-title xml:lang="en">Analysis of storage formats for multidimensional data models in the context of multidimensional cubes</article-title><trans-title-group xml:lang="ru"><trans-title>Анализ форматов хранения многомерных моделей данных в контексте многомерных кубов</trans-title></trans-title-group></title-group><contrib-group><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0009-0006-3090-7473</contrib-id><contrib-id contrib-id-type="spin">8207-1550</contrib-id><name-alternatives><name xml:lang="en"><surname>Frolov</surname><given-names>Vladimir A.</given-names></name><name xml:lang="ru"><surname>Фролов</surname><given-names>Владимир Андреевич</given-names></name></name-alternatives><address><country country="RU">Russian Federation</country></address><bio xml:lang="en"><p>postgraduate student, Department of Information Processing and Control Systems</p></bio><bio xml:lang="ru"><p>аспирант, кафедра «Системы обработки информации и управления»</p></bio><email>vladimir.frolov.99@mail.ru</email><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="orcid">https://orcid.org/0000-0002-0596-4955</contrib-id><contrib-id contrib-id-type="scopus">4036</contrib-id><contrib-id contrib-id-type="spin">6631-0932</contrib-id><name-alternatives><name xml:lang="en"><surname>Khayrullin</surname><given-names>Rustam Z.</given-names></name><name xml:lang="ru"><surname>Хайруллин</surname><given-names>Рустам Зиннатуллович</given-names></name></name-alternatives><address><country country="RU">Russian Federation</country></address><bio xml:lang="en"><p>Dr. Sci. (Phys.-Math.), Senior Researcher, Professor</p></bio><bio xml:lang="ru"><p>доктор физико-математических наук, старший научный сотрудник, профессор</p></bio><email>zrkzrk@list.ru</email><xref ref-type="aff" rid="aff1"/></contrib><contrib contrib-type="author"><contrib-id contrib-id-type="spin">7790-1645</contrib-id><name-alternatives><name xml:lang="en"><surname>Afanasyev</surname><given-names>Gennady I.</given-names></name><name xml:lang="ru"><surname>Афанасьев</surname><given-names>Геннадий Иванович</given-names></name></name-alternatives><address><country country="RU">Russian Federation</country></address><bio xml:lang="en"><p>Cand. Sci. (Eng.), Associate Professor</p></bio><bio xml:lang="ru"><p>кандидат технических наук, доцент</p></bio><email>gaipcs@bmstu.ru</email><xref ref-type="aff" rid="aff1"/></contrib></contrib-group><aff-alternatives id="aff1"><aff><institution xml:lang="en">Bauman Moscow State Technical University</institution></aff><aff><institution xml:lang="ru">Московский государственный технический университет имени Н.Э. Баумана</institution></aff></aff-alternatives><pub-date date-type="pub" iso-8601-date="2025-12-12" publication-format="electronic"><day>12</day><month>12</month><year>2025</year></pub-date><volume>12</volume><issue>4</issue><issue-title xml:lang="en">Computational nanotechnology</issue-title><issue-title xml:lang="ru">Computational nanotechnology</issue-title><fpage>187</fpage><lpage>194</lpage><history><date date-type="received" iso-8601-date="2026-02-02"><day>02</day><month>02</month><year>2026</year></date></history><permissions><copyright-statement xml:lang="en">Copyright ©; 2025, Yur-VAK</copyright-statement><copyright-statement xml:lang="ru">Copyright ©; 2025, Юр-ВАК</copyright-statement><copyright-year>2025</copyright-year><copyright-holder xml:lang="en">Yur-VAK</copyright-holder><copyright-holder xml:lang="ru">Юр-ВАК</copyright-holder><license><ali:license_ref xmlns:ali="http://www.niso.org/schemas/ali/1.0/">https://www.urvak.ru/contacts/</ali:license_ref></license></permissions><self-uri xlink:href="https://journals.rcsi.science/2313-223X/article/view/380199">https://journals.rcsi.science/2313-223X/article/view/380199</self-uri><abstract xml:lang="en"><p>The<bold> </bold>article considers the issues of efficient storage of multidimensional data models in the context of modern analytical systems. Particular attention is paid to the architecture of multidimensional cubes, which involve storing aggregated facts at the intersection of many dimensions. A review of modern data storage formats is provided – Parquet, ORC, Iceberg, Delta Lake, Hudi – from the standpoint of their applicability to multidimensional analytics tasks. It is shown that existing solutions are focused mainly on tabular structures and do not provide full support for multidimensional relationships, hierarchies and aggregations. The difficulties of integration between different storage formats and the lack of a unified approach to describing metadata are analyzed. Based on the identified limitations, design tasks facing the multidimensional cube storage format are formulated. A conceptual storage model is proposed that combines the principles of relational and multidimensional data organization. The multidimensional model is a table of facts, dimensions, as well as a metadata level and an API interface.</p></abstract><trans-abstract xml:lang="ru"><p>В статье рассматриваются вопросы эффективного хранения многомерных моделей данных в контексте современных аналитических систем. Особое внимание уделяется архитектуре многомерных кубов, которые предполагают хранение агрегированных фактов на пересечении множества измерений. Проведен обзор современных форматов хранения данных – Parquet, ORC, Iceberg, Delta Lake, Hudi – с позиции их применимости к задачам многомерной аналитики. Показано, что существующие решения ориентированы преимущественно на табличные структуры и не обеспечивают полноценной поддержки многомерных взаимосвязей, иерархий и агрегаций. Анализируются сложности интеграции между различными форматами хранения и отсутствие унифицированного подхода к описанию метаданных. На основе выявленных ограничений сформулированы проектные задачи, стоящие перед форматом хранения многомерных кубов. Предложена концептуальная модель хранения, сочетающая принципы реляционной и многомерной организации данных. Многомерная модель представляет собой таблицы фактов, измерений, а также уровень метаданных и API-интерфейс.</p></trans-abstract><kwd-group xml:lang="en"><kwd>multidimensional cubes</kwd><kwd>OLAP systems</kwd><kwd>data storage model</kwd><kwd>metadata</kwd><kwd>integration</kwd><kwd>data cube</kwd></kwd-group><kwd-group xml:lang="ru"><kwd>многомерные кубы</kwd><kwd>OLAP-системы</kwd><kwd>модель хранения данных</kwd><kwd>метаданные</kwd><kwd>интеграция</kwd><kwd>куб данных</kwd></kwd-group></article-meta></front><body></body><back><ref-list><ref id="B1"><label>1.</label><mixed-citation>Agrawal R., Gupta A., Sarawagi S. Modeling multidimensional databases. In: IBM research report. IBM Almaden Research Center, 1995. Pp. 1–17.</mixed-citation></ref><ref id="B2"><label>2.</label><mixed-citation>Arnas D., Rodríguez M. Range searching in multidimensional databases using navigation metadata. Applied Mathematics and Computation. 2020. Pp. 1–8. DOI: 10.1016/j.amc.2020.125510.</mixed-citation></ref><ref id="B3"><label>3.</label><mixed-citation>Basani M., Kandi A. Optimizing Cloud Data Storage: Evaluating File Formats for Efficient Data Warehousing. International Journal for Research in Applied Science &amp; Engineering Technology. 2024. Pp. 922–930. DOI: 10.22214/ijraset.2024.64753.</mixed-citation></ref><ref id="B4"><label>4.</label><mixed-citation>Boukraâ D., Latreche O. Self-service, on-demand construction of OLAP cubes from data lakes: Application to Twitter. ResearchGate. 2020. Pp. 1–10. DOI: 10.13140/RG.2.2.29163.36646.</mixed-citation></ref><ref id="B5"><label>5.</label><mixed-citation>Djiroun R., Boukhalfa K., Alimazighi Z. Data cubes retrieval and design in OLAP systems: From query analysis to visualization tool. Int. J. Business Intelligence and Data Mining. 2019. Vol. 14. No. 1/2. Pp. 267–270. DOI: 10.1504/IJBIDM.2019.096813.</mixed-citation></ref><ref id="B6"><label>6.</label><mixed-citation>Djiroun R., Boukhalfa K., Alimazighi Z. Designing data cubes in OLAP systems: A decision makers’ requirements-based approach. Cluster Computing. 2018. Pp. 1–14. DOI: 10.1007/s10586-018-2883-7.</mixed-citation></ref><ref id="B7"><label>7.</label><mixed-citation>Etcheverry L., Vaisman A.A. Enhancing OLAP analysis with Web cubes. LNCS. 2012. Vol. 7295. Pp. 469–482. DOI: 10.1007/978-3-642-30284-8_38.</mixed-citation></ref><ref id="B8"><label>8.</label><mixed-citation>Fan J., Han F., Liu H. Challenges of Big Data analysis. National Science Review. 2014. Vol. 1. No. 2. Pp. 293–299. DOI: 10.1093/nsr/nwt032.</mixed-citation></ref><ref id="B9"><label>9.</label><mixed-citation>Gray J., Bosworth A., Layman A., Pirahesh H. Data cube: A relational aggregation operator generalizing Group-By, Cross-Tab, and Sub-Totals. Proceedings of ICDE. 1996. Pp. 152–159.</mixed-citation></ref><ref id="B10"><label>10.</label><mixed-citation>Gyssens M., Lakshmanan L.V.S. A Foundation for multi-dimensional databases. In: Proceedings of the 23rd International Conference on Very Large Data Bases VLDB’97. 1997. Pp. 1–10.</mixed-citation></ref><ref id="B11"><label>11.</label><mixed-citation>Haelen B., Davis D. Delta lake: Up and running. O’Relly Media, 2023. Pp. 26–44.</mixed-citation></ref><ref id="B12"><label>12.</label><mixed-citation>Kuznetsov S.D., Kudryavtsev Yu.A. A mathematical model of the OLAP cubes. Programming and Computer Software. 2009. Vol. 35. No. 5. Pp. 257–265. DOI: 10.1134/S0361768809050028.</mixed-citation></ref><ref id="B13"><label>13.</label><mixed-citation>Letrache K., El Beggar O., Ramdani M. The automatic creation of OLAP cube using an MDA approach. In: Software: Practice and experience. 2017. Pp. 3–14. DOI: 10.1002/spe.2512.</mixed-citation></ref><ref id="B14"><label>14.</label><mixed-citation>Nanda N., Gupta S., Vijrania M. A comprehensive survey of OLAP: Recent trends. In: Proceedings of the Third International Conference on Electronics Communication and Aerospace Technology ICECA 2019. IEEE, 2019. Pp. 425–427. DOI: 10.1109/ICECA.2019.8822203.</mixed-citation></ref><ref id="B15"><label>15.</label><mixed-citation>Ron C., L’Esteve. Delta lake. In: The deinitive guide to azure data engineering. 2021. Pp. 293–295. DOI: 10.1007/978-1-4842-7182-7_15.</mixed-citation></ref><ref id="B16"><label>16.</label><mixed-citation>Saha D. Disruptor in data engineering – comprehensive review of apache iceberg. SSRN preprint. 2024. No. 4987315. Pp. 5–11. DOI: 10.2139/ssrn.4987315.</mixed-citation></ref><ref id="B17"><label>17.</label><mixed-citation>Vassiliadis P. A cube algebra with comparative operations: Containment, overlap, distance, and usability. arXiv.org. 2023. Pp. 2–58. DOI: 10.48550/arXiv.2203.09390v2.</mixed-citation></ref><ref id="B18"><label>18.</label><mixed-citation>Vassiliadis P. Modeling multidimensional databases, cubes, and cube operations. Proceedings of SSDM. 1998. Pp. 1–9. DOI: 10.1109/SSDM.1998.688111.</mixed-citation></ref><ref id="B19"><label>19.</label><mixed-citation>Vohra D. Apache parquet. In: Practical Hadoop ecosystem. Berkeley, CA: Apress, 2016. Pp. 325–328. DOI: 10.1007/978-1-4842-2199-0_8.</mixed-citation></ref><ref id="B20"><label>20.</label><mixed-citation>Wang Z., Chu Y., Tan K.-L. et al. Scalable data cube analysis over big data. arXiv.org. 2013. Pp. 1–12. DOI: 10.13140/RG.2.2.35874.25282.</mixed-citation></ref><ref id="B21"><label>21.</label><mixed-citation>Tennick A. Practical MDX queries: For Microsoft SQL server analysis services 2008. McGraw-Hill Education Group. 2010. Pp. 5–25.</mixed-citation></ref><ref id="B22"><label>22.</label><mixed-citation>Piasevoli T., Li S. MDX with Microsoft SQL Server 2016 Analysis Services Cookbook. 3rd ed. Packt Publishing, 2016. Pp. 401–440.</mixed-citation></ref></ref-list></back></article>
