From 745dff97de117ab3a84e5bd111281deb74477859 Mon Sep 17 00:00:00 2001 From: Xinyi Zou Date: Mon, 9 Dec 2024 14:52:52 +0800 Subject: [PATCH] [fix](memory) Fix init segment map check memory exceeds limit (#44092) ### What problem does this PR solve? Problem Summary: `RowIdConversion::init_segment_map` may use a lot of memory in compaction. however, this part of memory is not controlled, the process may OOM crash. If process has less than 10M available memory before generating `rowid_map` for each segment in `init_segment_map`, it will terminate. ![image](https://github.com/user-attachments/assets/652fadc9-bca0-4edd-a03e-04f2546cdf76) --- be/src/olap/rowid_conversion.h | 30 +++++++++++++++-------- be/src/olap/rowset/beta_rowset_reader.cpp | 3 ++- be/test/olap/rowid_conversion_test.cpp | 6 +++-- 3 files changed, 26 insertions(+), 13 deletions(-) diff --git a/be/src/olap/rowid_conversion.h b/be/src/olap/rowid_conversion.h index 01a2cea0d5e308..8f9d96a136aab4 100644 --- a/be/src/olap/rowid_conversion.h +++ b/be/src/olap/rowid_conversion.h @@ -37,21 +37,33 @@ class RowIdConversion { ~RowIdConversion() { RELEASE_THREAD_MEM_TRACKER(_seg_rowid_map_mem_used); } // resize segment rowid map to its rows num - void init_segment_map(const RowsetId& src_rowset_id, const std::vector& num_rows) { - size_t delta_std_pair_cap = 0; + Status init_segment_map(const RowsetId& src_rowset_id, const std::vector& num_rows) { for (size_t i = 0; i < num_rows.size(); i++) { + constexpr size_t RESERVED_MEMORY = 10 * 1024 * 1024; // 10M + if (doris::GlobalMemoryArbitrator::is_exceed_hard_mem_limit(RESERVED_MEMORY)) { + return Status::MemoryLimitExceeded(fmt::format( + "RowIdConversion init_segment_map failed, memory exceed limit, {}, " + "consuming " + "tracker:<{}>, peak used {}, current used {}.", + doris::GlobalMemoryArbitrator::process_limit_exceeded_errmsg_str(), + doris::thread_context()->thread_mem_tracker()->label(), + doris::thread_context()->thread_mem_tracker()->peak_consumption(), + doris::thread_context()->thread_mem_tracker()->consumption())); + } + uint32_t id = _segments_rowid_map.size(); _segment_to_id_map.emplace(std::pair {src_rowset_id, i}, id); _id_to_segment_map.emplace_back(src_rowset_id, i); std::vector> vec( num_rows[i], std::pair(UINT32_MAX, UINT32_MAX)); - delta_std_pair_cap += vec.capacity(); + + //NOTE: manually count _segments_rowid_map's memory here, because _segments_rowid_map could be used by indexCompaction. + // indexCompaction is a thridparty code, it's too complex to modify it. + // refer compact_column. + track_mem_usage(vec.capacity()); _segments_rowid_map.emplace_back(std::move(vec)); } - //NOTE: manually count _segments_rowid_map's memory here, because _segments_rowid_map could be used by indexCompaction. - // indexCompaction is a thridparty code, it's too complex to modify it. - // refer compact_column. - track_mem_usage(delta_std_pair_cap); + return Status::OK(); } // set dst rowset id @@ -124,9 +136,7 @@ class RowIdConversion { size_t new_size = _std_pair_cap * sizeof(std::pair) + _segments_rowid_map.capacity() * sizeof(std::vector>); - - RELEASE_THREAD_MEM_TRACKER(_seg_rowid_map_mem_used); - CONSUME_THREAD_MEM_TRACKER(new_size); + CONSUME_THREAD_MEM_TRACKER(new_size - _seg_rowid_map_mem_used); _seg_rowid_map_mem_used = new_size; } diff --git a/be/src/olap/rowset/beta_rowset_reader.cpp b/be/src/olap/rowset/beta_rowset_reader.cpp index e8923522f2e5b3..13bf1f6d8c84ae 100644 --- a/be/src/olap/rowset/beta_rowset_reader.cpp +++ b/be/src/olap/rowset/beta_rowset_reader.cpp @@ -220,7 +220,8 @@ Status BetaRowsetReader::get_segment_iterators(RowsetReaderContext* read_context // init segment rowid map for rowid conversion std::vector segment_num_rows; RETURN_IF_ERROR(get_segment_num_rows(&segment_num_rows)); - _read_context->rowid_conversion->init_segment_map(rowset()->rowset_id(), segment_num_rows); + RETURN_IF_ERROR(_read_context->rowid_conversion->init_segment_map(rowset()->rowset_id(), + segment_num_rows)); } auto [seg_start, seg_end] = _segment_offsets; diff --git a/be/test/olap/rowid_conversion_test.cpp b/be/test/olap/rowid_conversion_test.cpp index a9c966acf369ac..8f933eccbd3848 100644 --- a/be/test/olap/rowid_conversion_test.cpp +++ b/be/test/olap/rowid_conversion_test.cpp @@ -495,10 +495,12 @@ TEST_F(TestRowIdConversion, Basic) { RowIdConversion rowid_conversion; src_rowset.init(0); std::vector rs0_segment_num_rows = {4, 3}; - rowid_conversion.init_segment_map(src_rowset, rs0_segment_num_rows); + auto st = rowid_conversion.init_segment_map(src_rowset, rs0_segment_num_rows); + EXPECT_EQ(st.ok(), true); src_rowset.init(1); std::vector rs1_segment_num_rows = {4}; - rowid_conversion.init_segment_map(src_rowset, rs1_segment_num_rows); + st = rowid_conversion.init_segment_map(src_rowset, rs1_segment_num_rows); + EXPECT_EQ(st.ok(), true); rowid_conversion.set_dst_rowset_id(dst_rowset); std::vector dst_segment_num_rows = {4, 3, 4};