/* * Copyright (C) 2017 The Android Open Source Project * * Licensed under the Apache License, Version 2.0 (the "License"); * you may not use this file except in compliance with the License. * You may obtain a copy of the License at * * http://www.apache.org/licenses/LICENSE-2.0 * * Unless required by applicable law or agreed to in writing, software * distributed under the License is distributed on an "AS IS" BASIS, * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. * See the License for the specific language governing permissions and * limitations under the License. */ #include "otautil/rangeset.h" #include #include #include #include #include #include #include #include #include #include RangeSet::RangeSet(std::vector&& pairs) { blocks_ = 0; if (pairs.empty()) { LOG(ERROR) << "Invalid number of tokens"; return; } for (const auto& range : pairs) { if (!PushBack(range)) { Clear(); return; } } } RangeSet RangeSet::Parse(const std::string& range_text) { std::vector pieces = android::base::Split(range_text, ","); if (pieces.size() < 3) { LOG(ERROR) << "Invalid range text: " << range_text; return {}; } size_t num; if (!android::base::ParseUint(pieces[0], &num, static_cast(INT_MAX))) { LOG(ERROR) << "Failed to parse the number of tokens: " << range_text; return {}; } if (num == 0) { LOG(ERROR) << "Invalid number of tokens: " << range_text; return {}; } if (num % 2 != 0) { LOG(ERROR) << "Number of tokens must be even: " << range_text; return {}; } if (num != pieces.size() - 1) { LOG(ERROR) << "Mismatching number of tokens: " << range_text; return {}; } std::vector pairs; for (size_t i = 0; i < num; i += 2) { size_t first; size_t second; if (!android::base::ParseUint(pieces[i + 1], &first, static_cast(INT_MAX)) || !android::base::ParseUint(pieces[i + 2], &second, static_cast(INT_MAX))) { return {}; } pairs.emplace_back(first, second); } return RangeSet(std::move(pairs)); } bool RangeSet::PushBack(Range range) { if (range.first >= range.second) { LOG(ERROR) << "Empty or negative range: " << range.first << ", " << range.second; return false; } size_t sz = range.second - range.first; if (blocks_ >= SIZE_MAX - sz) { LOG(ERROR) << "RangeSet size overflow"; return false; } ranges_.push_back(std::move(range)); blocks_ += sz; return true; } void RangeSet::Clear() { ranges_.clear(); blocks_ = 0; } std::vector RangeSet::Split(size_t groups) const { if (ranges_.empty() || groups == 0) return {}; if (blocks_ < groups) { groups = blocks_; } // Evenly distribute blocks, with the first few groups possibly containing one more. size_t mean = blocks_ / groups; std::vector blocks_per_group(groups, mean); std::fill_n(blocks_per_group.begin(), blocks_ % groups, mean + 1); std::vector result; // Forward iterate Ranges and fill up each group with the desired number of blocks. auto it = ranges_.cbegin(); Range range = *it; for (const auto& blocks : blocks_per_group) { RangeSet buffer; size_t needed = blocks; while (needed > 0) { size_t range_blocks = range.second - range.first; if (range_blocks > needed) { // Split the current range and don't advance the iterator. buffer.PushBack({ range.first, range.first + needed }); range.first = range.first + needed; break; } buffer.PushBack(range); it++; if (it != ranges_.cend()) { range = *it; } needed -= range_blocks; } result.push_back(std::move(buffer)); } return result; } std::string RangeSet::ToString() const { if (ranges_.empty()) { return ""; } std::string result = std::to_string(ranges_.size() * 2); for (const auto& [begin, end] : ranges_) { result += android::base::StringPrintf(",%zu,%zu", begin, end); } return result; } // Get the block number for the i-th (starting from 0) block in the RangeSet. size_t RangeSet::GetBlockNumber(size_t idx) const { CHECK_LT(idx, blocks_) << "Out of bound index " << idx << " (total blocks: " << blocks_ << ")"; for (const auto& [begin, end] : ranges_) { if (idx < end - begin) { return begin + idx; } idx -= (end - begin); } CHECK(false) << "Failed to find block number for index " << idx; return 0; // Unreachable, but to make compiler happy. } // RangeSet has half-closed half-open bounds. For example, "3,5" contains blocks 3 and 4. So "3,5" // and "5,7" are not overlapped. bool RangeSet::Overlaps(const RangeSet& other) const { for (const auto& [begin, end] : ranges_) { for (const auto& [other_begin, other_end] : other.ranges_) { // [begin, end) vs [other_begin, other_end) if (!(other_begin >= end || begin >= other_end)) { return true; } } } return false; } std::optional RangeSet::GetSubRanges(size_t start_index, size_t num_of_blocks) const { size_t end_index = start_index + num_of_blocks; // The index of final block to read plus one if (start_index > end_index || end_index > blocks_) { LOG(ERROR) << "Failed to get the sub ranges for start_index " << start_index << " num_of_blocks " << num_of_blocks << " total number of blocks the range contains is " << blocks_; return std::nullopt; } if (num_of_blocks == 0) { LOG(WARNING) << "num_of_blocks is zero when calling GetSubRanges()"; return RangeSet(); } RangeSet result; size_t current_index = 0; for (const auto& [range_start, range_end] : ranges_) { CHECK_LT(range_start, range_end); size_t blocks_in_range = range_end - range_start; // Linear search to skip the ranges until we reach start_block. if (current_index + blocks_in_range <= start_index) { current_index += blocks_in_range; continue; } size_t trimmed_range_start = range_start; // We have found the first block range to read, trim the heading blocks. if (current_index < start_index) { trimmed_range_start += start_index - current_index; } // Trim the trailing blocks if the last range has more blocks than desired; also return the // result. if (current_index + blocks_in_range >= end_index) { size_t trimmed_range_end = range_end - (current_index + blocks_in_range - end_index); if (!result.PushBack({ trimmed_range_start, trimmed_range_end })) { return std::nullopt; } return result; } if (!result.PushBack({ trimmed_range_start, range_end })) { return std::nullopt; } current_index += blocks_in_range; } LOG(ERROR) << "Failed to construct byte ranges to read, start_block: " << start_index << ", num_of_blocks: " << num_of_blocks << " total number of blocks: " << blocks_; return std::nullopt; } // Ranges in the the set should be mutually exclusive; and they're sorted by the start block. SortedRangeSet::SortedRangeSet(std::vector&& pairs) : RangeSet(std::move(pairs)) { std::sort(ranges_.begin(), ranges_.end()); } void SortedRangeSet::Insert(const Range& to_insert) { SortedRangeSet rs({ to_insert }); Insert(rs); } // Insert the input SortedRangeSet; keep the ranges sorted and merge the overlap ranges. void SortedRangeSet::Insert(const SortedRangeSet& rs) { if (rs.size() == 0) { return; } // Merge and sort the two RangeSets. std::vector temp = std::move(ranges_); std::copy(rs.begin(), rs.end(), std::back_inserter(temp)); std::sort(temp.begin(), temp.end()); Clear(); // Trim overlaps and insert the result back to ranges_. Range to_insert = temp.front(); for (auto it = temp.cbegin() + 1; it != temp.cend(); it++) { if (it->first <= to_insert.second) { to_insert.second = std::max(to_insert.second, it->second); } else { ranges_.push_back(to_insert); blocks_ += (to_insert.second - to_insert.first); to_insert = *it; } } ranges_.push_back(to_insert); blocks_ += (to_insert.second - to_insert.first); } // Compute the block range the file occupies, and insert that range. void SortedRangeSet::Insert(size_t start, size_t len) { Range to_insert{ start / kBlockSize, (start + len - 1) / kBlockSize + 1 }; Insert(to_insert); } bool SortedRangeSet::Overlaps(size_t start, size_t len) const { RangeSet rs({ { start / kBlockSize, (start + len - 1) / kBlockSize + 1 } }); return Overlaps(rs); } // Given an offset of the file, checks if the corresponding block (by considering the file as // 0-based continuous block ranges) is covered by the SortedRangeSet. If so, returns the offset // within this SortedRangeSet. // // For example, the 4106-th byte of a file is from block 1, assuming a block size of 4096-byte. // The mapped offset within a SortedRangeSet("1-9 15-19") is 10. // // An offset of 65546 falls into the 16-th block in a file. Block 16 is contained as the 10-th // item in SortedRangeSet("1-9 15-19"). So its data can be found at offset 40970 (i.e. 4096 * 10 // + 10) in a range represented by this SortedRangeSet. size_t SortedRangeSet::GetOffsetInRangeSet(size_t old_offset) const { size_t old_block_start = old_offset / kBlockSize; size_t new_block_start = 0; for (const auto& [start, end] : ranges_) { // Find the index of old_block_start. if (old_block_start >= end) { new_block_start += (end - start); } else if (old_block_start >= start) { new_block_start += (old_block_start - start); return (new_block_start * kBlockSize + old_offset % kBlockSize); } else { CHECK(false) << "block_start " << old_block_start << " is missing between two ranges: " << ToString(); return 0; } } CHECK(false) << "block_start " << old_block_start << " exceeds the limit of current RangeSet: " << ToString(); return 0; }