|
| 1 | +// Copyright (c) 2013, Facebook, Inc. All rights reserved. |
| 2 | +// This source code is licensed under the BSD-style license found in the |
| 3 | +// LICENSE file in the root directory of this source tree. An additional grant |
| 4 | +// of patent rights can be found in the PATENTS file in the same directory. |
| 5 | +// |
| 6 | +// Copyright (c) 2011 The LevelDB Authors. All rights reserved. |
| 7 | +// Use of this source code is governed by a BSD-style license that can be |
| 8 | +// found in the LICENSE file. See the AUTHORS file for names of contributors. |
| 9 | + |
| 10 | +#include "db/file_indexer.h" |
| 11 | +#include <algorithm> |
| 12 | +#include "rocksdb/comparator.h" |
| 13 | +#include "db/version_edit.h" |
| 14 | + |
| 15 | +namespace rocksdb { |
| 16 | + |
| 17 | +FileIndexer::FileIndexer(const uint32_t num_levels, |
| 18 | + const Comparator* ucmp) |
| 19 | + : num_levels_(num_levels), |
| 20 | + ucmp_(ucmp), |
| 21 | + next_level_index_(num_levels), |
| 22 | + level_rb_(num_levels, -1) { |
| 23 | +} |
| 24 | + |
| 25 | + |
| 26 | +uint32_t FileIndexer::NumLevelIndex() { |
| 27 | + return next_level_index_.size(); |
| 28 | +} |
| 29 | + |
| 30 | +uint32_t FileIndexer::LevelIndexSize(uint32_t level) { |
| 31 | + return next_level_index_[level].size(); |
| 32 | +} |
| 33 | + |
| 34 | +void FileIndexer::GetNextLevelIndex( |
| 35 | + const uint32_t level, const uint32_t file_index, const int cmp_smallest, |
| 36 | + const int cmp_largest, int32_t* left_bound, int32_t* right_bound) { |
| 37 | + assert(level > 0); |
| 38 | + |
| 39 | + // Last level, no hint |
| 40 | + if (level == num_levels_ - 1) { |
| 41 | + *left_bound = 0; |
| 42 | + *right_bound = -1; |
| 43 | + return; |
| 44 | + } |
| 45 | + |
| 46 | + assert(level < num_levels_ - 1); |
| 47 | + assert(static_cast<int32_t>(file_index) <= level_rb_[level]); |
| 48 | + |
| 49 | + const auto& index = next_level_index_[level][file_index]; |
| 50 | + |
| 51 | + if (cmp_smallest < 0) { |
| 52 | + *left_bound = (level > 0 && file_index > 0) ? |
| 53 | + next_level_index_[level][file_index - 1].largest_lb : 0; |
| 54 | + *right_bound = index.smallest_rb; |
| 55 | + } else if (cmp_smallest == 0) { |
| 56 | + *left_bound = index.smallest_lb; |
| 57 | + *right_bound = index.smallest_rb; |
| 58 | + } else if (cmp_smallest > 0 && cmp_largest < 0) { |
| 59 | + *left_bound = index.smallest_lb; |
| 60 | + *right_bound = index.largest_rb; |
| 61 | + } else if (cmp_largest == 0) { |
| 62 | + *left_bound = index.largest_lb; |
| 63 | + *right_bound = index.largest_rb; |
| 64 | + } else if (cmp_largest > 0) { |
| 65 | + *left_bound = index.largest_lb; |
| 66 | + *right_bound = level_rb_[level + 1]; |
| 67 | + } else { |
| 68 | + assert(false); |
| 69 | + } |
| 70 | + |
| 71 | + assert(*left_bound >= 0); |
| 72 | + assert(*left_bound <= *right_bound + 1); |
| 73 | + assert(*right_bound <= level_rb_[level + 1]); |
| 74 | +} |
| 75 | + |
| 76 | +void FileIndexer::ClearIndex() { |
| 77 | + for (uint32_t level = 1; level < num_levels_; ++level) { |
| 78 | + next_level_index_[level].clear(); |
| 79 | + } |
| 80 | +} |
| 81 | + |
| 82 | +void FileIndexer::UpdateIndex(std::vector<FileMetaData*>* const files) { |
| 83 | + if (files == nullptr) { |
| 84 | + return; |
| 85 | + } |
| 86 | + |
| 87 | + // L1 - Ln-1 |
| 88 | + for (uint32_t level = 1; level < num_levels_ - 1; ++level) { |
| 89 | + const auto& upper_files = files[level]; |
| 90 | + const int32_t upper_size = upper_files.size(); |
| 91 | + const auto& lower_files = files[level + 1]; |
| 92 | + level_rb_[level] = upper_files.size() - 1; |
| 93 | + if (upper_size == 0) { |
| 94 | + continue; |
| 95 | + } |
| 96 | + auto& index = next_level_index_[level]; |
| 97 | + index.resize(upper_size); |
| 98 | + |
| 99 | + CalculateLB(upper_files, lower_files, &index, |
| 100 | + [this](const FileMetaData* a, const FileMetaData* b) -> int { |
| 101 | + return ucmp_->Compare(a->smallest.user_key(), b->largest.user_key()); |
| 102 | + }, |
| 103 | + [](IndexUnit* index, int32_t f_idx) { |
| 104 | + index->smallest_lb = f_idx; |
| 105 | + }); |
| 106 | + CalculateLB(upper_files, lower_files, &index, |
| 107 | + [this](const FileMetaData* a, const FileMetaData* b) -> int { |
| 108 | + return ucmp_->Compare(a->largest.user_key(), b->largest.user_key()); |
| 109 | + }, |
| 110 | + [](IndexUnit* index, int32_t f_idx) { |
| 111 | + index->largest_lb = f_idx; |
| 112 | + }); |
| 113 | + CalculateRB(upper_files, lower_files, &index, |
| 114 | + [this](const FileMetaData* a, const FileMetaData* b) -> int { |
| 115 | + return ucmp_->Compare(a->smallest.user_key(), b->smallest.user_key()); |
| 116 | + }, |
| 117 | + [](IndexUnit* index, int32_t f_idx) { |
| 118 | + index->smallest_rb = f_idx; |
| 119 | + }); |
| 120 | + CalculateRB(upper_files, lower_files, &index, |
| 121 | + [this](const FileMetaData* a, const FileMetaData* b) -> int { |
| 122 | + return ucmp_->Compare(a->largest.user_key(), b->smallest.user_key()); |
| 123 | + }, |
| 124 | + [](IndexUnit* index, int32_t f_idx) { |
| 125 | + index->largest_rb = f_idx; |
| 126 | + }); |
| 127 | + } |
| 128 | + level_rb_[num_levels_ - 1] = files[num_levels_ - 1].size() - 1; |
| 129 | +} |
| 130 | + |
| 131 | +void FileIndexer::CalculateLB(const std::vector<FileMetaData*>& upper_files, |
| 132 | + const std::vector<FileMetaData*>& lower_files, |
| 133 | + std::vector<IndexUnit>* index, |
| 134 | + std::function<int(const FileMetaData*, const FileMetaData*)> cmp_op, |
| 135 | + std::function<void(IndexUnit*, int32_t)> set_index) { |
| 136 | + const int32_t upper_size = upper_files.size(); |
| 137 | + const int32_t lower_size = lower_files.size(); |
| 138 | + int32_t upper_idx = 0; |
| 139 | + int32_t lower_idx = 0; |
| 140 | + while (upper_idx < upper_size && lower_idx < lower_size) { |
| 141 | + int cmp = cmp_op(upper_files[upper_idx], lower_files[lower_idx]); |
| 142 | + |
| 143 | + if (cmp == 0) { |
| 144 | + set_index(&(*index)[upper_idx], lower_idx); |
| 145 | + ++upper_idx; |
| 146 | + ++lower_idx; |
| 147 | + } else if (cmp > 0) { |
| 148 | + // Lower level's file (largest) is smaller, a key won't hit in that |
| 149 | + // file. Move to next lower file |
| 150 | + ++lower_idx; |
| 151 | + } else { |
| 152 | + // Lower level's file becomes larger, update the index, and |
| 153 | + // move to the next upper file |
| 154 | + set_index(&(*index)[upper_idx], lower_idx); |
| 155 | + ++upper_idx; |
| 156 | + } |
| 157 | + } |
| 158 | + |
| 159 | + while (upper_idx < upper_size) { |
| 160 | + // Lower files are exhausted, that means the remaining upper files are |
| 161 | + // greater than any lower files. Set the index to be the lower level size. |
| 162 | + set_index(&(*index)[upper_idx], lower_size); |
| 163 | + ++upper_idx; |
| 164 | + } |
| 165 | +} |
| 166 | + |
| 167 | +void FileIndexer::CalculateRB(const std::vector<FileMetaData*>& upper_files, |
| 168 | + const std::vector<FileMetaData*>& lower_files, |
| 169 | + std::vector<IndexUnit>* index, |
| 170 | + std::function<int(const FileMetaData*, const FileMetaData*)> cmp_op, |
| 171 | + std::function<void(IndexUnit*, int32_t)> set_index) { |
| 172 | + const int32_t upper_size = upper_files.size(); |
| 173 | + const int32_t lower_size = lower_files.size(); |
| 174 | + int32_t upper_idx = upper_size - 1; |
| 175 | + int32_t lower_idx = lower_size - 1; |
| 176 | + while (upper_idx >= 0 && lower_idx >= 0) { |
| 177 | + int cmp = cmp_op(upper_files[upper_idx], lower_files[lower_idx]); |
| 178 | + |
| 179 | + if (cmp == 0) { |
| 180 | + set_index(&(*index)[upper_idx], lower_idx); |
| 181 | + --upper_idx; |
| 182 | + --lower_idx; |
| 183 | + } else if (cmp < 0) { |
| 184 | + // Lower level's file (smallest) is larger, a key won't hit in that |
| 185 | + // file. Move to next lower file. |
| 186 | + --lower_idx; |
| 187 | + } else { |
| 188 | + // Lower level's file becomes smaller, update the index, and move to |
| 189 | + // the next the upper file |
| 190 | + set_index(&(*index)[upper_idx], lower_idx); |
| 191 | + --upper_idx; |
| 192 | + } |
| 193 | + } |
| 194 | + while (upper_idx >= 0) { |
| 195 | + // Lower files are exhausted, that means the remaining upper files are |
| 196 | + // smaller than any lower files. Set it to -1. |
| 197 | + set_index(&(*index)[upper_idx], -1); |
| 198 | + --upper_idx; |
| 199 | + } |
| 200 | +} |
| 201 | + |
| 202 | +} // namespace rocksdb |
0 commit comments