001/* 002 * Licensed to the Apache Software Foundation (ASF) under one 003 * or more contributor license agreements. See the NOTICE file 004 * distributed with this work for additional information 005 * regarding copyright ownership. The ASF licenses this file 006 * to you under the Apache License, Version 2.0 (the 007 * "License"); you may not use this file except in compliance 008 * with the License. You may obtain a copy of the License at 009 * 010 * http://www.apache.org/licenses/LICENSE-2.0 011 * 012 * Unless required by applicable law or agreed to in writing, software 013 * distributed under the License is distributed on an "AS IS" BASIS, 014 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 015 * See the License for the specific language governing permissions and 016 * limitations under the License. 017 */ 018package org.apache.hadoop.hbase.master.normalizer; 019 020import static org.apache.hadoop.hbase.master.normalizer.RegionNormalizerWorker.CUMULATIVE_SIZE_LIMIT_MB_KEY; 021import static org.apache.hadoop.hbase.master.normalizer.RegionNormalizerWorker.DEFAULT_CUMULATIVE_SIZE_LIMIT_MB; 022import static org.apache.hbase.thirdparty.org.apache.commons.collections4.CollectionUtils.isEmpty; 023 024import java.time.Instant; 025import java.time.Period; 026import java.util.ArrayList; 027import java.util.Collections; 028import java.util.LinkedList; 029import java.util.List; 030import java.util.Objects; 031import java.util.function.BooleanSupplier; 032import java.util.function.Function; 033import org.apache.hadoop.conf.Configuration; 034import org.apache.hadoop.hbase.HBaseInterfaceAudience; 035import org.apache.hadoop.hbase.RegionMetrics; 036import org.apache.hadoop.hbase.ServerMetrics; 037import org.apache.hadoop.hbase.ServerName; 038import org.apache.hadoop.hbase.Size; 039import org.apache.hadoop.hbase.TableName; 040import org.apache.hadoop.hbase.client.MasterSwitchType; 041import org.apache.hadoop.hbase.client.RegionInfo; 042import org.apache.hadoop.hbase.client.TableDescriptor; 043import org.apache.hadoop.hbase.conf.ConfigurationObserver; 044import org.apache.hadoop.hbase.master.MasterServices; 045import org.apache.hadoop.hbase.master.RegionState; 046import org.apache.hadoop.hbase.master.assignment.RegionStates; 047import org.apache.hadoop.hbase.util.EnvironmentEdgeManager; 048import org.apache.yetus.audience.InterfaceAudience; 049import org.slf4j.Logger; 050import org.slf4j.LoggerFactory; 051 052/** 053 * Simple implementation of region normalizer. Logic in use: 054 * <ol> 055 * <li>Get all regions of a given table</li> 056 * <li>Get avg size S of the regions in the table (by total size of store files reported in 057 * RegionMetrics)</li> 058 * <li>For each region R0, if R0 is bigger than S * 2, it is kindly requested to split.</li> 059 * <li>Otherwise, for the next region in the chain R1, if R0 + R1 is smaller then S, R0 and R1 are 060 * kindly requested to merge.</li> 061 * </ol> 062 */ 063@InterfaceAudience.LimitedPrivate(HBaseInterfaceAudience.CONFIG) 064class SimpleRegionNormalizer implements RegionNormalizer, ConfigurationObserver { 065 private static final Logger LOG = LoggerFactory.getLogger(SimpleRegionNormalizer.class); 066 067 static final String SPLIT_ENABLED_KEY = "hbase.normalizer.split.enabled"; 068 static final boolean DEFAULT_SPLIT_ENABLED = true; 069 static final String MERGE_ENABLED_KEY = "hbase.normalizer.merge.enabled"; 070 static final boolean DEFAULT_MERGE_ENABLED = true; 071 /** 072 * @deprecated since 2.5.0 and will be removed in 4.0.0. Use 073 * {@link SimpleRegionNormalizer#MERGE_MIN_REGION_COUNT_KEY} instead. 074 * @see <a href="https://issues.apache.org/jira/browse/HBASE-25745">HBASE-25745</a> 075 */ 076 @Deprecated 077 static final String MIN_REGION_COUNT_KEY = "hbase.normalizer.min.region.count"; 078 static final String MERGE_MIN_REGION_COUNT_KEY = "hbase.normalizer.merge.min.region.count"; 079 static final int DEFAULT_MERGE_MIN_REGION_COUNT = 3; 080 static final String MERGE_MIN_REGION_AGE_DAYS_KEY = "hbase.normalizer.merge.min_region_age.days"; 081 static final int DEFAULT_MERGE_MIN_REGION_AGE_DAYS = 3; 082 static final String MERGE_MIN_REGION_SIZE_MB_KEY = "hbase.normalizer.merge.min_region_size.mb"; 083 static final int DEFAULT_MERGE_MIN_REGION_SIZE_MB = 0; 084 static final String MERGE_REQUEST_MAX_NUMBER_OF_REGIONS_COUNT_KEY = 085 "hbase.normalizer.merge.merge_request_max_number_of_regions"; 086 static final long DEFAULT_MERGE_REQUEST_MAX_NUMBER_OF_REGIONS_COUNT = 100; 087 088 private MasterServices masterServices; 089 private NormalizerConfiguration normalizerConfiguration; 090 091 public SimpleRegionNormalizer() { 092 masterServices = null; 093 normalizerConfiguration = new NormalizerConfiguration(); 094 } 095 096 @Override 097 public Configuration getConf() { 098 return normalizerConfiguration.getConf(); 099 } 100 101 @Override 102 public void setConf(final Configuration conf) { 103 if (conf == null) { 104 return; 105 } 106 normalizerConfiguration = new NormalizerConfiguration(conf, normalizerConfiguration); 107 } 108 109 @Override 110 public void onConfigurationChange(Configuration conf) { 111 LOG.debug("Updating configuration parameters according to new configuration instance."); 112 setConf(conf); 113 } 114 115 private static int parseMergeMinRegionCount(final Configuration conf) { 116 final int parsedValue = conf.getInt(MERGE_MIN_REGION_COUNT_KEY, DEFAULT_MERGE_MIN_REGION_COUNT); 117 final int settledValue = Math.max(1, parsedValue); 118 if (parsedValue != settledValue) { 119 warnInvalidValue(MERGE_MIN_REGION_COUNT_KEY, parsedValue, settledValue); 120 } 121 return settledValue; 122 } 123 124 private static Period parseMergeMinRegionAge(final Configuration conf) { 125 final int parsedValue = 126 conf.getInt(MERGE_MIN_REGION_AGE_DAYS_KEY, DEFAULT_MERGE_MIN_REGION_AGE_DAYS); 127 final int settledValue = Math.max(0, parsedValue); 128 if (parsedValue != settledValue) { 129 warnInvalidValue(MERGE_MIN_REGION_AGE_DAYS_KEY, parsedValue, settledValue); 130 } 131 return Period.ofDays(settledValue); 132 } 133 134 private static long parseMergeMinRegionSizeMb(final Configuration conf) { 135 final long parsedValue = 136 conf.getLong(MERGE_MIN_REGION_SIZE_MB_KEY, DEFAULT_MERGE_MIN_REGION_SIZE_MB); 137 final long settledValue = Math.max(0, parsedValue); 138 if (parsedValue != settledValue) { 139 warnInvalidValue(MERGE_MIN_REGION_SIZE_MB_KEY, parsedValue, settledValue); 140 } 141 return settledValue; 142 } 143 144 private static long parseMergeRequestMaxNumberOfRegionsCount(final Configuration conf) { 145 final long parsedValue = conf.getLong(MERGE_REQUEST_MAX_NUMBER_OF_REGIONS_COUNT_KEY, 146 DEFAULT_MERGE_REQUEST_MAX_NUMBER_OF_REGIONS_COUNT); 147 final long settledValue = Math.max(2, parsedValue); 148 if (parsedValue != settledValue) { 149 warnInvalidValue(MERGE_REQUEST_MAX_NUMBER_OF_REGIONS_COUNT_KEY, parsedValue, settledValue); 150 } 151 return settledValue; 152 } 153 154 private static <T> void warnInvalidValue(final String key, final T parsedValue, 155 final T settledValue) { 156 LOG.warn("Configured value {}={} is invalid. Setting value to {}.", key, parsedValue, 157 settledValue); 158 } 159 160 private static <T> void logConfigurationUpdated(final String key, final T oldValue, 161 final T newValue) { 162 if (!Objects.equals(oldValue, newValue)) { 163 LOG.info("Updated configuration for key '{}' from {} to {}", key, oldValue, newValue); 164 } 165 } 166 167 /** 168 * Return this instance's configured value for {@value #SPLIT_ENABLED_KEY}. 169 */ 170 public boolean isSplitEnabled() { 171 return normalizerConfiguration.isSplitEnabled(); 172 } 173 174 /** 175 * Return this instance's configured value for {@value #MERGE_ENABLED_KEY}. 176 */ 177 public boolean isMergeEnabled() { 178 return normalizerConfiguration.isMergeEnabled(); 179 } 180 181 /** 182 * Return this instance's configured value for {@value #MERGE_MIN_REGION_COUNT_KEY}. 183 */ 184 public int getMergeMinRegionCount() { 185 return normalizerConfiguration.getMergeMinRegionCount(); 186 } 187 188 /** 189 * Return this instance's configured value for {@value #MERGE_MIN_REGION_AGE_DAYS_KEY}. 190 */ 191 public Period getMergeMinRegionAge() { 192 return normalizerConfiguration.getMergeMinRegionAge(); 193 } 194 195 /** 196 * Return this instance's configured value for {@value #MERGE_MIN_REGION_SIZE_MB_KEY}. 197 */ 198 public long getMergeMinRegionSizeMb() { 199 return normalizerConfiguration.getMergeMinRegionSizeMb(); 200 } 201 202 public long getMergeRequestMaxNumberOfRegionsCount() { 203 return normalizerConfiguration.getMergeRequestMaxNumberOfRegionsCount(); 204 } 205 206 @Override 207 public void setMasterServices(final MasterServices masterServices) { 208 this.masterServices = masterServices; 209 } 210 211 @Override 212 public List<NormalizationPlan> computePlansForTable(final TableDescriptor tableDescriptor) { 213 if (tableDescriptor == null) { 214 return Collections.emptyList(); 215 } 216 TableName table = tableDescriptor.getTableName(); 217 if (table.isSystemTable()) { 218 LOG.debug("Normalization of system table {} isn't allowed", table); 219 return Collections.emptyList(); 220 } 221 222 final boolean proceedWithSplitPlanning = proceedWithSplitPlanning(tableDescriptor); 223 final boolean proceedWithMergePlanning = proceedWithMergePlanning(tableDescriptor); 224 if (!proceedWithMergePlanning && !proceedWithSplitPlanning) { 225 LOG.debug("Both split and merge are disabled. Skipping normalization of table: {}", table); 226 return Collections.emptyList(); 227 } 228 229 final NormalizeContext ctx = new NormalizeContext(tableDescriptor); 230 if (isEmpty(ctx.getTableRegions())) { 231 return Collections.emptyList(); 232 } 233 234 LOG.debug("Computing normalization plan for table: {}, number of regions: {}", table, 235 ctx.getTableRegions().size()); 236 237 final List<NormalizationPlan> plans = new ArrayList<>(); 238 int splitPlansCount = 0; 239 if (proceedWithSplitPlanning) { 240 List<NormalizationPlan> splitPlans = computeSplitNormalizationPlans(ctx); 241 splitPlansCount = splitPlans.size(); 242 plans.addAll(splitPlans); 243 } 244 int mergePlansCount = 0; 245 if (proceedWithMergePlanning) { 246 List<NormalizationPlan> mergePlans = computeMergeNormalizationPlans(ctx); 247 mergePlansCount = mergePlans.size(); 248 plans.addAll(mergePlans); 249 } 250 251 if ( 252 normalizerConfiguration.getCumulativePlansSizeLimitMb() != DEFAULT_CUMULATIVE_SIZE_LIMIT_MB 253 ) { 254 // If we are going to truncate our list of plans, shuffle the split and merge plans together 255 // so that the merge plans, which are listed last, are not starved out. 256 shuffleNormalizationPlans(plans); 257 } 258 259 LOG.debug("Computed normalization plans for table {}. Total plans: {}, split plans: {}, " 260 + "merge plans: {}", table, plans.size(), splitPlansCount, mergePlansCount); 261 return plans; 262 } 263 264 /** Returns size of region in MB and if region is not found than -1 */ 265 private long getRegionSizeMB(RegionInfo hri) { 266 ServerName sn = 267 masterServices.getAssignmentManager().getRegionStates().getRegionServerOfRegion(hri); 268 if (sn == null) { 269 LOG.debug("{} region was not found on any Server", hri.getRegionNameAsString()); 270 return -1; 271 } 272 ServerMetrics serverMetrics = masterServices.getServerManager().getLoad(sn); 273 if (serverMetrics == null) { 274 LOG.debug("server {} was not found in ServerManager", sn.getServerName()); 275 return -1; 276 } 277 RegionMetrics regionLoad = serverMetrics.getRegionMetrics().get(hri.getRegionName()); 278 if (regionLoad == null) { 279 LOG.debug("{} was not found in RegionsLoad", hri.getRegionNameAsString()); 280 return -1; 281 } 282 return (long) regionLoad.getStoreFileSize().get(Size.Unit.MEGABYTE); 283 } 284 285 private boolean isMasterSwitchEnabled(final MasterSwitchType masterSwitchType) { 286 return masterServices.isSplitOrMergeEnabled(masterSwitchType); 287 } 288 289 private boolean proceedWithSplitPlanning(TableDescriptor tableDescriptor) { 290 String value = tableDescriptor.getValue(SPLIT_ENABLED_KEY); 291 return (value == null ? isSplitEnabled() : Boolean.parseBoolean(value)) 292 && isMasterSwitchEnabled(MasterSwitchType.SPLIT); 293 } 294 295 private boolean proceedWithMergePlanning(TableDescriptor tableDescriptor) { 296 String value = tableDescriptor.getValue(MERGE_ENABLED_KEY); 297 return (value == null ? isMergeEnabled() : Boolean.parseBoolean(value)) 298 && isMasterSwitchEnabled(MasterSwitchType.MERGE); 299 } 300 301 /** 302 * Also make sure tableRegions contains regions of the same table 303 * @param tableRegions regions of table to normalize 304 * @param tableDescriptor the TableDescriptor 305 * @return average region size depending on 306 * @see TableDescriptor#getNormalizerTargetRegionCount() 307 */ 308 private double getAverageRegionSizeMb(final List<RegionInfo> tableRegions, 309 final TableDescriptor tableDescriptor) { 310 if (isEmpty(tableRegions)) { 311 throw new IllegalStateException( 312 "Cannot calculate average size of a table without any regions."); 313 } 314 TableName table = tableDescriptor.getTableName(); 315 double avgRegionSize; 316 int targetRegionCount = tableDescriptor.getNormalizerTargetRegionCount(); 317 long targetRegionSize = tableDescriptor.getNormalizerTargetRegionSize(); 318 LOG.debug("Table {} configured with target region count {}, target region size {} MB", table, 319 targetRegionCount, targetRegionSize); 320 321 if (targetRegionSize > 0) { 322 avgRegionSize = targetRegionSize; 323 } else { 324 final int regionCount = tableRegions.size(); 325 final long totalSizeMb = tableRegions.stream().mapToLong(this::getRegionSizeMB).sum(); 326 if (targetRegionCount > 0) { 327 avgRegionSize = totalSizeMb / (double) targetRegionCount; 328 } else { 329 avgRegionSize = totalSizeMb / (double) regionCount; 330 } 331 LOG.debug("Table {}, total aggregated regions size: {} MB and average region size {} MB", 332 table, totalSizeMb, String.format("%.3f", avgRegionSize)); 333 } 334 335 return avgRegionSize; 336 } 337 338 /** 339 * Determine if a {@link RegionInfo} should be considered for a merge operation. 340 * </p> 341 * Callers beware: for safe concurrency, be sure to pass in the local instance of 342 * {@link NormalizerConfiguration}, don't use {@code this}'s instance. 343 */ 344 private boolean skipForMerge(final NormalizerConfiguration normalizerConfiguration, 345 final NormalizeContext ctx, final RegionInfo regionInfo) { 346 final RegionState state = ctx.getRegionStates().getRegionState(regionInfo); 347 final String name = regionInfo.getEncodedName(); 348 return logTraceReason(() -> state == null, 349 "skipping merge of region {} because no state information is available.", name) 350 || logTraceReason(() -> !Objects.equals(state.getState(), RegionState.State.OPEN), 351 "skipping merge of region {} because it is not open.", name) 352 || logTraceReason(() -> !isOldEnoughForMerge(normalizerConfiguration, ctx, regionInfo), 353 "skipping merge of region {} because it is not old enough.", name) 354 || logTraceReason(() -> !isLargeEnoughForMerge(normalizerConfiguration, ctx, regionInfo), 355 "skipping merge region {} because it is not large enough.", name); 356 } 357 358 /** 359 * Computes the merge plans that should be executed for this table to converge average region 360 * towards target average or target region count. 361 */ 362 private List<NormalizationPlan> computeMergeNormalizationPlans(final NormalizeContext ctx) { 363 final NormalizerConfiguration configuration = normalizerConfiguration; 364 if (ctx.getTableRegions().size() < configuration.getMergeMinRegionCount(ctx)) { 365 LOG.debug( 366 "Table {} has {} regions, required min number of regions for normalizer to run" 367 + " is {}, not computing merge plans.", 368 ctx.getTableName(), ctx.getTableRegions().size(), configuration.getMergeMinRegionCount()); 369 return Collections.emptyList(); 370 } 371 372 final long avgRegionSizeMb = (long) ctx.getAverageRegionSizeMb(); 373 if (avgRegionSizeMb < configuration.getMergeMinRegionSizeMb(ctx)) { 374 return Collections.emptyList(); 375 } 376 LOG.debug("Computing normalization plan for table {}. average region size: {} MB, number of" 377 + " regions: {}.", ctx.getTableName(), avgRegionSizeMb, ctx.getTableRegions().size()); 378 379 // this nested loop walks the table's region chain once, looking for contiguous sequences of 380 // regions that meet the criteria for merge. The outer loop tracks the starting point of the 381 // next sequence, the inner loop looks for the end of that sequence. A single sequence becomes 382 // an instance of MergeNormalizationPlan. 383 384 final List<NormalizationPlan> plans = new LinkedList<>(); 385 final List<NormalizationTarget> rangeMembers = new LinkedList<>(); 386 long sumRangeMembersSizeMb; 387 int current = 0; 388 for (int rangeStart = 0; rangeStart < ctx.getTableRegions().size() - 1 389 && current < ctx.getTableRegions().size();) { 390 // walk the region chain looking for contiguous sequences of regions that can be merged. 391 rangeMembers.clear(); 392 sumRangeMembersSizeMb = 0; 393 for (current = rangeStart; current < ctx.getTableRegions().size(); current++) { 394 final RegionInfo regionInfo = ctx.getTableRegions().get(current); 395 final long regionSizeMb = getRegionSizeMB(regionInfo); 396 if (skipForMerge(configuration, ctx, regionInfo)) { 397 // this region cannot participate in a range. resume the outer loop. 398 rangeStart = Math.max(current, rangeStart + 1); 399 break; 400 } 401 if ( 402 // when there are no range members, seed the range with whatever we have. this way we're 403 // prepared in case the next region is 0-size. 404 rangeMembers.isEmpty() 405 // when there is only one region and the size is 0, seed the range with whatever we 406 // have. 407 || (rangeMembers.size() == 1 && sumRangeMembersSizeMb == 0) 408 // add an empty region to the current range only if it doesn't exceed max merge request 409 // region count 410 || (regionSizeMb == 0 && rangeMembers.size() < getMergeRequestMaxNumberOfRegionsCount()) 411 // add region if current range region size is less than avg region size of table 412 // and current range doesn't exceed max merge request region count 413 || ((regionSizeMb + sumRangeMembersSizeMb <= avgRegionSizeMb) 414 && (rangeMembers.size() < getMergeRequestMaxNumberOfRegionsCount())) 415 ) { 416 // add the current region to the range when there's capacity remaining. 417 rangeMembers.add(new NormalizationTarget(regionInfo, regionSizeMb)); 418 sumRangeMembersSizeMb += regionSizeMb; 419 continue; 420 } 421 // we have accumulated enough regions to fill a range. resume the outer loop. 422 rangeStart = Math.max(current, rangeStart + 1); 423 break; 424 } 425 if (rangeMembers.size() > 1) { 426 plans.add(new MergeNormalizationPlan.Builder().setTargets(rangeMembers).build()); 427 } 428 } 429 return plans; 430 } 431 432 /** 433 * Determine if a region in {@link RegionState} should be considered for a split operation. 434 */ 435 private static boolean skipForSplit(final RegionState state, final RegionInfo regionInfo) { 436 final String name = regionInfo.getEncodedName(); 437 return logTraceReason(() -> state == null, 438 "skipping split of region {} because no state information is available.", name) 439 || logTraceReason(() -> !Objects.equals(state.getState(), RegionState.State.OPEN), 440 "skipping merge of region {} because it is not open.", name); 441 } 442 443 /** 444 * Computes the split plans that should be executed for this table to converge average region size 445 * towards target average or target region count. <br /> 446 * if the region is > 2 times larger than average, we split it. split is more high priority 447 * normalization action than merge. 448 */ 449 private List<NormalizationPlan> computeSplitNormalizationPlans(final NormalizeContext ctx) { 450 final double avgRegionSize = ctx.getAverageRegionSizeMb(); 451 LOG.debug("Table {}, average region size: {} MB", ctx.getTableName(), 452 String.format("%.3f", avgRegionSize)); 453 454 final List<NormalizationPlan> plans = new ArrayList<>(); 455 for (final RegionInfo hri : ctx.getTableRegions()) { 456 if (skipForSplit(ctx.getRegionStates().getRegionState(hri), hri)) { 457 continue; 458 } 459 final long regionSizeMb = getRegionSizeMB(hri); 460 if (regionSizeMb > 2 * avgRegionSize) { 461 LOG.info( 462 "Table {}, large region {} has size {} MB, more than twice avg size {} MB, " 463 + "splitting", 464 ctx.getTableName(), hri.getRegionNameAsString(), regionSizeMb, 465 String.format("%.3f", avgRegionSize)); 466 plans.add(new SplitNormalizationPlan(hri, regionSizeMb)); 467 } 468 } 469 return plans; 470 } 471 472 /** 473 * Return {@code true} when {@code regionInfo} has a creation date that is old enough to be 474 * considered for a merge operation, {@code false} otherwise. 475 */ 476 private static boolean isOldEnoughForMerge(final NormalizerConfiguration normalizerConfiguration, 477 final NormalizeContext ctx, final RegionInfo regionInfo) { 478 final Instant currentTime = Instant.ofEpochMilli(EnvironmentEdgeManager.currentTime()); 479 final Instant regionCreateTime = Instant.ofEpochMilli(regionInfo.getRegionId()); 480 return currentTime 481 .isAfter(regionCreateTime.plus(normalizerConfiguration.getMergeMinRegionAge(ctx))); 482 } 483 484 /** 485 * Return {@code true} when {@code regionInfo} has a size that is sufficient to be considered for 486 * a merge operation, {@code false} otherwise. 487 * </p> 488 * Callers beware: for safe concurrency, be sure to pass in the local instance of 489 * {@link NormalizerConfiguration}, don't use {@code this}'s instance. 490 */ 491 private boolean isLargeEnoughForMerge(final NormalizerConfiguration normalizerConfiguration, 492 final NormalizeContext ctx, final RegionInfo regionInfo) { 493 return getRegionSizeMB(regionInfo) >= normalizerConfiguration.getMergeMinRegionSizeMb(ctx); 494 } 495 496 /** 497 * This very simple method exists so we can verify it was called in a unit test. Visible for 498 * testing. 499 */ 500 void shuffleNormalizationPlans(List<NormalizationPlan> plans) { 501 Collections.shuffle(plans); 502 } 503 504 private static boolean logTraceReason(final BooleanSupplier predicate, final String fmtWhenTrue, 505 final Object... args) { 506 final boolean value = predicate.getAsBoolean(); 507 if (value) { 508 LOG.trace(fmtWhenTrue, args); 509 } 510 return value; 511 } 512 513 /** 514 * Holds the configuration values read from {@link Configuration}. Encapsulation in a POJO enables 515 * atomic hot-reloading of configs without locks. 516 */ 517 private static final class NormalizerConfiguration { 518 private final Configuration conf; 519 private final boolean splitEnabled; 520 private final boolean mergeEnabled; 521 private final int mergeMinRegionCount; 522 private final Period mergeMinRegionAge; 523 private final long mergeMinRegionSizeMb; 524 private final long mergeRequestMaxNumberOfRegionsCount; 525 private final long cumulativePlansSizeLimitMb; 526 527 private NormalizerConfiguration() { 528 conf = null; 529 splitEnabled = DEFAULT_SPLIT_ENABLED; 530 mergeEnabled = DEFAULT_MERGE_ENABLED; 531 mergeMinRegionCount = DEFAULT_MERGE_MIN_REGION_COUNT; 532 mergeMinRegionAge = Period.ofDays(DEFAULT_MERGE_MIN_REGION_AGE_DAYS); 533 mergeMinRegionSizeMb = DEFAULT_MERGE_MIN_REGION_SIZE_MB; 534 mergeRequestMaxNumberOfRegionsCount = DEFAULT_MERGE_REQUEST_MAX_NUMBER_OF_REGIONS_COUNT; 535 cumulativePlansSizeLimitMb = DEFAULT_CUMULATIVE_SIZE_LIMIT_MB; 536 } 537 538 private NormalizerConfiguration(final Configuration conf, 539 final NormalizerConfiguration currentConfiguration) { 540 this.conf = conf; 541 splitEnabled = conf.getBoolean(SPLIT_ENABLED_KEY, DEFAULT_SPLIT_ENABLED); 542 mergeEnabled = conf.getBoolean(MERGE_ENABLED_KEY, DEFAULT_MERGE_ENABLED); 543 mergeMinRegionCount = parseMergeMinRegionCount(conf); 544 mergeMinRegionAge = parseMergeMinRegionAge(conf); 545 mergeMinRegionSizeMb = parseMergeMinRegionSizeMb(conf); 546 mergeRequestMaxNumberOfRegionsCount = parseMergeRequestMaxNumberOfRegionsCount(conf); 547 cumulativePlansSizeLimitMb = 548 conf.getLong(CUMULATIVE_SIZE_LIMIT_MB_KEY, DEFAULT_CUMULATIVE_SIZE_LIMIT_MB); 549 logConfigurationUpdated(SPLIT_ENABLED_KEY, currentConfiguration.isSplitEnabled(), 550 splitEnabled); 551 logConfigurationUpdated(MERGE_ENABLED_KEY, currentConfiguration.isMergeEnabled(), 552 mergeEnabled); 553 logConfigurationUpdated(MERGE_MIN_REGION_COUNT_KEY, 554 currentConfiguration.getMergeMinRegionCount(), mergeMinRegionCount); 555 logConfigurationUpdated(MERGE_MIN_REGION_AGE_DAYS_KEY, 556 currentConfiguration.getMergeMinRegionAge(), mergeMinRegionAge); 557 logConfigurationUpdated(MERGE_MIN_REGION_SIZE_MB_KEY, 558 currentConfiguration.getMergeMinRegionSizeMb(), mergeMinRegionSizeMb); 559 logConfigurationUpdated(MERGE_REQUEST_MAX_NUMBER_OF_REGIONS_COUNT_KEY, 560 currentConfiguration.getMergeRequestMaxNumberOfRegionsCount(), 561 mergeRequestMaxNumberOfRegionsCount); 562 } 563 564 public Configuration getConf() { 565 return conf; 566 } 567 568 public boolean isSplitEnabled() { 569 return splitEnabled; 570 } 571 572 public boolean isMergeEnabled() { 573 return mergeEnabled; 574 } 575 576 public int getMergeMinRegionCount() { 577 return mergeMinRegionCount; 578 } 579 580 public int getMergeMinRegionCount(NormalizeContext context) { 581 String stringValue = 582 context.getOrDefault(MERGE_MIN_REGION_COUNT_KEY, Function.identity(), null); 583 if (stringValue == null) { 584 stringValue = context.getOrDefault(MIN_REGION_COUNT_KEY, Function.identity(), null); 585 if (stringValue != null) { 586 LOG.debug( 587 "The config key {} in table descriptor is deprecated. Instead please use {}. " 588 + "In future release we will remove the deprecated config.", 589 MIN_REGION_COUNT_KEY, MERGE_MIN_REGION_COUNT_KEY); 590 } 591 } 592 final int mergeMinRegionCount = stringValue == null ? 0 : Integer.parseInt(stringValue); 593 if (mergeMinRegionCount <= 0) { 594 return getMergeMinRegionCount(); 595 } 596 return mergeMinRegionCount; 597 } 598 599 public Period getMergeMinRegionAge() { 600 return mergeMinRegionAge; 601 } 602 603 public Period getMergeMinRegionAge(NormalizeContext context) { 604 final int mergeMinRegionAge = 605 context.getOrDefault(MERGE_MIN_REGION_AGE_DAYS_KEY, Integer::parseInt, -1); 606 if (mergeMinRegionAge < 0) { 607 return getMergeMinRegionAge(); 608 } 609 return Period.ofDays(mergeMinRegionAge); 610 } 611 612 public long getMergeMinRegionSizeMb() { 613 return mergeMinRegionSizeMb; 614 } 615 616 public long getMergeMinRegionSizeMb(NormalizeContext context) { 617 final long mergeMinRegionSizeMb = 618 context.getOrDefault(MERGE_MIN_REGION_SIZE_MB_KEY, Long::parseLong, (long) -1); 619 if (mergeMinRegionSizeMb < 0) { 620 return getMergeMinRegionSizeMb(); 621 } 622 return mergeMinRegionSizeMb; 623 } 624 625 public long getMergeRequestMaxNumberOfRegionsCount() { 626 return mergeRequestMaxNumberOfRegionsCount; 627 } 628 629 private long getCumulativePlansSizeLimitMb() { 630 return cumulativePlansSizeLimitMb; 631 } 632 } 633 634 /** 635 * Inner class caries the state necessary to perform a single invocation of 636 * {@link #computePlansForTable(TableDescriptor)}. Grabbing this data from the assignment manager 637 * up-front allows any computed values to be realized just once. 638 */ 639 private class NormalizeContext { 640 private final TableName tableName; 641 private final RegionStates regionStates; 642 private final List<RegionInfo> tableRegions; 643 private final double averageRegionSizeMb; 644 private final TableDescriptor tableDescriptor; 645 646 public NormalizeContext(final TableDescriptor tableDescriptor) { 647 this.tableDescriptor = tableDescriptor; 648 tableName = tableDescriptor.getTableName(); 649 regionStates = 650 SimpleRegionNormalizer.this.masterServices.getAssignmentManager().getRegionStates(); 651 tableRegions = regionStates.getRegionsOfTable(tableName); 652 // The list of regionInfo from getRegionsOfTable() is ordered by regionName. 653 // regionName does not necessary guarantee the order by STARTKEY (let's say 'aa1', 'aa1!', 654 // in order by regionName, it will be 'aa1!' followed by 'aa1'). 655 // This could result in normalizer merging non-adjacent regions into one and creates overlaps. 656 // In order to avoid that, sort the list by RegionInfo.COMPARATOR. 657 // See HBASE-24376 658 tableRegions.sort(RegionInfo.COMPARATOR); 659 averageRegionSizeMb = 660 SimpleRegionNormalizer.this.getAverageRegionSizeMb(this.tableRegions, this.tableDescriptor); 661 } 662 663 public TableName getTableName() { 664 return tableName; 665 } 666 667 public RegionStates getRegionStates() { 668 return regionStates; 669 } 670 671 public List<RegionInfo> getTableRegions() { 672 return tableRegions; 673 } 674 675 public double getAverageRegionSizeMb() { 676 return averageRegionSizeMb; 677 } 678 679 public <T> T getOrDefault(String key, Function<String, T> function, T defaultValue) { 680 String value = tableDescriptor.getValue(key); 681 if (value == null) { 682 return defaultValue; 683 } else { 684 return function.apply(value); 685 } 686 } 687 } 688}