001/*
002 * Licensed to the Apache Software Foundation (ASF) under one
003 * or more contributor license agreements.  See the NOTICE file
004 * distributed with this work for additional information
005 * regarding copyright ownership.  The ASF licenses this file
006 * to you under the Apache License, Version 2.0 (the
007 * "License"); you may not use this file except in compliance
008 * with the License.  You may obtain a copy of the License at
009 *
010 *     http://www.apache.org/licenses/LICENSE-2.0
011 *
012 * Unless required by applicable law or agreed to in writing, software
013 * distributed under the License is distributed on an "AS IS" BASIS,
014 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
015 * See the License for the specific language governing permissions and
016 * limitations under the License.
017 */
018package org.apache.hadoop.hbase.master;
019
020import java.io.IOException;
021import java.io.UncheckedIOException;
022import java.util.HashMap;
023import org.apache.hadoop.conf.Configuration;
024import org.apache.hadoop.hbase.CompatibilityFactory;
025import org.apache.hadoop.hbase.HBaseClassTestRule;
026import org.apache.hadoop.hbase.HBaseTestingUtility;
027import org.apache.hadoop.hbase.MiniHBaseCluster;
028import org.apache.hadoop.hbase.ServerMetricsBuilder;
029import org.apache.hadoop.hbase.ServerName;
030import org.apache.hadoop.hbase.StartMiniClusterOption;
031import org.apache.hadoop.hbase.YouAreDeadException;
032import org.apache.hadoop.hbase.regionserver.RSRpcServices;
033import org.apache.hadoop.hbase.test.MetricsAssertHelper;
034import org.apache.hadoop.hbase.testclassification.MasterTests;
035import org.apache.hadoop.hbase.testclassification.MediumTests;
036import org.apache.hadoop.hbase.util.EnvironmentEdgeManager;
037import org.apache.zookeeper.KeeperException;
038import org.junit.AfterClass;
039import org.junit.BeforeClass;
040import org.junit.ClassRule;
041import org.junit.Test;
042import org.junit.experimental.categories.Category;
043import org.slf4j.Logger;
044import org.slf4j.LoggerFactory;
045
046import org.apache.hbase.thirdparty.com.google.protobuf.RpcController;
047import org.apache.hbase.thirdparty.com.google.protobuf.ServiceException;
048
049import org.apache.hadoop.hbase.shaded.protobuf.ProtobufUtil;
050import org.apache.hadoop.hbase.shaded.protobuf.generated.ClusterStatusProtos;
051import org.apache.hadoop.hbase.shaded.protobuf.generated.RegionServerStatusProtos;
052import org.apache.hadoop.hbase.shaded.protobuf.generated.RegionServerStatusProtos.RegionServerStartupRequest;
053import org.apache.hadoop.hbase.shaded.protobuf.generated.RegionServerStatusProtos.RegionServerStartupResponse;
054
055@Category({ MasterTests.class, MediumTests.class })
056public class TestMasterMetrics {
057
058  @ClassRule
059  public static final HBaseClassTestRule CLASS_RULE =
060    HBaseClassTestRule.forClass(TestMasterMetrics.class);
061
062  private static final Logger LOG = LoggerFactory.getLogger(TestMasterMetrics.class);
063  private static final MetricsAssertHelper metricsHelper =
064    CompatibilityFactory.getInstance(MetricsAssertHelper.class);
065
066  private static MiniHBaseCluster cluster;
067  private static HMaster master;
068  private static HBaseTestingUtility TEST_UTIL;
069
070  public static class MyMaster extends HMaster {
071    public MyMaster(Configuration conf) throws IOException, KeeperException, InterruptedException {
072      super(conf);
073    }
074
075    @Override
076    protected void tryRegionServerReport(long reportStartTime, long reportEndTime) {
077      // do nothing
078    }
079
080    @Override
081    protected RSRpcServices createRpcServices() throws IOException {
082      return new MasterRpcServices(this) {
083
084        @Override
085        public RegionServerStartupResponse regionServerStartup(RpcController controller,
086          RegionServerStartupRequest request) throws ServiceException {
087          RegionServerStartupResponse resp = super.regionServerStartup(controller, request);
088          ServerManager serverManager = getServerManager();
089          // to let the region server actual online otherwise we can not assign meta region
090          new HashMap<>(serverManager.getOnlineServers()).forEach((sn, sm) -> {
091            if (sm.getLastReportTimestamp() <= 0) {
092              try {
093                serverManager.regionServerReport(sn,
094                  ServerMetricsBuilder.newBuilder(sn).setVersionNumber(sm.getVersionNumber())
095                    .setVersion(sm.getVersion())
096                    .setLastReportTimestamp(EnvironmentEdgeManager.currentTime()).build());
097              } catch (YouAreDeadException e) {
098                throw new UncheckedIOException(e);
099              }
100            }
101          });
102          return resp;
103        }
104      };
105    }
106  }
107
108  @BeforeClass
109  public static void startCluster() throws Exception {
110    LOG.info("Starting cluster");
111    TEST_UTIL = new HBaseTestingUtility();
112    // Set master class and use default values for other options.
113    StartMiniClusterOption option =
114      StartMiniClusterOption.builder().masterClass(MyMaster.class).build();
115    TEST_UTIL.startMiniCluster(option);
116    cluster = TEST_UTIL.getHBaseCluster();
117    LOG.info("Waiting for active/ready master");
118    cluster.waitForActiveAndReadyMaster();
119    master = cluster.getMaster();
120  }
121
122  @AfterClass
123  public static void after() throws Exception {
124    if (TEST_UTIL != null) {
125      TEST_UTIL.shutdownMiniCluster();
126    }
127  }
128
129  @Test
130  public void testClusterRequests() throws Exception {
131
132    // sending fake request to master to see how metric value has changed
133
134    RegionServerStatusProtos.RegionServerReportRequest.Builder request =
135      RegionServerStatusProtos.RegionServerReportRequest.newBuilder();
136    ServerName serverName = cluster.getMaster(0).getServerName();
137    request.setServer(ProtobufUtil.toServerName(serverName));
138    long expectedRequestNumber = 10000;
139
140    MetricsMasterSource masterSource = master.getMasterMetrics().getMetricsSource();
141    ClusterStatusProtos.ServerLoad sl = ClusterStatusProtos.ServerLoad.newBuilder()
142      .setTotalNumberOfRequests(expectedRequestNumber).build();
143    request.setLoad(sl);
144
145    master.getMasterRpcServices().regionServerReport(null, request.build());
146    boolean tablesOnMaster = LoadBalancer.isTablesOnMaster(TEST_UTIL.getConfiguration());
147    if (tablesOnMaster) {
148      metricsHelper.assertCounter("cluster_requests", expectedRequestNumber, masterSource);
149    } else {
150      metricsHelper.assertCounterGt("cluster_requests", expectedRequestNumber, masterSource);
151
152    }
153
154    expectedRequestNumber = 15000;
155
156    sl = ClusterStatusProtos.ServerLoad.newBuilder().setTotalNumberOfRequests(expectedRequestNumber)
157      .build();
158    request.setLoad(sl);
159
160    master.getMasterRpcServices().regionServerReport(null, request.build());
161    if (tablesOnMaster) {
162      metricsHelper.assertCounter("cluster_requests", expectedRequestNumber, masterSource);
163    } else {
164      metricsHelper.assertCounterGt("cluster_requests", expectedRequestNumber, masterSource);
165    }
166
167    master.stopMaster();
168  }
169
170  @Test
171  public void testDefaultMasterMetrics() throws Exception {
172    MetricsMasterSource masterSource = master.getMasterMetrics().getMetricsSource();
173    boolean tablesOnMaster = LoadBalancer.isTablesOnMaster(TEST_UTIL.getConfiguration());
174    metricsHelper.assertGauge("numRegionServers", 1 + (tablesOnMaster ? 1 : 0), masterSource);
175    metricsHelper.assertGauge("averageLoad", 1 + (tablesOnMaster ? 0 : 1), masterSource);
176    metricsHelper.assertGauge("numDeadRegionServers", 0, masterSource);
177    metricsHelper.assertGauge("numDrainingRegionServers", 0, masterSource);
178
179    metricsHelper.assertGauge("masterStartTime", master.getMasterStartTime(), masterSource);
180    metricsHelper.assertGauge("masterActiveTime", master.getMasterActiveTime(), masterSource);
181
182    metricsHelper.assertTag("isActiveMaster", "true", masterSource);
183    metricsHelper.assertTag("serverName", master.getServerName().toString(), masterSource);
184    metricsHelper.assertTag("clusterId", master.getClusterId(), masterSource);
185    metricsHelper.assertTag("zookeeperQuorum", master.getZooKeeper().getQuorum(), masterSource);
186
187    metricsHelper.assertCounter(MetricsMasterSource.SERVER_CRASH_METRIC_PREFIX + "SubmittedCount",
188      0, masterSource);
189    metricsHelper.assertGauge("oldWALsDirSize", master.getMasterWalManager().getOldWALsDirSize(),
190      masterSource);
191  }
192
193  @Test
194  public void testDefaultMasterProcMetrics() throws Exception {
195    MetricsMasterProcSource masterSource = master.getMasterMetrics().getMetricsProcSource();
196    metricsHelper.assertGauge("numMasterWALs", master.getNumWALFiles(), masterSource);
197  }
198}