001/*
002 * Licensed to the Apache Software Foundation (ASF) under one
003 * or more contributor license agreements.  See the NOTICE file
004 * distributed with this work for additional information
005 * regarding copyright ownership.  The ASF licenses this file
006 * to you under the Apache License, Version 2.0 (the
007 * "License"); you may not use this file except in compliance
008 * with the License.  You may obtain a copy of the License at
009 *
010 *     http://www.apache.org/licenses/LICENSE-2.0
011 *
012 * Unless required by applicable law or agreed to in writing, software
013 * distributed under the License is distributed on an "AS IS" BASIS,
014 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
015 * See the License for the specific language governing permissions and
016 * limitations under the License.
017 */
018package org.apache.hadoop.hbase.chaos.factories;
019
020import org.apache.hadoop.hbase.chaos.actions.Action;
021import org.apache.hadoop.hbase.chaos.actions.DumpClusterStatusAction;
022import org.apache.hadoop.hbase.chaos.actions.DumpHdfsClusterStatusAction;
023import org.apache.hadoop.hbase.chaos.actions.ForceBalancerAction;
024import org.apache.hadoop.hbase.chaos.actions.GracefulRollingRestartRsAction;
025import org.apache.hadoop.hbase.chaos.actions.RestartActiveMasterAction;
026import org.apache.hadoop.hbase.chaos.actions.RestartActiveNameNodeAction;
027import org.apache.hadoop.hbase.chaos.actions.RestartRandomDataNodeAction;
028import org.apache.hadoop.hbase.chaos.actions.RestartRandomJournalNodeAction;
029import org.apache.hadoop.hbase.chaos.actions.RestartRandomRsExceptMetaAction;
030import org.apache.hadoop.hbase.chaos.actions.RestartRandomZKNodeAction;
031import org.apache.hadoop.hbase.chaos.actions.RollingBatchRestartRsAction;
032import org.apache.hadoop.hbase.chaos.actions.RollingBatchSuspendResumeRsAction;
033import org.apache.hadoop.hbase.chaos.monkies.ChaosMonkey;
034import org.apache.hadoop.hbase.chaos.monkies.PolicyBasedChaosMonkey;
035import org.apache.hadoop.hbase.chaos.policies.CompositeSequentialPolicy;
036import org.apache.hadoop.hbase.chaos.policies.DoActionsOncePolicy;
037import org.apache.hadoop.hbase.chaos.policies.PeriodicRandomActionPolicy;
038
039/**
040 * Creates ChaosMonkeys for doing server restart actions, but not flush / compact / snapshot kind of
041 * actions.
042 */
043public class ServerAndDependenciesKillingMonkeyFactory extends MonkeyFactory {
044
045  @Override
046  public ChaosMonkey build() {
047    loadProperties();
048
049    // Destructive actions to mess things around. Cannot run batch restart.
050    // @formatter:off
051    Action[] actions1 = new Action[] {
052      new RestartRandomRsExceptMetaAction(restartRandomRsExceptMetaSleepTime),
053      new RestartActiveMasterAction(restartActiveMasterSleepTime),
054      // only allow 2 servers to be dead.
055      new RollingBatchRestartRsAction(rollingBatchRestartRSSleepTime, 1.0f, 2, true),
056      new ForceBalancerAction(),
057      new RestartActiveNameNodeAction(restartActiveNameNodeSleepTime),
058      new RestartRandomDataNodeAction(restartRandomDataNodeSleepTime),
059      new RestartRandomJournalNodeAction(restartRandomJournalNodeSleepTime),
060      new RestartRandomZKNodeAction(restartRandomZKNodeSleepTime),
061      new GracefulRollingRestartRsAction(gracefulRollingRestartTSSLeepTime),
062      new RollingBatchSuspendResumeRsAction(rollingBatchSuspendRSSleepTime,
063          rollingBatchSuspendRSRatio)
064    };
065    // @formatter:on
066
067    // Action to log more info for debugging
068    Action[] actions2 =
069      new Action[] { new DumpClusterStatusAction(), new DumpHdfsClusterStatusAction() };
070
071    return new PolicyBasedChaosMonkey(properties, util,
072      new CompositeSequentialPolicy(new DoActionsOncePolicy(action1Period, actions1),
073        new PeriodicRandomActionPolicy(action1Period, actions1)),
074      new PeriodicRandomActionPolicy(action1Period, actions2));
075  }
076}