001/* 002 * Licensed to the Apache Software Foundation (ASF) under one 003 * or more contributor license agreements. See the NOTICE file 004 * distributed with this work for additional information 005 * regarding copyright ownership. The ASF licenses this file 006 * to you under the Apache License, Version 2.0 (the 007 * "License"); you may not use this file except in compliance 008 * with the License. You may obtain a copy of the License at 009 * 010 * http://www.apache.org/licenses/LICENSE-2.0 011 * 012 * Unless required by applicable law or agreed to in writing, software 013 * distributed under the License is distributed on an "AS IS" BASIS, 014 * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. 015 * See the License for the specific language governing permissions and 016 * limitations under the License. 017 */ 018package org.apache.hadoop.hbase.chaos.factories; 019 020import org.apache.hadoop.hbase.chaos.actions.Action; 021import org.apache.hadoop.hbase.chaos.actions.DumpClusterStatusAction; 022import org.apache.hadoop.hbase.chaos.actions.DumpHdfsClusterStatusAction; 023import org.apache.hadoop.hbase.chaos.actions.ForceBalancerAction; 024import org.apache.hadoop.hbase.chaos.actions.GracefulRollingRestartRsAction; 025import org.apache.hadoop.hbase.chaos.actions.RestartActiveMasterAction; 026import org.apache.hadoop.hbase.chaos.actions.RestartActiveNameNodeAction; 027import org.apache.hadoop.hbase.chaos.actions.RestartRandomDataNodeAction; 028import org.apache.hadoop.hbase.chaos.actions.RestartRandomJournalNodeAction; 029import org.apache.hadoop.hbase.chaos.actions.RestartRandomRsExceptMetaAction; 030import org.apache.hadoop.hbase.chaos.actions.RestartRandomZKNodeAction; 031import org.apache.hadoop.hbase.chaos.actions.RollingBatchRestartRsAction; 032import org.apache.hadoop.hbase.chaos.actions.RollingBatchSuspendResumeRsAction; 033import org.apache.hadoop.hbase.chaos.monkies.ChaosMonkey; 034import org.apache.hadoop.hbase.chaos.monkies.PolicyBasedChaosMonkey; 035import org.apache.hadoop.hbase.chaos.policies.CompositeSequentialPolicy; 036import org.apache.hadoop.hbase.chaos.policies.DoActionsOncePolicy; 037import org.apache.hadoop.hbase.chaos.policies.PeriodicRandomActionPolicy; 038 039/** 040 * Creates ChaosMonkeys for doing server restart actions, but not flush / compact / snapshot kind of 041 * actions. 042 */ 043public class ServerAndDependenciesKillingMonkeyFactory extends MonkeyFactory { 044 045 @Override 046 public ChaosMonkey build() { 047 loadProperties(); 048 049 // Destructive actions to mess things around. Cannot run batch restart. 050 // @formatter:off 051 Action[] actions1 = new Action[] { 052 new RestartRandomRsExceptMetaAction(restartRandomRsExceptMetaSleepTime), 053 new RestartActiveMasterAction(restartActiveMasterSleepTime), 054 // only allow 2 servers to be dead. 055 new RollingBatchRestartRsAction(rollingBatchRestartRSSleepTime, 1.0f, 2, true), 056 new ForceBalancerAction(), 057 new RestartActiveNameNodeAction(restartActiveNameNodeSleepTime), 058 new RestartRandomDataNodeAction(restartRandomDataNodeSleepTime), 059 new RestartRandomJournalNodeAction(restartRandomJournalNodeSleepTime), 060 new RestartRandomZKNodeAction(restartRandomZKNodeSleepTime), 061 new GracefulRollingRestartRsAction(gracefulRollingRestartTSSLeepTime), 062 new RollingBatchSuspendResumeRsAction(rollingBatchSuspendRSSleepTime, 063 rollingBatchSuspendRSRatio) 064 }; 065 // @formatter:on 066 067 // Action to log more info for debugging 068 Action[] actions2 = 069 new Action[] { new DumpClusterStatusAction(), new DumpHdfsClusterStatusAction() }; 070 071 return new PolicyBasedChaosMonkey(properties, util, 072 new CompositeSequentialPolicy(new DoActionsOncePolicy(action1Period, actions1), 073 new PeriodicRandomActionPolicy(action1Period, actions1)), 074 new PeriodicRandomActionPolicy(action1Period, actions2)); 075 } 076}