View Javadoc

1   /**
2    * Licensed to the Apache Software Foundation (ASF) under one
3    * or more contributor license agreements.  See the NOTICE file
4    * distributed with this work for additional information
5    * regarding copyright ownership.  The ASF licenses this file
6    * to you under the Apache License, Version 2.0 (the
7    * "License"); you may not use this file except in compliance
8    * with the License.  You may obtain a copy of the License at
9    *
10   *     http://www.apache.org/licenses/LICENSE-2.0
11   *
12   * Unless required by applicable law or agreed to in writing, software
13   * distributed under the License is distributed on an "AS IS" BASIS,
14   * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
15   * See the License for the specific language governing permissions and
16   * limitations under the License.
17   */
18  package org.apache.hadoop.hbase.master.snapshot;
19  
20  import java.io.IOException;
21  import java.util.HashSet;
22  import java.util.List;
23  import java.util.Set;
24  
25  import org.apache.commons.logging.Log;
26  import org.apache.commons.logging.LogFactory;
27  import org.apache.hadoop.classification.InterfaceAudience;
28  import org.apache.hadoop.fs.Path;
29  import org.apache.hadoop.hbase.HRegionInfo;
30  import org.apache.hadoop.hbase.ServerName;
31  import org.apache.hadoop.hbase.errorhandling.ForeignException;
32  import org.apache.hadoop.hbase.master.MasterServices;
33  import org.apache.hadoop.hbase.master.metrics.MasterMetrics;
34  import org.apache.hadoop.hbase.procedure.Procedure;
35  import org.apache.hadoop.hbase.procedure.ProcedureCoordinator;
36  import org.apache.hadoop.hbase.protobuf.generated.HBaseProtos.SnapshotDescription;
37  import org.apache.hadoop.hbase.regionserver.HRegion;
38  import org.apache.hadoop.hbase.snapshot.HBaseSnapshotException;
39  import org.apache.hadoop.hbase.snapshot.SnapshotDescriptionUtils;
40  import org.apache.hadoop.hbase.util.Pair;
41  
42  import com.google.common.collect.Lists;
43  
44  /**
45   * Handle the master side of taking a snapshot of an online table, regardless of snapshot type.
46   * Uses a {@link Procedure} to run the snapshot across all the involved region servers.
47   * @see ProcedureCoordinator
48   */
49  @InterfaceAudience.Private
50  public class EnabledTableSnapshotHandler extends TakeSnapshotHandler {
51  
52    private static final Log LOG = LogFactory.getLog(EnabledTableSnapshotHandler.class);
53    private final ProcedureCoordinator coordinator;
54  
55    public EnabledTableSnapshotHandler(SnapshotDescription snapshot, MasterServices master,
56        final SnapshotManager manager, final MasterMetrics metricsMaster) {
57      super(snapshot, master, metricsMaster);
58      this.coordinator = manager.getCoordinator();
59    }
60  
61    // TODO consider switching over to using regionnames, rather than server names. This would allow
62    // regions to migrate during a snapshot, and then be involved when they are ready. Still want to
63    // enforce a snapshot time constraints, but lets us be potentially a bit more robust.
64  
65    /**
66     * This method kicks off a snapshot procedure.  Other than that it hangs around for various
67     * phases to complete.
68     */
69    @Override
70    protected void snapshotRegions(List<Pair<HRegionInfo, ServerName>> regions)
71        throws HBaseSnapshotException, IOException {
72      Set<String> regionServers = new HashSet<String>(regions.size());
73      for (Pair<HRegionInfo, ServerName> region : regions) {
74        if (region != null && region.getFirst() != null && region.getSecond() != null) {
75          HRegionInfo hri = region.getFirst();
76          if (hri.isOffline() && (hri.isSplit() || hri.isSplitParent())) continue;
77          regionServers.add(region.getSecond().toString());
78        }
79      }
80  
81      // start the snapshot on the RS
82      Procedure proc = coordinator.startProcedure(this.monitor, this.snapshot.getName(),
83        this.snapshot.toByteArray(), Lists.newArrayList(regionServers));
84      if (proc == null) {
85        String msg = "Failed to submit distributed procedure for snapshot '"
86            + snapshot.getName() + "'";
87        LOG.error(msg);
88        throw new HBaseSnapshotException(msg);
89      }
90  
91      try {
92        // wait for the snapshot to complete.  A timer thread is kicked off that should cancel this
93        // if it takes too long.
94        proc.waitForCompleted();
95        LOG.info("Done waiting - online snapshot for " + this.snapshot.getName());
96  
97        // Take the offline regions as disabled
98        Path snapshotDir = SnapshotDescriptionUtils.getWorkingSnapshotDir(snapshot, rootDir);
99        for (Pair<HRegionInfo, ServerName> region : regions) {
100         HRegionInfo regionInfo = region.getFirst();
101         if (regionInfo.isOffline() && (regionInfo.isSplit() || regionInfo.isSplitParent())) {
102           if (!fs.exists(new Path(snapshotDir, regionInfo.getEncodedName()))) {
103             LOG.info("Take disabled snapshot of offline region=" + regionInfo);
104             snapshotDisabledRegion(regionInfo);
105           }
106         }
107       }
108     } catch (InterruptedException e) {
109       ForeignException ee =
110           new ForeignException("Interrupted while waiting for snapshot to finish", e);
111       monitor.receive(ee);
112       Thread.currentThread().interrupt();
113     } catch (ForeignException e) {
114       monitor.receive(e);
115     }
116   }
117 }