1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19 package org.apache.hadoop.hbase.master;
20
21 import java.io.File;
22 import java.io.IOException;
23 import java.util.List;
24
25 import org.apache.commons.cli.CommandLine;
26 import org.apache.commons.cli.GnuParser;
27 import org.apache.commons.cli.Options;
28 import org.apache.commons.cli.ParseException;
29 import org.apache.commons.logging.Log;
30 import org.apache.commons.logging.LogFactory;
31 import org.apache.hadoop.hbase.classification.InterfaceAudience;
32 import org.apache.hadoop.conf.Configuration;
33 import org.apache.hadoop.hbase.CoordinatedStateManager;
34 import org.apache.hadoop.hbase.CoordinatedStateManagerFactory;
35 import org.apache.hadoop.hbase.HConstants;
36 import org.apache.hadoop.hbase.LocalHBaseCluster;
37 import org.apache.hadoop.hbase.MasterNotRunningException;
38 import org.apache.hadoop.hbase.ZNodeClearer;
39 import org.apache.hadoop.hbase.ZooKeeperConnectionException;
40 import org.apache.hadoop.hbase.client.Admin;
41 import org.apache.hadoop.hbase.client.HBaseAdmin;
42 import org.apache.hadoop.hbase.regionserver.HRegionServer;
43 import org.apache.hadoop.hbase.util.JVMClusterUtil;
44 import org.apache.hadoop.hbase.util.ServerCommandLine;
45 import org.apache.hadoop.hbase.zookeeper.MiniZooKeeperCluster;
46 import org.apache.hadoop.hbase.zookeeper.ZKUtil;
47 import org.apache.hadoop.metrics2.lib.DefaultMetricsSystem;
48 import org.apache.zookeeper.KeeperException;
49
50 @InterfaceAudience.Private
51 public class HMasterCommandLine extends ServerCommandLine {
52 private static final Log LOG = LogFactory.getLog(HMasterCommandLine.class);
53
54 private static final String USAGE =
55 "Usage: Master [opts] start|stop|clear\n" +
56 " start Start Master. If local mode, start Master and RegionServer in same JVM\n" +
57 " stop Start cluster shutdown; Master signals RegionServer shutdown\n" +
58 " clear Delete the master znode in ZooKeeper after a master crashes\n "+
59 " where [opts] are:\n" +
60 " --minRegionServers=<servers> Minimum RegionServers needed to host user tables.\n" +
61 " --localRegionServers=<servers> " +
62 "RegionServers to start in master process when in standalone mode.\n" +
63 " --masters=<servers> Masters to start in this process.\n" +
64 " --backup Master should start in backup mode";
65
66 private final Class<? extends HMaster> masterClass;
67
68 public HMasterCommandLine(Class<? extends HMaster> masterClass) {
69 this.masterClass = masterClass;
70 }
71
72 protected String getUsage() {
73 return USAGE;
74 }
75
76
77 public int run(String args[]) throws Exception {
78 Options opt = new Options();
79 opt.addOption("localRegionServers", true,
80 "RegionServers to start in master process when running standalone");
81 opt.addOption("masters", true, "Masters to start in this process");
82 opt.addOption("minRegionServers", true, "Minimum RegionServers needed to host user tables");
83 opt.addOption("backup", false, "Do not try to become HMaster until the primary fails");
84
85 CommandLine cmd;
86 try {
87 cmd = new GnuParser().parse(opt, args);
88 } catch (ParseException e) {
89 LOG.error("Could not parse: ", e);
90 usage(null);
91 return 1;
92 }
93
94
95 if (cmd.hasOption("minRegionServers")) {
96 String val = cmd.getOptionValue("minRegionServers");
97 getConf().setInt("hbase.regions.server.count.min",
98 Integer.valueOf(val));
99 LOG.debug("minRegionServers set to " + val);
100 }
101
102
103 if (cmd.hasOption("minServers")) {
104 String val = cmd.getOptionValue("minServers");
105 getConf().setInt("hbase.regions.server.count.min",
106 Integer.valueOf(val));
107 LOG.debug("minServers set to " + val);
108 }
109
110
111 if (cmd.hasOption("backup")) {
112 getConf().setBoolean(HConstants.MASTER_TYPE_BACKUP, true);
113 }
114
115
116
117 if (cmd.hasOption("localRegionServers")) {
118 String val = cmd.getOptionValue("localRegionServers");
119 getConf().setInt("hbase.regionservers", Integer.valueOf(val));
120 LOG.debug("localRegionServers set to " + val);
121 }
122
123 if (cmd.hasOption("masters")) {
124 String val = cmd.getOptionValue("masters");
125 getConf().setInt("hbase.masters", Integer.valueOf(val));
126 LOG.debug("masters set to " + val);
127 }
128
129 @SuppressWarnings("unchecked")
130 List<String> remainingArgs = cmd.getArgList();
131 if (remainingArgs.size() != 1) {
132 usage(null);
133 return 1;
134 }
135
136 String command = remainingArgs.get(0);
137
138 if ("start".equals(command)) {
139 return startMaster();
140 } else if ("stop".equals(command)) {
141 return stopMaster();
142 } else if ("clear".equals(command)) {
143 return (ZNodeClearer.clear(getConf()) ? 0 : 1);
144 } else {
145 usage("Invalid command: " + command);
146 return 1;
147 }
148 }
149
150 private int startMaster() {
151 Configuration conf = getConf();
152 try {
153
154
155 if (LocalHBaseCluster.isLocal(conf)) {
156 DefaultMetricsSystem.setMiniClusterMode(true);
157 final MiniZooKeeperCluster zooKeeperCluster = new MiniZooKeeperCluster(conf);
158 File zkDataPath = new File(conf.get(HConstants.ZOOKEEPER_DATA_DIR));
159
160
161 int zkClientPort = 0;
162
163
164 String zkserver = conf.get(HConstants.ZOOKEEPER_QUORUM);
165 if (zkserver != null) {
166 String[] zkservers = zkserver.split(",");
167
168 if (zkservers.length > 1) {
169
170
171 String errorMsg = "Could not start ZK with " + zkservers.length +
172 " ZK servers in local mode deployment. Aborting as clients (e.g. shell) will not "
173 + "be able to find this ZK quorum.";
174 System.err.println(errorMsg);
175 throw new IOException(errorMsg);
176 }
177
178 String[] parts = zkservers[0].split(":");
179
180 if (parts.length == 2) {
181
182 zkClientPort = Integer.parseInt(parts [1]);
183 }
184 }
185
186 if (zkClientPort == 0) {
187 zkClientPort = conf.getInt(HConstants.ZOOKEEPER_CLIENT_PORT, 0);
188
189 if (zkClientPort == 0) {
190 throw new IOException("No config value for " + HConstants.ZOOKEEPER_CLIENT_PORT);
191 }
192 }
193 zooKeeperCluster.setDefaultClientPort(zkClientPort);
194
195 int zkTickTime = conf.getInt(HConstants.ZOOKEEPER_TICK_TIME, 0);
196 if (zkTickTime > 0) {
197 zooKeeperCluster.setTickTime(zkTickTime);
198 }
199
200
201 ZKUtil.loginServer(conf, "hbase.zookeeper.server.keytab.file",
202 "hbase.zookeeper.server.kerberos.principal", null);
203 int localZKClusterSessionTimeout =
204 conf.getInt(HConstants.ZK_SESSION_TIMEOUT + ".localHBaseCluster", 10*1000);
205 conf.setInt(HConstants.ZK_SESSION_TIMEOUT, localZKClusterSessionTimeout);
206 LOG.info("Starting a zookeeper cluster");
207 int clientPort = zooKeeperCluster.startup(zkDataPath);
208 if (clientPort != zkClientPort) {
209 String errorMsg = "Could not start ZK at requested port of " +
210 zkClientPort + ". ZK was started at port: " + clientPort +
211 ". Aborting as clients (e.g. shell) will not be able to find " +
212 "this ZK quorum.";
213 System.err.println(errorMsg);
214 throw new IOException(errorMsg);
215 }
216 conf.set(HConstants.ZOOKEEPER_CLIENT_PORT, Integer.toString(clientPort));
217
218
219
220 int mastersCount = conf.getInt("hbase.masters", 1);
221 int regionServersCount = conf.getInt("hbase.regionservers", 1);
222
223 conf.setIfUnset("hbase.master.start.timeout.localHBaseCluster", "300000");
224 LOG.info("Starting up instance of localHBaseCluster; master=" + mastersCount +
225 ", regionserversCount=" + regionServersCount);
226 LocalHBaseCluster cluster = new LocalHBaseCluster(conf, mastersCount, regionServersCount,
227 LocalHMaster.class, HRegionServer.class);
228 ((LocalHMaster)cluster.getMaster(0)).setZKCluster(zooKeeperCluster);
229 cluster.startup();
230 waitOnMasterThreads(cluster);
231 } else {
232 logProcessInfo(getConf());
233 CoordinatedStateManager csm =
234 CoordinatedStateManagerFactory.getCoordinatedStateManager(conf);
235 HMaster master = HMaster.constructMaster(masterClass, conf, csm);
236 if (master.isStopped()) {
237 LOG.info("Won't bring the Master up as a shutdown is requested");
238 return 1;
239 }
240 master.start();
241 master.join();
242 if(master.isAborted())
243 throw new RuntimeException("HMaster Aborted");
244 }
245 } catch (Throwable t) {
246 LOG.error("Master exiting", t);
247 return 1;
248 }
249 return 0;
250 }
251
252 @SuppressWarnings("resource")
253 private int stopMaster() {
254 Admin adm = null;
255 try {
256 Configuration conf = getConf();
257
258 conf.setInt(HConstants.HBASE_CLIENT_RETRIES_NUMBER, 1);
259 adm = new HBaseAdmin(getConf());
260 } catch (MasterNotRunningException e) {
261 LOG.error("Master not running");
262 return 1;
263 } catch (ZooKeeperConnectionException e) {
264 LOG.error("ZooKeeper not available");
265 return 1;
266 } catch (IOException e) {
267 LOG.error("Got IOException: " +e.getMessage(), e);
268 return 1;
269 }
270 try {
271 adm.shutdown();
272 } catch (Throwable t) {
273 LOG.error("Failed to stop master", t);
274 return 1;
275 }
276 return 0;
277 }
278
279 private void waitOnMasterThreads(LocalHBaseCluster cluster) throws InterruptedException{
280 List<JVMClusterUtil.MasterThread> masters = cluster.getMasters();
281 List<JVMClusterUtil.RegionServerThread> regionservers = cluster.getRegionServers();
282
283 if (masters != null) {
284 for (JVMClusterUtil.MasterThread t : masters) {
285 t.join();
286 if(t.getMaster().isAborted()) {
287 closeAllRegionServerThreads(regionservers);
288 throw new RuntimeException("HMaster Aborted");
289 }
290 }
291 }
292 }
293
294 private static void closeAllRegionServerThreads(
295 List<JVMClusterUtil.RegionServerThread> regionservers) {
296 for(JVMClusterUtil.RegionServerThread t : regionservers){
297 t.getRegionServer().stop("HMaster Aborted; Bringing down regions servers");
298 }
299 }
300
301
302
303
304 public static class LocalHMaster extends HMaster {
305 private MiniZooKeeperCluster zkcluster = null;
306
307 public LocalHMaster(Configuration conf, CoordinatedStateManager csm)
308 throws IOException, KeeperException, InterruptedException {
309 super(conf, csm);
310 }
311
312 @Override
313 public void run() {
314 super.run();
315 if (this.zkcluster != null) {
316 try {
317 this.zkcluster.shutdown();
318 } catch (IOException e) {
319 e.printStackTrace();
320 }
321 }
322 }
323
324 void setZKCluster(final MiniZooKeeperCluster zkcluster) {
325 this.zkcluster = zkcluster;
326 }
327 }
328 }