masterd.py 21.4 KB
Newer Older
1
#
Iustin Pop's avatar
Iustin Pop committed
2
3
#

4
# Copyright (C) 2006, 2007, 2010, 2011 Google Inc.
Iustin Pop's avatar
Iustin Pop committed
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
# 02110-1301, USA.


"""Master daemon program.

Some classes deviates from the standard style guide since the
inheritance from parent classes requires it.

"""

Iustin Pop's avatar
Iustin Pop committed
29
30
# pylint: disable-msg=C0103
# C0103: Invalid name ganeti-masterd
Iustin Pop's avatar
Iustin Pop committed
31

32
33
34
import grp
import os
import pwd
35
import sys
36
import socket
Iustin Pop's avatar
Iustin Pop committed
37
import time
38
import tempfile
39
import logging
Iustin Pop's avatar
Iustin Pop committed
40

41
from optparse import OptionParser
Iustin Pop's avatar
Iustin Pop committed
42

43
from ganeti import config
Iustin Pop's avatar
Iustin Pop committed
44
from ganeti import constants
45
from ganeti import daemon
Iustin Pop's avatar
Iustin Pop committed
46
47
48
from ganeti import mcpu
from ganeti import opcodes
from ganeti import jqueue
49
from ganeti import locking
Iustin Pop's avatar
Iustin Pop committed
50
51
from ganeti import luxi
from ganeti import utils
52
53
from ganeti import errors
from ganeti import ssconf
54
from ganeti import workerpool
55
from ganeti import rpc
56
from ganeti import bootstrap
57
from ganeti import netutils
58
from ganeti import objects
59
from ganeti import query
60
61


62
63
CLIENT_REQUEST_WORKERS = 16

64
65
EXIT_NOTMASTER = constants.EXIT_NOTMASTER
EXIT_NODESETUP_ERROR = constants.EXIT_NODESETUP_ERROR
Iustin Pop's avatar
Iustin Pop committed
66
67


68
class ClientRequestWorker(workerpool.BaseWorker):
69
  # pylint: disable-msg=W0221
70
  def RunTask(self, server, message, client):
71
72
73
    """Process the request.

    """
74
75
    client_ops = ClientOps(server)

76
    try:
77
      (method, args, version) = luxi.ParseRequest(message)
78
79
80
81
82
83
84
    except luxi.ProtocolError, err:
      logging.error("Protocol Error: %s", err)
      client.close_log()
      return

    success = False
    try:
85
86
87
88
89
      # Verify client's version if there was one in the request
      if version is not None and version != constants.LUXI_VERSION:
        raise errors.LuxiError("LUXI version mismatch, server %s, request %s" %
                               (constants.LUXI_VERSION, version))

90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
      result = client_ops.handle_request(method, args)
      success = True
    except errors.GenericError, err:
      logging.exception("Unexpected exception")
      success = False
      result = errors.EncodeException(err)
    except:
      logging.exception("Unexpected exception")
      err = sys.exc_info()
      result = "Caught exception: %s" % str(err[1])

    try:
      reply = luxi.FormatResponse(success, result)
      client.send_message(reply)
      # awake the main thread so that it can write out the data.
      server.awaker.signal()
106
    except: # pylint: disable-msg=W0702
107
108
109
110
111
112
113
114
115
116
117
118
119
120
121
122
123
      logging.exception("Send error")
      client.close_log()


class MasterClientHandler(daemon.AsyncTerminatedMessageStream):
  """Handler for master peers.

  """
  _MAX_UNHANDLED = 1
  def __init__(self, server, connected_socket, client_address, family):
    daemon.AsyncTerminatedMessageStream.__init__(self, connected_socket,
                                                 client_address,
                                                 constants.LUXI_EOM,
                                                 family, self._MAX_UNHANDLED)
    self.server = server

  def handle_message(self, message, _):
124
    self.server.request_workers.AddTask((self.server, message, self))
125
126


127
128
class MasterServer(daemon.AsyncStreamServer):
  """Master Server.
Iustin Pop's avatar
Iustin Pop committed
129

130
131
  This is the main asynchronous master server. It handles connections to the
  master socket.
Iustin Pop's avatar
Iustin Pop committed
132
133

  """
134
135
136
  family = socket.AF_UNIX

  def __init__(self, mainloop, address, uid, gid):
137
    """MasterServer constructor
138

139
140
141
    @type mainloop: ganeti.daemon.Mainloop
    @param mainloop: Mainloop used to poll for I/O events
    @param address: the unix socket address to bind the MasterServer to
142
143
    @param uid: The uid of the owner of the socket
    @param gid: The gid of the owner of the socket
144
145

    """
146
    temp_name = tempfile.mktemp(dir=os.path.dirname(address))
147
    daemon.AsyncStreamServer.__init__(self, self.family, temp_name)
148
149
150
151
    os.chmod(temp_name, 0770)
    os.chown(temp_name, uid, gid)
    os.rename(temp_name, address)

152
    self.mainloop = mainloop
153
    self.awaker = daemon.AsyncAwaker()
154
155

    # We'll only start threads once we've forked.
156
    self.context = None
157
    self.request_workers = None
158

159
  def handle_connection(self, connected_socket, client_address):
160
161
162
    # TODO: add connection count and limit the number of open connections to a
    # maximum number to avoid breaking for lack of file descriptors or memory.
    MasterClientHandler(self, connected_socket, client_address, self.family)
163

164
  def setup_queue(self):
165
    self.context = GanetiContext()
166
167
    self.request_workers = workerpool.WorkerPool("ClientReq",
                                                 CLIENT_REQUEST_WORKERS,
168
                                                 ClientRequestWorker)
Iustin Pop's avatar
Iustin Pop committed
169

170
171
172
173
174
175
176
  def server_cleanup(self):
    """Cleanup the server.

    This involves shutting down the processor threads and the master
    socket.

    """
177
    try:
178
      self.close()
179
    finally:
180
      if self.request_workers:
181
        self.request_workers.TerminateWorkers()
182
183
      if self.context:
        self.context.jobqueue.Shutdown()
Iustin Pop's avatar
Iustin Pop committed
184
185
186
187
188
189
190


class ClientOps:
  """Class holding high-level client operations."""
  def __init__(self, server):
    self.server = server

Iustin Pop's avatar
Iustin Pop committed
191
  def handle_request(self, method, args): # pylint: disable-msg=R0911
192
    queue = self.server.context.jobqueue
193
194
195

    # TODO: Parameter validation

Iustin Pop's avatar
Iustin Pop committed
196
197
    # TODO: Rewrite to not exit in each 'if/elif' branch

198
    if method == luxi.REQ_SUBMIT_JOB:
199
      logging.info("Received new job")
200
      ops = [opcodes.OpCode.LoadOpCode(state) for state in args]
201
      return queue.SubmitJob(ops)
Iustin Pop's avatar
Iustin Pop committed
202

203
204
205
206
207
208
209
    if method == luxi.REQ_SUBMIT_MANY_JOBS:
      logging.info("Received multiple jobs")
      jobs = []
      for ops in args:
        jobs.append([opcodes.OpCode.LoadOpCode(state) for state in ops])
      return queue.SubmitManyJobs(jobs)

210
    elif method == luxi.REQ_CANCEL_JOB:
211
      job_id = args
212
      logging.info("Received job cancel request for %s", job_id)
213
      return queue.CancelJob(job_id)
Iustin Pop's avatar
Iustin Pop committed
214

215
    elif method == luxi.REQ_ARCHIVE_JOB:
216
      job_id = args
217
      logging.info("Received job archive request for %s", job_id)
218
219
      return queue.ArchiveJob(job_id)

Iustin Pop's avatar
Iustin Pop committed
220
    elif method == luxi.REQ_AUTOARCHIVE_JOBS:
221
      (age, timeout) = args
222
223
      logging.info("Received job autoarchive request for age %s, timeout %s",
                   age, timeout)
224
      return queue.AutoArchiveJobs(age, timeout)
Iustin Pop's avatar
Iustin Pop committed
225

226
    elif method == luxi.REQ_WAIT_FOR_JOB_CHANGE:
227
      (job_id, fields, prev_job_info, prev_log_serial, timeout) = args
228
      logging.info("Received job poll request for %s", job_id)
229
      return queue.WaitForJobChanges(job_id, fields, prev_job_info,
230
                                     prev_log_serial, timeout)
231

232
233
234
235
236
237
    elif method == luxi.REQ_QUERY:
      req = objects.QueryRequest.FromDict(args)

      if req.what in constants.QR_OP_QUERY:
        result = self._Query(opcodes.OpQuery(what=req.what, fields=req.fields,
                                             filter=req.filter))
238
239
240
241
      elif req.what == constants.QR_LOCK:
        if req.filter is not None:
          raise errors.OpPrereqError("Lock queries can't be filtered")
        return self.server.context.glm.QueryLocks(req.fields)
242
243
244
245
246
247
248
249
250
251
252
253
254
255
      elif req.what in constants.QR_OP_LUXI:
        raise NotImplementedError
      else:
        raise errors.OpPrereqError("Resource type '%s' unknown" % req.what,
                                   errors.ECODE_INVAL)

      return result

    elif method == luxi.REQ_QUERY_FIELDS:
      req = objects.QueryFieldsRequest.FromDict(args)

      if req.what in constants.QR_OP_QUERY:
        result = self._Query(opcodes.OpQueryFields(what=req.what,
                                                   fields=req.fields))
256
257
      elif req.what == constants.QR_LOCK:
        return query.QueryFields(query.LOCK_FIELDS, req.fields)
258
259
260
261
262
263
264
265
      elif req.what in constants.QR_OP_LUXI:
        raise NotImplementedError
      else:
        raise errors.OpPrereqError("Resource type '%s' unknown" % req.what,
                                   errors.ECODE_INVAL)

      return result

266
267
    elif method == luxi.REQ_QUERY_JOBS:
      (job_ids, fields) = args
268
      if isinstance(job_ids, (tuple, list)) and job_ids:
269
        msg = utils.CommaJoin(job_ids)
270
271
272
      else:
        msg = str(job_ids)
      logging.info("Received job query request for %s", msg)
273
274
      return queue.QueryJobs(job_ids, fields)

275
    elif method == luxi.REQ_QUERY_INSTANCES:
276
      (names, fields, use_locking) = args
277
      logging.info("Received instance query request for %s", names)
278
      if use_locking:
279
280
        raise errors.OpPrereqError("Sync queries are not allowed",
                                   errors.ECODE_INVAL)
281
282
      op = opcodes.OpInstanceQuery(names=names, output_fields=fields,
                                   use_locking=use_locking)
283
284
      return self._Query(op)

Michael Hanselmann's avatar
Michael Hanselmann committed
285
    elif method == luxi.REQ_QUERY_NODES:
286
      (names, fields, use_locking) = args
287
      logging.info("Received node query request for %s", names)
288
      if use_locking:
289
290
        raise errors.OpPrereqError("Sync queries are not allowed",
                                   errors.ECODE_INVAL)
291
292
      op = opcodes.OpNodeQuery(names=names, output_fields=fields,
                               use_locking=use_locking)
Michael Hanselmann's avatar
Michael Hanselmann committed
293
294
      return self._Query(op)

295
296
297
298
299
300
    elif method == luxi.REQ_QUERY_GROUPS:
      (names, fields, use_locking) = args
      logging.info("Received group query request for %s", names)
      if use_locking:
        raise errors.OpPrereqError("Sync queries are not allowed",
                                   errors.ECODE_INVAL)
301
      op = opcodes.OpGroupQuery(names=names, output_fields=fields)
302
303
      return self._Query(op)

304
    elif method == luxi.REQ_QUERY_EXPORTS:
305
      nodes, use_locking = args
306
      if use_locking:
307
308
        raise errors.OpPrereqError("Sync queries are not allowed",
                                   errors.ECODE_INVAL)
309
      logging.info("Received exports query request")
310
      op = opcodes.OpBackupQuery(nodes=nodes, use_locking=use_locking)
311
312
      return self._Query(op)

313
314
    elif method == luxi.REQ_QUERY_CONFIG_VALUES:
      fields = args
315
      logging.info("Received config values query request for %s", fields)
316
      op = opcodes.OpClusterConfigQuery(output_fields=fields)
317
318
      return self._Query(op)

319
    elif method == luxi.REQ_QUERY_CLUSTER_INFO:
320
      logging.info("Received cluster info query request")
321
      op = opcodes.OpClusterQuery()
322
323
      return self._Query(op)

Iustin Pop's avatar
Iustin Pop committed
324
325
326
    elif method == luxi.REQ_QUERY_TAGS:
      kind, name = args
      logging.info("Received tags query request")
Iustin Pop's avatar
Iustin Pop committed
327
      op = opcodes.OpTagsGet(kind=kind, name=name)
Iustin Pop's avatar
Iustin Pop committed
328
329
      return self._Query(op)

Michael Hanselmann's avatar
Michael Hanselmann committed
330
331
332
    elif method == luxi.REQ_QUERY_LOCKS:
      (fields, sync) = args
      logging.info("Received locks query request")
333
334
335
      if sync:
        raise NotImplementedError("Synchronous queries are not implemented")
      return self.server.context.glm.OldStyleQueryLocks(fields)
Michael Hanselmann's avatar
Michael Hanselmann committed
336

337
338
    elif method == luxi.REQ_QUEUE_SET_DRAIN_FLAG:
      drain_flag = args
339
340
      logging.info("Received queue drain flag change request to %s",
                   drain_flag)
341
342
      return queue.SetDrainFlag(drain_flag)

343
344
345
346
347
348
349
350
351
352
353
354
355
356
357
358
    elif method == luxi.REQ_SET_WATCHER_PAUSE:
      (until, ) = args

      if until is None:
        logging.info("Received request to no longer pause the watcher")
      else:
        if not isinstance(until, (int, float)):
          raise TypeError("Duration must be an integer or float")

        if until < time.time():
          raise errors.GenericError("Unable to set pause end time in the past")

        logging.info("Received request to pause the watcher until %s", until)

      return _SetWatcherPause(until)

359
    else:
360
361
      logging.info("Received invalid request '%s'", method)
      raise ValueError("Invalid operation '%s'" % method)
Iustin Pop's avatar
Iustin Pop committed
362

363
364
365
366
  def _Query(self, op):
    """Runs the specified opcode and returns the result.

    """
367
368
    # Queries don't have a job id
    proc = mcpu.Processor(self.server.context, None)
369
370
371

    # TODO: Executing an opcode using locks will acquire them in blocking mode.
    # Consider using a timeout for retries.
372
    return proc.ExecOpCode(op, None)
373

Iustin Pop's avatar
Iustin Pop committed
374

375
376
377
378
379
380
class GanetiContext(object):
  """Context common to all ganeti threads.

  This class creates and holds common objects shared by all threads.

  """
Iustin Pop's avatar
Iustin Pop committed
381
382
  # pylint: disable-msg=W0212
  # we do want to ensure a singleton here
383
384
385
386
387
388
389
390
391
392
393
  _instance = None

  def __init__(self):
    """Constructs a new GanetiContext object.

    There should be only a GanetiContext object at any time, so this
    function raises an error if this is not the case.

    """
    assert self.__class__._instance is None, "double GanetiContext instance"

394
    # Create global configuration object
395
    self.cfg = config.ConfigWriter()
396
397

    # Locking manager
Guido Trotter's avatar
Guido Trotter committed
398
    self.glm = locking.GanetiLockManager(
399
                self.cfg.GetNodeList(),
400
                self.cfg.GetNodeGroupList(),
401
402
                self.cfg.GetInstanceList())

403
404
405
    # Job queue
    self.jobqueue = jqueue.JobQueue(self)

406
407
408
409
410
411
412
413
414
415
    # setting this also locks the class against attribute modifications
    self.__class__._instance = self

  def __setattr__(self, name, value):
    """Setting GanetiContext attributes is forbidden after initialization.

    """
    assert self.__class__._instance is None, "Attempt to modify Ganeti Context"
    object.__setattr__(self, name, value)

416
  def AddNode(self, node, ec_id):
417
418
419
420
    """Adds a node to the configuration and lock manager.

    """
    # Add it to the configuration
421
    self.cfg.AddNode(node, ec_id)
422

423
    # If preseeding fails it'll not be added
424
    self.jobqueue.AddNode(node)
425

426
427
428
429
430
431
432
    # Add the new node to the Ganeti Lock Manager
    self.glm.add(locking.LEVEL_NODE, node.name)

  def ReaddNode(self, node):
    """Updates a node that's already in the configuration

    """
433
    # Synchronize the queue again
434
    self.jobqueue.AddNode(node)
435
436
437
438
439
440
441
442

  def RemoveNode(self, name):
    """Removes a node from the configuration and lock manager.

    """
    # Remove node from configuration
    self.cfg.RemoveNode(name)

443
444
445
    # Notify job queue
    self.jobqueue.RemoveNode(name)

446
447
448
    # Remove the node from the Ganeti Lock Manager
    self.glm.remove(locking.LEVEL_NODE, name)

449

450
451
452
453
454
455
456
457
458
459
460
461
462
def _SetWatcherPause(until):
  """Creates or removes the watcher pause file.

  @type until: None or int
  @param until: Unix timestamp saying until when the watcher shouldn't run

  """
  if until is None:
    utils.RemoveFile(constants.WATCHER_PAUSEFILE)
  else:
    utils.WriteFile(constants.WATCHER_PAUSEFILE,
                    data="%d\n" % (until, ))

463
464
  return until

465

466
@rpc.RunWithRPC
467
468
469
470
471
472
473
474
475
def CheckAgreement():
  """Check the agreement on who is the master.

  The function uses a very simple algorithm: we must get more positive
  than negative answers. Since in most of the cases we are the master,
  we'll use our own config file for getting the node list. In the
  future we could collect the current node list from our (possibly
  obsolete) known nodes.

476
477
478
479
480
481
482
483
484
485
  In order to account for cold-start of all nodes, we retry for up to
  a minute until we get a real answer as the top-voted one. If the
  nodes are more out-of-sync, for now manual startup of the master
  should be attempted.

  Note that for a even number of nodes cluster, we need at least half
  of the nodes (beside ourselves) to vote for us. This creates a
  problem on two-node clusters, since in this case we require the
  other node to be up too to confirm our status.

486
  """
487
  myself = netutils.Hostname.GetSysName()
488
489
490
491
  #temp instantiation of a config writer, used only to get the node list
  cfg = config.ConfigWriter()
  node_list = cfg.GetNodeList()
  del cfg
492
493
494
495
496
497
498
499
500
  retries = 6
  while retries > 0:
    votes = bootstrap.GatherMasterVotes(node_list)
    if not votes:
      # empty node list, this is a one node cluster
      return True
    if votes[0][0] is None:
      retries -= 1
      time.sleep(10)
501
      continue
502
503
    break
  if retries == 0:
Iustin Pop's avatar
Iustin Pop committed
504
505
    logging.critical("Cluster inconsistent, most of the nodes didn't answer"
                     " after multiple retries. Aborting startup")
506
507
    logging.critical("Use the --no-voting option if you understand what"
                     " effects it has on the cluster state")
Iustin Pop's avatar
Iustin Pop committed
508
    return False
509
510
511
  # here a real node is at the top of the list
  all_votes = sum(item[1] for item in votes)
  top_node, top_votes = votes[0]
512

513
514
515
  result = False
  if top_node != myself:
    logging.critical("It seems we are not the master (top-voted node"
Iustin Pop's avatar
Iustin Pop committed
516
517
                     " is %s with %d out of %d votes)", top_node, top_votes,
                     all_votes)
518
  elif top_votes < all_votes - top_votes:
519
    logging.critical("It seems we are not the master (%d votes for,"
520
521
522
523
524
                     " %d votes against)", top_votes, all_votes - top_votes)
  else:
    result = True

  return result
525

Michael Hanselmann's avatar
Michael Hanselmann committed
526

527
528
529
530
531
532
533
534
535
536
@rpc.RunWithRPC
def ActivateMasterIP():
  # activate ip
  master_node = ssconf.SimpleStore().GetMasterNode()
  result = rpc.RpcRunner.call_node_start_master(master_node, False, False)
  msg = result.fail_msg
  if msg:
    logging.error("Can't activate master IP address: %s", msg)


537
538
539
540
def CheckMasterd(options, args):
  """Initial checks whether to run or exit with a failure.

  """
541
542
543
544
  if args: # masterd doesn't take any arguments
    print >> sys.stderr, ("Usage: %s [-f] [-d]" % sys.argv[0])
    sys.exit(constants.EXIT_FAILURE)

545
546
  ssconf.CheckMaster(options.debug)

547
548
549
550
551
552
553
554
  try:
    options.uid = pwd.getpwnam(constants.MASTERD_USER).pw_uid
    options.gid = grp.getgrnam(constants.DAEMONS_GROUP).gr_gid
  except KeyError:
    print >> sys.stderr, ("User or group not existing on system: %s:%s" %
                          (constants.MASTERD_USER, constants.DAEMONS_GROUP))
    sys.exit(constants.EXIT_FAILURE)

555
556
557
558
559
560
561
562
563
564
565
566
567
568
569
570
571
572
573
574
575
576
  # Check the configuration is sane before anything else
  try:
    config.ConfigWriter()
  except errors.ConfigVersionMismatch, err:
    v1 = "%s.%s.%s" % constants.SplitVersion(err.args[0])
    v2 = "%s.%s.%s" % constants.SplitVersion(err.args[1])
    print >> sys.stderr,  \
        ("Configuration version mismatch. The current Ganeti software"
         " expects version %s, but the on-disk configuration file has"
         " version %s. This is likely the result of upgrading the"
         " software without running the upgrade procedure. Please contact"
         " your cluster administrator or complete the upgrade using the"
         " cfgupgrade utility, after reading the upgrade notes." %
         (v1, v2))
    sys.exit(constants.EXIT_FAILURE)
  except errors.ConfigurationError, err:
    print >> sys.stderr, \
        ("Configuration error while opening the configuration file: %s\n"
         "This might be caused by an incomplete software upgrade or"
         " by a corrupted configuration file. Until the problem is fixed"
         " the master daemon cannot start." % str(err))
    sys.exit(constants.EXIT_FAILURE)
577

578
579
580
581
582
583
584
585
586
587
588
589
590
  # If CheckMaster didn't fail we believe we are the master, but we have to
  # confirm with the other nodes.
  if options.no_voting:
    if options.yes_do_it:
      return

    sys.stdout.write("The 'no voting' option has been selected.\n")
    sys.stdout.write("This is dangerous, please confirm by"
                     " typing uppercase 'yes': ")
    sys.stdout.flush()

    confirmation = sys.stdin.readline().strip()
    if confirmation != "YES":
Iustin Pop's avatar
Iustin Pop committed
591
      print >> sys.stderr, "Aborting."
592
593
594
595
596
597
      sys.exit(constants.EXIT_FAILURE)

    return

  # CheckAgreement uses RPC and threads, hence it needs to be run in a separate
  # process before we call utils.Daemonize in the current process.
598
  if not utils.RunInSeparateProcess(CheckAgreement):
599
600
    sys.exit(constants.EXIT_FAILURE)

601
602
603
604
605
606
  # ActivateMasterIP also uses RPC/threads, so we run it again via a
  # separate process.

  # TODO: decide whether failure to activate the master IP is a fatal error
  utils.RunInSeparateProcess(ActivateMasterIP)

607

608
609
def PrepMasterd(options, _):
  """Prep master daemon function, executed with the PID file held.
610

611
612
613
614
  """
  # This is safe to do as the pid file guarantees against
  # concurrent execution.
  utils.RemoveFile(constants.MASTER_SOCKET)
615

616
  mainloop = daemon.Mainloop()
617
  master = MasterServer(mainloop, constants.MASTER_SOCKET,
618
                        options.uid, options.gid)
619
620
621
622
623
624
625
626
  return (mainloop, master)


def ExecMasterd(options, args, prep_data): # pylint: disable-msg=W0613
  """Main master daemon function, executed with the PID file held.

  """
  (mainloop, master) = prep_data
627
  try:
628
    rpc.Init()
629
    try:
630
631
      master.setup_queue()
      try:
632
        mainloop.Run()
633
634
      finally:
        master.server_cleanup()
635
    finally:
636
      rpc.Shutdown()
637
  finally:
638
    utils.RemoveFile(constants.MASTER_SOCKET)
639

Iustin Pop's avatar
Iustin Pop committed
640

641
def Main():
642
643
644
645
646
647
648
649
650
651
652
653
  """Main function"""
  parser = OptionParser(description="Ganeti master daemon",
                        usage="%prog [-f] [-d]",
                        version="%%prog (ganeti) %s" %
                        constants.RELEASE_VERSION)
  parser.add_option("--no-voting", dest="no_voting",
                    help="Do not check that the nodes agree on this node"
                    " being the master and start the daemon unconditionally",
                    default=False, action="store_true")
  parser.add_option("--yes-do-it", dest="yes_do_it",
                    help="Override interactive check for --no-voting",
                    default=False, action="store_true")
654
  daemon.GenericMain(constants.MASTERD, parser, CheckMasterd, PrepMasterd,
Iustin Pop's avatar
Iustin Pop committed
655
                     ExecMasterd, multithreaded=True)