bdev.py 73.3 KB
Newer Older
Iustin Pop's avatar
Iustin Pop committed
1
#
Iustin Pop's avatar
Iustin Pop committed
2 3 4 5 6 7 8 9 10 11 12 13 14 15 16 17 18 19 20 21 22 23 24 25 26
#

# Copyright (C) 2006, 2007 Google Inc.
#
# This program is free software; you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation; either version 2 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful, but
# WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the GNU
# General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program; if not, write to the Free Software
# Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA
# 02110-1301, USA.


"""Block device abstraction"""

import re
import time
import errno
27
import pyparsing as pyp
Iustin Pop's avatar
Iustin Pop committed
28 29 30 31

from ganeti import utils
from ganeti import logger
from ganeti import errors
32
from ganeti import constants
Iustin Pop's avatar
Iustin Pop committed
33 34 35 36 37 38 39 40 41 42 43 44 45 46 47 48 49 50 51 52 53 54 55 56 57 58 59 60 61 62 63 64 65 66 67 68 69 70 71 72 73 74 75 76 77 78 79 80 81 82 83 84 85 86 87 88 89 90 91 92 93 94 95 96 97 98 99 100 101 102 103 104 105 106 107 108 109 110 111 112 113 114 115 116 117 118 119 120 121 122 123 124


class BlockDev(object):
  """Block device abstract class.

  A block device can be in the following states:
    - not existing on the system, and by `Create()` it goes into:
    - existing but not setup/not active, and by `Assemble()` goes into:
    - active read-write and by `Open()` it goes into
    - online (=used, or ready for use)

  A device can also be online but read-only, however we are not using
  the readonly state (MD and LV have it, if needed in the future)
  and we are usually looking at this like at a stack, so it's easier
  to conceptualise the transition from not-existing to online and back
  like a linear one.

  The many different states of the device are due to the fact that we
  need to cover many device types:
    - logical volumes are created, lvchange -a y $lv, and used
    - md arrays are created or assembled and used
    - drbd devices are attached to a local disk/remote peer and made primary

  The status of the device can be examined by `GetStatus()`, which
  returns a numerical value, depending on the position in the
  transition stack of the device.

  A block device is identified by three items:
    - the /dev path of the device (dynamic)
    - a unique ID of the device (static)
    - it's major/minor pair (dynamic)

  Not all devices implement both the first two as distinct items. LVM
  logical volumes have their unique ID (the pair volume group, logical
  volume name) in a 1-to-1 relation to the dev path. For MD devices,
  the /dev path is dynamic and the unique ID is the UUID generated at
  array creation plus the slave list. For DRBD devices, the /dev path
  is again dynamic and the unique id is the pair (host1, dev1),
  (host2, dev2).

  You can get to a device in two ways:
    - creating the (real) device, which returns you
      an attached instance (lvcreate, mdadm --create)
    - attaching of a python instance to an existing (real) device

  The second point, the attachement to a device, is different
  depending on whether the device is assembled or not. At init() time,
  we search for a device with the same unique_id as us. If found,
  good. It also means that the device is already assembled. If not,
  after assembly we'll have our correct major/minor.

  """
  STATUS_UNKNOWN = 0
  STATUS_EXISTING = 1
  STATUS_STANDBY = 2
  STATUS_ONLINE = 3

  STATUS_MAP = {
    STATUS_UNKNOWN: "unknown",
    STATUS_EXISTING: "existing",
    STATUS_STANDBY: "ready for use",
    STATUS_ONLINE: "online",
    }

  def __init__(self, unique_id, children):
    self._children = children
    self.dev_path = None
    self.unique_id = unique_id
    self.major = None
    self.minor = None

  def Assemble(self):
    """Assemble the device from its components.

    If this is a plain block device (e.g. LVM) than assemble does
    nothing, as the LVM has no children and we don't put logical
    volumes offline.

    One guarantee is that after the device has been assembled, it
    knows its major/minor numbers. This allows other devices (usually
    parents) to probe correctly for their children.

    """
    status = True
    for child in self._children:
      if not isinstance(child, BlockDev):
        raise TypeError("Invalid child passed of type '%s'" % type(child))
      if not status:
        break
      status = status and child.Assemble()
      if not status:
        break
125 126 127 128 129 130 131

      try:
        child.Open()
      except errors.BlockDeviceError:
        for child in self._children:
          child.Shutdown()
        raise
Iustin Pop's avatar
Iustin Pop committed
132 133 134 135 136 137 138 139 140 141 142 143 144 145 146 147 148 149 150 151 152 153 154 155 156 157 158 159 160 161 162 163 164 165 166 167 168 169 170 171 172 173

    if not status:
      for child in self._children:
        child.Shutdown()
    return status

  def Attach(self):
    """Find a device which matches our config and attach to it.

    """
    raise NotImplementedError

  def Close(self):
    """Notifies that the device will no longer be used for I/O.

    """
    raise NotImplementedError

  @classmethod
  def Create(cls, unique_id, children, size):
    """Create the device.

    If the device cannot be created, it will return None
    instead. Error messages go to the logging system.

    Note that for some devices, the unique_id is used, and for other,
    the children. The idea is that these two, taken together, are
    enough for both creation and assembly (later).

    """
    raise NotImplementedError

  def Remove(self):
    """Remove this device.

    This makes sense only for some of the device types: LV and to a
    lesser degree, md devices. Also note that if the device can't
    attach, the removal can't be completed.

    """
    raise NotImplementedError

Iustin Pop's avatar
Iustin Pop committed
174 175 176 177 178 179 180 181
  def Rename(self, new_id):
    """Rename this device.

    This may or may not make sense for a given device type.

    """
    raise NotImplementedError

Iustin Pop's avatar
Iustin Pop committed
182 183 184 185 186 187 188 189 190 191 192 193 194 195 196 197 198 199 200 201 202 203 204 205 206 207 208 209 210 211 212 213 214 215 216 217 218 219 220 221 222 223 224 225 226 227 228
  def GetStatus(self):
    """Return the status of the device.

    """
    raise NotImplementedError

  def Open(self, force=False):
    """Make the device ready for use.

    This makes the device ready for I/O. For now, just the DRBD
    devices need this.

    The force parameter signifies that if the device has any kind of
    --force thing, it should be used, we know what we are doing.

    """
    raise NotImplementedError

  def Shutdown(self):
    """Shut down the device, freeing its children.

    This undoes the `Assemble()` work, except for the child
    assembling; as such, the children on the device are still
    assembled after this call.

    """
    raise NotImplementedError

  def SetSyncSpeed(self, speed):
    """Adjust the sync speed of the mirror.

    In case this is not a mirroring device, this is no-op.

    """
    result = True
    if self._children:
      for child in self._children:
        result = result and child.SetSyncSpeed(speed)
    return result

  def GetSyncStatus(self):
    """Returns the sync status of the device.

    If this device is a mirroring device, this function returns the
    status of the mirror.

    Returns:
229 230 231
     (sync_percent, estimated_time, is_degraded, ldisk)

    If sync_percent is None, it means the device is not syncing.
Iustin Pop's avatar
Iustin Pop committed
232 233

    If estimated_time is None, it means we can't estimate
234 235
    the time needed, otherwise it's the time left in seconds.

Iustin Pop's avatar
Iustin Pop committed
236 237 238 239
    If is_degraded is True, it means the device is missing
    redundancy. This is usually a sign that something went wrong in
    the device setup, if sync_percent is None.

240 241 242 243
    The ldisk parameter represents the degradation of the local
    data. This is only valid for some devices, the rest will always
    return False (not degraded).

Iustin Pop's avatar
Iustin Pop committed
244
    """
245
    return None, None, False, False
Iustin Pop's avatar
Iustin Pop committed
246 247 248 249 250 251 252 253 254 255


  def CombinedSyncStatus(self):
    """Calculate the mirror status recursively for our children.

    The return value is the same as for `GetSyncStatus()` except the
    minimum percent and maximum time are calculated across our
    children.

    """
256
    min_percent, max_time, is_degraded, ldisk = self.GetSyncStatus()
Iustin Pop's avatar
Iustin Pop committed
257 258
    if self._children:
      for child in self._children:
259
        c_percent, c_time, c_degraded, c_ldisk = child.GetSyncStatus()
Iustin Pop's avatar
Iustin Pop committed
260 261 262 263 264 265 266 267 268
        if min_percent is None:
          min_percent = c_percent
        elif c_percent is not None:
          min_percent = min(min_percent, c_percent)
        if max_time is None:
          max_time = c_time
        elif c_time is not None:
          max_time = max(max_time, c_time)
        is_degraded = is_degraded or c_degraded
269 270
        ldisk = ldisk or c_ldisk
    return min_percent, max_time, is_degraded, ldisk
Iustin Pop's avatar
Iustin Pop committed
271 272


273 274 275 276 277 278 279 280 281 282
  def SetInfo(self, text):
    """Update metadata with info text.

    Only supported for some device types.

    """
    for child in self._children:
      child.SetInfo(text)


Iustin Pop's avatar
Iustin Pop committed
283 284 285 286 287 288 289 290 291 292 293 294 295 296 297 298 299 300 301 302 303 304 305 306 307 308 309 310 311 312 313 314 315
  def __repr__(self):
    return ("<%s: unique_id: %s, children: %s, %s:%s, %s>" %
            (self.__class__, self.unique_id, self._children,
             self.major, self.minor, self.dev_path))


class LogicalVolume(BlockDev):
  """Logical Volume block device.

  """
  def __init__(self, unique_id, children):
    """Attaches to a LV device.

    The unique_id is a tuple (vg_name, lv_name)

    """
    super(LogicalVolume, self).__init__(unique_id, children)
    if not isinstance(unique_id, (tuple, list)) or len(unique_id) != 2:
      raise ValueError("Invalid configuration data %s" % str(unique_id))
    self._vg_name, self._lv_name = unique_id
    self.dev_path = "/dev/%s/%s" % (self._vg_name, self._lv_name)
    self.Attach()

  @classmethod
  def Create(cls, unique_id, children, size):
    """Create a new logical volume.

    """
    if not isinstance(unique_id, (tuple, list)) or len(unique_id) != 2:
      raise ValueError("Invalid configuration data %s" % str(unique_id))
    vg_name, lv_name = unique_id
    pvs_info = cls.GetPVInfo(vg_name)
    if not pvs_info:
316 317
      raise errors.BlockDeviceError("Can't compute PV info for vg %s" %
                                    vg_name)
Iustin Pop's avatar
Iustin Pop committed
318 319
    pvs_info.sort()
    pvs_info.reverse()
320 321 322 323 324 325

    pvlist = [ pv[1] for pv in pvs_info ]
    free_size = sum([ pv[0] for pv in pvs_info ])

    # The size constraint should have been checked from the master before
    # calling the create function.
Iustin Pop's avatar
Iustin Pop committed
326
    if free_size < size:
327 328
      raise errors.BlockDeviceError("Not enough free space: required %s,"
                                    " available %s" % (size, free_size))
Iustin Pop's avatar
Iustin Pop committed
329
    result = utils.RunCmd(["lvcreate", "-L%dm" % size, "-n%s" % lv_name,
330
                           vg_name] + pvlist)
Iustin Pop's avatar
Iustin Pop committed
331 332 333 334 335 336 337 338 339 340 341 342 343
    if result.failed:
      raise errors.BlockDeviceError(result.fail_reason)
    return LogicalVolume(unique_id, children)

  @staticmethod
  def GetPVInfo(vg_name):
    """Get the free space info for PVs in a volume group.

    Args:
      vg_name: the volume group name

    Returns:
      list of (free_space, name) with free_space in mebibytes
344

Iustin Pop's avatar
Iustin Pop committed
345 346 347 348 349 350 351 352 353 354 355 356 357 358 359 360 361 362 363 364 365 366 367 368 369 370 371 372 373 374 375 376 377 378 379
    """
    command = ["pvs", "--noheadings", "--nosuffix", "--units=m",
               "-opv_name,vg_name,pv_free,pv_attr", "--unbuffered",
               "--separator=:"]
    result = utils.RunCmd(command)
    if result.failed:
      logger.Error("Can't get the PV information: %s" % result.fail_reason)
      return None
    data = []
    for line in result.stdout.splitlines():
      fields = line.strip().split(':')
      if len(fields) != 4:
        logger.Error("Can't parse pvs output: line '%s'" % line)
        return None
      # skip over pvs from another vg or ones which are not allocatable
      if fields[1] != vg_name or fields[3][0] != 'a':
        continue
      data.append((float(fields[2]), fields[0]))

    return data

  def Remove(self):
    """Remove this logical volume.

    """
    if not self.minor and not self.Attach():
      # the LV does not exist
      return True
    result = utils.RunCmd(["lvremove", "-f", "%s/%s" %
                           (self._vg_name, self._lv_name)])
    if result.failed:
      logger.Error("Can't lvremove: %s" % result.fail_reason)

    return not result.failed

Iustin Pop's avatar
Iustin Pop committed
380 381 382 383 384 385 386 387 388 389 390 391 392 393 394
  def Rename(self, new_id):
    """Rename this logical volume.

    """
    if not isinstance(new_id, (tuple, list)) or len(new_id) != 2:
      raise errors.ProgrammerError("Invalid new logical id '%s'" % new_id)
    new_vg, new_name = new_id
    if new_vg != self._vg_name:
      raise errors.ProgrammerError("Can't move a logical volume across"
                                   " volume groups (from %s to to %s)" %
                                   (self._vg_name, new_vg))
    result = utils.RunCmd(["lvrename", new_vg, self._lv_name, new_name])
    if result.failed:
      raise errors.BlockDeviceError("Failed to rename the logical volume: %s" %
                                    result.output)
395 396 397
    self._lv_name = new_name
    self.dev_path = "/dev/%s/%s" % (self._vg_name, self._lv_name)

Iustin Pop's avatar
Iustin Pop committed
398 399 400 401 402 403 404 405 406 407 408

  def Attach(self):
    """Attach to an existing LV.

    This method will try to see if an existing and active LV exists
    which matches the our name. If so, its major/minor will be
    recorded.

    """
    result = utils.RunCmd(["lvdisplay", self.dev_path])
    if result.failed:
409 410
      logger.Error("Can't find LV %s: %s, %s" %
                   (self.dev_path, result.fail_reason, result.output))
Iustin Pop's avatar
Iustin Pop committed
411 412 413 414 415 416 417 418 419 420 421 422 423
      return False
    match = re.compile("^ *Block device *([0-9]+):([0-9]+).*$")
    for line in result.stdout.splitlines():
      match_result = match.match(line)
      if match_result:
        self.major = int(match_result.group(1))
        self.minor = int(match_result.group(2))
        return True
    return False

  def Assemble(self):
    """Assemble the device.

424 425 426
    We alway run `lvchange -ay` on the LV to ensure it's active before
    use, as there were cases when xenvg was not active after boot
    (also possibly after disk issues).
Iustin Pop's avatar
Iustin Pop committed
427 428

    """
429 430 431 432
    result = utils.RunCmd(["lvchange", "-ay", self.dev_path])
    if result.failed:
      logger.Error("Can't activate lv %s: %s" % (self.dev_path, result.output))
    return not result.failed
Iustin Pop's avatar
Iustin Pop committed
433 434 435 436 437 438 439 440 441 442 443 444 445 446 447 448 449 450 451 452 453 454 455 456 457 458 459 460 461 462 463 464 465 466 467 468 469 470

  def Shutdown(self):
    """Shutdown the device.

    This is a no-op for the LV device type, as we don't deactivate the
    volumes on shutdown.

    """
    return True

  def GetStatus(self):
    """Return the status of the device.

    Logical volumes will can be in all four states, although we don't
    deactivate (lvchange -an) them when shutdown, so STATUS_EXISTING
    should not be seen for our devices.

    """
    result = utils.RunCmd(["lvs", "--noheadings", "-olv_attr", self.dev_path])
    if result.failed:
      logger.Error("Can't display lv: %s" % result.fail_reason)
      return self.STATUS_UNKNOWN
    out = result.stdout.strip()
    # format: type/permissions/alloc/fixed_minor/state/open
    if len(out) != 6:
      return self.STATUS_UNKNOWN
    #writable = (out[1] == "w")
    active = (out[4] == "a")
    online = (out[5] == "o")
    if online:
      retval = self.STATUS_ONLINE
    elif active:
      retval = self.STATUS_STANDBY
    else:
      retval = self.STATUS_EXISTING

    return retval

471 472 473 474 475 476 477
  def GetSyncStatus(self):
    """Returns the sync status of the device.

    If this device is a mirroring device, this function returns the
    status of the mirror.

    Returns:
478
     (sync_percent, estimated_time, is_degraded, ldisk)
479 480 481

    For logical volumes, sync_percent and estimated_time are always
    None (no recovery in progress, as we don't handle the mirrored LV
482 483
    case). The is_degraded parameter is the inverse of the ldisk
    parameter.
484

485 486 487 488 489
    For the ldisk parameter, we check if the logical volume has the
    'virtual' type, which means it's not backed by existing storage
    anymore (read from it return I/O error). This happens after a
    physical disk failure and subsequent 'vgreduce --removemissing' on
    the volume group.
490 491 492 493 494

    """
    result = utils.RunCmd(["lvs", "--noheadings", "-olv_attr", self.dev_path])
    if result.failed:
      logger.Error("Can't display lv: %s" % result.fail_reason)
495
      return None, None, True, True
496 497 498
    out = result.stdout.strip()
    # format: type/permissions/alloc/fixed_minor/state/open
    if len(out) != 6:
499 500 501 502 503
      logger.Debug("Error in lvs output: attrs=%s, len != 6" % out)
      return None, None, True, True
    ldisk = out[0] == 'v' # virtual volume, i.e. doesn't have
                          # backing storage
    return None, None, ldisk, ldisk
504

Iustin Pop's avatar
Iustin Pop committed
505 506 507 508 509 510
  def Open(self, force=False):
    """Make the device ready for I/O.

    This is a no-op for the LV device type.

    """
511
    pass
Iustin Pop's avatar
Iustin Pop committed
512 513 514 515 516 517 518

  def Close(self):
    """Notifies that the device will no longer be used for I/O.

    This is a no-op for the LV device type.

    """
519
    pass
Iustin Pop's avatar
Iustin Pop committed
520 521 522 523 524 525 526 527 528 529 530 531 532

  def Snapshot(self, size):
    """Create a snapshot copy of an lvm block device.

    """
    snap_name = self._lv_name + ".snap"

    # remove existing snapshot if found
    snap = LogicalVolume((self._vg_name, snap_name), None)
    snap.Remove()

    pvs_info = self.GetPVInfo(self._vg_name)
    if not pvs_info:
533 534
      raise errors.BlockDeviceError("Can't compute PV info for vg %s" %
                                    self._vg_name)
Iustin Pop's avatar
Iustin Pop committed
535 536 537 538
    pvs_info.sort()
    pvs_info.reverse()
    free_size, pv_name = pvs_info[0]
    if free_size < size:
539 540
      raise errors.BlockDeviceError("Not enough free space: required %s,"
                                    " available %s" % (size, free_size))
Iustin Pop's avatar
Iustin Pop committed
541 542 543 544

    result = utils.RunCmd(["lvcreate", "-L%dm" % size, "-s",
                           "-n%s" % snap_name, self.dev_path])
    if result.failed:
545 546
      raise errors.BlockDeviceError("command: %s error: %s" %
                                    (result.cmd, result.fail_reason))
Iustin Pop's avatar
Iustin Pop committed
547 548 549

    return snap_name

550 551 552 553 554 555 556 557 558 559 560 561 562 563 564 565
  def SetInfo(self, text):
    """Update metadata with info text.

    """
    BlockDev.SetInfo(self, text)

    # Replace invalid characters
    text = re.sub('^[^A-Za-z0-9_+.]', '_', text)
    text = re.sub('[^-A-Za-z0-9_+.]', '_', text)

    # Only up to 128 characters are allowed
    text = text[:128]

    result = utils.RunCmd(["lvchange", "--addtag", text,
                           self.dev_path])
    if result.failed:
566 567
      raise errors.BlockDeviceError("Command: %s error: %s" %
                                    (result.cmd, result.fail_reason))
568 569


Iustin Pop's avatar
Iustin Pop committed
570 571 572 573 574 575 576 577 578 579 580 581 582 583 584 585 586 587 588 589 590 591 592 593 594 595 596 597 598 599 600 601 602 603 604 605 606 607 608 609 610 611 612 613 614 615 616 617 618 619 620 621 622 623 624 625 626 627 628 629 630 631 632
class MDRaid1(BlockDev):
  """raid1 device implemented via md.

  """
  def __init__(self, unique_id, children):
    super(MDRaid1, self).__init__(unique_id, children)
    self.major = 9
    self.Attach()

  def Attach(self):
    """Find an array which matches our config and attach to it.

    This tries to find a MD array which has the same UUID as our own.

    """
    minor = self._FindMDByUUID(self.unique_id)
    if minor is not None:
      self._SetFromMinor(minor)
    else:
      self.minor = None
      self.dev_path = None

    return (minor is not None)

  @staticmethod
  def _GetUsedDevs():
    """Compute the list of in-use MD devices.

    It doesn't matter if the used device have other raid level, just
    that they are in use.

    """
    mdstat = open("/proc/mdstat", "r")
    data = mdstat.readlines()
    mdstat.close()

    used_md = {}
    valid_line = re.compile("^md([0-9]+) : .*$")
    for line in data:
      match = valid_line.match(line)
      if match:
        md_no = int(match.group(1))
        used_md[md_no] = line

    return used_md

  @staticmethod
  def _GetDevInfo(minor):
    """Get info about a MD device.

    Currently only uuid is returned.

    """
    result = utils.RunCmd(["mdadm", "-D", "/dev/md%d" % minor])
    if result.failed:
      logger.Error("Can't display md: %s" % result.fail_reason)
      return None
    retval = {}
    for line in result.stdout.splitlines():
      line = line.strip()
      kv = line.split(" : ", 1)
      if kv:
        if kv[0] == "UUID":
633
          retval["uuid"] = kv[1].split()[0]
Iustin Pop's avatar
Iustin Pop committed
634 635 636 637 638 639 640 641 642 643 644 645 646 647 648 649 650 651 652
        elif kv[0] == "State":
          retval["state"] = kv[1].split(", ")
    return retval

  @staticmethod
  def _FindUnusedMinor():
    """Compute an unused MD minor.

    This code assumes that there are 256 minors only.

    """
    used_md = MDRaid1._GetUsedDevs()
    i = 0
    while i < 256:
      if i not in used_md:
        break
      i += 1
    if i == 256:
      logger.Error("Critical: Out of md minor numbers.")
Iustin Pop's avatar
Iustin Pop committed
653
      raise errors.BlockDeviceError("Can't find a free MD minor")
Iustin Pop's avatar
Iustin Pop committed
654 655 656 657 658 659 660 661 662 663 664 665 666 667
    return i

  @classmethod
  def _FindMDByUUID(cls, uuid):
    """Find the minor of an MD array with a given UUID.

    """
    md_list = cls._GetUsedDevs()
    for minor in md_list:
      info = cls._GetDevInfo(minor)
      if info and info["uuid"] == uuid:
        return minor
    return None

668 669 670 671 672 673 674 675 676 677 678 679 680 681 682 683 684 685 686 687 688 689 690 691 692 693 694 695 696 697 698 699 700 701 702 703 704 705 706 707 708 709 710
  @staticmethod
  def _ZeroSuperblock(dev_path):
    """Zero the possible locations for an MD superblock.

    The zero-ing can't be done via ``mdadm --zero-superblock`` as that
    fails in versions 2.x with the same error code as non-writable
    device.

    The superblocks are located at (negative values are relative to
    the end of the block device):
      - -128k to end for version 0.90 superblock
      - -8k to -12k for version 1.0 superblock (included in the above)
      - 0k to 4k for version 1.1 superblock
      - 4k to 8k for version 1.2 superblock

    To cover all situations, the zero-ing will be:
      - 0k to 128k
      - -128k to end

    As such, the minimum device size must be 128k, otherwise we'll get
    I/O errors.

    Note that this function depends on the fact that one can open,
    read and write block devices normally.

    """
    overwrite_size = 128 * 1024
    empty_buf = '\0' * overwrite_size
    fd = open(dev_path, "r+")
    try:
      fd.seek(0, 0)
      p1 = fd.tell()
      fd.write(empty_buf)
      p2 = fd.tell()
      logger.Debug("Zeroed %s from %d to %d" % (dev_path, p1, p2))
      fd.seek(-overwrite_size, 2)
      p1 = fd.tell()
      fd.write(empty_buf)
      p2 = fd.tell()
      logger.Debug("Zeroed %s from %d to %d" % (dev_path, p1, p2))
    finally:
      fd.close()

Iustin Pop's avatar
Iustin Pop committed
711 712 713 714 715 716 717 718 719 720 721 722
  @classmethod
  def Create(cls, unique_id, children, size):
    """Create a new MD raid1 array.

    """
    if not isinstance(children, (tuple, list)):
      raise ValueError("Invalid setup data for MDRaid1 dev: %s" %
                       str(children))
    for i in children:
      if not isinstance(i, BlockDev):
        raise ValueError("Invalid member in MDRaid1 dev: %s" % type(i))
    for i in children:
723 724 725 726 727
      try:
        cls._ZeroSuperblock(i.dev_path)
      except EnvironmentError, err:
        logger.Error("Can't zero superblock for %s: %s" %
                     (i.dev_path, str(err)))
Iustin Pop's avatar
Iustin Pop committed
728 729 730 731 732 733 734 735
        return None
    minor = cls._FindUnusedMinor()
    result = utils.RunCmd(["mdadm", "--create", "/dev/md%d" % minor,
                           "--auto=yes", "--force", "-l1",
                           "-n%d" % len(children)] +
                          [dev.dev_path for dev in children])

    if result.failed:
736 737
      logger.Error("Can't create md: %s: %s" % (result.fail_reason,
                                                result.output))
Iustin Pop's avatar
Iustin Pop committed
738 739 740 741 742 743 744 745 746 747 748 749 750 751 752 753
      return None
    info = cls._GetDevInfo(minor)
    if not info or not "uuid" in info:
      logger.Error("Wrong information returned from mdadm -D: %s" % str(info))
      return None
    return MDRaid1(info["uuid"], children)

  def Remove(self):
    """Stub remove function for MD RAID 1 arrays.

    We don't remove the superblock right now. Mark a to do.

    """
    #TODO: maybe zero superblock on child devices?
    return self.Shutdown()

Iustin Pop's avatar
Iustin Pop committed
754 755 756 757 758 759 760
  def Rename(self, new_id):
    """Rename a device.

    This is not supported for md raid1 devices.

    """
    raise errors.ProgrammerError("Can't rename a md raid1 device")
Iustin Pop's avatar
Iustin Pop committed
761

762 763
  def AddChildren(self, devices):
    """Add new member(s) to the md raid1.
Iustin Pop's avatar
Iustin Pop committed
764 765 766

    """
    if self.minor is None and not self.Attach():
767
      raise errors.BlockDeviceError("Can't attach to device")
768 769 770 771 772 773 774 775

    args = ["mdadm", "-a", self.dev_path]
    for dev in devices:
      if dev.dev_path is None:
        raise errors.BlockDeviceError("Child '%s' is not initialised" % dev)
      dev.Open()
      args.append(dev.dev_path)
    result = utils.RunCmd(args)
Iustin Pop's avatar
Iustin Pop committed
776
    if result.failed:
777 778
      raise errors.BlockDeviceError("Failed to add new device to array: %s" %
                                    result.output)
779
    new_len = len(self._children) + len(devices)
Iustin Pop's avatar
Iustin Pop committed
780 781
    result = utils.RunCmd(["mdadm", "--grow", self.dev_path, "-n", new_len])
    if result.failed:
782 783
      raise errors.BlockDeviceError("Can't grow md array: %s" %
                                    result.output)
784
    self._children.extend(devices)
Iustin Pop's avatar
Iustin Pop committed
785

786 787
  def RemoveChildren(self, devices):
    """Remove member(s) from the md raid1.
Iustin Pop's avatar
Iustin Pop committed
788 789 790

    """
    if self.minor is None and not self.Attach():
791
      raise errors.BlockDeviceError("Can't attach to device")
792 793 794 795 796 797
    new_len = len(self._children) - len(devices)
    if new_len < 1:
      raise errors.BlockDeviceError("Can't reduce to less than one child")
    args = ["mdadm", "-f", self.dev_path]
    orig_devs = []
    for dev in devices:
798
      args.append(dev)
799
      for c in self._children:
800
        if c.dev_path == dev:
801 802 803 804 805 806
          orig_devs.append(c)
          break
      else:
        raise errors.BlockDeviceError("Can't find device '%s' for removal" %
                                      dev)
    result = utils.RunCmd(args)
Iustin Pop's avatar
Iustin Pop committed
807
    if result.failed:
808
      raise errors.BlockDeviceError("Failed to mark device(s) as failed: %s" %
809
                                    result.output)
Iustin Pop's avatar
Iustin Pop committed
810 811 812 813

    # it seems here we need a short delay for MD to update its
    # superblocks
    time.sleep(0.5)
814 815
    args[1] = "-r"
    result = utils.RunCmd(args)
Iustin Pop's avatar
Iustin Pop committed
816
    if result.failed:
817 818
      raise errors.BlockDeviceError("Failed to remove device(s) from array:"
                                    " %s" % result.output)
Iustin Pop's avatar
Iustin Pop committed
819 820 821
    result = utils.RunCmd(["mdadm", "--grow", "--force", self.dev_path,
                           "-n", new_len])
    if result.failed:
822 823
      raise errors.BlockDeviceError("Can't shrink md array: %s" %
                                    result.output)
824 825
    for dev in orig_devs:
      self._children.remove(dev)
Iustin Pop's avatar
Iustin Pop committed
826 827 828 829 830 831 832 833 834 835 836 837 838 839 840 841 842 843 844 845 846 847 848 849 850 851 852 853 854 855 856 857 858 859 860 861 862 863 864 865 866 867 868 869

  def GetStatus(self):
    """Return the status of the device.

    """
    self.Attach()
    if self.minor is None:
      retval = self.STATUS_UNKNOWN
    else:
      retval = self.STATUS_ONLINE
    return retval

  def _SetFromMinor(self, minor):
    """Set our parameters based on the given minor.

    This sets our minor variable and our dev_path.

    """
    self.minor = minor
    self.dev_path = "/dev/md%d" % minor

  def Assemble(self):
    """Assemble the MD device.

    At this point we should have:
      - list of children devices
      - uuid

    """
    result = super(MDRaid1, self).Assemble()
    if not result:
      return result
    md_list = self._GetUsedDevs()
    for minor in md_list:
      info = self._GetDevInfo(minor)
      if info and info["uuid"] == self.unique_id:
        self._SetFromMinor(minor)
        logger.Info("MD array %s already started" % str(self))
        return True
    free_minor = self._FindUnusedMinor()
    result = utils.RunCmd(["mdadm", "-A", "--auto=yes", "--uuid",
                           self.unique_id, "/dev/md%d" % free_minor] +
                          [bdev.dev_path for bdev in self._children])
    if result.failed:
870 871
      logger.Error("Can't assemble MD array: %s: %s" %
                   (result.fail_reason, result.output))
Iustin Pop's avatar
Iustin Pop committed
872 873 874 875 876 877 878 879 880 881 882 883 884 885 886 887 888 889 890 891 892 893 894 895 896 897 898 899 900 901 902 903 904 905 906 907 908 909 910 911 912 913 914 915 916 917 918 919
      self.minor = None
    else:
      self.minor = free_minor
    return not result.failed

  def Shutdown(self):
    """Tear down the MD array.

    This does a 'mdadm --stop' so after this command, the array is no
    longer available.

    """
    if self.minor is None and not self.Attach():
      logger.Info("MD object not attached to a device")
      return True

    result = utils.RunCmd(["mdadm", "--stop", "/dev/md%d" % self.minor])
    if result.failed:
      logger.Error("Can't stop MD array: %s" % result.fail_reason)
      return False
    self.minor = None
    self.dev_path = None
    return True

  def SetSyncSpeed(self, kbytes):
    """Set the maximum sync speed for the MD array.

    """
    result = super(MDRaid1, self).SetSyncSpeed(kbytes)
    if self.minor is None:
      logger.Error("MD array not attached to a device")
      return False
    f = open("/sys/block/md%d/md/sync_speed_max" % self.minor, "w")
    try:
      f.write("%d" % kbytes)
    finally:
      f.close()
    f = open("/sys/block/md%d/md/sync_speed_min" % self.minor, "w")
    try:
      f.write("%d" % (kbytes/2))
    finally:
      f.close()
    return result

  def GetSyncStatus(self):
    """Returns the sync status of the device.

    Returns:
920
     (sync_percent, estimated_time, is_degraded, ldisk)
Iustin Pop's avatar
Iustin Pop committed
921 922 923

    If sync_percent is None, it means all is ok
    If estimated_time is None, it means we can't esimate
924 925 926
    the time needed, otherwise it's the time left in seconds.

    The ldisk parameter is always true for MD devices.
Iustin Pop's avatar
Iustin Pop committed
927 928 929 930 931 932 933 934 935 936 937 938 939

    """
    if self.minor is None and not self.Attach():
      raise errors.BlockDeviceError("Can't attach to device in GetSyncStatus")
    dev_info = self._GetDevInfo(self.minor)
    is_clean = ("state" in dev_info and
                len(dev_info["state"]) == 1 and
                dev_info["state"][0] in ("clean", "active"))
    sys_path = "/sys/block/md%s/md/" % self.minor
    f = file(sys_path + "sync_action")
    sync_status = f.readline().strip()
    f.close()
    if sync_status == "idle":
940
      return None, None, not is_clean, False
Iustin Pop's avatar
Iustin Pop committed
941 942 943 944
    f = file(sys_path + "sync_completed")
    sync_completed = f.readline().strip().split(" / ")
    f.close()
    if len(sync_completed) != 2:
945
      return 0, None, not is_clean, False
Iustin Pop's avatar
Iustin Pop committed
946 947 948 949 950 951 952 953
    sync_done, sync_total = [float(i) for i in sync_completed]
    sync_percent = 100.0*sync_done/sync_total
    f = file(sys_path + "sync_speed")
    sync_speed_k = int(f.readline().strip())
    if sync_speed_k == 0:
      time_est = None
    else:
      time_est = (sync_total - sync_done) / 2 / sync_speed_k
954
    return sync_percent, time_est, not is_clean, False
Iustin Pop's avatar
Iustin Pop committed
955 956 957 958 959 960 961 962

  def Open(self, force=False):
    """Make the device ready for I/O.

    This is a no-op for the MDRaid1 device type, although we could use
    the 2.6.18's new array_state thing.

    """
963
    pass
Iustin Pop's avatar
Iustin Pop committed
964 965 966 967 968 969 970 971

  def Close(self):
    """Notifies that the device will no longer be used for I/O.

    This is a no-op for the MDRaid1 device type, but see comment for
    `Open()`.

    """
972
    pass
Iustin Pop's avatar
Iustin Pop committed
973 974


975 976
class BaseDRBD(BlockDev):
  """Base DRBD class.
Iustin Pop's avatar
Iustin Pop committed
977

978 979 980 981 982
  This class contains a few bits of common functionality between the
  0.7 and 8.x versions of DRBD.

  """
  _VERSION_RE = re.compile(r"^version: (\d+)\.(\d+)\.(\d+)"
983 984
                           r" \(api:(\d+)/proto:(\d+)(?:-(\d+))?\)")

985 986 987 988
  _DRBD_MAJOR = 147
  _ST_UNCONFIGURED = "Unconfigured"
  _ST_WFCONNECTION = "WFConnection"
  _ST_CONNECTED = "Connected"
989 990 991 992 993 994 995 996 997 998 999 1000 1001 1002 1003

  @staticmethod
  def _GetProcData():
    """Return data from /proc/drbd.

    """
    stat = open("/proc/drbd", "r")
    try:
      data = stat.read().splitlines()
    finally:
      stat.close()
    if not data:
      raise errors.BlockDeviceError("Can't read any data from /proc/drbd")
    return data

1004 1005 1006 1007 1008 1009 1010 1011 1012 1013 1014 1015 1016 1017 1018 1019 1020 1021 1022 1023 1024 1025 1026 1027 1028 1029
  @staticmethod
  def _MassageProcData(data):
    """Transform the output of _GetProdData into a nicer form.

    Returns:
      a dictionary of minor: joined lines from /proc/drbd for that minor

    """
    lmatch = re.compile("^ *([0-9]+):.*$")
    results = {}
    old_minor = old_line = None
    for line in data:
      lresult = lmatch.match(line)
      if lresult is not None:
        if old_minor is not None:
          results[old_minor] = old_line
        old_minor = int(lresult.group(1))
        old_line = line
      else:
        if old_minor is not None:
          old_line += " " + line.strip()
    # add last line
    if old_minor is not None:
      results[old_minor] = old_line
    return results

1030 1031 1032 1033
  @classmethod
  def _GetVersion(cls):
    """Return the DRBD version.

1034 1035 1036 1037 1038 1039 1040
    This will return a dict with keys:
      k_major,
      k_minor,
      k_point,
      api,
      proto,
      proto2 (only on drbd > 8.2.X)
1041 1042 1043 1044 1045 1046 1047 1048

    """
    proc_data = cls._GetProcData()
    first_line = proc_data[0].strip()
    version = cls._VERSION_RE.match(first_line)
    if not version:
      raise errors.BlockDeviceError("Can't parse DRBD version from '%s'" %
                                    first_line)
1049 1050 1051 1052 1053 1054 1055 1056 1057 1058 1059 1060

    values = version.groups()
    retval = {'k_major': int(values[0]),
              'k_minor': int(values[1]),
              'k_point': int(values[2]),
              'api': int(values[3]),
              'proto': int(values[4]),
             }
    if values[5] is not None:
      retval['proto2'] = values[5]

    return retval
1061

1062 1063 1064 1065 1066 1067 1068 1069 1070 1071 1072 1073 1074 1075 1076 1077 1078 1079 1080 1081 1082 1083 1084 1085 1086 1087 1088 1089
  @staticmethod
  def _DevPath(minor):
    """Return the path to a drbd device for a given minor.

    """
    return "/dev/drbd%d" % minor

  @classmethod
  def _GetUsedDevs(cls):
    """Compute the list of used DRBD devices.

    """
    data = cls._GetProcData()

    used_devs = {}
    valid_line = re.compile("^ *([0-9]+): cs:([^ ]+).*$")
    for line in data:
      match = valid_line.match(line)
      if not match:
        continue
      minor = int(match.group(1))
      state = match.group(2)
      if state == cls._ST_UNCONFIGURED:
        continue
      used_devs[minor] = state, line

    return used_devs

1090 1091 1092 1093 1094 1095 1096 1097 1098 1099 1100 1101
  def _SetFromMinor(self, minor):
    """Set our parameters based on the given minor.

    This sets our minor variable and our dev_path.

    """
    if minor is None:
      self.minor = self.dev_path = None
    else:
      self.minor = minor
      self.dev_path = self._DevPath(minor)

1102 1103 1104 1105 1106 1107 1108 1109 1110 1111 1112 1113 1114 1115 1116 1117 1118 1119 1120 1121 1122 1123 1124 1125 1126 1127
  @staticmethod
  def _CheckMetaSize(meta_device):
    """Check if the given meta device looks like a valid one.

    This currently only check the size, which must be around
    128MiB.

    """
    result = utils.RunCmd(["blockdev", "--getsize", meta_device])
    if result.failed:
      logger.Error("Failed to get device size: %s" % result.fail_reason)
      return False
    try:
      sectors = int(result.stdout)
    except ValueError:
      logger.Error("Invalid output from blockdev: '%s'" % result.stdout)
      return False
    bytes = sectors * 512
    if bytes < 128 * 1024 * 1024: # less than 128MiB
      logger.Error("Meta device too small (%.2fMib)" % (bytes / 1024 / 1024))
      return False
    if bytes > (128 + 32) * 1024 * 1024: # account for an extra (big) PE on LVM
      logger.Error("Meta device too big (%.2fMiB)" % (bytes / 1024 / 1024))
      return False
    return True

Iustin Pop's avatar
Iustin Pop committed
1128 1129 1130 1131 1132 1133 1134 1135
  def Rename(self, new_id):
    """Rename a device.

    This is not supported for drbd devices.

    """
    raise errors.ProgrammerError("Can't rename a drbd device")

1136 1137

class DRBDev(BaseDRBD):
Iustin Pop's avatar
Iustin Pop committed
1138 1139 1140 1141 1142 1143 1144 1145 1146 1147 1148 1149 1150 1151 1152
  """DRBD block device.

  This implements the local host part of the DRBD device, i.e. it
  doesn't do anything to the supposed peer. If you need a fully
  connected DRBD pair, you need to use this class on both hosts.

  The unique_id for the drbd device is the (local_ip, local_port,
  remote_ip, remote_port) tuple, and it must have two children: the
  data device and the meta_device. The meta device is checked for
  valid size and is zeroed on create.

  """
  def __init__(self, unique_id, children):
    super(DRBDev, self).__init__(unique_id, children)
    self.major = self._DRBD_MAJOR
1153 1154
    version = self._GetVersion()
    if version['k_major'] != 0 and version['k_minor'] != 7:
1155 1156
      raise errors.BlockDeviceError("Mismatch in DRBD kernel version and"
                                    " requested ganeti usage: kernel is"
1157 1158
                                    " %s.%s, ganeti wants 0.7" %
                                    (version['k_major'], version['k_minor']))
Iustin Pop's avatar
Iustin Pop committed
1159 1160 1161 1162 1163 1164 1165 1166 1167 1168 1169 1170 1171 1172 1173 1174 1175 1176 1177 1178
    if len(children) != 2:
      raise ValueError("Invalid configuration data %s" % str(children))
    if not isinstance(unique_id, (tuple, list)) or len(unique_id) != 4:
      raise ValueError("Invalid configuration data %s" % str(unique_id))
    self._lhost, self._lport, self._rhost, self._rport = unique_id
    self.Attach()

  @classmethod
  def _FindUnusedMinor(cls):
    """Find an unused DRBD device.

    """
    data = cls._GetProcData()

    valid_line = re.compile("^ *([0-9]+): cs:Unconfigured$")
    for line in data:
      match = valid_line.match(line)
      if match:
        return int(match.group(1))
    logger.Error("Error: no free drbd minors!")
Iustin Pop's avatar
Iustin Pop committed
1179
    raise errors.BlockDeviceError("Can't find a free DRBD minor")
Iustin Pop's avatar
Iustin Pop committed
1180 1181 1182 1183 1184 1185 1186 1187 1188 1189 1190 1191 1192 1193 1194 1195 1196 1197 1198 1199 1200 1201 1202 1203 1204 1205 1206 1207 1208 1209 1210 1211 1212 1213 1214 1215 1216 1217 1218 1219 1220 1221 1222 1223 1224 1225 1226 1227 1228 1229 1230 1231 1232 1233 1234 1235 1236 1237 1238 1239 1240 1241 1242 1243 1244 1245 1246 1247 1248 1249 1250 1251 1252 1253 1254 1255 1256 1257 1258 1259 1260 1261 1262 1263 1264 1265 1266 1267 1268 1269 1270 1271 1272 1273 1274 1275 1276 1277 1278 1279 1280 1281 1282 1283 1284 1285 1286 1287 1288 1289 1290 1291

  @classmethod
  def _GetDevInfo(cls, minor):
    """Get details about a given DRBD minor.

    This return, if available, the local backing device in (major,
    minor) formant and the local and remote (ip, port) information.

    """
    data = {}
    result = utils.RunCmd(["drbdsetup", cls._DevPath(minor), "show"])
    if result.failed:
      logger.Error("Can't display the drbd config: %s" % result.fail_reason)
      return data
    out = result.stdout
    if out == "Not configured\n":
      return data
    for line in out.splitlines():
      if "local_dev" not in data:
        match = re.match("^Lower device: ([0-9]+):([0-9]+) .*$", line)
        if match:
          data["local_dev"] = (int(match.group(1)), int(match.group(2)))
          continue
      if "meta_dev" not in data:
        match = re.match("^Meta device: (([0-9]+):([0-9]+)|internal).*$", line)
        if match:
          if match.group(2) is not None and match.group(3) is not None:
            # matched on the major/minor
            data["meta_dev"] = (int(match.group(2)), int(match.group(3)))
          else:
            # matched on the "internal" string
            data["meta_dev"] = match.group(1)
            # in this case, no meta_index is in the output
            data["meta_index"] = -1
          continue
      if "meta_index" not in data:
        match = re.match("^Meta index: ([0-9]+).*$", line)
        if match:
          data["meta_index"] = int(match.group(1))
          continue
      if "local_addr" not in data:
        match = re.match("^Local address: ([0-9.]+):([0-9]+)$", line)
        if match:
          data["local_addr"] = (match.group(1), int(match.group(2)))
          continue
      if "remote_addr" not in data:
        match = re.match("^Remote address: ([0-9.]+):([0-9]+)$", line)
        if match:
          data["remote_addr"] = (match.group(1), int(match.group(2)))
          continue
    return data

  def _MatchesLocal(self, info):
    """Test if our local config matches with an existing device.

    The parameter should be as returned from `_GetDevInfo()`. This
    method tests if our local backing device is the same as the one in
    the info parameter, in effect testing if we look like the given
    device.

    """
    if not ("local_dev" in info and "meta_dev" in info and
            "meta_index" in info):
      return False

    backend = self._children[0]
    if backend is not None:
      retval = (info["local_dev"] == (backend.major, backend.minor))
    else:
      retval = (info["local_dev"] == (0, 0))
    meta = self._children[1]
    if meta is not None:
      retval = retval and (info["meta_dev"] == (meta.major, meta.minor))
      retval = retval and (info["meta_index"] == 0)
    else:
      retval = retval and (info["meta_dev"] == "internal" and
                           info["meta_index"] == -1)
    return retval

  def _MatchesNet(self, info):
    """Test if our network config matches with an existing device.

    The parameter should be as returned from `_GetDevInfo()`. This
    method tests if our network configuration is the same as the one
    in the info parameter, in effect testing if we look like the given
    device.

    """
    if (((self._lhost is None and not ("local_addr" in info)) and
         (self._rhost is None and not ("remote_addr" in info)))):
      return True

    if self._lhost is None:
      return False

    if not ("local_addr" in info and
            "remote_addr" in info):
      return False

    retval = (info["local_addr"] == (self._lhost, self._lport))
    retval = (retval and
              info["remote_addr"] == (self._rhost, self._rport))
    return retval

  @classmethod
  def _AssembleLocal(cls, minor, backend, meta):
    """Configure the local part of a DRBD device.

    This is the first thing that must be done on an unconfigured DRBD
    device. And it must be done only once.

    """
1292
    if not cls._CheckMetaSize(meta):
Iustin Pop's avatar
Iustin Pop committed
1293 1294 1295 1296 1297 1298 1299 1300 1301 1302 1303 1304 1305 1306 1307 1308 1309 1310 1311 1312 1313 1314 1315 1316 1317 1318 1319 1320 1321 1322 1323 1324 1325 1326 1327 1328 1329 1330 1331 1332 1333 1334 1335 1336 1337 1338 1339 1340 1341 1342 1343 1344 1345 1346 1347 1348 1349 1350 1351 1352 1353 1354 1355 1356 1357 1358 1359 1360 1361 1362 1363 1364 1365 1366 1367 1368 1369 1370 1371
      return False
    result = utils.RunCmd(["drbdsetup", cls._DevPath(minor), "disk",
                           backend, meta, "0", "-e", "detach"])
    if result.failed:
      logger.Error("Can't attach local disk: %s" % result.output)
    return not result.failed

  @classmethod
  def _ShutdownLocal(cls, minor):
    """Detach from the local device.

    I/Os will continue to be served from the remote device. If we
    don't have a remote device, this operation will fail.

    """
    result = utils.RunCmd(["drbdsetup", cls._DevPath(minor), "detach"])
    if result.failed:
      logger.Error("Can't detach local device: %s" % result.output)
    return not result.failed

  @staticmethod
  def _ShutdownAll(minor):
    """Deactivate the device.

    This will, of course, fail if the device is in use.

    """
    result = utils.RunCmd(["drbdsetup", DRBDev._DevPath(minor), "down"])
    if result.failed:
      logger.Error("Can't shutdown drbd device: %s" % result.output)
    return not result.failed

  @classmethod
  def _AssembleNet(cls, minor, net_info, protocol):
    """Configure the network part of the device.

    This operation can be, in theory, done multiple times, but there
    have been cases (in lab testing) in which the network part of the
    device had become stuck and couldn't be shut down because activity
    from the new peer (also stuck) triggered a timer re-init and
    needed remote peer interface shutdown in order to clear. So please
    don't change online the net config.

    """
    lhost, lport, rhost, rport = net_info
    result = utils.RunCmd(["drbdsetup", cls._DevPath(minor), "net",
                           "%s:%s" % (lhost, lport), "%s:%s" % (rhost, rport),
                           protocol])
    if result.failed:
      logger.Error("Can't setup network for dbrd device: %s" %
                   result.fail_reason)
      return False

    timeout = time.time() + 10
    ok = False
    while time.time() < timeout:
      info = cls._GetDevInfo(minor)
      if not "local_addr" in info or not "remote_addr" in info:
        time.sleep(1)
        continue
      if (info["local_addr"] != (lhost, lport) or
          info["remote_addr"] != (rhost, rport)):
        time.sleep(1)
        continue
      ok = True
      break
    if not ok:
      logger.Error("Timeout while configuring network")
      return False
    return True

  @classmethod
  def _ShutdownNet(cls, minor):
    """Disconnect from the remote peer.

    This fails if we don't have a local device.

    """
    result = utils.RunCmd(["drbdsetup", cls._DevPath(minor), "disconnect"])
1372 1373
    if result.failed:
      logger.Error("Can't shutdown network: %s" % result.output)
Iustin Pop's avatar
Iustin Pop committed
1374 1375 1376 1377 1378 1379 1380 1381 1382 1383 1384 1385 1386 1387 1388 1389 1390 1391 1392 1393 1394 1395 1396 1397 1398 1399 1400 1401 1402 1403 1404 1405 1406 1407 1408 1409 1410 1411 1412 1413 1414 1415 1416 1417 1418 1419 1420 1421 1422 1423 1424 1425 1426 1427 1428 1429 1430 1431 1432 1433 1434 1435 1436 1437 1438 1439 1440 1441 1442 1443 1444 1445 1446 1447 1448 1449 1450 1451 1452 1453 1454 1455 1456 1457 1458 1459 1460 1461 1462 1463 1464 1465 1466 1467 1468 1469 1470 1471 1472 1473 1474 1475 1476 1477 1478 1479 1480 1481 1482
    return not result.failed

  def Assemble(self):
    """Assemble the drbd.

    Method:
      - if we have a local backing device, we bind to it by:
        - checking the list of used drbd devices
        - check if the local minor use of any of them is our own device
        - if yes, abort?
        - if not, bind
      - if we have a local/remote net info:
        - redo the local backing device step for the remote device
        - check if any drbd device is using the local port,
          if yes abort
        - check if any remote drbd device is using the remote
          port, if yes abort (for now)
        - bind our net port
        - bind the remote net port

    """
    self.Attach()
    if self.minor is not None:
      logger.Info("Already assembled")
      return True

    result = super(DRBDev, self).Assemble()
    if not result:
      return result

    minor = self._FindUnusedMinor()
    need_localdev_teardown = False
    if self._children[0]:
      result = self._AssembleLocal(minor, self._children[0].dev_path,
                                   self._children[1].dev_path)
      if not result:
        return False
      need_localdev_teardown = True
    if self._lhost and self._lport and self._rhost and self._rport:
      result = self._AssembleNet(minor,
                                 (self._lhost, self._lport,
                                  self._rhost, self._rport),
                                 "C")
      if not result:
        if need_localdev_teardown:
          # we will ignore failures from this
          logger.Error("net setup failed, tearing down local device")
          self._ShutdownAll(minor)
        return False
    self._SetFromMinor(minor)
    return True

  def Shutdown(self):
    """Shutdown the DRBD device.

    """
    if self.minor is None and not self.Attach():
      logger.Info("DRBD device not attached to a device during Shutdown")
      return True
    if not self._ShutdownAll(self.minor):
      return False
    self.minor = None
    self.dev_path = None
    return True

  def Attach(self):
    """Find a DRBD device which matches our config and attach to it.

    In case of partially attached (local device matches but no network
    setup), we perform the network attach. If successful, we re-test
    the attach if can return success.

    """
    for minor in self._GetUsedDevs():
      info = self._GetDevInfo(minor)
      match_l = self._MatchesLocal(info)
      match_r = self._MatchesNet(info)
      if match_l and match_r:
        break
      if match_l and not match_r and "local_addr" not in info:
        res_r = self._AssembleNet(minor,
                                  (self._lhost, self._lport,
                                   self._rhost, self._rport),
                                  "C")
        if res_r and self._MatchesNet(self._GetDevInfo(minor)):
          break
    else:
      minor = None

    self._SetFromMinor(minor)
    return minor is not None

  def Open(self, force=False):
    """Make the local state primary.

    If the 'force' parameter is given, the '--do-what-I-say' parameter
    is given. Since this is a pottentialy dangerous operation, the
    force flag should be only given after creation, when it actually
    has to be given.

    """
    if self.minor is None and not self.Attach():
      logger.Error("DRBD cannot attach to a device during open")
      return False
    cmd = ["drbdsetup", self.dev_path, "primary"]
    if force:
      cmd.append("--do-what-I-say")
    result = utils.RunCmd(cmd)
    if result.failed:
1483 1484 1485
      msg = ("Can't make drbd device primary: %s" % result.output)
      logger.Error(msg)
      raise errors.BlockDeviceError(msg)
Iustin Pop's avatar
Iustin Pop committed
1486 1487 1488 1489 1490 1491 1492 1493 1494 1495 1496 1497

  def Close(self):
    """Make the local state secondary.

    This will, of course, fail if the device is in use.

    """
    if self.minor is None and not self.Attach():
      logger.Info("Instance not attached to a device")
      raise errors.BlockDeviceError("Can't find device")
    result = utils.RunCmd(["drbdsetup", self.dev_path, "secondary"])
    if result.failed:
1498 1499 1500 1501
      msg = ("Can't switch drbd device to"
             " secondary: %s" % result.output)
      logger.Error(msg)
      raise errors.BlockDeviceError(msg)
Iustin Pop's avatar
Iustin Pop committed
1502 1503 1504 1505 1506 1507 1508 1509 1510 1511 1512 1513 1514 1515 1516 1517 1518 1519 1520

  def SetSyncSpeed(self, kbytes):
    """Set the speed of the DRBD syncer.

    """
    children_result = super(DRBDev, self).SetSyncSpeed(kbytes)
    if self.minor is None:
      logger.Info("Instance not attached to a device")
      return False
    result = utils.RunCmd(["drbdsetup", self.dev_path, "syncer", "-r", "%d" %
                           kbytes])
    if result.failed:
      logger.Error("Can't change syncer rate: %s " % result.fail_reason)
    return not result.failed and children_result

  def GetSyncStatus(self):
    """Returns the sync status of the device.

    Returns:
1521
     (sync_percent, estimated_time, is_degraded, ldisk)
Iustin Pop's avatar
Iustin Pop committed
1522 1523 1524

    If sync_percent is None, it means all is ok
    If estimated_time is None, it means we can't esimate
1525 1526 1527 1528
    the time needed, otherwise it's the time left in seconds.

    The ldisk parameter will be returned as True, since the DRBD7
    devices have not been converted.
Iustin Pop's avatar
Iustin Pop committed
1529 1530 1531 1532 1533 1534 1535 1536 1537 1538 1539 1540 1541 1542 1543 1544 1545 1546 1547 1548 1549 1550 1551 1552 1553 1554

    """
    if self.minor is None and not self.Attach():
      raise errors.BlockDeviceError("Can't attach to device in GetSyncStatus")
    proc_info = self._MassageProcData(self._GetProcData())
    if self.minor not in proc_info:
      raise errors.BlockDeviceError("Can't find myself in /proc (minor %d)" %
                                    self.minor)
    line = proc_info[self.minor]
    match = re.match("^.*sync'ed: *([0-9.]+)%.*"
                     " finish: ([0-9]+):([0-9]+):([0-9]+) .*$", line)
    if match:
      sync_percent = float(match.group(1))
      hours = int(match.group(2))
      minutes = int(match.group(3))
      seconds = int(match.group(4))
      est_time = hours * 3600 + minutes * 60 + seconds
    else:
      sync_percent = None
      est_time = None
    match = re.match("^ *[0-9]+: cs:([^ ]+).*$", line)
    if not match:
      raise errors.BlockDeviceError("Can't find my data in /proc (minor %d)" %
                                    self.minor)
    client_state = match.group(1)
    is_degraded = client_state != "Connected"
1555
    return sync_percent, est_time, is_degraded, False
Iustin Pop's avatar
Iustin Pop committed
1556 1557 1558 1559 1560 1561 1562 1563 1564 1565 1566 1567 1568 1569 1570 1571 1572 1573 1574 1575 1576 1577 1578 1579 1580 1581 1582 1583 1584 1585 1586 1587 1588 1589 1590 1591 1592 1593 1594 1595 1596 1597 1598 1599 1600 1601 1602 1603 1604 1605 1606 1607 1608 1609 1610 1611 1612 1613 1614

  def GetStatus(self):
    """Compute the status of the DRBD device

    Note that DRBD devices don't have the STATUS_EXISTING state.

    """
    if self.minor is None and not self.Attach():
      return self.STATUS_UNKNOWN

    data = self._GetProcData()
    match = re.compile("^ *%d: cs:[^ ]+ st:(Primary|Secondary)/.*$" %
                       self.minor)
    for line in data:
      mresult = match.match(line)
      if mresult:
        break
    else:
      logger.Error("Can't find myself!")
      return self.STATUS_UNKNOWN

    state = mresult.group(2)
    if state == "Primary":
      result = self.STATUS_ONLINE
    else:
      result = self.STATUS_STANDBY

    return result

  @staticmethod
  def _ZeroDevice(device):
    """Zero a device.

    This writes until we get ENOSPC.

    """
    f = open(device, "w")
    buf = "\0" * 1048576
    try:
      while True:
        f.write(buf)
    except IOError, err:
      if err.errno != errno.ENOSPC:
        raise

  @classmethod
  def Create(cls, unique_id, children, size):
    """Create a new DRBD device.

    Since DRBD devices are not created per se, just assembled, this
    function just zeroes the meta device.

    """
    if len(children) != 2:
      raise errors.ProgrammerError("Invalid setup for the drbd device")
    meta = children[1]
    meta.Assemble()
    if not meta.Attach():
      raise errors.BlockDeviceError("Can't attach to meta device")
Iustin Pop's avatar