github.com/rsampaio/docker@v0.7.2-0.20150827203920-fdc73cc3fc31/daemon/graphdriver/devmapper/deviceset.go (about) 1 // +build linux 2 3 package devmapper 4 5 import ( 6 "encoding/json" 7 "errors" 8 "fmt" 9 "io" 10 "io/ioutil" 11 "os" 12 "os/exec" 13 "path" 14 "path/filepath" 15 "strconv" 16 "strings" 17 "sync" 18 "syscall" 19 "time" 20 21 "github.com/Sirupsen/logrus" 22 "github.com/docker/docker/daemon/graphdriver" 23 "github.com/docker/docker/pkg/devicemapper" 24 "github.com/docker/docker/pkg/parsers" 25 "github.com/docker/docker/pkg/units" 26 "github.com/opencontainers/runc/libcontainer/label" 27 ) 28 29 var ( 30 defaultDataLoopbackSize int64 = 100 * 1024 * 1024 * 1024 31 defaultMetaDataLoopbackSize int64 = 2 * 1024 * 1024 * 1024 32 defaultBaseFsSize uint64 = 100 * 1024 * 1024 * 1024 33 defaultThinpBlockSize uint32 = 128 // 64K = 128 512b sectors 34 defaultUdevSyncOverride = false 35 maxDeviceID = 0xffffff // 24 bit, pool limit 36 deviceIDMapSz = (maxDeviceID + 1) / 8 37 // We retry device removal so many a times that even error messages 38 // will fill up console during normal operation. So only log Fatal 39 // messages by default. 40 logLevel = devicemapper.LogLevelFatal 41 driverDeferredRemovalSupport = false 42 enableDeferredRemoval = false 43 ) 44 45 const deviceSetMetaFile string = "deviceset-metadata" 46 const transactionMetaFile string = "transaction-metadata" 47 48 type transaction struct { 49 OpenTransactionID uint64 `json:"open_transaction_id"` 50 DeviceIDHash string `json:"device_hash"` 51 DeviceID int `json:"device_id"` 52 } 53 54 type devInfo struct { 55 Hash string `json:"-"` 56 DeviceID int `json:"device_id"` 57 Size uint64 `json:"size"` 58 TransactionID uint64 `json:"transaction_id"` 59 Initialized bool `json:"initialized"` 60 devices *DeviceSet 61 62 mountCount int 63 mountPath string 64 65 // The global DeviceSet lock guarantees that we serialize all 66 // the calls to libdevmapper (which is not threadsafe), but we 67 // sometimes release that lock while sleeping. In that case 68 // this per-device lock is still held, protecting against 69 // other accesses to the device that we're doing the wait on. 70 // 71 // WARNING: In order to avoid AB-BA deadlocks when releasing 72 // the global lock while holding the per-device locks all 73 // device locks must be acquired *before* the device lock, and 74 // multiple device locks should be acquired parent before child. 75 lock sync.Mutex 76 } 77 78 type metaData struct { 79 Devices map[string]*devInfo `json:"Devices"` 80 devicesLock sync.Mutex // Protects all read/writes to Devices map 81 } 82 83 // DeviceSet holds information about list of devices 84 type DeviceSet struct { 85 metaData `json:"-"` 86 sync.Mutex `json:"-"` // Protects Devices map and serializes calls into libdevmapper 87 root string 88 devicePrefix string 89 TransactionID uint64 `json:"-"` 90 NextDeviceID int `json:"next_device_id"` 91 deviceIDMap []byte 92 93 // Options 94 dataLoopbackSize int64 95 metaDataLoopbackSize int64 96 baseFsSize uint64 97 filesystem string 98 mountOptions string 99 mkfsArgs []string 100 dataDevice string // block or loop dev 101 dataLoopFile string // loopback file, if used 102 metadataDevice string // block or loop dev 103 metadataLoopFile string // loopback file, if used 104 doBlkDiscard bool 105 thinpBlockSize uint32 106 thinPoolDevice string 107 transaction `json:"-"` 108 overrideUdevSyncCheck bool 109 deferredRemove bool // use deferred removal 110 BaseDeviceUUID string //save UUID of base device 111 } 112 113 // DiskUsage contains information about disk usage and is used when reporting Status of a device. 114 type DiskUsage struct { 115 // Used bytes on the disk. 116 Used uint64 117 // Total bytes on the disk. 118 Total uint64 119 // Available bytes on the disk. 120 Available uint64 121 } 122 123 // Status returns the information about the device. 124 type Status struct { 125 // PoolName is the name of the data pool. 126 PoolName string 127 // DataFile is the actual block device for data. 128 DataFile string 129 // DataLoopback loopback file, if used. 130 DataLoopback string 131 // MetadataFile is the actual block device for metadata. 132 MetadataFile string 133 // MetadataLoopback is the loopback file, if used. 134 MetadataLoopback string 135 // Data is the disk used for data. 136 Data DiskUsage 137 // Metadata is the disk used for meta data. 138 Metadata DiskUsage 139 // SectorSize size of the vector. 140 SectorSize uint64 141 // UdevSyncSupported is true if sync is supported. 142 UdevSyncSupported bool 143 // DeferredRemoveEnabled is true then the device is not unmounted. 144 DeferredRemoveEnabled bool 145 } 146 147 // Structure used to export image/container metadata in docker inspect. 148 type deviceMetadata struct { 149 deviceID int 150 deviceSize uint64 // size in bytes 151 deviceName string // Device name as used during activation 152 } 153 154 // DevStatus returns information about device mounted containing its id, size and sector information. 155 type DevStatus struct { 156 // DeviceID is the id of the device. 157 DeviceID int 158 // Size is the size of the filesystem. 159 Size uint64 160 // TransactionID is a unique integer per device set used to identify an operation on the file system, this number is incremental. 161 TransactionID uint64 162 // SizeInSectors indicates the size of the sectors allocated. 163 SizeInSectors uint64 164 // MappedSectors indicates number of mapped sectors. 165 MappedSectors uint64 166 // HighestMappedSector is the pointer to the highest mapped sector. 167 HighestMappedSector uint64 168 } 169 170 func getDevName(name string) string { 171 return "/dev/mapper/" + name 172 } 173 174 func (info *devInfo) Name() string { 175 hash := info.Hash 176 if hash == "" { 177 hash = "base" 178 } 179 return fmt.Sprintf("%s-%s", info.devices.devicePrefix, hash) 180 } 181 182 func (info *devInfo) DevName() string { 183 return getDevName(info.Name()) 184 } 185 186 func (devices *DeviceSet) loopbackDir() string { 187 return path.Join(devices.root, "devicemapper") 188 } 189 190 func (devices *DeviceSet) metadataDir() string { 191 return path.Join(devices.root, "metadata") 192 } 193 194 func (devices *DeviceSet) metadataFile(info *devInfo) string { 195 file := info.Hash 196 if file == "" { 197 file = "base" 198 } 199 return path.Join(devices.metadataDir(), file) 200 } 201 202 func (devices *DeviceSet) transactionMetaFile() string { 203 return path.Join(devices.metadataDir(), transactionMetaFile) 204 } 205 206 func (devices *DeviceSet) deviceSetMetaFile() string { 207 return path.Join(devices.metadataDir(), deviceSetMetaFile) 208 } 209 210 func (devices *DeviceSet) oldMetadataFile() string { 211 return path.Join(devices.loopbackDir(), "json") 212 } 213 214 func (devices *DeviceSet) getPoolName() string { 215 if devices.thinPoolDevice == "" { 216 return devices.devicePrefix + "-pool" 217 } 218 return devices.thinPoolDevice 219 } 220 221 func (devices *DeviceSet) getPoolDevName() string { 222 return getDevName(devices.getPoolName()) 223 } 224 225 func (devices *DeviceSet) hasImage(name string) bool { 226 dirname := devices.loopbackDir() 227 filename := path.Join(dirname, name) 228 229 _, err := os.Stat(filename) 230 return err == nil 231 } 232 233 // ensureImage creates a sparse file of <size> bytes at the path 234 // <root>/devicemapper/<name>. 235 // If the file already exists, it does nothing. 236 // Either way it returns the full path. 237 func (devices *DeviceSet) ensureImage(name string, size int64) (string, error) { 238 dirname := devices.loopbackDir() 239 filename := path.Join(dirname, name) 240 241 if err := os.MkdirAll(dirname, 0700); err != nil { 242 return "", err 243 } 244 245 if _, err := os.Stat(filename); err != nil { 246 if !os.IsNotExist(err) { 247 return "", err 248 } 249 logrus.Debugf("Creating loopback file %s for device-manage use", filename) 250 file, err := os.OpenFile(filename, os.O_RDWR|os.O_CREATE, 0600) 251 if err != nil { 252 return "", err 253 } 254 defer file.Close() 255 256 if err := file.Truncate(size); err != nil { 257 return "", err 258 } 259 } 260 return filename, nil 261 } 262 263 func (devices *DeviceSet) allocateTransactionID() uint64 { 264 devices.OpenTransactionID = devices.TransactionID + 1 265 return devices.OpenTransactionID 266 } 267 268 func (devices *DeviceSet) updatePoolTransactionID() error { 269 if err := devicemapper.SetTransactionId(devices.getPoolDevName(), devices.TransactionID, devices.OpenTransactionID); err != nil { 270 return fmt.Errorf("Error setting devmapper transaction ID: %s", err) 271 } 272 devices.TransactionID = devices.OpenTransactionID 273 return nil 274 } 275 276 func (devices *DeviceSet) removeMetadata(info *devInfo) error { 277 if err := os.RemoveAll(devices.metadataFile(info)); err != nil { 278 return fmt.Errorf("Error removing metadata file %s: %s", devices.metadataFile(info), err) 279 } 280 return nil 281 } 282 283 // Given json data and file path, write it to disk 284 func (devices *DeviceSet) writeMetaFile(jsonData []byte, filePath string) error { 285 tmpFile, err := ioutil.TempFile(devices.metadataDir(), ".tmp") 286 if err != nil { 287 return fmt.Errorf("Error creating metadata file: %s", err) 288 } 289 290 n, err := tmpFile.Write(jsonData) 291 if err != nil { 292 return fmt.Errorf("Error writing metadata to %s: %s", tmpFile.Name(), err) 293 } 294 if n < len(jsonData) { 295 return io.ErrShortWrite 296 } 297 if err := tmpFile.Sync(); err != nil { 298 return fmt.Errorf("Error syncing metadata file %s: %s", tmpFile.Name(), err) 299 } 300 if err := tmpFile.Close(); err != nil { 301 return fmt.Errorf("Error closing metadata file %s: %s", tmpFile.Name(), err) 302 } 303 if err := os.Rename(tmpFile.Name(), filePath); err != nil { 304 return fmt.Errorf("Error committing metadata file %s: %s", tmpFile.Name(), err) 305 } 306 307 return nil 308 } 309 310 func (devices *DeviceSet) saveMetadata(info *devInfo) error { 311 jsonData, err := json.Marshal(info) 312 if err != nil { 313 return fmt.Errorf("Error encoding metadata to json: %s", err) 314 } 315 if err := devices.writeMetaFile(jsonData, devices.metadataFile(info)); err != nil { 316 return err 317 } 318 return nil 319 } 320 321 func (devices *DeviceSet) markDeviceIDUsed(deviceID int) { 322 var mask byte 323 i := deviceID % 8 324 mask = 1 << uint(i) 325 devices.deviceIDMap[deviceID/8] = devices.deviceIDMap[deviceID/8] | mask 326 } 327 328 func (devices *DeviceSet) markDeviceIDFree(deviceID int) { 329 var mask byte 330 i := deviceID % 8 331 mask = ^(1 << uint(i)) 332 devices.deviceIDMap[deviceID/8] = devices.deviceIDMap[deviceID/8] & mask 333 } 334 335 func (devices *DeviceSet) isDeviceIDFree(deviceID int) bool { 336 var mask byte 337 i := deviceID % 8 338 mask = (1 << uint(i)) 339 if (devices.deviceIDMap[deviceID/8] & mask) != 0 { 340 return false 341 } 342 return true 343 } 344 345 func (devices *DeviceSet) lookupDevice(hash string) (*devInfo, error) { 346 devices.devicesLock.Lock() 347 defer devices.devicesLock.Unlock() 348 info := devices.Devices[hash] 349 if info == nil { 350 info = devices.loadMetadata(hash) 351 if info == nil { 352 return nil, fmt.Errorf("Unknown device %s", hash) 353 } 354 355 devices.Devices[hash] = info 356 } 357 return info, nil 358 } 359 360 func (devices *DeviceSet) deviceFileWalkFunction(path string, finfo os.FileInfo) error { 361 362 // Skip some of the meta files which are not device files. 363 if strings.HasSuffix(finfo.Name(), ".migrated") { 364 logrus.Debugf("Skipping file %s", path) 365 return nil 366 } 367 368 if strings.HasPrefix(finfo.Name(), ".") { 369 logrus.Debugf("Skipping file %s", path) 370 return nil 371 } 372 373 if finfo.Name() == deviceSetMetaFile { 374 logrus.Debugf("Skipping file %s", path) 375 return nil 376 } 377 378 logrus.Debugf("Loading data for file %s", path) 379 380 hash := finfo.Name() 381 if hash == "base" { 382 hash = "" 383 } 384 385 dinfo := devices.loadMetadata(hash) 386 if dinfo == nil { 387 return fmt.Errorf("Error loading device metadata file %s", hash) 388 } 389 390 if dinfo.DeviceID > maxDeviceID { 391 logrus.Errorf("Ignoring Invalid DeviceID=%d", dinfo.DeviceID) 392 return nil 393 } 394 395 devices.Lock() 396 devices.markDeviceIDUsed(dinfo.DeviceID) 397 devices.Unlock() 398 399 logrus.Debugf("Added deviceID=%d to DeviceIDMap", dinfo.DeviceID) 400 return nil 401 } 402 403 func (devices *DeviceSet) constructDeviceIDMap() error { 404 logrus.Debugf("[deviceset] constructDeviceIDMap()") 405 defer logrus.Debugf("[deviceset] constructDeviceIDMap() END") 406 407 var scan = func(path string, info os.FileInfo, err error) error { 408 if err != nil { 409 logrus.Debugf("Can't walk the file %s", path) 410 return nil 411 } 412 413 // Skip any directories 414 if info.IsDir() { 415 return nil 416 } 417 418 return devices.deviceFileWalkFunction(path, info) 419 } 420 421 return filepath.Walk(devices.metadataDir(), scan) 422 } 423 424 func (devices *DeviceSet) unregisterDevice(id int, hash string) error { 425 logrus.Debugf("unregisterDevice(%v, %v)", id, hash) 426 info := &devInfo{ 427 Hash: hash, 428 DeviceID: id, 429 } 430 431 devices.devicesLock.Lock() 432 delete(devices.Devices, hash) 433 devices.devicesLock.Unlock() 434 435 if err := devices.removeMetadata(info); err != nil { 436 logrus.Debugf("Error removing metadata: %s", err) 437 return err 438 } 439 440 return nil 441 } 442 443 func (devices *DeviceSet) registerDevice(id int, hash string, size uint64, transactionID uint64) (*devInfo, error) { 444 logrus.Debugf("registerDevice(%v, %v)", id, hash) 445 info := &devInfo{ 446 Hash: hash, 447 DeviceID: id, 448 Size: size, 449 TransactionID: transactionID, 450 Initialized: false, 451 devices: devices, 452 } 453 454 devices.devicesLock.Lock() 455 devices.Devices[hash] = info 456 devices.devicesLock.Unlock() 457 458 if err := devices.saveMetadata(info); err != nil { 459 // Try to remove unused device 460 devices.devicesLock.Lock() 461 delete(devices.Devices, hash) 462 devices.devicesLock.Unlock() 463 return nil, err 464 } 465 466 return info, nil 467 } 468 469 func (devices *DeviceSet) activateDeviceIfNeeded(info *devInfo) error { 470 logrus.Debugf("activateDeviceIfNeeded(%v)", info.Hash) 471 472 // Make sure deferred removal on device is canceled, if one was 473 // scheduled. 474 if err := devices.cancelDeferredRemoval(info); err != nil { 475 return fmt.Errorf("Deivce Deferred Removal Cancellation Failed: %s", err) 476 } 477 478 if devinfo, _ := devicemapper.GetInfo(info.Name()); devinfo != nil && devinfo.Exists != 0 { 479 return nil 480 } 481 482 return devicemapper.ActivateDevice(devices.getPoolDevName(), info.Name(), info.DeviceID, info.Size) 483 } 484 485 func (devices *DeviceSet) createFilesystem(info *devInfo) error { 486 devname := info.DevName() 487 488 args := []string{} 489 for _, arg := range devices.mkfsArgs { 490 args = append(args, arg) 491 } 492 493 args = append(args, devname) 494 495 var err error 496 switch devices.filesystem { 497 case "xfs": 498 err = exec.Command("mkfs.xfs", args...).Run() 499 case "ext4": 500 err = exec.Command("mkfs.ext4", append([]string{"-E", "nodiscard,lazy_itable_init=0,lazy_journal_init=0"}, args...)...).Run() 501 if err != nil { 502 err = exec.Command("mkfs.ext4", append([]string{"-E", "nodiscard,lazy_itable_init=0"}, args...)...).Run() 503 } 504 if err != nil { 505 return err 506 } 507 err = exec.Command("tune2fs", append([]string{"-c", "-1", "-i", "0"}, devname)...).Run() 508 default: 509 err = fmt.Errorf("Unsupported filesystem type %s", devices.filesystem) 510 } 511 if err != nil { 512 return err 513 } 514 515 return nil 516 } 517 518 func (devices *DeviceSet) migrateOldMetaData() error { 519 // Migrate old metadata file 520 jsonData, err := ioutil.ReadFile(devices.oldMetadataFile()) 521 if err != nil && !os.IsNotExist(err) { 522 return err 523 } 524 525 if jsonData != nil { 526 m := metaData{Devices: make(map[string]*devInfo)} 527 528 if err := json.Unmarshal(jsonData, &m); err != nil { 529 return err 530 } 531 532 for hash, info := range m.Devices { 533 info.Hash = hash 534 devices.saveMetadata(info) 535 } 536 if err := os.Rename(devices.oldMetadataFile(), devices.oldMetadataFile()+".migrated"); err != nil { 537 return err 538 } 539 540 } 541 542 return nil 543 } 544 545 func (devices *DeviceSet) initMetaData() error { 546 if err := devices.migrateOldMetaData(); err != nil { 547 return err 548 } 549 550 _, transactionID, _, _, _, _, err := devices.poolStatus() 551 if err != nil { 552 return err 553 } 554 555 devices.TransactionID = transactionID 556 557 if err := devices.constructDeviceIDMap(); err != nil { 558 return err 559 } 560 561 if err := devices.processPendingTransaction(); err != nil { 562 return err 563 } 564 return nil 565 } 566 567 func (devices *DeviceSet) incNextDeviceID() { 568 // IDs are 24bit, so wrap around 569 devices.NextDeviceID = (devices.NextDeviceID + 1) & maxDeviceID 570 } 571 572 func (devices *DeviceSet) getNextFreeDeviceID() (int, error) { 573 devices.incNextDeviceID() 574 for i := 0; i <= maxDeviceID; i++ { 575 if devices.isDeviceIDFree(devices.NextDeviceID) { 576 devices.markDeviceIDUsed(devices.NextDeviceID) 577 return devices.NextDeviceID, nil 578 } 579 devices.incNextDeviceID() 580 } 581 582 return 0, fmt.Errorf("Unable to find a free device ID") 583 } 584 585 func (devices *DeviceSet) createRegisterDevice(hash string) (*devInfo, error) { 586 deviceID, err := devices.getNextFreeDeviceID() 587 if err != nil { 588 return nil, err 589 } 590 591 if err := devices.openTransaction(hash, deviceID); err != nil { 592 logrus.Debugf("Error opening transaction hash = %s deviceID = %d", hash, deviceID) 593 devices.markDeviceIDFree(deviceID) 594 return nil, err 595 } 596 597 for { 598 if err := devicemapper.CreateDevice(devices.getPoolDevName(), deviceID); err != nil { 599 if devicemapper.DeviceIdExists(err) { 600 // Device ID already exists. This should not 601 // happen. Now we have a mechianism to find 602 // a free device ID. So something is not right. 603 // Give a warning and continue. 604 logrus.Errorf("Device ID %d exists in pool but it is supposed to be unused", deviceID) 605 deviceID, err = devices.getNextFreeDeviceID() 606 if err != nil { 607 return nil, err 608 } 609 // Save new device id into transaction 610 devices.refreshTransaction(deviceID) 611 continue 612 } 613 logrus.Debugf("Error creating device: %s", err) 614 devices.markDeviceIDFree(deviceID) 615 return nil, err 616 } 617 break 618 } 619 620 logrus.Debugf("Registering device (id %v) with FS size %v", deviceID, devices.baseFsSize) 621 info, err := devices.registerDevice(deviceID, hash, devices.baseFsSize, devices.OpenTransactionID) 622 if err != nil { 623 _ = devicemapper.DeleteDevice(devices.getPoolDevName(), deviceID) 624 devices.markDeviceIDFree(deviceID) 625 return nil, err 626 } 627 628 if err := devices.closeTransaction(); err != nil { 629 devices.unregisterDevice(deviceID, hash) 630 devicemapper.DeleteDevice(devices.getPoolDevName(), deviceID) 631 devices.markDeviceIDFree(deviceID) 632 return nil, err 633 } 634 return info, nil 635 } 636 637 func (devices *DeviceSet) createRegisterSnapDevice(hash string, baseInfo *devInfo) error { 638 deviceID, err := devices.getNextFreeDeviceID() 639 if err != nil { 640 return err 641 } 642 643 if err := devices.openTransaction(hash, deviceID); err != nil { 644 logrus.Debugf("Error opening transaction hash = %s deviceID = %d", hash, deviceID) 645 devices.markDeviceIDFree(deviceID) 646 return err 647 } 648 649 for { 650 if err := devicemapper.CreateSnapDevice(devices.getPoolDevName(), deviceID, baseInfo.Name(), baseInfo.DeviceID); err != nil { 651 if devicemapper.DeviceIdExists(err) { 652 // Device ID already exists. This should not 653 // happen. Now we have a mechianism to find 654 // a free device ID. So something is not right. 655 // Give a warning and continue. 656 logrus.Errorf("Device ID %d exists in pool but it is supposed to be unused", deviceID) 657 deviceID, err = devices.getNextFreeDeviceID() 658 if err != nil { 659 return err 660 } 661 // Save new device id into transaction 662 devices.refreshTransaction(deviceID) 663 continue 664 } 665 logrus.Debugf("Error creating snap device: %s", err) 666 devices.markDeviceIDFree(deviceID) 667 return err 668 } 669 break 670 } 671 672 if _, err := devices.registerDevice(deviceID, hash, baseInfo.Size, devices.OpenTransactionID); err != nil { 673 devicemapper.DeleteDevice(devices.getPoolDevName(), deviceID) 674 devices.markDeviceIDFree(deviceID) 675 logrus.Debugf("Error registering device: %s", err) 676 return err 677 } 678 679 if err := devices.closeTransaction(); err != nil { 680 devices.unregisterDevice(deviceID, hash) 681 devicemapper.DeleteDevice(devices.getPoolDevName(), deviceID) 682 devices.markDeviceIDFree(deviceID) 683 return err 684 } 685 return nil 686 } 687 688 func (devices *DeviceSet) loadMetadata(hash string) *devInfo { 689 info := &devInfo{Hash: hash, devices: devices} 690 691 jsonData, err := ioutil.ReadFile(devices.metadataFile(info)) 692 if err != nil { 693 return nil 694 } 695 696 if err := json.Unmarshal(jsonData, &info); err != nil { 697 return nil 698 } 699 700 return info 701 } 702 703 func getDeviceUUID(device string) (string, error) { 704 out, err := exec.Command("blkid", "-s", "UUID", "-o", "value", device).Output() 705 if err != nil { 706 logrus.Debugf("Failed to find uuid for device %s:%v", device, err) 707 return "", err 708 } 709 710 uuid := strings.TrimSuffix(string(out), "\n") 711 uuid = strings.TrimSpace(uuid) 712 logrus.Debugf("UUID for device: %s is:%s", device, uuid) 713 return uuid, nil 714 } 715 716 func (devices *DeviceSet) verifyBaseDeviceUUID(baseInfo *devInfo) error { 717 devices.Lock() 718 defer devices.Unlock() 719 720 if err := devices.activateDeviceIfNeeded(baseInfo); err != nil { 721 return err 722 } 723 724 defer devices.deactivateDevice(baseInfo) 725 726 uuid, err := getDeviceUUID(baseInfo.DevName()) 727 if err != nil { 728 return err 729 } 730 731 if devices.BaseDeviceUUID != uuid { 732 return fmt.Errorf("Current Base Device UUID:%s does not match with stored UUID:%s", uuid, devices.BaseDeviceUUID) 733 } 734 735 return nil 736 } 737 738 func (devices *DeviceSet) saveBaseDeviceUUID(baseInfo *devInfo) error { 739 devices.Lock() 740 defer devices.Unlock() 741 742 if err := devices.activateDeviceIfNeeded(baseInfo); err != nil { 743 return err 744 } 745 746 defer devices.deactivateDevice(baseInfo) 747 748 uuid, err := getDeviceUUID(baseInfo.DevName()) 749 if err != nil { 750 return err 751 } 752 753 devices.BaseDeviceUUID = uuid 754 devices.saveDeviceSetMetaData() 755 return nil 756 } 757 758 func (devices *DeviceSet) setupBaseImage() error { 759 oldInfo, _ := devices.lookupDevice("") 760 if oldInfo != nil && oldInfo.Initialized { 761 // If BaseDeviceUUID is nil (upgrade case), save it and 762 // return success. 763 if devices.BaseDeviceUUID == "" { 764 if err := devices.saveBaseDeviceUUID(oldInfo); err != nil { 765 return fmt.Errorf("Could not query and save base device UUID:%v", err) 766 } 767 return nil 768 } 769 770 if err := devices.verifyBaseDeviceUUID(oldInfo); err != nil { 771 return fmt.Errorf("Base Device UUID verification failed. Possibly using a different thin pool then last invocation:%v", err) 772 } 773 return nil 774 } 775 776 if oldInfo != nil && !oldInfo.Initialized { 777 logrus.Debugf("Removing uninitialized base image") 778 if err := devices.DeleteDevice(""); err != nil { 779 return err 780 } 781 } 782 783 if devices.thinPoolDevice != "" && oldInfo == nil { 784 _, transactionID, dataUsed, _, _, _, err := devices.poolStatus() 785 if err != nil { 786 return err 787 } 788 if dataUsed != 0 { 789 return fmt.Errorf("Unable to take ownership of thin-pool (%s) that already has used data blocks", 790 devices.thinPoolDevice) 791 } 792 if transactionID != 0 { 793 return fmt.Errorf("Unable to take ownership of thin-pool (%s) with non-zero transaction ID", 794 devices.thinPoolDevice) 795 } 796 } 797 798 logrus.Debugf("Initializing base device-mapper thin volume") 799 800 // Create initial device 801 info, err := devices.createRegisterDevice("") 802 if err != nil { 803 return err 804 } 805 806 logrus.Debugf("Creating filesystem on base device-mapper thin volume") 807 808 if err := devices.activateDeviceIfNeeded(info); err != nil { 809 return err 810 } 811 812 if err := devices.createFilesystem(info); err != nil { 813 return err 814 } 815 816 info.Initialized = true 817 if err := devices.saveMetadata(info); err != nil { 818 info.Initialized = false 819 return err 820 } 821 822 if err := devices.saveBaseDeviceUUID(info); err != nil { 823 return fmt.Errorf("Could not query and save base device UUID:%v", err) 824 } 825 826 return nil 827 } 828 829 func setCloseOnExec(name string) { 830 if fileInfos, _ := ioutil.ReadDir("/proc/self/fd"); fileInfos != nil { 831 for _, i := range fileInfos { 832 link, _ := os.Readlink(filepath.Join("/proc/self/fd", i.Name())) 833 if link == name { 834 fd, err := strconv.Atoi(i.Name()) 835 if err == nil { 836 syscall.CloseOnExec(fd) 837 } 838 } 839 } 840 } 841 } 842 843 // DMLog implements logging using DevMapperLogger interface. 844 func (devices *DeviceSet) DMLog(level int, file string, line int, dmError int, message string) { 845 // By default libdm sends us all the messages including debug ones. 846 // We need to filter out messages here and figure out which one 847 // should be printed. 848 if level > logLevel { 849 return 850 } 851 852 // FIXME(vbatts) push this back into ./pkg/devicemapper/ 853 if level <= devicemapper.LogLevelErr { 854 logrus.Errorf("libdevmapper(%d): %s:%d (%d) %s", level, file, line, dmError, message) 855 } else if level <= devicemapper.LogLevelInfo { 856 logrus.Infof("libdevmapper(%d): %s:%d (%d) %s", level, file, line, dmError, message) 857 } else { 858 // FIXME(vbatts) push this back into ./pkg/devicemapper/ 859 logrus.Debugf("libdevmapper(%d): %s:%d (%d) %s", level, file, line, dmError, message) 860 } 861 } 862 863 func major(device uint64) uint64 { 864 return (device >> 8) & 0xfff 865 } 866 867 func minor(device uint64) uint64 { 868 return (device & 0xff) | ((device >> 12) & 0xfff00) 869 } 870 871 // ResizePool increases the size of the pool. 872 func (devices *DeviceSet) ResizePool(size int64) error { 873 dirname := devices.loopbackDir() 874 datafilename := path.Join(dirname, "data") 875 if len(devices.dataDevice) > 0 { 876 datafilename = devices.dataDevice 877 } 878 metadatafilename := path.Join(dirname, "metadata") 879 if len(devices.metadataDevice) > 0 { 880 metadatafilename = devices.metadataDevice 881 } 882 883 datafile, err := os.OpenFile(datafilename, os.O_RDWR, 0) 884 if datafile == nil { 885 return err 886 } 887 defer datafile.Close() 888 889 fi, err := datafile.Stat() 890 if fi == nil { 891 return err 892 } 893 894 if fi.Size() > size { 895 return fmt.Errorf("Can't shrink file") 896 } 897 898 dataloopback := devicemapper.FindLoopDeviceFor(datafile) 899 if dataloopback == nil { 900 return fmt.Errorf("Unable to find loopback mount for: %s", datafilename) 901 } 902 defer dataloopback.Close() 903 904 metadatafile, err := os.OpenFile(metadatafilename, os.O_RDWR, 0) 905 if metadatafile == nil { 906 return err 907 } 908 defer metadatafile.Close() 909 910 metadataloopback := devicemapper.FindLoopDeviceFor(metadatafile) 911 if metadataloopback == nil { 912 return fmt.Errorf("Unable to find loopback mount for: %s", metadatafilename) 913 } 914 defer metadataloopback.Close() 915 916 // Grow loopback file 917 if err := datafile.Truncate(size); err != nil { 918 return fmt.Errorf("Unable to grow loopback file: %s", err) 919 } 920 921 // Reload size for loopback device 922 if err := devicemapper.LoopbackSetCapacity(dataloopback); err != nil { 923 return fmt.Errorf("Unable to update loopback capacity: %s", err) 924 } 925 926 // Suspend the pool 927 if err := devicemapper.SuspendDevice(devices.getPoolName()); err != nil { 928 return fmt.Errorf("Unable to suspend pool: %s", err) 929 } 930 931 // Reload with the new block sizes 932 if err := devicemapper.ReloadPool(devices.getPoolName(), dataloopback, metadataloopback, devices.thinpBlockSize); err != nil { 933 return fmt.Errorf("Unable to reload pool: %s", err) 934 } 935 936 // Resume the pool 937 if err := devicemapper.ResumeDevice(devices.getPoolName()); err != nil { 938 return fmt.Errorf("Unable to resume pool: %s", err) 939 } 940 941 return nil 942 } 943 944 func (devices *DeviceSet) loadTransactionMetaData() error { 945 jsonData, err := ioutil.ReadFile(devices.transactionMetaFile()) 946 if err != nil { 947 // There is no active transaction. This will be the case 948 // during upgrade. 949 if os.IsNotExist(err) { 950 devices.OpenTransactionID = devices.TransactionID 951 return nil 952 } 953 return err 954 } 955 956 json.Unmarshal(jsonData, &devices.transaction) 957 return nil 958 } 959 960 func (devices *DeviceSet) saveTransactionMetaData() error { 961 jsonData, err := json.Marshal(&devices.transaction) 962 if err != nil { 963 return fmt.Errorf("Error encoding metadata to json: %s", err) 964 } 965 966 return devices.writeMetaFile(jsonData, devices.transactionMetaFile()) 967 } 968 969 func (devices *DeviceSet) removeTransactionMetaData() error { 970 if err := os.RemoveAll(devices.transactionMetaFile()); err != nil { 971 return err 972 } 973 return nil 974 } 975 976 func (devices *DeviceSet) rollbackTransaction() error { 977 logrus.Debugf("Rolling back open transaction: TransactionID=%d hash=%s device_id=%d", devices.OpenTransactionID, devices.DeviceIDHash, devices.DeviceID) 978 979 // A device id might have already been deleted before transaction 980 // closed. In that case this call will fail. Just leave a message 981 // in case of failure. 982 if err := devicemapper.DeleteDevice(devices.getPoolDevName(), devices.DeviceID); err != nil { 983 logrus.Errorf("Unable to delete device: %s", err) 984 } 985 986 dinfo := &devInfo{Hash: devices.DeviceIDHash} 987 if err := devices.removeMetadata(dinfo); err != nil { 988 logrus.Errorf("Unable to remove metadata: %s", err) 989 } else { 990 devices.markDeviceIDFree(devices.DeviceID) 991 } 992 993 if err := devices.removeTransactionMetaData(); err != nil { 994 logrus.Errorf("Unable to remove transaction meta file %s: %s", devices.transactionMetaFile(), err) 995 } 996 997 return nil 998 } 999 1000 func (devices *DeviceSet) processPendingTransaction() error { 1001 if err := devices.loadTransactionMetaData(); err != nil { 1002 return err 1003 } 1004 1005 // If there was open transaction but pool transaction ID is same 1006 // as open transaction ID, nothing to roll back. 1007 if devices.TransactionID == devices.OpenTransactionID { 1008 return nil 1009 } 1010 1011 // If open transaction ID is less than pool transaction ID, something 1012 // is wrong. Bail out. 1013 if devices.OpenTransactionID < devices.TransactionID { 1014 logrus.Errorf("Open Transaction id %d is less than pool transaction id %d", devices.OpenTransactionID, devices.TransactionID) 1015 return nil 1016 } 1017 1018 // Pool transaction ID is not same as open transaction. There is 1019 // a transaction which was not completed. 1020 if err := devices.rollbackTransaction(); err != nil { 1021 return fmt.Errorf("Rolling back open transaction failed: %s", err) 1022 } 1023 1024 devices.OpenTransactionID = devices.TransactionID 1025 return nil 1026 } 1027 1028 func (devices *DeviceSet) loadDeviceSetMetaData() error { 1029 jsonData, err := ioutil.ReadFile(devices.deviceSetMetaFile()) 1030 if err != nil { 1031 // For backward compatibility return success if file does 1032 // not exist. 1033 if os.IsNotExist(err) { 1034 return nil 1035 } 1036 return err 1037 } 1038 1039 return json.Unmarshal(jsonData, devices) 1040 } 1041 1042 func (devices *DeviceSet) saveDeviceSetMetaData() error { 1043 jsonData, err := json.Marshal(devices) 1044 if err != nil { 1045 return fmt.Errorf("Error encoding metadata to json: %s", err) 1046 } 1047 1048 return devices.writeMetaFile(jsonData, devices.deviceSetMetaFile()) 1049 } 1050 1051 func (devices *DeviceSet) openTransaction(hash string, DeviceID int) error { 1052 devices.allocateTransactionID() 1053 devices.DeviceIDHash = hash 1054 devices.DeviceID = DeviceID 1055 if err := devices.saveTransactionMetaData(); err != nil { 1056 return fmt.Errorf("Error saving transaction metadata: %s", err) 1057 } 1058 return nil 1059 } 1060 1061 func (devices *DeviceSet) refreshTransaction(DeviceID int) error { 1062 devices.DeviceID = DeviceID 1063 if err := devices.saveTransactionMetaData(); err != nil { 1064 return fmt.Errorf("Error saving transaction metadata: %s", err) 1065 } 1066 return nil 1067 } 1068 1069 func (devices *DeviceSet) closeTransaction() error { 1070 if err := devices.updatePoolTransactionID(); err != nil { 1071 logrus.Debugf("Failed to close Transaction") 1072 return err 1073 } 1074 return nil 1075 } 1076 1077 func determineDriverCapabilities(version string) error { 1078 /* 1079 * Driver version 4.27.0 and greater support deferred activation 1080 * feature. 1081 */ 1082 1083 logrus.Debugf("devicemapper: driver version is %s", version) 1084 1085 versionSplit := strings.Split(version, ".") 1086 major, err := strconv.Atoi(versionSplit[0]) 1087 if err != nil { 1088 return graphdriver.ErrNotSupported 1089 } 1090 1091 if major > 4 { 1092 driverDeferredRemovalSupport = true 1093 return nil 1094 } 1095 1096 if major < 4 { 1097 return nil 1098 } 1099 1100 minor, err := strconv.Atoi(versionSplit[1]) 1101 if err != nil { 1102 return graphdriver.ErrNotSupported 1103 } 1104 1105 /* 1106 * If major is 4 and minor is 27, then there is no need to 1107 * check for patch level as it can not be less than 0. 1108 */ 1109 if minor >= 27 { 1110 driverDeferredRemovalSupport = true 1111 return nil 1112 } 1113 1114 return nil 1115 } 1116 1117 // Determine the major and minor number of loopback device 1118 func getDeviceMajorMinor(file *os.File) (uint64, uint64, error) { 1119 stat, err := file.Stat() 1120 if err != nil { 1121 return 0, 0, err 1122 } 1123 1124 dev := stat.Sys().(*syscall.Stat_t).Rdev 1125 majorNum := major(dev) 1126 minorNum := minor(dev) 1127 1128 logrus.Debugf("[devmapper]: Major:Minor for device: %s is:%v:%v", file.Name(), majorNum, minorNum) 1129 return majorNum, minorNum, nil 1130 } 1131 1132 // Given a file which is backing file of a loop back device, find the 1133 // loopback device name and its major/minor number. 1134 func getLoopFileDeviceMajMin(filename string) (string, uint64, uint64, error) { 1135 file, err := os.Open(filename) 1136 if err != nil { 1137 logrus.Debugf("[devmapper]: Failed to open file %s", filename) 1138 return "", 0, 0, err 1139 } 1140 1141 defer file.Close() 1142 loopbackDevice := devicemapper.FindLoopDeviceFor(file) 1143 if loopbackDevice == nil { 1144 return "", 0, 0, fmt.Errorf("[devmapper]: Unable to find loopback mount for: %s", filename) 1145 } 1146 defer loopbackDevice.Close() 1147 1148 Major, Minor, err := getDeviceMajorMinor(loopbackDevice) 1149 if err != nil { 1150 return "", 0, 0, err 1151 } 1152 return loopbackDevice.Name(), Major, Minor, nil 1153 } 1154 1155 // Get the major/minor numbers of thin pool data and metadata devices 1156 func (devices *DeviceSet) getThinPoolDataMetaMajMin() (uint64, uint64, uint64, uint64, error) { 1157 var params, poolDataMajMin, poolMetadataMajMin string 1158 1159 _, _, _, params, err := devicemapper.GetTable(devices.getPoolName()) 1160 if err != nil { 1161 return 0, 0, 0, 0, err 1162 } 1163 1164 if _, err = fmt.Sscanf(params, "%s %s", &poolMetadataMajMin, &poolDataMajMin); err != nil { 1165 return 0, 0, 0, 0, err 1166 } 1167 1168 logrus.Debugf("[devmapper]: poolDataMajMin=%s poolMetaMajMin=%s\n", poolDataMajMin, poolMetadataMajMin) 1169 1170 poolDataMajMinorSplit := strings.Split(poolDataMajMin, ":") 1171 poolDataMajor, err := strconv.ParseUint(poolDataMajMinorSplit[0], 10, 32) 1172 if err != nil { 1173 return 0, 0, 0, 0, err 1174 } 1175 1176 poolDataMinor, err := strconv.ParseUint(poolDataMajMinorSplit[1], 10, 32) 1177 if err != nil { 1178 return 0, 0, 0, 0, err 1179 } 1180 1181 poolMetadataMajMinorSplit := strings.Split(poolMetadataMajMin, ":") 1182 poolMetadataMajor, err := strconv.ParseUint(poolMetadataMajMinorSplit[0], 10, 32) 1183 if err != nil { 1184 return 0, 0, 0, 0, err 1185 } 1186 1187 poolMetadataMinor, err := strconv.ParseUint(poolMetadataMajMinorSplit[1], 10, 32) 1188 if err != nil { 1189 return 0, 0, 0, 0, err 1190 } 1191 1192 return poolDataMajor, poolDataMinor, poolMetadataMajor, poolMetadataMinor, nil 1193 } 1194 1195 func (devices *DeviceSet) loadThinPoolLoopBackInfo() error { 1196 poolDataMajor, poolDataMinor, poolMetadataMajor, poolMetadataMinor, err := devices.getThinPoolDataMetaMajMin() 1197 if err != nil { 1198 return err 1199 } 1200 1201 dirname := devices.loopbackDir() 1202 1203 // data device has not been passed in. So there should be a data file 1204 // which is being mounted as loop device. 1205 if devices.dataDevice == "" { 1206 datafilename := path.Join(dirname, "data") 1207 dataLoopDevice, dataMajor, dataMinor, err := getLoopFileDeviceMajMin(datafilename) 1208 if err != nil { 1209 return err 1210 } 1211 1212 // Compare the two 1213 if poolDataMajor == dataMajor && poolDataMinor == dataMinor { 1214 devices.dataDevice = dataLoopDevice 1215 devices.dataLoopFile = datafilename 1216 } 1217 1218 } 1219 1220 // metadata device has not been passed in. So there should be a 1221 // metadata file which is being mounted as loop device. 1222 if devices.metadataDevice == "" { 1223 metadatafilename := path.Join(dirname, "metadata") 1224 metadataLoopDevice, metadataMajor, metadataMinor, err := getLoopFileDeviceMajMin(metadatafilename) 1225 if err != nil { 1226 return err 1227 } 1228 if poolMetadataMajor == metadataMajor && poolMetadataMinor == metadataMinor { 1229 devices.metadataDevice = metadataLoopDevice 1230 devices.metadataLoopFile = metadatafilename 1231 } 1232 } 1233 1234 return nil 1235 } 1236 1237 func (devices *DeviceSet) initDevmapper(doInit bool) error { 1238 // give ourselves to libdm as a log handler 1239 devicemapper.LogInit(devices) 1240 1241 version, err := devicemapper.GetDriverVersion() 1242 if err != nil { 1243 // Can't even get driver version, assume not supported 1244 return graphdriver.ErrNotSupported 1245 } 1246 1247 if err := determineDriverCapabilities(version); err != nil { 1248 return graphdriver.ErrNotSupported 1249 } 1250 1251 // If user asked for deferred removal and both library and driver 1252 // supports deferred removal use it. 1253 if enableDeferredRemoval && driverDeferredRemovalSupport && devicemapper.LibraryDeferredRemovalSupport == true { 1254 logrus.Debugf("devmapper: Deferred removal support enabled.") 1255 devices.deferredRemove = true 1256 } 1257 1258 // https://github.com/docker/docker/issues/4036 1259 if supported := devicemapper.UdevSetSyncSupport(true); !supported { 1260 logrus.Warn("Udev sync is not supported. This will lead to unexpected behavior, data loss and errors. For more information, see https://docs.docker.com/reference/commandline/daemon/#daemon-storage-driver-option") 1261 } 1262 1263 if err := os.MkdirAll(devices.metadataDir(), 0700); err != nil { 1264 return err 1265 } 1266 1267 // Set the device prefix from the device id and inode of the docker root dir 1268 1269 st, err := os.Stat(devices.root) 1270 if err != nil { 1271 return fmt.Errorf("Error looking up dir %s: %s", devices.root, err) 1272 } 1273 sysSt := st.Sys().(*syscall.Stat_t) 1274 // "reg-" stands for "regular file". 1275 // In the future we might use "dev-" for "device file", etc. 1276 // docker-maj,min[-inode] stands for: 1277 // - Managed by docker 1278 // - The target of this device is at major <maj> and minor <min> 1279 // - If <inode> is defined, use that file inside the device as a loopback image. Otherwise use the device itself. 1280 devices.devicePrefix = fmt.Sprintf("docker-%d:%d-%d", major(sysSt.Dev), minor(sysSt.Dev), sysSt.Ino) 1281 logrus.Debugf("Generated prefix: %s", devices.devicePrefix) 1282 1283 // Check for the existence of the thin-pool device 1284 logrus.Debugf("Checking for existence of the pool '%s'", devices.getPoolName()) 1285 info, err := devicemapper.GetInfo(devices.getPoolName()) 1286 if info == nil { 1287 logrus.Debugf("Error device devicemapper.GetInfo: %s", err) 1288 return err 1289 } 1290 1291 // It seems libdevmapper opens this without O_CLOEXEC, and go exec will not close files 1292 // that are not Close-on-exec, and lxc-start will die if it inherits any unexpected files, 1293 // so we add this badhack to make sure it closes itself 1294 setCloseOnExec("/dev/mapper/control") 1295 1296 // Make sure the sparse images exist in <root>/devicemapper/data and 1297 // <root>/devicemapper/metadata 1298 1299 createdLoopback := false 1300 1301 // If the pool doesn't exist, create it 1302 if info.Exists == 0 && devices.thinPoolDevice == "" { 1303 logrus.Debugf("Pool doesn't exist. Creating it.") 1304 1305 var ( 1306 dataFile *os.File 1307 metadataFile *os.File 1308 ) 1309 1310 if devices.dataDevice == "" { 1311 // Make sure the sparse images exist in <root>/devicemapper/data 1312 1313 hasData := devices.hasImage("data") 1314 1315 if !doInit && !hasData { 1316 return errors.New("Loopback data file not found") 1317 } 1318 1319 if !hasData { 1320 createdLoopback = true 1321 } 1322 1323 data, err := devices.ensureImage("data", devices.dataLoopbackSize) 1324 if err != nil { 1325 logrus.Debugf("Error device ensureImage (data): %s", err) 1326 return err 1327 } 1328 1329 dataFile, err = devicemapper.AttachLoopDevice(data) 1330 if err != nil { 1331 return err 1332 } 1333 devices.dataLoopFile = data 1334 devices.dataDevice = dataFile.Name() 1335 } else { 1336 dataFile, err = os.OpenFile(devices.dataDevice, os.O_RDWR, 0600) 1337 if err != nil { 1338 return err 1339 } 1340 } 1341 defer dataFile.Close() 1342 1343 if devices.metadataDevice == "" { 1344 // Make sure the sparse images exist in <root>/devicemapper/metadata 1345 1346 hasMetadata := devices.hasImage("metadata") 1347 1348 if !doInit && !hasMetadata { 1349 return errors.New("Loopback metadata file not found") 1350 } 1351 1352 if !hasMetadata { 1353 createdLoopback = true 1354 } 1355 1356 metadata, err := devices.ensureImage("metadata", devices.metaDataLoopbackSize) 1357 if err != nil { 1358 logrus.Debugf("Error device ensureImage (metadata): %s", err) 1359 return err 1360 } 1361 1362 metadataFile, err = devicemapper.AttachLoopDevice(metadata) 1363 if err != nil { 1364 return err 1365 } 1366 devices.metadataLoopFile = metadata 1367 devices.metadataDevice = metadataFile.Name() 1368 } else { 1369 metadataFile, err = os.OpenFile(devices.metadataDevice, os.O_RDWR, 0600) 1370 if err != nil { 1371 return err 1372 } 1373 } 1374 defer metadataFile.Close() 1375 1376 if err := devicemapper.CreatePool(devices.getPoolName(), dataFile, metadataFile, devices.thinpBlockSize); err != nil { 1377 return err 1378 } 1379 } 1380 1381 // Pool already exists and caller did not pass us a pool. That means 1382 // we probably created pool earlier and could not remove it as some 1383 // containers were still using it. Detect some of the properties of 1384 // pool, like is it using loop devices. 1385 if info.Exists != 0 && devices.thinPoolDevice == "" { 1386 if err := devices.loadThinPoolLoopBackInfo(); err != nil { 1387 logrus.Debugf("Failed to load thin pool loopback device information:%v", err) 1388 return err 1389 } 1390 } 1391 1392 // If we didn't just create the data or metadata image, we need to 1393 // load the transaction id and migrate old metadata 1394 if !createdLoopback { 1395 if err := devices.initMetaData(); err != nil { 1396 return err 1397 } 1398 } 1399 1400 // Right now this loads only NextDeviceID. If there is more metadata 1401 // down the line, we might have to move it earlier. 1402 if err := devices.loadDeviceSetMetaData(); err != nil { 1403 return err 1404 } 1405 1406 // Setup the base image 1407 if doInit { 1408 if err := devices.setupBaseImage(); err != nil { 1409 logrus.Debugf("Error device setupBaseImage: %s", err) 1410 return err 1411 } 1412 } 1413 1414 return nil 1415 } 1416 1417 // AddDevice adds a device and registers in the hash. 1418 func (devices *DeviceSet) AddDevice(hash, baseHash string) error { 1419 logrus.Debugf("[deviceset] AddDevice(hash=%s basehash=%s)", hash, baseHash) 1420 defer logrus.Debugf("[deviceset] AddDevice(hash=%s basehash=%s) END", hash, baseHash) 1421 1422 baseInfo, err := devices.lookupDevice(baseHash) 1423 if err != nil { 1424 return err 1425 } 1426 1427 baseInfo.lock.Lock() 1428 defer baseInfo.lock.Unlock() 1429 1430 devices.Lock() 1431 defer devices.Unlock() 1432 1433 if info, _ := devices.lookupDevice(hash); info != nil { 1434 return fmt.Errorf("device %s already exists", hash) 1435 } 1436 1437 if err := devices.createRegisterSnapDevice(hash, baseInfo); err != nil { 1438 return err 1439 } 1440 1441 return nil 1442 } 1443 1444 func (devices *DeviceSet) deleteDevice(info *devInfo) error { 1445 if devices.doBlkDiscard { 1446 // This is a workaround for the kernel not discarding block so 1447 // on the thin pool when we remove a thinp device, so we do it 1448 // manually 1449 if err := devices.activateDeviceIfNeeded(info); err == nil { 1450 if err := devicemapper.BlockDeviceDiscard(info.DevName()); err != nil { 1451 logrus.Debugf("Error discarding block on device: %s (ignoring)", err) 1452 } 1453 } 1454 } 1455 1456 devinfo, _ := devicemapper.GetInfo(info.Name()) 1457 if devinfo != nil && devinfo.Exists != 0 { 1458 if err := devices.removeDevice(info.Name()); err != nil { 1459 logrus.Debugf("Error removing device: %s", err) 1460 return err 1461 } 1462 } 1463 1464 if err := devices.openTransaction(info.Hash, info.DeviceID); err != nil { 1465 logrus.Debugf("Error opening transaction hash = %s deviceID = %d", "", info.DeviceID) 1466 return err 1467 } 1468 1469 if err := devicemapper.DeleteDevice(devices.getPoolDevName(), info.DeviceID); err != nil { 1470 logrus.Debugf("Error deleting device: %s", err) 1471 return err 1472 } 1473 1474 if err := devices.unregisterDevice(info.DeviceID, info.Hash); err != nil { 1475 return err 1476 } 1477 1478 if err := devices.closeTransaction(); err != nil { 1479 return err 1480 } 1481 1482 devices.markDeviceIDFree(info.DeviceID) 1483 1484 return nil 1485 } 1486 1487 // DeleteDevice deletes a device from the hash. 1488 func (devices *DeviceSet) DeleteDevice(hash string) error { 1489 info, err := devices.lookupDevice(hash) 1490 if err != nil { 1491 return err 1492 } 1493 1494 info.lock.Lock() 1495 defer info.lock.Unlock() 1496 1497 devices.Lock() 1498 defer devices.Unlock() 1499 1500 return devices.deleteDevice(info) 1501 } 1502 1503 func (devices *DeviceSet) deactivatePool() error { 1504 logrus.Debugf("[devmapper] deactivatePool()") 1505 defer logrus.Debugf("[devmapper] deactivatePool END") 1506 devname := devices.getPoolDevName() 1507 1508 devinfo, err := devicemapper.GetInfo(devname) 1509 if err != nil { 1510 return err 1511 } 1512 1513 if devinfo.Exists == 0 { 1514 return nil 1515 } 1516 if err := devicemapper.RemoveDevice(devname); err != nil { 1517 return err 1518 } 1519 1520 if d, err := devicemapper.GetDeps(devname); err == nil { 1521 logrus.Warnf("[devmapper] device %s still has %d active dependents", devname, d.Count) 1522 } 1523 1524 return nil 1525 } 1526 1527 func (devices *DeviceSet) deactivateDevice(info *devInfo) error { 1528 logrus.Debugf("[devmapper] deactivateDevice(%s)", info.Hash) 1529 defer logrus.Debugf("[devmapper] deactivateDevice END(%s)", info.Hash) 1530 1531 devinfo, err := devicemapper.GetInfo(info.Name()) 1532 if err != nil { 1533 return err 1534 } 1535 1536 if devinfo.Exists == 0 { 1537 return nil 1538 } 1539 1540 if devices.deferredRemove { 1541 if err := devicemapper.RemoveDeviceDeferred(info.Name()); err != nil { 1542 return err 1543 } 1544 } else { 1545 if err := devices.removeDevice(info.Name()); err != nil { 1546 return err 1547 } 1548 } 1549 return nil 1550 } 1551 1552 // Issues the underlying dm remove operation. 1553 func (devices *DeviceSet) removeDevice(devname string) error { 1554 var err error 1555 1556 logrus.Debugf("[devmapper] removeDevice START(%s)", devname) 1557 defer logrus.Debugf("[devmapper] removeDevice END(%s)", devname) 1558 1559 for i := 0; i < 200; i++ { 1560 err = devicemapper.RemoveDevice(devname) 1561 if err == nil { 1562 break 1563 } 1564 if err != devicemapper.ErrBusy { 1565 return err 1566 } 1567 1568 // If we see EBUSY it may be a transient error, 1569 // sleep a bit a retry a few times. 1570 devices.Unlock() 1571 time.Sleep(100 * time.Millisecond) 1572 devices.Lock() 1573 } 1574 1575 return err 1576 } 1577 1578 func (devices *DeviceSet) cancelDeferredRemoval(info *devInfo) error { 1579 if !devices.deferredRemove { 1580 return nil 1581 } 1582 1583 logrus.Debugf("[devmapper] cancelDeferredRemoval START(%s)", info.Name()) 1584 defer logrus.Debugf("[devmapper] cancelDeferredRemoval END(%s)", info.Name()) 1585 1586 devinfo, err := devicemapper.GetInfoWithDeferred(info.Name()) 1587 1588 if devinfo != nil && devinfo.DeferredRemove == 0 { 1589 return nil 1590 } 1591 1592 // Cancel deferred remove 1593 for i := 0; i < 100; i++ { 1594 err = devicemapper.CancelDeferredRemove(info.Name()) 1595 if err == nil { 1596 break 1597 } 1598 1599 if err == devicemapper.ErrEnxio { 1600 // Device is probably already gone. Return success. 1601 return nil 1602 } 1603 1604 if err != devicemapper.ErrBusy { 1605 return err 1606 } 1607 1608 // If we see EBUSY it may be a transient error, 1609 // sleep a bit a retry a few times. 1610 devices.Unlock() 1611 time.Sleep(100 * time.Millisecond) 1612 devices.Lock() 1613 } 1614 return err 1615 } 1616 1617 // Shutdown shuts down the device by unmounting the root. 1618 func (devices *DeviceSet) Shutdown() error { 1619 logrus.Debugf("[deviceset %s] Shutdown()", devices.devicePrefix) 1620 logrus.Debugf("[devmapper] Shutting down DeviceSet: %s", devices.root) 1621 defer logrus.Debugf("[deviceset %s] Shutdown() END", devices.devicePrefix) 1622 1623 var devs []*devInfo 1624 1625 devices.devicesLock.Lock() 1626 for _, info := range devices.Devices { 1627 devs = append(devs, info) 1628 } 1629 devices.devicesLock.Unlock() 1630 1631 for _, info := range devs { 1632 info.lock.Lock() 1633 if info.mountCount > 0 { 1634 // We use MNT_DETACH here in case it is still busy in some running 1635 // container. This means it'll go away from the global scope directly, 1636 // and the device will be released when that container dies. 1637 if err := syscall.Unmount(info.mountPath, syscall.MNT_DETACH); err != nil { 1638 logrus.Debugf("Shutdown unmounting %s, error: %s", info.mountPath, err) 1639 } 1640 1641 devices.Lock() 1642 if err := devices.deactivateDevice(info); err != nil { 1643 logrus.Debugf("Shutdown deactivate %s , error: %s", info.Hash, err) 1644 } 1645 devices.Unlock() 1646 } 1647 info.lock.Unlock() 1648 } 1649 1650 info, _ := devices.lookupDevice("") 1651 if info != nil { 1652 info.lock.Lock() 1653 devices.Lock() 1654 if err := devices.deactivateDevice(info); err != nil { 1655 logrus.Debugf("Shutdown deactivate base , error: %s", err) 1656 } 1657 devices.Unlock() 1658 info.lock.Unlock() 1659 } 1660 1661 devices.Lock() 1662 if devices.thinPoolDevice == "" { 1663 if err := devices.deactivatePool(); err != nil { 1664 logrus.Debugf("Shutdown deactivate pool , error: %s", err) 1665 } 1666 } 1667 1668 devices.saveDeviceSetMetaData() 1669 devices.Unlock() 1670 1671 return nil 1672 } 1673 1674 // MountDevice mounts the device if not already mounted. 1675 func (devices *DeviceSet) MountDevice(hash, path, mountLabel string) error { 1676 info, err := devices.lookupDevice(hash) 1677 if err != nil { 1678 return err 1679 } 1680 1681 info.lock.Lock() 1682 defer info.lock.Unlock() 1683 1684 devices.Lock() 1685 defer devices.Unlock() 1686 1687 if info.mountCount > 0 { 1688 if path != info.mountPath { 1689 return fmt.Errorf("Trying to mount devmapper device in multiple places (%s, %s)", info.mountPath, path) 1690 } 1691 1692 info.mountCount++ 1693 return nil 1694 } 1695 1696 if err := devices.activateDeviceIfNeeded(info); err != nil { 1697 return fmt.Errorf("Error activating devmapper device for '%s': %s", hash, err) 1698 } 1699 1700 fstype, err := ProbeFsType(info.DevName()) 1701 if err != nil { 1702 return err 1703 } 1704 1705 options := "" 1706 1707 if fstype == "xfs" { 1708 // XFS needs nouuid or it can't mount filesystems with the same fs 1709 options = joinMountOptions(options, "nouuid") 1710 } 1711 1712 options = joinMountOptions(options, devices.mountOptions) 1713 options = joinMountOptions(options, label.FormatMountLabel("", mountLabel)) 1714 1715 if err := syscall.Mount(info.DevName(), path, fstype, syscall.MS_MGC_VAL, options); err != nil { 1716 return fmt.Errorf("Error mounting '%s' on '%s': %s", info.DevName(), path, err) 1717 } 1718 1719 info.mountCount = 1 1720 info.mountPath = path 1721 1722 return nil 1723 } 1724 1725 // UnmountDevice unmounts the device and removes it from hash. 1726 func (devices *DeviceSet) UnmountDevice(hash string) error { 1727 logrus.Debugf("[devmapper] UnmountDevice(hash=%s)", hash) 1728 defer logrus.Debugf("[devmapper] UnmountDevice(hash=%s) END", hash) 1729 1730 info, err := devices.lookupDevice(hash) 1731 if err != nil { 1732 return err 1733 } 1734 1735 info.lock.Lock() 1736 defer info.lock.Unlock() 1737 1738 devices.Lock() 1739 defer devices.Unlock() 1740 1741 if info.mountCount == 0 { 1742 return fmt.Errorf("UnmountDevice: device not-mounted id %s", hash) 1743 } 1744 1745 info.mountCount-- 1746 if info.mountCount > 0 { 1747 return nil 1748 } 1749 1750 logrus.Debugf("[devmapper] Unmount(%s)", info.mountPath) 1751 if err := syscall.Unmount(info.mountPath, syscall.MNT_DETACH); err != nil { 1752 return err 1753 } 1754 logrus.Debugf("[devmapper] Unmount done") 1755 1756 if err := devices.deactivateDevice(info); err != nil { 1757 return err 1758 } 1759 1760 info.mountPath = "" 1761 1762 return nil 1763 } 1764 1765 // HasDevice returns true if the device is in the hash and mounted. 1766 func (devices *DeviceSet) HasDevice(hash string) bool { 1767 devices.Lock() 1768 defer devices.Unlock() 1769 1770 info, _ := devices.lookupDevice(hash) 1771 return info != nil 1772 } 1773 1774 // HasActivatedDevice return true if the device exists. 1775 func (devices *DeviceSet) HasActivatedDevice(hash string) bool { 1776 info, _ := devices.lookupDevice(hash) 1777 if info == nil { 1778 return false 1779 } 1780 1781 info.lock.Lock() 1782 defer info.lock.Unlock() 1783 1784 devices.Lock() 1785 defer devices.Unlock() 1786 1787 devinfo, _ := devicemapper.GetInfo(info.Name()) 1788 return devinfo != nil && devinfo.Exists != 0 1789 } 1790 1791 // List returns a list of device ids. 1792 func (devices *DeviceSet) List() []string { 1793 devices.Lock() 1794 defer devices.Unlock() 1795 1796 devices.devicesLock.Lock() 1797 ids := make([]string, len(devices.Devices)) 1798 i := 0 1799 for k := range devices.Devices { 1800 ids[i] = k 1801 i++ 1802 } 1803 devices.devicesLock.Unlock() 1804 1805 return ids 1806 } 1807 1808 func (devices *DeviceSet) deviceStatus(devName string) (sizeInSectors, mappedSectors, highestMappedSector uint64, err error) { 1809 var params string 1810 _, sizeInSectors, _, params, err = devicemapper.GetStatus(devName) 1811 if err != nil { 1812 return 1813 } 1814 if _, err = fmt.Sscanf(params, "%d %d", &mappedSectors, &highestMappedSector); err == nil { 1815 return 1816 } 1817 return 1818 } 1819 1820 // GetDeviceStatus provides size, mapped sectors 1821 func (devices *DeviceSet) GetDeviceStatus(hash string) (*DevStatus, error) { 1822 info, err := devices.lookupDevice(hash) 1823 if err != nil { 1824 return nil, err 1825 } 1826 1827 info.lock.Lock() 1828 defer info.lock.Unlock() 1829 1830 devices.Lock() 1831 defer devices.Unlock() 1832 1833 status := &DevStatus{ 1834 DeviceID: info.DeviceID, 1835 Size: info.Size, 1836 TransactionID: info.TransactionID, 1837 } 1838 1839 if err := devices.activateDeviceIfNeeded(info); err != nil { 1840 return nil, fmt.Errorf("Error activating devmapper device for '%s': %s", hash, err) 1841 } 1842 1843 sizeInSectors, mappedSectors, highestMappedSector, err := devices.deviceStatus(info.DevName()) 1844 1845 if err != nil { 1846 return nil, err 1847 } 1848 1849 status.SizeInSectors = sizeInSectors 1850 status.MappedSectors = mappedSectors 1851 status.HighestMappedSector = highestMappedSector 1852 1853 return status, nil 1854 } 1855 1856 func (devices *DeviceSet) poolStatus() (totalSizeInSectors, transactionID, dataUsed, dataTotal, metadataUsed, metadataTotal uint64, err error) { 1857 var params string 1858 if _, totalSizeInSectors, _, params, err = devicemapper.GetStatus(devices.getPoolName()); err == nil { 1859 _, err = fmt.Sscanf(params, "%d %d/%d %d/%d", &transactionID, &metadataUsed, &metadataTotal, &dataUsed, &dataTotal) 1860 } 1861 return 1862 } 1863 1864 // DataDevicePath returns the path to the data storage for this deviceset, 1865 // regardless of loopback or block device 1866 func (devices *DeviceSet) DataDevicePath() string { 1867 return devices.dataDevice 1868 } 1869 1870 // MetadataDevicePath returns the path to the metadata storage for this deviceset, 1871 // regardless of loopback or block device 1872 func (devices *DeviceSet) MetadataDevicePath() string { 1873 return devices.metadataDevice 1874 } 1875 1876 func (devices *DeviceSet) getUnderlyingAvailableSpace(loopFile string) (uint64, error) { 1877 buf := new(syscall.Statfs_t) 1878 if err := syscall.Statfs(loopFile, buf); err != nil { 1879 logrus.Warnf("Couldn't stat loopfile filesystem %v: %v", loopFile, err) 1880 return 0, err 1881 } 1882 return buf.Bfree * uint64(buf.Bsize), nil 1883 } 1884 1885 func (devices *DeviceSet) isRealFile(loopFile string) (bool, error) { 1886 if loopFile != "" { 1887 fi, err := os.Stat(loopFile) 1888 if err != nil { 1889 logrus.Warnf("Couldn't stat loopfile %v: %v", loopFile, err) 1890 return false, err 1891 } 1892 return fi.Mode().IsRegular(), nil 1893 } 1894 return false, nil 1895 } 1896 1897 // Status returns the current status of this deviceset 1898 func (devices *DeviceSet) Status() *Status { 1899 devices.Lock() 1900 defer devices.Unlock() 1901 1902 status := &Status{} 1903 1904 status.PoolName = devices.getPoolName() 1905 status.DataFile = devices.DataDevicePath() 1906 status.DataLoopback = devices.dataLoopFile 1907 status.MetadataFile = devices.MetadataDevicePath() 1908 status.MetadataLoopback = devices.metadataLoopFile 1909 status.UdevSyncSupported = devicemapper.UdevSyncSupported() 1910 status.DeferredRemoveEnabled = devices.deferredRemove 1911 1912 totalSizeInSectors, _, dataUsed, dataTotal, metadataUsed, metadataTotal, err := devices.poolStatus() 1913 if err == nil { 1914 // Convert from blocks to bytes 1915 blockSizeInSectors := totalSizeInSectors / dataTotal 1916 1917 status.Data.Used = dataUsed * blockSizeInSectors * 512 1918 status.Data.Total = dataTotal * blockSizeInSectors * 512 1919 status.Data.Available = status.Data.Total - status.Data.Used 1920 1921 // metadata blocks are always 4k 1922 status.Metadata.Used = metadataUsed * 4096 1923 status.Metadata.Total = metadataTotal * 4096 1924 status.Metadata.Available = status.Metadata.Total - status.Metadata.Used 1925 1926 status.SectorSize = blockSizeInSectors * 512 1927 1928 if check, _ := devices.isRealFile(devices.dataLoopFile); check { 1929 actualSpace, err := devices.getUnderlyingAvailableSpace(devices.dataLoopFile) 1930 if err == nil && actualSpace < status.Data.Available { 1931 status.Data.Available = actualSpace 1932 } 1933 } 1934 1935 if check, _ := devices.isRealFile(devices.metadataLoopFile); check { 1936 actualSpace, err := devices.getUnderlyingAvailableSpace(devices.metadataLoopFile) 1937 if err == nil && actualSpace < status.Metadata.Available { 1938 status.Metadata.Available = actualSpace 1939 } 1940 } 1941 } 1942 1943 return status 1944 } 1945 1946 // Status returns the current status of this deviceset 1947 func (devices *DeviceSet) exportDeviceMetadata(hash string) (*deviceMetadata, error) { 1948 info, err := devices.lookupDevice(hash) 1949 if err != nil { 1950 return nil, err 1951 } 1952 1953 info.lock.Lock() 1954 defer info.lock.Unlock() 1955 1956 metadata := &deviceMetadata{info.DeviceID, info.Size, info.Name()} 1957 return metadata, nil 1958 } 1959 1960 // NewDeviceSet creates the device set based on the options provided. 1961 func NewDeviceSet(root string, doInit bool, options []string) (*DeviceSet, error) { 1962 devicemapper.SetDevDir("/dev") 1963 1964 devices := &DeviceSet{ 1965 root: root, 1966 metaData: metaData{Devices: make(map[string]*devInfo)}, 1967 dataLoopbackSize: defaultDataLoopbackSize, 1968 metaDataLoopbackSize: defaultMetaDataLoopbackSize, 1969 baseFsSize: defaultBaseFsSize, 1970 overrideUdevSyncCheck: defaultUdevSyncOverride, 1971 filesystem: "ext4", 1972 doBlkDiscard: true, 1973 thinpBlockSize: defaultThinpBlockSize, 1974 deviceIDMap: make([]byte, deviceIDMapSz), 1975 } 1976 1977 foundBlkDiscard := false 1978 for _, option := range options { 1979 key, val, err := parsers.ParseKeyValueOpt(option) 1980 if err != nil { 1981 return nil, err 1982 } 1983 key = strings.ToLower(key) 1984 switch key { 1985 case "dm.basesize": 1986 size, err := units.RAMInBytes(val) 1987 if err != nil { 1988 return nil, err 1989 } 1990 devices.baseFsSize = uint64(size) 1991 case "dm.loopdatasize": 1992 size, err := units.RAMInBytes(val) 1993 if err != nil { 1994 return nil, err 1995 } 1996 devices.dataLoopbackSize = size 1997 case "dm.loopmetadatasize": 1998 size, err := units.RAMInBytes(val) 1999 if err != nil { 2000 return nil, err 2001 } 2002 devices.metaDataLoopbackSize = size 2003 case "dm.fs": 2004 if val != "ext4" && val != "xfs" { 2005 return nil, fmt.Errorf("Unsupported filesystem %s\n", val) 2006 } 2007 devices.filesystem = val 2008 case "dm.mkfsarg": 2009 devices.mkfsArgs = append(devices.mkfsArgs, val) 2010 case "dm.mountopt": 2011 devices.mountOptions = joinMountOptions(devices.mountOptions, val) 2012 case "dm.metadatadev": 2013 devices.metadataDevice = val 2014 case "dm.datadev": 2015 devices.dataDevice = val 2016 case "dm.thinpooldev": 2017 devices.thinPoolDevice = strings.TrimPrefix(val, "/dev/mapper/") 2018 case "dm.blkdiscard": 2019 foundBlkDiscard = true 2020 devices.doBlkDiscard, err = strconv.ParseBool(val) 2021 if err != nil { 2022 return nil, err 2023 } 2024 case "dm.blocksize": 2025 size, err := units.RAMInBytes(val) 2026 if err != nil { 2027 return nil, err 2028 } 2029 // convert to 512b sectors 2030 devices.thinpBlockSize = uint32(size) >> 9 2031 case "dm.override_udev_sync_check": 2032 devices.overrideUdevSyncCheck, err = strconv.ParseBool(val) 2033 if err != nil { 2034 return nil, err 2035 } 2036 2037 case "dm.use_deferred_removal": 2038 enableDeferredRemoval, err = strconv.ParseBool(val) 2039 if err != nil { 2040 return nil, err 2041 } 2042 2043 default: 2044 return nil, fmt.Errorf("Unknown option %s\n", key) 2045 } 2046 } 2047 2048 // By default, don't do blk discard hack on raw devices, its rarely useful and is expensive 2049 if !foundBlkDiscard && (devices.dataDevice != "" || devices.thinPoolDevice != "") { 2050 devices.doBlkDiscard = false 2051 } 2052 2053 if err := devices.initDevmapper(doInit); err != nil { 2054 return nil, err 2055 } 2056 2057 return devices, nil 2058 }