github.com/walkingsparrow/docker@v1.4.2-0.20151218153551-b708a2249bfa/daemon/graphdriver/devmapper/deviceset.go (about) 1 // +build linux 2 3 package devmapper 4 5 import ( 6 "bufio" 7 "encoding/json" 8 "errors" 9 "fmt" 10 "io" 11 "io/ioutil" 12 "os" 13 "os/exec" 14 "path" 15 "path/filepath" 16 "strconv" 17 "strings" 18 "sync" 19 "syscall" 20 "time" 21 22 "github.com/Sirupsen/logrus" 23 24 "github.com/docker/docker/daemon/graphdriver" 25 "github.com/docker/docker/pkg/devicemapper" 26 "github.com/docker/docker/pkg/idtools" 27 "github.com/docker/docker/pkg/mount" 28 "github.com/docker/docker/pkg/parsers" 29 "github.com/docker/go-units" 30 31 "github.com/opencontainers/runc/libcontainer/label" 32 ) 33 34 var ( 35 defaultDataLoopbackSize int64 = 100 * 1024 * 1024 * 1024 36 defaultMetaDataLoopbackSize int64 = 2 * 1024 * 1024 * 1024 37 defaultBaseFsSize uint64 = 100 * 1024 * 1024 * 1024 38 defaultThinpBlockSize uint32 = 128 // 64K = 128 512b sectors 39 defaultUdevSyncOverride = false 40 maxDeviceID = 0xffffff // 24 bit, pool limit 41 deviceIDMapSz = (maxDeviceID + 1) / 8 42 // We retry device removal so many a times that even error messages 43 // will fill up console during normal operation. So only log Fatal 44 // messages by default. 45 logLevel = devicemapper.LogLevelFatal 46 driverDeferredRemovalSupport = false 47 enableDeferredRemoval = false 48 enableDeferredDeletion = false 49 ) 50 51 const deviceSetMetaFile string = "deviceset-metadata" 52 const transactionMetaFile string = "transaction-metadata" 53 54 type transaction struct { 55 OpenTransactionID uint64 `json:"open_transaction_id"` 56 DeviceIDHash string `json:"device_hash"` 57 DeviceID int `json:"device_id"` 58 } 59 60 type devInfo struct { 61 Hash string `json:"-"` 62 DeviceID int `json:"device_id"` 63 Size uint64 `json:"size"` 64 TransactionID uint64 `json:"transaction_id"` 65 Initialized bool `json:"initialized"` 66 Deleted bool `json:"deleted"` 67 devices *DeviceSet 68 69 mountCount int 70 mountPath string 71 72 // The global DeviceSet lock guarantees that we serialize all 73 // the calls to libdevmapper (which is not threadsafe), but we 74 // sometimes release that lock while sleeping. In that case 75 // this per-device lock is still held, protecting against 76 // other accesses to the device that we're doing the wait on. 77 // 78 // WARNING: In order to avoid AB-BA deadlocks when releasing 79 // the global lock while holding the per-device locks all 80 // device locks must be acquired *before* the device lock, and 81 // multiple device locks should be acquired parent before child. 82 lock sync.Mutex 83 } 84 85 type metaData struct { 86 Devices map[string]*devInfo `json:"Devices"` 87 } 88 89 // DeviceSet holds information about list of devices 90 type DeviceSet struct { 91 metaData `json:"-"` 92 sync.Mutex `json:"-"` // Protects all fields of DeviceSet and serializes calls into libdevmapper 93 root string 94 devicePrefix string 95 TransactionID uint64 `json:"-"` 96 NextDeviceID int `json:"next_device_id"` 97 deviceIDMap []byte 98 99 // Options 100 dataLoopbackSize int64 101 metaDataLoopbackSize int64 102 baseFsSize uint64 103 filesystem string 104 mountOptions string 105 mkfsArgs []string 106 dataDevice string // block or loop dev 107 dataLoopFile string // loopback file, if used 108 metadataDevice string // block or loop dev 109 metadataLoopFile string // loopback file, if used 110 doBlkDiscard bool 111 thinpBlockSize uint32 112 thinPoolDevice string 113 transaction `json:"-"` 114 overrideUdevSyncCheck bool 115 deferredRemove bool // use deferred removal 116 deferredDelete bool // use deferred deletion 117 BaseDeviceUUID string // save UUID of base device 118 BaseDeviceFilesystem string // save filesystem of base device 119 nrDeletedDevices uint // number of deleted devices 120 deletionWorkerTicker *time.Ticker 121 uidMaps []idtools.IDMap 122 gidMaps []idtools.IDMap 123 } 124 125 // DiskUsage contains information about disk usage and is used when reporting Status of a device. 126 type DiskUsage struct { 127 // Used bytes on the disk. 128 Used uint64 129 // Total bytes on the disk. 130 Total uint64 131 // Available bytes on the disk. 132 Available uint64 133 } 134 135 // Status returns the information about the device. 136 type Status struct { 137 // PoolName is the name of the data pool. 138 PoolName string 139 // DataFile is the actual block device for data. 140 DataFile string 141 // DataLoopback loopback file, if used. 142 DataLoopback string 143 // MetadataFile is the actual block device for metadata. 144 MetadataFile string 145 // MetadataLoopback is the loopback file, if used. 146 MetadataLoopback string 147 // Data is the disk used for data. 148 Data DiskUsage 149 // Metadata is the disk used for meta data. 150 Metadata DiskUsage 151 // BaseDeviceSize is base size of container and image 152 BaseDeviceSize uint64 153 // BaseDeviceFS is backing filesystem. 154 BaseDeviceFS string 155 // SectorSize size of the vector. 156 SectorSize uint64 157 // UdevSyncSupported is true if sync is supported. 158 UdevSyncSupported bool 159 // DeferredRemoveEnabled is true then the device is not unmounted. 160 DeferredRemoveEnabled bool 161 // True if deferred deletion is enabled. This is different from 162 // deferred removal. "removal" means that device mapper device is 163 // deactivated. Thin device is still in thin pool and can be activated 164 // again. But "deletion" means that thin device will be deleted from 165 // thin pool and it can't be activated again. 166 DeferredDeleteEnabled bool 167 DeferredDeletedDeviceCount uint 168 } 169 170 // Structure used to export image/container metadata in docker inspect. 171 type deviceMetadata struct { 172 deviceID int 173 deviceSize uint64 // size in bytes 174 deviceName string // Device name as used during activation 175 } 176 177 // DevStatus returns information about device mounted containing its id, size and sector information. 178 type DevStatus struct { 179 // DeviceID is the id of the device. 180 DeviceID int 181 // Size is the size of the filesystem. 182 Size uint64 183 // TransactionID is a unique integer per device set used to identify an operation on the file system, this number is incremental. 184 TransactionID uint64 185 // SizeInSectors indicates the size of the sectors allocated. 186 SizeInSectors uint64 187 // MappedSectors indicates number of mapped sectors. 188 MappedSectors uint64 189 // HighestMappedSector is the pointer to the highest mapped sector. 190 HighestMappedSector uint64 191 } 192 193 func getDevName(name string) string { 194 return "/dev/mapper/" + name 195 } 196 197 func (info *devInfo) Name() string { 198 hash := info.Hash 199 if hash == "" { 200 hash = "base" 201 } 202 return fmt.Sprintf("%s-%s", info.devices.devicePrefix, hash) 203 } 204 205 func (info *devInfo) DevName() string { 206 return getDevName(info.Name()) 207 } 208 209 func (devices *DeviceSet) loopbackDir() string { 210 return path.Join(devices.root, "devicemapper") 211 } 212 213 func (devices *DeviceSet) metadataDir() string { 214 return path.Join(devices.root, "metadata") 215 } 216 217 func (devices *DeviceSet) metadataFile(info *devInfo) string { 218 file := info.Hash 219 if file == "" { 220 file = "base" 221 } 222 return path.Join(devices.metadataDir(), file) 223 } 224 225 func (devices *DeviceSet) transactionMetaFile() string { 226 return path.Join(devices.metadataDir(), transactionMetaFile) 227 } 228 229 func (devices *DeviceSet) deviceSetMetaFile() string { 230 return path.Join(devices.metadataDir(), deviceSetMetaFile) 231 } 232 233 func (devices *DeviceSet) oldMetadataFile() string { 234 return path.Join(devices.loopbackDir(), "json") 235 } 236 237 func (devices *DeviceSet) getPoolName() string { 238 if devices.thinPoolDevice == "" { 239 return devices.devicePrefix + "-pool" 240 } 241 return devices.thinPoolDevice 242 } 243 244 func (devices *DeviceSet) getPoolDevName() string { 245 return getDevName(devices.getPoolName()) 246 } 247 248 func (devices *DeviceSet) hasImage(name string) bool { 249 dirname := devices.loopbackDir() 250 filename := path.Join(dirname, name) 251 252 _, err := os.Stat(filename) 253 return err == nil 254 } 255 256 // ensureImage creates a sparse file of <size> bytes at the path 257 // <root>/devicemapper/<name>. 258 // If the file already exists and new size is larger than its current size, it grows to the new size. 259 // Either way it returns the full path. 260 func (devices *DeviceSet) ensureImage(name string, size int64) (string, error) { 261 dirname := devices.loopbackDir() 262 filename := path.Join(dirname, name) 263 264 uid, gid, err := idtools.GetRootUIDGID(devices.uidMaps, devices.gidMaps) 265 if err != nil { 266 return "", err 267 } 268 if err := idtools.MkdirAllAs(dirname, 0700, uid, gid); err != nil && !os.IsExist(err) { 269 return "", err 270 } 271 272 if fi, err := os.Stat(filename); err != nil { 273 if !os.IsNotExist(err) { 274 return "", err 275 } 276 logrus.Debugf("devmapper: Creating loopback file %s for device-manage use", filename) 277 file, err := os.OpenFile(filename, os.O_RDWR|os.O_CREATE, 0600) 278 if err != nil { 279 return "", err 280 } 281 defer file.Close() 282 283 if err := file.Truncate(size); err != nil { 284 return "", err 285 } 286 } else { 287 if fi.Size() < size { 288 file, err := os.OpenFile(filename, os.O_RDWR|os.O_CREATE, 0600) 289 if err != nil { 290 return "", err 291 } 292 defer file.Close() 293 if err := file.Truncate(size); err != nil { 294 return "", fmt.Errorf("devmapper: Unable to grow loopback file %s: %v", filename, err) 295 } 296 } else if fi.Size() > size { 297 logrus.Warnf("devmapper: Can't shrink loopback file %s", filename) 298 } 299 } 300 return filename, nil 301 } 302 303 func (devices *DeviceSet) allocateTransactionID() uint64 { 304 devices.OpenTransactionID = devices.TransactionID + 1 305 return devices.OpenTransactionID 306 } 307 308 func (devices *DeviceSet) updatePoolTransactionID() error { 309 if err := devicemapper.SetTransactionID(devices.getPoolDevName(), devices.TransactionID, devices.OpenTransactionID); err != nil { 310 return fmt.Errorf("devmapper: Error setting devmapper transaction ID: %s", err) 311 } 312 devices.TransactionID = devices.OpenTransactionID 313 return nil 314 } 315 316 func (devices *DeviceSet) removeMetadata(info *devInfo) error { 317 if err := os.RemoveAll(devices.metadataFile(info)); err != nil { 318 return fmt.Errorf("devmapper: Error removing metadata file %s: %s", devices.metadataFile(info), err) 319 } 320 return nil 321 } 322 323 // Given json data and file path, write it to disk 324 func (devices *DeviceSet) writeMetaFile(jsonData []byte, filePath string) error { 325 tmpFile, err := ioutil.TempFile(devices.metadataDir(), ".tmp") 326 if err != nil { 327 return fmt.Errorf("devmapper: Error creating metadata file: %s", err) 328 } 329 330 n, err := tmpFile.Write(jsonData) 331 if err != nil { 332 return fmt.Errorf("devmapper: Error writing metadata to %s: %s", tmpFile.Name(), err) 333 } 334 if n < len(jsonData) { 335 return io.ErrShortWrite 336 } 337 if err := tmpFile.Sync(); err != nil { 338 return fmt.Errorf("devmapper: Error syncing metadata file %s: %s", tmpFile.Name(), err) 339 } 340 if err := tmpFile.Close(); err != nil { 341 return fmt.Errorf("devmapper: Error closing metadata file %s: %s", tmpFile.Name(), err) 342 } 343 if err := os.Rename(tmpFile.Name(), filePath); err != nil { 344 return fmt.Errorf("devmapper: Error committing metadata file %s: %s", tmpFile.Name(), err) 345 } 346 347 return nil 348 } 349 350 func (devices *DeviceSet) saveMetadata(info *devInfo) error { 351 jsonData, err := json.Marshal(info) 352 if err != nil { 353 return fmt.Errorf("devmapper: Error encoding metadata to json: %s", err) 354 } 355 if err := devices.writeMetaFile(jsonData, devices.metadataFile(info)); err != nil { 356 return err 357 } 358 return nil 359 } 360 361 func (devices *DeviceSet) markDeviceIDUsed(deviceID int) { 362 var mask byte 363 i := deviceID % 8 364 mask = 1 << uint(i) 365 devices.deviceIDMap[deviceID/8] = devices.deviceIDMap[deviceID/8] | mask 366 } 367 368 func (devices *DeviceSet) markDeviceIDFree(deviceID int) { 369 var mask byte 370 i := deviceID % 8 371 mask = ^(1 << uint(i)) 372 devices.deviceIDMap[deviceID/8] = devices.deviceIDMap[deviceID/8] & mask 373 } 374 375 func (devices *DeviceSet) isDeviceIDFree(deviceID int) bool { 376 var mask byte 377 i := deviceID % 8 378 mask = (1 << uint(i)) 379 if (devices.deviceIDMap[deviceID/8] & mask) != 0 { 380 return false 381 } 382 return true 383 } 384 385 // Should be called with devices.Lock() held. 386 func (devices *DeviceSet) lookupDevice(hash string) (*devInfo, error) { 387 info := devices.Devices[hash] 388 if info == nil { 389 info = devices.loadMetadata(hash) 390 if info == nil { 391 return nil, fmt.Errorf("devmapper: Unknown device %s", hash) 392 } 393 394 devices.Devices[hash] = info 395 } 396 return info, nil 397 } 398 399 func (devices *DeviceSet) lookupDeviceWithLock(hash string) (*devInfo, error) { 400 devices.Lock() 401 defer devices.Unlock() 402 info, err := devices.lookupDevice(hash) 403 return info, err 404 } 405 406 // This function relies on that device hash map has been loaded in advance. 407 // Should be called with devices.Lock() held. 408 func (devices *DeviceSet) constructDeviceIDMap() { 409 logrus.Debugf("devmapper: constructDeviceIDMap()") 410 defer logrus.Debugf("devmapper: constructDeviceIDMap() END") 411 412 for _, info := range devices.Devices { 413 devices.markDeviceIDUsed(info.DeviceID) 414 logrus.Debugf("devmapper: Added deviceId=%d to DeviceIdMap", info.DeviceID) 415 } 416 } 417 418 func (devices *DeviceSet) deviceFileWalkFunction(path string, finfo os.FileInfo) error { 419 420 // Skip some of the meta files which are not device files. 421 if strings.HasSuffix(finfo.Name(), ".migrated") { 422 logrus.Debugf("devmapper: Skipping file %s", path) 423 return nil 424 } 425 426 if strings.HasPrefix(finfo.Name(), ".") { 427 logrus.Debugf("devmapper: Skipping file %s", path) 428 return nil 429 } 430 431 if finfo.Name() == deviceSetMetaFile { 432 logrus.Debugf("devmapper: Skipping file %s", path) 433 return nil 434 } 435 436 if finfo.Name() == transactionMetaFile { 437 logrus.Debugf("devmapper: Skipping file %s", path) 438 return nil 439 } 440 441 logrus.Debugf("devmapper: Loading data for file %s", path) 442 443 hash := finfo.Name() 444 if hash == "base" { 445 hash = "" 446 } 447 448 // Include deleted devices also as cleanup delete device logic 449 // will go through it and see if there are any deleted devices. 450 if _, err := devices.lookupDevice(hash); err != nil { 451 return fmt.Errorf("devmapper: Error looking up device %s:%v", hash, err) 452 } 453 454 return nil 455 } 456 457 func (devices *DeviceSet) loadDeviceFilesOnStart() error { 458 logrus.Debugf("devmapper: loadDeviceFilesOnStart()") 459 defer logrus.Debugf("devmapper: loadDeviceFilesOnStart() END") 460 461 var scan = func(path string, info os.FileInfo, err error) error { 462 if err != nil { 463 logrus.Debugf("devmapper: Can't walk the file %s", path) 464 return nil 465 } 466 467 // Skip any directories 468 if info.IsDir() { 469 return nil 470 } 471 472 return devices.deviceFileWalkFunction(path, info) 473 } 474 475 return filepath.Walk(devices.metadataDir(), scan) 476 } 477 478 // Should be called with devices.Lock() held. 479 func (devices *DeviceSet) unregisterDevice(id int, hash string) error { 480 logrus.Debugf("devmapper: unregisterDevice(%v, %v)", id, hash) 481 info := &devInfo{ 482 Hash: hash, 483 DeviceID: id, 484 } 485 486 delete(devices.Devices, hash) 487 488 if err := devices.removeMetadata(info); err != nil { 489 logrus.Debugf("devmapper: Error removing metadata: %s", err) 490 return err 491 } 492 493 return nil 494 } 495 496 // Should be called with devices.Lock() held. 497 func (devices *DeviceSet) registerDevice(id int, hash string, size uint64, transactionID uint64) (*devInfo, error) { 498 logrus.Debugf("devmapper: registerDevice(%v, %v)", id, hash) 499 info := &devInfo{ 500 Hash: hash, 501 DeviceID: id, 502 Size: size, 503 TransactionID: transactionID, 504 Initialized: false, 505 devices: devices, 506 } 507 508 devices.Devices[hash] = info 509 510 if err := devices.saveMetadata(info); err != nil { 511 // Try to remove unused device 512 delete(devices.Devices, hash) 513 return nil, err 514 } 515 516 return info, nil 517 } 518 519 func (devices *DeviceSet) activateDeviceIfNeeded(info *devInfo, ignoreDeleted bool) error { 520 logrus.Debugf("devmapper: activateDeviceIfNeeded(%v)", info.Hash) 521 522 if info.Deleted && !ignoreDeleted { 523 return fmt.Errorf("devmapper: Can't activate device %v as it is marked for deletion", info.Hash) 524 } 525 526 // Make sure deferred removal on device is canceled, if one was 527 // scheduled. 528 if err := devices.cancelDeferredRemoval(info); err != nil { 529 return fmt.Errorf("devmapper: Device Deferred Removal Cancellation Failed: %s", err) 530 } 531 532 if devinfo, _ := devicemapper.GetInfo(info.Name()); devinfo != nil && devinfo.Exists != 0 { 533 return nil 534 } 535 536 return devicemapper.ActivateDevice(devices.getPoolDevName(), info.Name(), info.DeviceID, info.Size) 537 } 538 539 // Return true only if kernel supports xfs and mkfs.xfs is available 540 func xfsSupported() bool { 541 // Make sure mkfs.xfs is available 542 if _, err := exec.LookPath("mkfs.xfs"); err != nil { 543 return false 544 } 545 546 // Check if kernel supports xfs filesystem or not. 547 exec.Command("modprobe", "xfs").Run() 548 549 f, err := os.Open("/proc/filesystems") 550 if err != nil { 551 logrus.Warnf("devmapper: Could not check if xfs is supported: %v", err) 552 return false 553 } 554 defer f.Close() 555 556 s := bufio.NewScanner(f) 557 for s.Scan() { 558 if strings.HasSuffix(s.Text(), "\txfs") { 559 return true 560 } 561 } 562 563 if err := s.Err(); err != nil { 564 logrus.Warnf("devmapper: Could not check if xfs is supported: %v", err) 565 } 566 return false 567 } 568 569 func determineDefaultFS() string { 570 if xfsSupported() { 571 return "xfs" 572 } 573 574 logrus.Warn("devmapper: XFS is not supported in your system. Either the kernel doesnt support it or mkfs.xfs is not in your PATH. Defaulting to ext4 filesystem") 575 return "ext4" 576 } 577 578 func (devices *DeviceSet) createFilesystem(info *devInfo) (err error) { 579 devname := info.DevName() 580 581 args := []string{} 582 for _, arg := range devices.mkfsArgs { 583 args = append(args, arg) 584 } 585 586 args = append(args, devname) 587 588 if devices.filesystem == "" { 589 devices.filesystem = determineDefaultFS() 590 } 591 if err := devices.saveBaseDeviceFilesystem(devices.filesystem); err != nil { 592 return err 593 } 594 595 logrus.Infof("devmapper: Creating filesystem %s on device %s", devices.filesystem, info.Name()) 596 defer func() { 597 if err != nil { 598 logrus.Infof("devmapper: Error while creating filesystem %s on device %s: %v", devices.filesystem, info.Name(), err) 599 } else { 600 logrus.Infof("devmapper: Successfully created filesystem %s on device %s", devices.filesystem, info.Name()) 601 } 602 }() 603 604 switch devices.filesystem { 605 case "xfs": 606 err = exec.Command("mkfs.xfs", args...).Run() 607 case "ext4": 608 err = exec.Command("mkfs.ext4", append([]string{"-E", "nodiscard,lazy_itable_init=0,lazy_journal_init=0"}, args...)...).Run() 609 if err != nil { 610 err = exec.Command("mkfs.ext4", append([]string{"-E", "nodiscard,lazy_itable_init=0"}, args...)...).Run() 611 } 612 if err != nil { 613 return err 614 } 615 err = exec.Command("tune2fs", append([]string{"-c", "-1", "-i", "0"}, devname)...).Run() 616 default: 617 err = fmt.Errorf("devmapper: Unsupported filesystem type %s", devices.filesystem) 618 } 619 return 620 } 621 622 func (devices *DeviceSet) migrateOldMetaData() error { 623 // Migrate old metadata file 624 jsonData, err := ioutil.ReadFile(devices.oldMetadataFile()) 625 if err != nil && !os.IsNotExist(err) { 626 return err 627 } 628 629 if jsonData != nil { 630 m := metaData{Devices: make(map[string]*devInfo)} 631 632 if err := json.Unmarshal(jsonData, &m); err != nil { 633 return err 634 } 635 636 for hash, info := range m.Devices { 637 info.Hash = hash 638 devices.saveMetadata(info) 639 } 640 if err := os.Rename(devices.oldMetadataFile(), devices.oldMetadataFile()+".migrated"); err != nil { 641 return err 642 } 643 644 } 645 646 return nil 647 } 648 649 // Cleanup deleted devices. It assumes that all the devices have been 650 // loaded in the hash table. 651 func (devices *DeviceSet) cleanupDeletedDevices() error { 652 devices.Lock() 653 654 // If there are no deleted devices, there is nothing to do. 655 if devices.nrDeletedDevices == 0 { 656 devices.Unlock() 657 return nil 658 } 659 660 var deletedDevices []*devInfo 661 662 for _, info := range devices.Devices { 663 if !info.Deleted { 664 continue 665 } 666 logrus.Debugf("devmapper: Found deleted device %s.", info.Hash) 667 deletedDevices = append(deletedDevices, info) 668 } 669 670 // Delete the deleted devices. DeleteDevice() first takes the info lock 671 // and then devices.Lock(). So drop it to avoid deadlock. 672 devices.Unlock() 673 674 for _, info := range deletedDevices { 675 // This will again try deferred deletion. 676 if err := devices.DeleteDevice(info.Hash, false); err != nil { 677 logrus.Warnf("devmapper: Deletion of device %s, device_id=%v failed:%v", info.Hash, info.DeviceID, err) 678 } 679 } 680 681 return nil 682 } 683 684 func (devices *DeviceSet) countDeletedDevices() { 685 for _, info := range devices.Devices { 686 if !info.Deleted { 687 continue 688 } 689 devices.nrDeletedDevices++ 690 } 691 } 692 693 func (devices *DeviceSet) startDeviceDeletionWorker() { 694 // Deferred deletion is not enabled. Don't do anything. 695 if !devices.deferredDelete { 696 return 697 } 698 699 logrus.Debugf("devmapper: Worker to cleanup deleted devices started") 700 for range devices.deletionWorkerTicker.C { 701 devices.cleanupDeletedDevices() 702 } 703 } 704 705 func (devices *DeviceSet) initMetaData() error { 706 devices.Lock() 707 defer devices.Unlock() 708 709 if err := devices.migrateOldMetaData(); err != nil { 710 return err 711 } 712 713 _, transactionID, _, _, _, _, err := devices.poolStatus() 714 if err != nil { 715 return err 716 } 717 718 devices.TransactionID = transactionID 719 720 if err := devices.loadDeviceFilesOnStart(); err != nil { 721 return fmt.Errorf("devmapper: Failed to load device files:%v", err) 722 } 723 724 devices.constructDeviceIDMap() 725 devices.countDeletedDevices() 726 727 if err := devices.processPendingTransaction(); err != nil { 728 return err 729 } 730 731 // Start a goroutine to cleanup Deleted Devices 732 go devices.startDeviceDeletionWorker() 733 return nil 734 } 735 736 func (devices *DeviceSet) incNextDeviceID() { 737 // IDs are 24bit, so wrap around 738 devices.NextDeviceID = (devices.NextDeviceID + 1) & maxDeviceID 739 } 740 741 func (devices *DeviceSet) getNextFreeDeviceID() (int, error) { 742 devices.incNextDeviceID() 743 for i := 0; i <= maxDeviceID; i++ { 744 if devices.isDeviceIDFree(devices.NextDeviceID) { 745 devices.markDeviceIDUsed(devices.NextDeviceID) 746 return devices.NextDeviceID, nil 747 } 748 devices.incNextDeviceID() 749 } 750 751 return 0, fmt.Errorf("devmapper: Unable to find a free device ID") 752 } 753 754 func (devices *DeviceSet) createRegisterDevice(hash string) (*devInfo, error) { 755 devices.Lock() 756 defer devices.Unlock() 757 758 deviceID, err := devices.getNextFreeDeviceID() 759 if err != nil { 760 return nil, err 761 } 762 763 if err := devices.openTransaction(hash, deviceID); err != nil { 764 logrus.Debugf("devmapper: Error opening transaction hash = %s deviceID = %d", hash, deviceID) 765 devices.markDeviceIDFree(deviceID) 766 return nil, err 767 } 768 769 for { 770 if err := devicemapper.CreateDevice(devices.getPoolDevName(), deviceID); err != nil { 771 if devicemapper.DeviceIDExists(err) { 772 // Device ID already exists. This should not 773 // happen. Now we have a mechanism to find 774 // a free device ID. So something is not right. 775 // Give a warning and continue. 776 logrus.Errorf("devmapper: Device ID %d exists in pool but it is supposed to be unused", deviceID) 777 deviceID, err = devices.getNextFreeDeviceID() 778 if err != nil { 779 return nil, err 780 } 781 // Save new device id into transaction 782 devices.refreshTransaction(deviceID) 783 continue 784 } 785 logrus.Debugf("devmapper: Error creating device: %s", err) 786 devices.markDeviceIDFree(deviceID) 787 return nil, err 788 } 789 break 790 } 791 792 logrus.Debugf("devmapper: Registering device (id %v) with FS size %v", deviceID, devices.baseFsSize) 793 info, err := devices.registerDevice(deviceID, hash, devices.baseFsSize, devices.OpenTransactionID) 794 if err != nil { 795 _ = devicemapper.DeleteDevice(devices.getPoolDevName(), deviceID) 796 devices.markDeviceIDFree(deviceID) 797 return nil, err 798 } 799 800 if err := devices.closeTransaction(); err != nil { 801 devices.unregisterDevice(deviceID, hash) 802 devicemapper.DeleteDevice(devices.getPoolDevName(), deviceID) 803 devices.markDeviceIDFree(deviceID) 804 return nil, err 805 } 806 return info, nil 807 } 808 809 func (devices *DeviceSet) createRegisterSnapDevice(hash string, baseInfo *devInfo) error { 810 deviceID, err := devices.getNextFreeDeviceID() 811 if err != nil { 812 return err 813 } 814 815 if err := devices.openTransaction(hash, deviceID); err != nil { 816 logrus.Debugf("devmapper: Error opening transaction hash = %s deviceID = %d", hash, deviceID) 817 devices.markDeviceIDFree(deviceID) 818 return err 819 } 820 821 for { 822 if err := devicemapper.CreateSnapDevice(devices.getPoolDevName(), deviceID, baseInfo.Name(), baseInfo.DeviceID); err != nil { 823 if devicemapper.DeviceIDExists(err) { 824 // Device ID already exists. This should not 825 // happen. Now we have a mechanism to find 826 // a free device ID. So something is not right. 827 // Give a warning and continue. 828 logrus.Errorf("devmapper: Device ID %d exists in pool but it is supposed to be unused", deviceID) 829 deviceID, err = devices.getNextFreeDeviceID() 830 if err != nil { 831 return err 832 } 833 // Save new device id into transaction 834 devices.refreshTransaction(deviceID) 835 continue 836 } 837 logrus.Debugf("devmapper: Error creating snap device: %s", err) 838 devices.markDeviceIDFree(deviceID) 839 return err 840 } 841 break 842 } 843 844 if _, err := devices.registerDevice(deviceID, hash, baseInfo.Size, devices.OpenTransactionID); err != nil { 845 devicemapper.DeleteDevice(devices.getPoolDevName(), deviceID) 846 devices.markDeviceIDFree(deviceID) 847 logrus.Debugf("devmapper: Error registering device: %s", err) 848 return err 849 } 850 851 if err := devices.closeTransaction(); err != nil { 852 devices.unregisterDevice(deviceID, hash) 853 devicemapper.DeleteDevice(devices.getPoolDevName(), deviceID) 854 devices.markDeviceIDFree(deviceID) 855 return err 856 } 857 return nil 858 } 859 860 func (devices *DeviceSet) loadMetadata(hash string) *devInfo { 861 info := &devInfo{Hash: hash, devices: devices} 862 863 jsonData, err := ioutil.ReadFile(devices.metadataFile(info)) 864 if err != nil { 865 return nil 866 } 867 868 if err := json.Unmarshal(jsonData, &info); err != nil { 869 return nil 870 } 871 872 if info.DeviceID > maxDeviceID { 873 logrus.Errorf("devmapper: Ignoring Invalid DeviceId=%d", info.DeviceID) 874 return nil 875 } 876 877 return info 878 } 879 880 func getDeviceUUID(device string) (string, error) { 881 out, err := exec.Command("blkid", "-s", "UUID", "-o", "value", device).Output() 882 if err != nil { 883 return "", fmt.Errorf("devmapper: Failed to find uuid for device %s:%v", device, err) 884 } 885 886 uuid := strings.TrimSuffix(string(out), "\n") 887 uuid = strings.TrimSpace(uuid) 888 logrus.Debugf("devmapper: UUID for device: %s is:%s", device, uuid) 889 return uuid, nil 890 } 891 892 func (devices *DeviceSet) getBaseDeviceSize() uint64 { 893 info, _ := devices.lookupDevice("") 894 if info == nil { 895 return 0 896 } 897 return info.Size 898 } 899 900 func (devices *DeviceSet) getBaseDeviceFS() string { 901 return devices.BaseDeviceFilesystem 902 } 903 904 func (devices *DeviceSet) verifyBaseDeviceUUIDFS(baseInfo *devInfo) error { 905 devices.Lock() 906 defer devices.Unlock() 907 908 if err := devices.activateDeviceIfNeeded(baseInfo, false); err != nil { 909 return err 910 } 911 defer devices.deactivateDevice(baseInfo) 912 913 uuid, err := getDeviceUUID(baseInfo.DevName()) 914 if err != nil { 915 return err 916 } 917 918 if devices.BaseDeviceUUID != uuid { 919 return fmt.Errorf("devmapper: Current Base Device UUID:%s does not match with stored UUID:%s. Possibly using a different thin pool than last invocation", uuid, devices.BaseDeviceUUID) 920 } 921 922 if devices.BaseDeviceFilesystem == "" { 923 fsType, err := ProbeFsType(baseInfo.DevName()) 924 if err != nil { 925 return err 926 } 927 if err := devices.saveBaseDeviceFilesystem(fsType); err != nil { 928 return err 929 } 930 } 931 932 // If user specified a filesystem using dm.fs option and current 933 // file system of base image is not same, warn user that dm.fs 934 // will be ignored. 935 if devices.BaseDeviceFilesystem != devices.filesystem { 936 logrus.Warnf("devmapper: Base device already exists and has filesystem %s on it. User specified filesystem %s will be ignored.", devices.BaseDeviceFilesystem, devices.filesystem) 937 devices.filesystem = devices.BaseDeviceFilesystem 938 } 939 return nil 940 } 941 942 func (devices *DeviceSet) saveBaseDeviceFilesystem(fs string) error { 943 devices.BaseDeviceFilesystem = fs 944 return devices.saveDeviceSetMetaData() 945 } 946 947 func (devices *DeviceSet) saveBaseDeviceUUID(baseInfo *devInfo) error { 948 devices.Lock() 949 defer devices.Unlock() 950 951 if err := devices.activateDeviceIfNeeded(baseInfo, false); err != nil { 952 return err 953 } 954 defer devices.deactivateDevice(baseInfo) 955 956 uuid, err := getDeviceUUID(baseInfo.DevName()) 957 if err != nil { 958 return err 959 } 960 961 devices.BaseDeviceUUID = uuid 962 return devices.saveDeviceSetMetaData() 963 } 964 965 func (devices *DeviceSet) createBaseImage() error { 966 logrus.Debugf("devmapper: Initializing base device-mapper thin volume") 967 968 // Create initial device 969 info, err := devices.createRegisterDevice("") 970 if err != nil { 971 return err 972 } 973 974 logrus.Debugf("devmapper: Creating filesystem on base device-mapper thin volume") 975 976 if err := devices.activateDeviceIfNeeded(info, false); err != nil { 977 return err 978 } 979 980 if err := devices.createFilesystem(info); err != nil { 981 return err 982 } 983 984 info.Initialized = true 985 if err := devices.saveMetadata(info); err != nil { 986 info.Initialized = false 987 return err 988 } 989 990 if err := devices.saveBaseDeviceUUID(info); err != nil { 991 return fmt.Errorf("devmapper: Could not query and save base device UUID:%v", err) 992 } 993 994 return nil 995 } 996 997 // Returns if thin pool device exists or not. If device exists, also makes 998 // sure it is a thin pool device and not some other type of device. 999 func (devices *DeviceSet) thinPoolExists(thinPoolDevice string) (bool, error) { 1000 logrus.Debugf("devmapper: Checking for existence of the pool %s", thinPoolDevice) 1001 1002 info, err := devicemapper.GetInfo(thinPoolDevice) 1003 if err != nil { 1004 return false, fmt.Errorf("devmapper: GetInfo() on device %s failed: %v", thinPoolDevice, err) 1005 } 1006 1007 // Device does not exist. 1008 if info.Exists == 0 { 1009 return false, nil 1010 } 1011 1012 _, _, deviceType, _, err := devicemapper.GetStatus(thinPoolDevice) 1013 if err != nil { 1014 return false, fmt.Errorf("devmapper: GetStatus() on device %s failed: %v", thinPoolDevice, err) 1015 } 1016 1017 if deviceType != "thin-pool" { 1018 return false, fmt.Errorf("devmapper: Device %s is not a thin pool", thinPoolDevice) 1019 } 1020 1021 return true, nil 1022 } 1023 1024 func (devices *DeviceSet) checkThinPool() error { 1025 _, transactionID, dataUsed, _, _, _, err := devices.poolStatus() 1026 if err != nil { 1027 return err 1028 } 1029 if dataUsed != 0 { 1030 return fmt.Errorf("devmapper: Unable to take ownership of thin-pool (%s) that already has used data blocks", 1031 devices.thinPoolDevice) 1032 } 1033 if transactionID != 0 { 1034 return fmt.Errorf("devmapper: Unable to take ownership of thin-pool (%s) with non-zero transaction ID", 1035 devices.thinPoolDevice) 1036 } 1037 return nil 1038 } 1039 1040 // Base image is initialized properly. Either save UUID for first time (for 1041 // upgrade case or verify UUID. 1042 func (devices *DeviceSet) setupVerifyBaseImageUUIDFS(baseInfo *devInfo) error { 1043 // If BaseDeviceUUID is nil (upgrade case), save it and return success. 1044 if devices.BaseDeviceUUID == "" { 1045 if err := devices.saveBaseDeviceUUID(baseInfo); err != nil { 1046 return fmt.Errorf("devmapper: Could not query and save base device UUID:%v", err) 1047 } 1048 return nil 1049 } 1050 1051 if err := devices.verifyBaseDeviceUUIDFS(baseInfo); err != nil { 1052 return fmt.Errorf("devmapper: Base Device UUID and Filesystem verification failed.%v", err) 1053 } 1054 1055 return nil 1056 } 1057 1058 func (devices *DeviceSet) setupBaseImage() error { 1059 oldInfo, _ := devices.lookupDeviceWithLock("") 1060 1061 // base image already exists. If it is initialized properly, do UUID 1062 // verification and return. Otherwise remove image and set it up 1063 // fresh. 1064 1065 if oldInfo != nil { 1066 if oldInfo.Initialized && !oldInfo.Deleted { 1067 if err := devices.setupVerifyBaseImageUUIDFS(oldInfo); err != nil { 1068 return err 1069 } 1070 1071 if devices.baseFsSize != defaultBaseFsSize && devices.baseFsSize != devices.getBaseDeviceSize() { 1072 logrus.Warnf("devmapper: Base device is already initialized to size %s, new value of base device size %s will not take effect", 1073 units.HumanSize(float64(devices.getBaseDeviceSize())), units.HumanSize(float64(devices.baseFsSize))) 1074 } 1075 1076 return nil 1077 } 1078 1079 logrus.Debugf("devmapper: Removing uninitialized base image") 1080 // If previous base device is in deferred delete state, 1081 // that needs to be cleaned up first. So don't try 1082 // deferred deletion. 1083 if err := devices.DeleteDevice("", true); err != nil { 1084 return err 1085 } 1086 } 1087 1088 // If we are setting up base image for the first time, make sure 1089 // thin pool is empty. 1090 if devices.thinPoolDevice != "" && oldInfo == nil { 1091 if err := devices.checkThinPool(); err != nil { 1092 return err 1093 } 1094 } 1095 1096 // Create new base image device 1097 if err := devices.createBaseImage(); err != nil { 1098 return err 1099 } 1100 1101 return nil 1102 } 1103 1104 func setCloseOnExec(name string) { 1105 if fileInfos, _ := ioutil.ReadDir("/proc/self/fd"); fileInfos != nil { 1106 for _, i := range fileInfos { 1107 link, _ := os.Readlink(filepath.Join("/proc/self/fd", i.Name())) 1108 if link == name { 1109 fd, err := strconv.Atoi(i.Name()) 1110 if err == nil { 1111 syscall.CloseOnExec(fd) 1112 } 1113 } 1114 } 1115 } 1116 } 1117 1118 // DMLog implements logging using DevMapperLogger interface. 1119 func (devices *DeviceSet) DMLog(level int, file string, line int, dmError int, message string) { 1120 // By default libdm sends us all the messages including debug ones. 1121 // We need to filter out messages here and figure out which one 1122 // should be printed. 1123 if level > logLevel { 1124 return 1125 } 1126 1127 // FIXME(vbatts) push this back into ./pkg/devicemapper/ 1128 if level <= devicemapper.LogLevelErr { 1129 logrus.Errorf("libdevmapper(%d): %s:%d (%d) %s", level, file, line, dmError, message) 1130 } else if level <= devicemapper.LogLevelInfo { 1131 logrus.Infof("libdevmapper(%d): %s:%d (%d) %s", level, file, line, dmError, message) 1132 } else { 1133 // FIXME(vbatts) push this back into ./pkg/devicemapper/ 1134 logrus.Debugf("libdevmapper(%d): %s:%d (%d) %s", level, file, line, dmError, message) 1135 } 1136 } 1137 1138 func major(device uint64) uint64 { 1139 return (device >> 8) & 0xfff 1140 } 1141 1142 func minor(device uint64) uint64 { 1143 return (device & 0xff) | ((device >> 12) & 0xfff00) 1144 } 1145 1146 // ResizePool increases the size of the pool. 1147 func (devices *DeviceSet) ResizePool(size int64) error { 1148 dirname := devices.loopbackDir() 1149 datafilename := path.Join(dirname, "data") 1150 if len(devices.dataDevice) > 0 { 1151 datafilename = devices.dataDevice 1152 } 1153 metadatafilename := path.Join(dirname, "metadata") 1154 if len(devices.metadataDevice) > 0 { 1155 metadatafilename = devices.metadataDevice 1156 } 1157 1158 datafile, err := os.OpenFile(datafilename, os.O_RDWR, 0) 1159 if datafile == nil { 1160 return err 1161 } 1162 defer datafile.Close() 1163 1164 fi, err := datafile.Stat() 1165 if fi == nil { 1166 return err 1167 } 1168 1169 if fi.Size() > size { 1170 return fmt.Errorf("devmapper: Can't shrink file") 1171 } 1172 1173 dataloopback := devicemapper.FindLoopDeviceFor(datafile) 1174 if dataloopback == nil { 1175 return fmt.Errorf("devmapper: Unable to find loopback mount for: %s", datafilename) 1176 } 1177 defer dataloopback.Close() 1178 1179 metadatafile, err := os.OpenFile(metadatafilename, os.O_RDWR, 0) 1180 if metadatafile == nil { 1181 return err 1182 } 1183 defer metadatafile.Close() 1184 1185 metadataloopback := devicemapper.FindLoopDeviceFor(metadatafile) 1186 if metadataloopback == nil { 1187 return fmt.Errorf("devmapper: Unable to find loopback mount for: %s", metadatafilename) 1188 } 1189 defer metadataloopback.Close() 1190 1191 // Grow loopback file 1192 if err := datafile.Truncate(size); err != nil { 1193 return fmt.Errorf("devmapper: Unable to grow loopback file: %s", err) 1194 } 1195 1196 // Reload size for loopback device 1197 if err := devicemapper.LoopbackSetCapacity(dataloopback); err != nil { 1198 return fmt.Errorf("devmapper: Unable to update loopback capacity: %s", err) 1199 } 1200 1201 // Suspend the pool 1202 if err := devicemapper.SuspendDevice(devices.getPoolName()); err != nil { 1203 return fmt.Errorf("devmapper: Unable to suspend pool: %s", err) 1204 } 1205 1206 // Reload with the new block sizes 1207 if err := devicemapper.ReloadPool(devices.getPoolName(), dataloopback, metadataloopback, devices.thinpBlockSize); err != nil { 1208 return fmt.Errorf("devmapper: Unable to reload pool: %s", err) 1209 } 1210 1211 // Resume the pool 1212 if err := devicemapper.ResumeDevice(devices.getPoolName()); err != nil { 1213 return fmt.Errorf("devmapper: Unable to resume pool: %s", err) 1214 } 1215 1216 return nil 1217 } 1218 1219 func (devices *DeviceSet) loadTransactionMetaData() error { 1220 jsonData, err := ioutil.ReadFile(devices.transactionMetaFile()) 1221 if err != nil { 1222 // There is no active transaction. This will be the case 1223 // during upgrade. 1224 if os.IsNotExist(err) { 1225 devices.OpenTransactionID = devices.TransactionID 1226 return nil 1227 } 1228 return err 1229 } 1230 1231 json.Unmarshal(jsonData, &devices.transaction) 1232 return nil 1233 } 1234 1235 func (devices *DeviceSet) saveTransactionMetaData() error { 1236 jsonData, err := json.Marshal(&devices.transaction) 1237 if err != nil { 1238 return fmt.Errorf("devmapper: Error encoding metadata to json: %s", err) 1239 } 1240 1241 return devices.writeMetaFile(jsonData, devices.transactionMetaFile()) 1242 } 1243 1244 func (devices *DeviceSet) removeTransactionMetaData() error { 1245 if err := os.RemoveAll(devices.transactionMetaFile()); err != nil { 1246 return err 1247 } 1248 return nil 1249 } 1250 1251 func (devices *DeviceSet) rollbackTransaction() error { 1252 logrus.Debugf("devmapper: Rolling back open transaction: TransactionID=%d hash=%s device_id=%d", devices.OpenTransactionID, devices.DeviceIDHash, devices.DeviceID) 1253 1254 // A device id might have already been deleted before transaction 1255 // closed. In that case this call will fail. Just leave a message 1256 // in case of failure. 1257 if err := devicemapper.DeleteDevice(devices.getPoolDevName(), devices.DeviceID); err != nil { 1258 logrus.Errorf("devmapper: Unable to delete device: %s", err) 1259 } 1260 1261 dinfo := &devInfo{Hash: devices.DeviceIDHash} 1262 if err := devices.removeMetadata(dinfo); err != nil { 1263 logrus.Errorf("devmapper: Unable to remove metadata: %s", err) 1264 } else { 1265 devices.markDeviceIDFree(devices.DeviceID) 1266 } 1267 1268 if err := devices.removeTransactionMetaData(); err != nil { 1269 logrus.Errorf("devmapper: Unable to remove transaction meta file %s: %s", devices.transactionMetaFile(), err) 1270 } 1271 1272 return nil 1273 } 1274 1275 func (devices *DeviceSet) processPendingTransaction() error { 1276 if err := devices.loadTransactionMetaData(); err != nil { 1277 return err 1278 } 1279 1280 // If there was open transaction but pool transaction ID is same 1281 // as open transaction ID, nothing to roll back. 1282 if devices.TransactionID == devices.OpenTransactionID { 1283 return nil 1284 } 1285 1286 // If open transaction ID is less than pool transaction ID, something 1287 // is wrong. Bail out. 1288 if devices.OpenTransactionID < devices.TransactionID { 1289 logrus.Errorf("devmapper: Open Transaction id %d is less than pool transaction id %d", devices.OpenTransactionID, devices.TransactionID) 1290 return nil 1291 } 1292 1293 // Pool transaction ID is not same as open transaction. There is 1294 // a transaction which was not completed. 1295 if err := devices.rollbackTransaction(); err != nil { 1296 return fmt.Errorf("devmapper: Rolling back open transaction failed: %s", err) 1297 } 1298 1299 devices.OpenTransactionID = devices.TransactionID 1300 return nil 1301 } 1302 1303 func (devices *DeviceSet) loadDeviceSetMetaData() error { 1304 jsonData, err := ioutil.ReadFile(devices.deviceSetMetaFile()) 1305 if err != nil { 1306 // For backward compatibility return success if file does 1307 // not exist. 1308 if os.IsNotExist(err) { 1309 return nil 1310 } 1311 return err 1312 } 1313 1314 return json.Unmarshal(jsonData, devices) 1315 } 1316 1317 func (devices *DeviceSet) saveDeviceSetMetaData() error { 1318 jsonData, err := json.Marshal(devices) 1319 if err != nil { 1320 return fmt.Errorf("devmapper: Error encoding metadata to json: %s", err) 1321 } 1322 1323 return devices.writeMetaFile(jsonData, devices.deviceSetMetaFile()) 1324 } 1325 1326 func (devices *DeviceSet) openTransaction(hash string, DeviceID int) error { 1327 devices.allocateTransactionID() 1328 devices.DeviceIDHash = hash 1329 devices.DeviceID = DeviceID 1330 if err := devices.saveTransactionMetaData(); err != nil { 1331 return fmt.Errorf("devmapper: Error saving transaction metadata: %s", err) 1332 } 1333 return nil 1334 } 1335 1336 func (devices *DeviceSet) refreshTransaction(DeviceID int) error { 1337 devices.DeviceID = DeviceID 1338 if err := devices.saveTransactionMetaData(); err != nil { 1339 return fmt.Errorf("devmapper: Error saving transaction metadata: %s", err) 1340 } 1341 return nil 1342 } 1343 1344 func (devices *DeviceSet) closeTransaction() error { 1345 if err := devices.updatePoolTransactionID(); err != nil { 1346 logrus.Debugf("devmapper: Failed to close Transaction") 1347 return err 1348 } 1349 return nil 1350 } 1351 1352 func determineDriverCapabilities(version string) error { 1353 /* 1354 * Driver version 4.27.0 and greater support deferred activation 1355 * feature. 1356 */ 1357 1358 logrus.Debugf("devicemapper: driver version is %s", version) 1359 1360 versionSplit := strings.Split(version, ".") 1361 major, err := strconv.Atoi(versionSplit[0]) 1362 if err != nil { 1363 return graphdriver.ErrNotSupported 1364 } 1365 1366 if major > 4 { 1367 driverDeferredRemovalSupport = true 1368 return nil 1369 } 1370 1371 if major < 4 { 1372 return nil 1373 } 1374 1375 minor, err := strconv.Atoi(versionSplit[1]) 1376 if err != nil { 1377 return graphdriver.ErrNotSupported 1378 } 1379 1380 /* 1381 * If major is 4 and minor is 27, then there is no need to 1382 * check for patch level as it can not be less than 0. 1383 */ 1384 if minor >= 27 { 1385 driverDeferredRemovalSupport = true 1386 return nil 1387 } 1388 1389 return nil 1390 } 1391 1392 // Determine the major and minor number of loopback device 1393 func getDeviceMajorMinor(file *os.File) (uint64, uint64, error) { 1394 stat, err := file.Stat() 1395 if err != nil { 1396 return 0, 0, err 1397 } 1398 1399 dev := stat.Sys().(*syscall.Stat_t).Rdev 1400 majorNum := major(dev) 1401 minorNum := minor(dev) 1402 1403 logrus.Debugf("devmapper: Major:Minor for device: %s is:%v:%v", file.Name(), majorNum, minorNum) 1404 return majorNum, minorNum, nil 1405 } 1406 1407 // Given a file which is backing file of a loop back device, find the 1408 // loopback device name and its major/minor number. 1409 func getLoopFileDeviceMajMin(filename string) (string, uint64, uint64, error) { 1410 file, err := os.Open(filename) 1411 if err != nil { 1412 logrus.Debugf("devmapper: Failed to open file %s", filename) 1413 return "", 0, 0, err 1414 } 1415 1416 defer file.Close() 1417 loopbackDevice := devicemapper.FindLoopDeviceFor(file) 1418 if loopbackDevice == nil { 1419 return "", 0, 0, fmt.Errorf("devmapper: Unable to find loopback mount for: %s", filename) 1420 } 1421 defer loopbackDevice.Close() 1422 1423 Major, Minor, err := getDeviceMajorMinor(loopbackDevice) 1424 if err != nil { 1425 return "", 0, 0, err 1426 } 1427 return loopbackDevice.Name(), Major, Minor, nil 1428 } 1429 1430 // Get the major/minor numbers of thin pool data and metadata devices 1431 func (devices *DeviceSet) getThinPoolDataMetaMajMin() (uint64, uint64, uint64, uint64, error) { 1432 var params, poolDataMajMin, poolMetadataMajMin string 1433 1434 _, _, _, params, err := devicemapper.GetTable(devices.getPoolName()) 1435 if err != nil { 1436 return 0, 0, 0, 0, err 1437 } 1438 1439 if _, err = fmt.Sscanf(params, "%s %s", &poolMetadataMajMin, &poolDataMajMin); err != nil { 1440 return 0, 0, 0, 0, err 1441 } 1442 1443 logrus.Debugf("devmapper: poolDataMajMin=%s poolMetaMajMin=%s\n", poolDataMajMin, poolMetadataMajMin) 1444 1445 poolDataMajMinorSplit := strings.Split(poolDataMajMin, ":") 1446 poolDataMajor, err := strconv.ParseUint(poolDataMajMinorSplit[0], 10, 32) 1447 if err != nil { 1448 return 0, 0, 0, 0, err 1449 } 1450 1451 poolDataMinor, err := strconv.ParseUint(poolDataMajMinorSplit[1], 10, 32) 1452 if err != nil { 1453 return 0, 0, 0, 0, err 1454 } 1455 1456 poolMetadataMajMinorSplit := strings.Split(poolMetadataMajMin, ":") 1457 poolMetadataMajor, err := strconv.ParseUint(poolMetadataMajMinorSplit[0], 10, 32) 1458 if err != nil { 1459 return 0, 0, 0, 0, err 1460 } 1461 1462 poolMetadataMinor, err := strconv.ParseUint(poolMetadataMajMinorSplit[1], 10, 32) 1463 if err != nil { 1464 return 0, 0, 0, 0, err 1465 } 1466 1467 return poolDataMajor, poolDataMinor, poolMetadataMajor, poolMetadataMinor, nil 1468 } 1469 1470 func (devices *DeviceSet) loadThinPoolLoopBackInfo() error { 1471 poolDataMajor, poolDataMinor, poolMetadataMajor, poolMetadataMinor, err := devices.getThinPoolDataMetaMajMin() 1472 if err != nil { 1473 return err 1474 } 1475 1476 dirname := devices.loopbackDir() 1477 1478 // data device has not been passed in. So there should be a data file 1479 // which is being mounted as loop device. 1480 if devices.dataDevice == "" { 1481 datafilename := path.Join(dirname, "data") 1482 dataLoopDevice, dataMajor, dataMinor, err := getLoopFileDeviceMajMin(datafilename) 1483 if err != nil { 1484 return err 1485 } 1486 1487 // Compare the two 1488 if poolDataMajor == dataMajor && poolDataMinor == dataMinor { 1489 devices.dataDevice = dataLoopDevice 1490 devices.dataLoopFile = datafilename 1491 } 1492 1493 } 1494 1495 // metadata device has not been passed in. So there should be a 1496 // metadata file which is being mounted as loop device. 1497 if devices.metadataDevice == "" { 1498 metadatafilename := path.Join(dirname, "metadata") 1499 metadataLoopDevice, metadataMajor, metadataMinor, err := getLoopFileDeviceMajMin(metadatafilename) 1500 if err != nil { 1501 return err 1502 } 1503 if poolMetadataMajor == metadataMajor && poolMetadataMinor == metadataMinor { 1504 devices.metadataDevice = metadataLoopDevice 1505 devices.metadataLoopFile = metadatafilename 1506 } 1507 } 1508 1509 return nil 1510 } 1511 1512 func (devices *DeviceSet) initDevmapper(doInit bool) error { 1513 // give ourselves to libdm as a log handler 1514 devicemapper.LogInit(devices) 1515 1516 version, err := devicemapper.GetDriverVersion() 1517 if err != nil { 1518 // Can't even get driver version, assume not supported 1519 return graphdriver.ErrNotSupported 1520 } 1521 1522 if err := determineDriverCapabilities(version); err != nil { 1523 return graphdriver.ErrNotSupported 1524 } 1525 1526 // If user asked for deferred removal then check both libdm library 1527 // and kernel driver support deferred removal otherwise error out. 1528 if enableDeferredRemoval { 1529 if !driverDeferredRemovalSupport { 1530 return fmt.Errorf("devmapper: Deferred removal can not be enabled as kernel does not support it") 1531 } 1532 if !devicemapper.LibraryDeferredRemovalSupport { 1533 return fmt.Errorf("devmapper: Deferred removal can not be enabled as libdm does not support it") 1534 } 1535 logrus.Debugf("devmapper: Deferred removal support enabled.") 1536 devices.deferredRemove = true 1537 } 1538 1539 if enableDeferredDeletion { 1540 if !devices.deferredRemove { 1541 return fmt.Errorf("devmapper: Deferred deletion can not be enabled as deferred removal is not enabled. Enable deferred removal using --storage-opt dm.use_deferred_removal=true parameter") 1542 } 1543 logrus.Debugf("devmapper: Deferred deletion support enabled.") 1544 devices.deferredDelete = true 1545 } 1546 1547 // https://github.com/docker/docker/issues/4036 1548 if supported := devicemapper.UdevSetSyncSupport(true); !supported { 1549 logrus.Warn("devmapper: Udev sync is not supported. This will lead to unexpected behavior, data loss and errors. For more information, see https://docs.docker.com/reference/commandline/daemon/#daemon-storage-driver-option") 1550 } 1551 1552 //create the root dir of the devmapper driver ownership to match this 1553 //daemon's remapped root uid/gid so containers can start properly 1554 uid, gid, err := idtools.GetRootUIDGID(devices.uidMaps, devices.gidMaps) 1555 if err != nil { 1556 return err 1557 } 1558 if err := idtools.MkdirAs(devices.root, 0700, uid, gid); err != nil && !os.IsExist(err) { 1559 return err 1560 } 1561 if err := os.MkdirAll(devices.metadataDir(), 0700); err != nil && !os.IsExist(err) { 1562 return err 1563 } 1564 1565 // Set the device prefix from the device id and inode of the docker root dir 1566 1567 st, err := os.Stat(devices.root) 1568 if err != nil { 1569 return fmt.Errorf("devmapper: Error looking up dir %s: %s", devices.root, err) 1570 } 1571 sysSt := st.Sys().(*syscall.Stat_t) 1572 // "reg-" stands for "regular file". 1573 // In the future we might use "dev-" for "device file", etc. 1574 // docker-maj,min[-inode] stands for: 1575 // - Managed by docker 1576 // - The target of this device is at major <maj> and minor <min> 1577 // - If <inode> is defined, use that file inside the device as a loopback image. Otherwise use the device itself. 1578 devices.devicePrefix = fmt.Sprintf("docker-%d:%d-%d", major(sysSt.Dev), minor(sysSt.Dev), sysSt.Ino) 1579 logrus.Debugf("devmapper: Generated prefix: %s", devices.devicePrefix) 1580 1581 // Check for the existence of the thin-pool device 1582 poolExists, err := devices.thinPoolExists(devices.getPoolName()) 1583 if err != nil { 1584 return err 1585 } 1586 1587 // It seems libdevmapper opens this without O_CLOEXEC, and go exec will not close files 1588 // that are not Close-on-exec, 1589 // so we add this badhack to make sure it closes itself 1590 setCloseOnExec("/dev/mapper/control") 1591 1592 // Make sure the sparse images exist in <root>/devicemapper/data and 1593 // <root>/devicemapper/metadata 1594 1595 createdLoopback := false 1596 1597 // If the pool doesn't exist, create it 1598 if !poolExists && devices.thinPoolDevice == "" { 1599 logrus.Debugf("devmapper: Pool doesn't exist. Creating it.") 1600 1601 var ( 1602 dataFile *os.File 1603 metadataFile *os.File 1604 ) 1605 1606 if devices.dataDevice == "" { 1607 // Make sure the sparse images exist in <root>/devicemapper/data 1608 1609 hasData := devices.hasImage("data") 1610 1611 if !doInit && !hasData { 1612 return errors.New("Loopback data file not found") 1613 } 1614 1615 if !hasData { 1616 createdLoopback = true 1617 } 1618 1619 data, err := devices.ensureImage("data", devices.dataLoopbackSize) 1620 if err != nil { 1621 logrus.Debugf("devmapper: Error device ensureImage (data): %s", err) 1622 return err 1623 } 1624 1625 dataFile, err = devicemapper.AttachLoopDevice(data) 1626 if err != nil { 1627 return err 1628 } 1629 devices.dataLoopFile = data 1630 devices.dataDevice = dataFile.Name() 1631 } else { 1632 dataFile, err = os.OpenFile(devices.dataDevice, os.O_RDWR, 0600) 1633 if err != nil { 1634 return err 1635 } 1636 } 1637 defer dataFile.Close() 1638 1639 if devices.metadataDevice == "" { 1640 // Make sure the sparse images exist in <root>/devicemapper/metadata 1641 1642 hasMetadata := devices.hasImage("metadata") 1643 1644 if !doInit && !hasMetadata { 1645 return errors.New("Loopback metadata file not found") 1646 } 1647 1648 if !hasMetadata { 1649 createdLoopback = true 1650 } 1651 1652 metadata, err := devices.ensureImage("metadata", devices.metaDataLoopbackSize) 1653 if err != nil { 1654 logrus.Debugf("devmapper: Error device ensureImage (metadata): %s", err) 1655 return err 1656 } 1657 1658 metadataFile, err = devicemapper.AttachLoopDevice(metadata) 1659 if err != nil { 1660 return err 1661 } 1662 devices.metadataLoopFile = metadata 1663 devices.metadataDevice = metadataFile.Name() 1664 } else { 1665 metadataFile, err = os.OpenFile(devices.metadataDevice, os.O_RDWR, 0600) 1666 if err != nil { 1667 return err 1668 } 1669 } 1670 defer metadataFile.Close() 1671 1672 if err := devicemapper.CreatePool(devices.getPoolName(), dataFile, metadataFile, devices.thinpBlockSize); err != nil { 1673 return err 1674 } 1675 } 1676 1677 // Pool already exists and caller did not pass us a pool. That means 1678 // we probably created pool earlier and could not remove it as some 1679 // containers were still using it. Detect some of the properties of 1680 // pool, like is it using loop devices. 1681 if poolExists && devices.thinPoolDevice == "" { 1682 if err := devices.loadThinPoolLoopBackInfo(); err != nil { 1683 logrus.Debugf("devmapper: Failed to load thin pool loopback device information:%v", err) 1684 return err 1685 } 1686 } 1687 1688 // If we didn't just create the data or metadata image, we need to 1689 // load the transaction id and migrate old metadata 1690 if !createdLoopback { 1691 if err := devices.initMetaData(); err != nil { 1692 return err 1693 } 1694 } 1695 1696 if devices.thinPoolDevice == "" { 1697 if devices.metadataLoopFile != "" || devices.dataLoopFile != "" { 1698 logrus.Warnf("devmapper: Usage of loopback devices is strongly discouraged for production use. Please use `--storage-opt dm.thinpooldev` or use `man docker` to refer to dm.thinpooldev section.") 1699 } 1700 } 1701 1702 // Right now this loads only NextDeviceID. If there is more metadata 1703 // down the line, we might have to move it earlier. 1704 if err := devices.loadDeviceSetMetaData(); err != nil { 1705 return err 1706 } 1707 1708 // Setup the base image 1709 if doInit { 1710 if err := devices.setupBaseImage(); err != nil { 1711 logrus.Debugf("devmapper: Error device setupBaseImage: %s", err) 1712 return err 1713 } 1714 } 1715 1716 return nil 1717 } 1718 1719 // AddDevice adds a device and registers in the hash. 1720 func (devices *DeviceSet) AddDevice(hash, baseHash string) error { 1721 logrus.Debugf("devmapper: AddDevice(hash=%s basehash=%s)", hash, baseHash) 1722 defer logrus.Debugf("devmapper: AddDevice(hash=%s basehash=%s) END", hash, baseHash) 1723 1724 // If a deleted device exists, return error. 1725 baseInfo, err := devices.lookupDeviceWithLock(baseHash) 1726 if err != nil { 1727 return err 1728 } 1729 1730 if baseInfo.Deleted { 1731 return fmt.Errorf("devmapper: Base device %v has been marked for deferred deletion", baseInfo.Hash) 1732 } 1733 1734 baseInfo.lock.Lock() 1735 defer baseInfo.lock.Unlock() 1736 1737 devices.Lock() 1738 defer devices.Unlock() 1739 1740 // Also include deleted devices in case hash of new device is 1741 // same as one of the deleted devices. 1742 if info, _ := devices.lookupDevice(hash); info != nil { 1743 return fmt.Errorf("devmapper: device %s already exists. Deleted=%v", hash, info.Deleted) 1744 } 1745 1746 if err := devices.createRegisterSnapDevice(hash, baseInfo); err != nil { 1747 return err 1748 } 1749 1750 return nil 1751 } 1752 1753 func (devices *DeviceSet) markForDeferredDeletion(info *devInfo) error { 1754 // If device is already in deleted state, there is nothing to be done. 1755 if info.Deleted { 1756 return nil 1757 } 1758 1759 logrus.Debugf("devmapper: Marking device %s for deferred deletion.", info.Hash) 1760 1761 info.Deleted = true 1762 1763 // save device metadata to reflect deleted state. 1764 if err := devices.saveMetadata(info); err != nil { 1765 info.Deleted = false 1766 return err 1767 } 1768 1769 devices.nrDeletedDevices++ 1770 return nil 1771 } 1772 1773 // Should be called with devices.Lock() held. 1774 func (devices *DeviceSet) deleteTransaction(info *devInfo, syncDelete bool) error { 1775 if err := devices.openTransaction(info.Hash, info.DeviceID); err != nil { 1776 logrus.Debugf("devmapper: Error opening transaction hash = %s deviceId = %d", "", info.DeviceID) 1777 return err 1778 } 1779 1780 defer devices.closeTransaction() 1781 1782 err := devicemapper.DeleteDevice(devices.getPoolDevName(), info.DeviceID) 1783 if err != nil { 1784 // If syncDelete is true, we want to return error. If deferred 1785 // deletion is not enabled, we return an error. If error is 1786 // something other then EBUSY, return an error. 1787 if syncDelete || !devices.deferredDelete || err != devicemapper.ErrBusy { 1788 logrus.Debugf("devmapper: Error deleting device: %s", err) 1789 return err 1790 } 1791 } 1792 1793 if err == nil { 1794 if err := devices.unregisterDevice(info.DeviceID, info.Hash); err != nil { 1795 return err 1796 } 1797 // If device was already in deferred delete state that means 1798 // deletion was being tried again later. Reduce the deleted 1799 // device count. 1800 if info.Deleted { 1801 devices.nrDeletedDevices-- 1802 } 1803 } else { 1804 if err := devices.markForDeferredDeletion(info); err != nil { 1805 return err 1806 } 1807 } 1808 1809 return nil 1810 } 1811 1812 // Issue discard only if device open count is zero. 1813 func (devices *DeviceSet) issueDiscard(info *devInfo) error { 1814 logrus.Debugf("devmapper: issueDiscard(device: %s). START", info.Hash) 1815 defer logrus.Debugf("devmapper: issueDiscard(device: %s). END", info.Hash) 1816 // This is a workaround for the kernel not discarding block so 1817 // on the thin pool when we remove a thinp device, so we do it 1818 // manually. 1819 // Even if device is deferred deleted, activate it and issue 1820 // discards. 1821 if err := devices.activateDeviceIfNeeded(info, true); err != nil { 1822 return err 1823 } 1824 1825 devinfo, err := devicemapper.GetInfo(info.Name()) 1826 if err != nil { 1827 return err 1828 } 1829 1830 if devinfo.OpenCount != 0 { 1831 logrus.Debugf("devmapper: Device: %s is in use. OpenCount=%d. Not issuing discards.", info.Hash, devinfo.OpenCount) 1832 return nil 1833 } 1834 1835 if err := devicemapper.BlockDeviceDiscard(info.DevName()); err != nil { 1836 logrus.Debugf("devmapper: Error discarding block on device: %s (ignoring)", err) 1837 } 1838 return nil 1839 } 1840 1841 // Should be called with devices.Lock() held. 1842 func (devices *DeviceSet) deleteDevice(info *devInfo, syncDelete bool) error { 1843 if devices.doBlkDiscard { 1844 devices.issueDiscard(info) 1845 } 1846 1847 // Try to deactivate device in case it is active. 1848 if err := devices.deactivateDevice(info); err != nil { 1849 logrus.Debugf("devmapper: Error deactivating device: %s", err) 1850 return err 1851 } 1852 1853 if err := devices.deleteTransaction(info, syncDelete); err != nil { 1854 return err 1855 } 1856 1857 devices.markDeviceIDFree(info.DeviceID) 1858 1859 return nil 1860 } 1861 1862 // DeleteDevice will return success if device has been marked for deferred 1863 // removal. If one wants to override that and want DeleteDevice() to fail if 1864 // device was busy and could not be deleted, set syncDelete=true. 1865 func (devices *DeviceSet) DeleteDevice(hash string, syncDelete bool) error { 1866 logrus.Debugf("devmapper: DeleteDevice(hash=%v syncDelete=%v) START", hash, syncDelete) 1867 defer logrus.Debugf("devmapper: DeleteDevice(hash=%v syncDelete=%v) END", hash, syncDelete) 1868 info, err := devices.lookupDeviceWithLock(hash) 1869 if err != nil { 1870 return err 1871 } 1872 1873 info.lock.Lock() 1874 defer info.lock.Unlock() 1875 1876 devices.Lock() 1877 defer devices.Unlock() 1878 1879 // If mountcount is not zero, that means devices is still in use 1880 // or has not been Put() properly. Fail device deletion. 1881 1882 if info.mountCount != 0 { 1883 return fmt.Errorf("devmapper: Can't delete device %v as it is still mounted. mntCount=%v", info.Hash, info.mountCount) 1884 } 1885 1886 return devices.deleteDevice(info, syncDelete) 1887 } 1888 1889 func (devices *DeviceSet) deactivatePool() error { 1890 logrus.Debugf("devmapper: deactivatePool()") 1891 defer logrus.Debugf("devmapper: deactivatePool END") 1892 devname := devices.getPoolDevName() 1893 1894 devinfo, err := devicemapper.GetInfo(devname) 1895 if err != nil { 1896 return err 1897 } 1898 1899 if devinfo.Exists == 0 { 1900 return nil 1901 } 1902 if err := devicemapper.RemoveDevice(devname); err != nil { 1903 return err 1904 } 1905 1906 if d, err := devicemapper.GetDeps(devname); err == nil { 1907 logrus.Warnf("devmapper: device %s still has %d active dependents", devname, d.Count) 1908 } 1909 1910 return nil 1911 } 1912 1913 func (devices *DeviceSet) deactivateDevice(info *devInfo) error { 1914 logrus.Debugf("devmapper: deactivateDevice(%s)", info.Hash) 1915 defer logrus.Debugf("devmapper: deactivateDevice END(%s)", info.Hash) 1916 1917 devinfo, err := devicemapper.GetInfo(info.Name()) 1918 if err != nil { 1919 return err 1920 } 1921 1922 if devinfo.Exists == 0 { 1923 return nil 1924 } 1925 1926 if devices.deferredRemove { 1927 if err := devicemapper.RemoveDeviceDeferred(info.Name()); err != nil { 1928 return err 1929 } 1930 } else { 1931 if err := devices.removeDevice(info.Name()); err != nil { 1932 return err 1933 } 1934 } 1935 return nil 1936 } 1937 1938 // Issues the underlying dm remove operation. 1939 func (devices *DeviceSet) removeDevice(devname string) error { 1940 var err error 1941 1942 logrus.Debugf("devmapper: removeDevice START(%s)", devname) 1943 defer logrus.Debugf("devmapper: removeDevice END(%s)", devname) 1944 1945 for i := 0; i < 200; i++ { 1946 err = devicemapper.RemoveDevice(devname) 1947 if err == nil { 1948 break 1949 } 1950 if err != devicemapper.ErrBusy { 1951 return err 1952 } 1953 1954 // If we see EBUSY it may be a transient error, 1955 // sleep a bit a retry a few times. 1956 devices.Unlock() 1957 time.Sleep(100 * time.Millisecond) 1958 devices.Lock() 1959 } 1960 1961 return err 1962 } 1963 1964 func (devices *DeviceSet) cancelDeferredRemoval(info *devInfo) error { 1965 if !devices.deferredRemove { 1966 return nil 1967 } 1968 1969 logrus.Debugf("devmapper: cancelDeferredRemoval START(%s)", info.Name()) 1970 defer logrus.Debugf("devmapper: cancelDeferredRemoval END(%s)", info.Name()) 1971 1972 devinfo, err := devicemapper.GetInfoWithDeferred(info.Name()) 1973 1974 if devinfo != nil && devinfo.DeferredRemove == 0 { 1975 return nil 1976 } 1977 1978 // Cancel deferred remove 1979 for i := 0; i < 100; i++ { 1980 err = devicemapper.CancelDeferredRemove(info.Name()) 1981 if err == nil { 1982 break 1983 } 1984 1985 if err == devicemapper.ErrEnxio { 1986 // Device is probably already gone. Return success. 1987 return nil 1988 } 1989 1990 if err != devicemapper.ErrBusy { 1991 return err 1992 } 1993 1994 // If we see EBUSY it may be a transient error, 1995 // sleep a bit a retry a few times. 1996 devices.Unlock() 1997 time.Sleep(100 * time.Millisecond) 1998 devices.Lock() 1999 } 2000 return err 2001 } 2002 2003 // Shutdown shuts down the device by unmounting the root. 2004 func (devices *DeviceSet) Shutdown() error { 2005 logrus.Debugf("devmapper: [deviceset %s] Shutdown()", devices.devicePrefix) 2006 logrus.Debugf("devmapper: Shutting down DeviceSet: %s", devices.root) 2007 defer logrus.Debugf("devmapper: [deviceset %s] Shutdown() END", devices.devicePrefix) 2008 2009 var devs []*devInfo 2010 2011 // Stop deletion worker. This should start delivering new events to 2012 // ticker channel. That means no new instance of cleanupDeletedDevice() 2013 // will run after this call. If one instance is already running at 2014 // the time of the call, it must be holding devices.Lock() and 2015 // we will block on this lock till cleanup function exits. 2016 devices.deletionWorkerTicker.Stop() 2017 2018 devices.Lock() 2019 // Save DeviceSet Metadata first. Docker kills all threads if they 2020 // don't finish in certain time. It is possible that Shutdown() 2021 // routine does not finish in time as we loop trying to deactivate 2022 // some devices while these are busy. In that case shutdown() routine 2023 // will be killed and we will not get a chance to save deviceset 2024 // metadata. Hence save this early before trying to deactivate devices. 2025 devices.saveDeviceSetMetaData() 2026 2027 for _, info := range devices.Devices { 2028 devs = append(devs, info) 2029 } 2030 devices.Unlock() 2031 2032 for _, info := range devs { 2033 info.lock.Lock() 2034 if info.mountCount > 0 { 2035 // We use MNT_DETACH here in case it is still busy in some running 2036 // container. This means it'll go away from the global scope directly, 2037 // and the device will be released when that container dies. 2038 if err := syscall.Unmount(info.mountPath, syscall.MNT_DETACH); err != nil { 2039 logrus.Debugf("devmapper: Shutdown unmounting %s, error: %s", info.mountPath, err) 2040 } 2041 2042 devices.Lock() 2043 if err := devices.deactivateDevice(info); err != nil { 2044 logrus.Debugf("devmapper: Shutdown deactivate %s , error: %s", info.Hash, err) 2045 } 2046 devices.Unlock() 2047 } 2048 info.lock.Unlock() 2049 } 2050 2051 info, _ := devices.lookupDeviceWithLock("") 2052 if info != nil { 2053 info.lock.Lock() 2054 devices.Lock() 2055 if err := devices.deactivateDevice(info); err != nil { 2056 logrus.Debugf("devmapper: Shutdown deactivate base , error: %s", err) 2057 } 2058 devices.Unlock() 2059 info.lock.Unlock() 2060 } 2061 2062 devices.Lock() 2063 if devices.thinPoolDevice == "" { 2064 if err := devices.deactivatePool(); err != nil { 2065 logrus.Debugf("devmapper: Shutdown deactivate pool , error: %s", err) 2066 } 2067 } 2068 devices.Unlock() 2069 2070 return nil 2071 } 2072 2073 // MountDevice mounts the device if not already mounted. 2074 func (devices *DeviceSet) MountDevice(hash, path, mountLabel string) error { 2075 info, err := devices.lookupDeviceWithLock(hash) 2076 if err != nil { 2077 return err 2078 } 2079 2080 if info.Deleted { 2081 return fmt.Errorf("devmapper: Can't mount device %v as it has been marked for deferred deletion", info.Hash) 2082 } 2083 2084 info.lock.Lock() 2085 defer info.lock.Unlock() 2086 2087 devices.Lock() 2088 defer devices.Unlock() 2089 2090 if info.mountCount > 0 { 2091 if path != info.mountPath { 2092 return fmt.Errorf("devmapper: Trying to mount devmapper device in multiple places (%s, %s)", info.mountPath, path) 2093 } 2094 2095 info.mountCount++ 2096 return nil 2097 } 2098 2099 if err := devices.activateDeviceIfNeeded(info, false); err != nil { 2100 return fmt.Errorf("devmapper: Error activating devmapper device for '%s': %s", hash, err) 2101 } 2102 2103 fstype, err := ProbeFsType(info.DevName()) 2104 if err != nil { 2105 return err 2106 } 2107 2108 options := "" 2109 2110 if fstype == "xfs" { 2111 // XFS needs nouuid or it can't mount filesystems with the same fs 2112 options = joinMountOptions(options, "nouuid") 2113 } 2114 2115 options = joinMountOptions(options, devices.mountOptions) 2116 options = joinMountOptions(options, label.FormatMountLabel("", mountLabel)) 2117 2118 if err := mount.Mount(info.DevName(), path, fstype, options); err != nil { 2119 return fmt.Errorf("devmapper: Error mounting '%s' on '%s': %s", info.DevName(), path, err) 2120 } 2121 2122 info.mountCount = 1 2123 info.mountPath = path 2124 2125 return nil 2126 } 2127 2128 // UnmountDevice unmounts the device and removes it from hash. 2129 func (devices *DeviceSet) UnmountDevice(hash, mountPath string) error { 2130 logrus.Debugf("devmapper: UnmountDevice(hash=%s)", hash) 2131 defer logrus.Debugf("devmapper: UnmountDevice(hash=%s) END", hash) 2132 2133 info, err := devices.lookupDeviceWithLock(hash) 2134 if err != nil { 2135 return err 2136 } 2137 2138 info.lock.Lock() 2139 defer info.lock.Unlock() 2140 2141 devices.Lock() 2142 defer devices.Unlock() 2143 2144 // If there are running containers when daemon crashes, during daemon 2145 // restarting, it will kill running containers and will finally call 2146 // Put() without calling Get(). So info.MountCount may become negative. 2147 // if info.mountCount goes negative, we do the unmount and assign 2148 // it to 0. 2149 2150 info.mountCount-- 2151 if info.mountCount > 0 { 2152 return nil 2153 } else if info.mountCount < 0 { 2154 logrus.Warnf("devmapper: Mount count of device went negative. Put() called without matching Get(). Resetting count to 0") 2155 info.mountCount = 0 2156 } 2157 2158 logrus.Debugf("devmapper: Unmount(%s)", mountPath) 2159 if err := syscall.Unmount(mountPath, syscall.MNT_DETACH); err != nil { 2160 return err 2161 } 2162 logrus.Debugf("devmapper: Unmount done") 2163 2164 if err := devices.deactivateDevice(info); err != nil { 2165 return err 2166 } 2167 2168 info.mountPath = "" 2169 2170 return nil 2171 } 2172 2173 // HasDevice returns true if the device metadata exists. 2174 func (devices *DeviceSet) HasDevice(hash string) bool { 2175 info, _ := devices.lookupDeviceWithLock(hash) 2176 return info != nil 2177 } 2178 2179 // List returns a list of device ids. 2180 func (devices *DeviceSet) List() []string { 2181 devices.Lock() 2182 defer devices.Unlock() 2183 2184 ids := make([]string, len(devices.Devices)) 2185 i := 0 2186 for k := range devices.Devices { 2187 ids[i] = k 2188 i++ 2189 } 2190 return ids 2191 } 2192 2193 func (devices *DeviceSet) deviceStatus(devName string) (sizeInSectors, mappedSectors, highestMappedSector uint64, err error) { 2194 var params string 2195 _, sizeInSectors, _, params, err = devicemapper.GetStatus(devName) 2196 if err != nil { 2197 return 2198 } 2199 if _, err = fmt.Sscanf(params, "%d %d", &mappedSectors, &highestMappedSector); err == nil { 2200 return 2201 } 2202 return 2203 } 2204 2205 // GetDeviceStatus provides size, mapped sectors 2206 func (devices *DeviceSet) GetDeviceStatus(hash string) (*DevStatus, error) { 2207 info, err := devices.lookupDeviceWithLock(hash) 2208 if err != nil { 2209 return nil, err 2210 } 2211 2212 info.lock.Lock() 2213 defer info.lock.Unlock() 2214 2215 devices.Lock() 2216 defer devices.Unlock() 2217 2218 status := &DevStatus{ 2219 DeviceID: info.DeviceID, 2220 Size: info.Size, 2221 TransactionID: info.TransactionID, 2222 } 2223 2224 if err := devices.activateDeviceIfNeeded(info, false); err != nil { 2225 return nil, fmt.Errorf("devmapper: Error activating devmapper device for '%s': %s", hash, err) 2226 } 2227 2228 sizeInSectors, mappedSectors, highestMappedSector, err := devices.deviceStatus(info.DevName()) 2229 2230 if err != nil { 2231 return nil, err 2232 } 2233 2234 status.SizeInSectors = sizeInSectors 2235 status.MappedSectors = mappedSectors 2236 status.HighestMappedSector = highestMappedSector 2237 2238 return status, nil 2239 } 2240 2241 func (devices *DeviceSet) poolStatus() (totalSizeInSectors, transactionID, dataUsed, dataTotal, metadataUsed, metadataTotal uint64, err error) { 2242 var params string 2243 if _, totalSizeInSectors, _, params, err = devicemapper.GetStatus(devices.getPoolName()); err == nil { 2244 _, err = fmt.Sscanf(params, "%d %d/%d %d/%d", &transactionID, &metadataUsed, &metadataTotal, &dataUsed, &dataTotal) 2245 } 2246 return 2247 } 2248 2249 // DataDevicePath returns the path to the data storage for this deviceset, 2250 // regardless of loopback or block device 2251 func (devices *DeviceSet) DataDevicePath() string { 2252 return devices.dataDevice 2253 } 2254 2255 // MetadataDevicePath returns the path to the metadata storage for this deviceset, 2256 // regardless of loopback or block device 2257 func (devices *DeviceSet) MetadataDevicePath() string { 2258 return devices.metadataDevice 2259 } 2260 2261 func (devices *DeviceSet) getUnderlyingAvailableSpace(loopFile string) (uint64, error) { 2262 buf := new(syscall.Statfs_t) 2263 if err := syscall.Statfs(loopFile, buf); err != nil { 2264 logrus.Warnf("devmapper: Couldn't stat loopfile filesystem %v: %v", loopFile, err) 2265 return 0, err 2266 } 2267 return buf.Bfree * uint64(buf.Bsize), nil 2268 } 2269 2270 func (devices *DeviceSet) isRealFile(loopFile string) (bool, error) { 2271 if loopFile != "" { 2272 fi, err := os.Stat(loopFile) 2273 if err != nil { 2274 logrus.Warnf("devmapper: Couldn't stat loopfile %v: %v", loopFile, err) 2275 return false, err 2276 } 2277 return fi.Mode().IsRegular(), nil 2278 } 2279 return false, nil 2280 } 2281 2282 // Status returns the current status of this deviceset 2283 func (devices *DeviceSet) Status() *Status { 2284 devices.Lock() 2285 defer devices.Unlock() 2286 2287 status := &Status{} 2288 2289 status.PoolName = devices.getPoolName() 2290 status.DataFile = devices.DataDevicePath() 2291 status.DataLoopback = devices.dataLoopFile 2292 status.MetadataFile = devices.MetadataDevicePath() 2293 status.MetadataLoopback = devices.metadataLoopFile 2294 status.UdevSyncSupported = devicemapper.UdevSyncSupported() 2295 status.DeferredRemoveEnabled = devices.deferredRemove 2296 status.DeferredDeleteEnabled = devices.deferredDelete 2297 status.DeferredDeletedDeviceCount = devices.nrDeletedDevices 2298 status.BaseDeviceSize = devices.getBaseDeviceSize() 2299 status.BaseDeviceFS = devices.getBaseDeviceFS() 2300 2301 totalSizeInSectors, _, dataUsed, dataTotal, metadataUsed, metadataTotal, err := devices.poolStatus() 2302 if err == nil { 2303 // Convert from blocks to bytes 2304 blockSizeInSectors := totalSizeInSectors / dataTotal 2305 2306 status.Data.Used = dataUsed * blockSizeInSectors * 512 2307 status.Data.Total = dataTotal * blockSizeInSectors * 512 2308 status.Data.Available = status.Data.Total - status.Data.Used 2309 2310 // metadata blocks are always 4k 2311 status.Metadata.Used = metadataUsed * 4096 2312 status.Metadata.Total = metadataTotal * 4096 2313 status.Metadata.Available = status.Metadata.Total - status.Metadata.Used 2314 2315 status.SectorSize = blockSizeInSectors * 512 2316 2317 if check, _ := devices.isRealFile(devices.dataLoopFile); check { 2318 actualSpace, err := devices.getUnderlyingAvailableSpace(devices.dataLoopFile) 2319 if err == nil && actualSpace < status.Data.Available { 2320 status.Data.Available = actualSpace 2321 } 2322 } 2323 2324 if check, _ := devices.isRealFile(devices.metadataLoopFile); check { 2325 actualSpace, err := devices.getUnderlyingAvailableSpace(devices.metadataLoopFile) 2326 if err == nil && actualSpace < status.Metadata.Available { 2327 status.Metadata.Available = actualSpace 2328 } 2329 } 2330 } 2331 2332 return status 2333 } 2334 2335 // Status returns the current status of this deviceset 2336 func (devices *DeviceSet) exportDeviceMetadata(hash string) (*deviceMetadata, error) { 2337 info, err := devices.lookupDeviceWithLock(hash) 2338 if err != nil { 2339 return nil, err 2340 } 2341 2342 info.lock.Lock() 2343 defer info.lock.Unlock() 2344 2345 metadata := &deviceMetadata{info.DeviceID, info.Size, info.Name()} 2346 return metadata, nil 2347 } 2348 2349 // NewDeviceSet creates the device set based on the options provided. 2350 func NewDeviceSet(root string, doInit bool, options []string, uidMaps, gidMaps []idtools.IDMap) (*DeviceSet, error) { 2351 devicemapper.SetDevDir("/dev") 2352 2353 devices := &DeviceSet{ 2354 root: root, 2355 metaData: metaData{Devices: make(map[string]*devInfo)}, 2356 dataLoopbackSize: defaultDataLoopbackSize, 2357 metaDataLoopbackSize: defaultMetaDataLoopbackSize, 2358 baseFsSize: defaultBaseFsSize, 2359 overrideUdevSyncCheck: defaultUdevSyncOverride, 2360 doBlkDiscard: true, 2361 thinpBlockSize: defaultThinpBlockSize, 2362 deviceIDMap: make([]byte, deviceIDMapSz), 2363 deletionWorkerTicker: time.NewTicker(time.Second * 30), 2364 uidMaps: uidMaps, 2365 gidMaps: gidMaps, 2366 } 2367 2368 foundBlkDiscard := false 2369 for _, option := range options { 2370 key, val, err := parsers.ParseKeyValueOpt(option) 2371 if err != nil { 2372 return nil, err 2373 } 2374 key = strings.ToLower(key) 2375 switch key { 2376 case "dm.basesize": 2377 size, err := units.RAMInBytes(val) 2378 if err != nil { 2379 return nil, err 2380 } 2381 devices.baseFsSize = uint64(size) 2382 case "dm.loopdatasize": 2383 size, err := units.RAMInBytes(val) 2384 if err != nil { 2385 return nil, err 2386 } 2387 devices.dataLoopbackSize = size 2388 case "dm.loopmetadatasize": 2389 size, err := units.RAMInBytes(val) 2390 if err != nil { 2391 return nil, err 2392 } 2393 devices.metaDataLoopbackSize = size 2394 case "dm.fs": 2395 if val != "ext4" && val != "xfs" { 2396 return nil, fmt.Errorf("devmapper: Unsupported filesystem %s\n", val) 2397 } 2398 devices.filesystem = val 2399 case "dm.mkfsarg": 2400 devices.mkfsArgs = append(devices.mkfsArgs, val) 2401 case "dm.mountopt": 2402 devices.mountOptions = joinMountOptions(devices.mountOptions, val) 2403 case "dm.metadatadev": 2404 devices.metadataDevice = val 2405 case "dm.datadev": 2406 devices.dataDevice = val 2407 case "dm.thinpooldev": 2408 devices.thinPoolDevice = strings.TrimPrefix(val, "/dev/mapper/") 2409 case "dm.blkdiscard": 2410 foundBlkDiscard = true 2411 devices.doBlkDiscard, err = strconv.ParseBool(val) 2412 if err != nil { 2413 return nil, err 2414 } 2415 case "dm.blocksize": 2416 size, err := units.RAMInBytes(val) 2417 if err != nil { 2418 return nil, err 2419 } 2420 // convert to 512b sectors 2421 devices.thinpBlockSize = uint32(size) >> 9 2422 case "dm.override_udev_sync_check": 2423 devices.overrideUdevSyncCheck, err = strconv.ParseBool(val) 2424 if err != nil { 2425 return nil, err 2426 } 2427 2428 case "dm.use_deferred_removal": 2429 enableDeferredRemoval, err = strconv.ParseBool(val) 2430 if err != nil { 2431 return nil, err 2432 } 2433 2434 case "dm.use_deferred_deletion": 2435 enableDeferredDeletion, err = strconv.ParseBool(val) 2436 if err != nil { 2437 return nil, err 2438 } 2439 2440 default: 2441 return nil, fmt.Errorf("devmapper: Unknown option %s\n", key) 2442 } 2443 } 2444 2445 // By default, don't do blk discard hack on raw devices, its rarely useful and is expensive 2446 if !foundBlkDiscard && (devices.dataDevice != "" || devices.thinPoolDevice != "") { 2447 devices.doBlkDiscard = false 2448 } 2449 2450 if err := devices.initDevmapper(doInit); err != nil { 2451 return nil, err 2452 } 2453 2454 return devices, nil 2455 }