github.com/chenchun/docker@v1.3.2-0.20150629222414-20467faf132b/daemon/graphdriver/devmapper/deviceset.go (about) 1 // +build linux 2 3 package devmapper 4 5 import ( 6 "encoding/json" 7 "errors" 8 "fmt" 9 "io" 10 "io/ioutil" 11 "os" 12 "os/exec" 13 "path" 14 "path/filepath" 15 "strconv" 16 "strings" 17 "sync" 18 "syscall" 19 "time" 20 21 "github.com/Sirupsen/logrus" 22 "github.com/docker/docker/daemon/graphdriver" 23 "github.com/docker/docker/pkg/devicemapper" 24 "github.com/docker/docker/pkg/parsers" 25 "github.com/docker/docker/pkg/units" 26 "github.com/docker/libcontainer/label" 27 ) 28 29 var ( 30 DefaultDataLoopbackSize int64 = 100 * 1024 * 1024 * 1024 31 DefaultMetaDataLoopbackSize int64 = 2 * 1024 * 1024 * 1024 32 DefaultBaseFsSize uint64 = 10 * 1024 * 1024 * 1024 33 DefaultThinpBlockSize uint32 = 128 // 64K = 128 512b sectors 34 DefaultUdevSyncOverride bool = false 35 MaxDeviceId int = 0xffffff // 24 bit, pool limit 36 DeviceIdMapSz int = (MaxDeviceId + 1) / 8 37 // We retry device removal so many a times that even error messages 38 // will fill up console during normal operation. So only log Fatal 39 // messages by default. 40 DMLogLevel int = devicemapper.LogLevelFatal 41 DriverDeferredRemovalSupport bool = false 42 EnableDeferredRemoval bool = false 43 ) 44 45 const deviceSetMetaFile string = "deviceset-metadata" 46 const transactionMetaFile string = "transaction-metadata" 47 48 type Transaction struct { 49 OpenTransactionId uint64 `json:"open_transaction_id"` 50 DeviceIdHash string `json:"device_hash"` 51 DeviceId int `json:"device_id"` 52 } 53 54 type DevInfo struct { 55 Hash string `json:"-"` 56 DeviceId int `json:"device_id"` 57 Size uint64 `json:"size"` 58 TransactionId uint64 `json:"transaction_id"` 59 Initialized bool `json:"initialized"` 60 devices *DeviceSet 61 62 mountCount int 63 mountPath string 64 65 // The global DeviceSet lock guarantees that we serialize all 66 // the calls to libdevmapper (which is not threadsafe), but we 67 // sometimes release that lock while sleeping. In that case 68 // this per-device lock is still held, protecting against 69 // other accesses to the device that we're doing the wait on. 70 // 71 // WARNING: In order to avoid AB-BA deadlocks when releasing 72 // the global lock while holding the per-device locks all 73 // device locks must be aquired *before* the device lock, and 74 // multiple device locks should be aquired parent before child. 75 lock sync.Mutex 76 } 77 78 type MetaData struct { 79 Devices map[string]*DevInfo `json:"Devices"` 80 devicesLock sync.Mutex // Protects all read/writes to Devices map 81 } 82 83 type DeviceSet struct { 84 MetaData `json:"-"` 85 sync.Mutex `json:"-"` // Protects Devices map and serializes calls into libdevmapper 86 root string 87 devicePrefix string 88 TransactionId uint64 `json:"-"` 89 NextDeviceId int `json:"next_device_id"` 90 deviceIdMap []byte 91 92 // Options 93 dataLoopbackSize int64 94 metaDataLoopbackSize int64 95 baseFsSize uint64 96 filesystem string 97 mountOptions string 98 mkfsArgs []string 99 dataDevice string // block or loop dev 100 dataLoopFile string // loopback file, if used 101 metadataDevice string // block or loop dev 102 metadataLoopFile string // loopback file, if used 103 doBlkDiscard bool 104 thinpBlockSize uint32 105 thinPoolDevice string 106 Transaction `json:"-"` 107 overrideUdevSyncCheck bool 108 deferredRemove bool // use deferred removal 109 BaseDeviceUUID string //save UUID of base device 110 } 111 112 type DiskUsage struct { 113 Used uint64 114 Total uint64 115 Available uint64 116 } 117 118 type Status struct { 119 PoolName string 120 DataFile string // actual block device for data 121 DataLoopback string // loopback file, if used 122 MetadataFile string // actual block device for metadata 123 MetadataLoopback string // loopback file, if used 124 Data DiskUsage 125 Metadata DiskUsage 126 SectorSize uint64 127 UdevSyncSupported bool 128 DeferredRemoveEnabled bool 129 } 130 131 // Structure used to export image/container metadata in docker inspect. 132 type DeviceMetadata struct { 133 deviceId int 134 deviceSize uint64 // size in bytes 135 deviceName string // Device name as used during activation 136 } 137 138 type DevStatus struct { 139 DeviceId int 140 Size uint64 141 TransactionId uint64 142 SizeInSectors uint64 143 MappedSectors uint64 144 HighestMappedSector uint64 145 } 146 147 func getDevName(name string) string { 148 return "/dev/mapper/" + name 149 } 150 151 func (info *DevInfo) Name() string { 152 hash := info.Hash 153 if hash == "" { 154 hash = "base" 155 } 156 return fmt.Sprintf("%s-%s", info.devices.devicePrefix, hash) 157 } 158 159 func (info *DevInfo) DevName() string { 160 return getDevName(info.Name()) 161 } 162 163 func (devices *DeviceSet) loopbackDir() string { 164 return path.Join(devices.root, "devicemapper") 165 } 166 167 func (devices *DeviceSet) metadataDir() string { 168 return path.Join(devices.root, "metadata") 169 } 170 171 func (devices *DeviceSet) metadataFile(info *DevInfo) string { 172 file := info.Hash 173 if file == "" { 174 file = "base" 175 } 176 return path.Join(devices.metadataDir(), file) 177 } 178 179 func (devices *DeviceSet) transactionMetaFile() string { 180 return path.Join(devices.metadataDir(), transactionMetaFile) 181 } 182 183 func (devices *DeviceSet) deviceSetMetaFile() string { 184 return path.Join(devices.metadataDir(), deviceSetMetaFile) 185 } 186 187 func (devices *DeviceSet) oldMetadataFile() string { 188 return path.Join(devices.loopbackDir(), "json") 189 } 190 191 func (devices *DeviceSet) getPoolName() string { 192 if devices.thinPoolDevice == "" { 193 return devices.devicePrefix + "-pool" 194 } 195 return devices.thinPoolDevice 196 } 197 198 func (devices *DeviceSet) getPoolDevName() string { 199 return getDevName(devices.getPoolName()) 200 } 201 202 func (devices *DeviceSet) hasImage(name string) bool { 203 dirname := devices.loopbackDir() 204 filename := path.Join(dirname, name) 205 206 _, err := os.Stat(filename) 207 return err == nil 208 } 209 210 // ensureImage creates a sparse file of <size> bytes at the path 211 // <root>/devicemapper/<name>. 212 // If the file already exists, it does nothing. 213 // Either way it returns the full path. 214 func (devices *DeviceSet) ensureImage(name string, size int64) (string, error) { 215 dirname := devices.loopbackDir() 216 filename := path.Join(dirname, name) 217 218 if err := os.MkdirAll(dirname, 0700); err != nil && !os.IsExist(err) { 219 return "", err 220 } 221 222 if _, err := os.Stat(filename); err != nil { 223 if !os.IsNotExist(err) { 224 return "", err 225 } 226 logrus.Debugf("Creating loopback file %s for device-manage use", filename) 227 file, err := os.OpenFile(filename, os.O_RDWR|os.O_CREATE, 0600) 228 if err != nil { 229 return "", err 230 } 231 defer file.Close() 232 233 if err := file.Truncate(size); err != nil { 234 return "", err 235 } 236 } 237 return filename, nil 238 } 239 240 func (devices *DeviceSet) allocateTransactionId() uint64 { 241 devices.OpenTransactionId = devices.TransactionId + 1 242 return devices.OpenTransactionId 243 } 244 245 func (devices *DeviceSet) updatePoolTransactionId() error { 246 if err := devicemapper.SetTransactionId(devices.getPoolDevName(), devices.TransactionId, devices.OpenTransactionId); err != nil { 247 return fmt.Errorf("Error setting devmapper transaction ID: %s", err) 248 } 249 devices.TransactionId = devices.OpenTransactionId 250 return nil 251 } 252 253 func (devices *DeviceSet) removeMetadata(info *DevInfo) error { 254 if err := os.RemoveAll(devices.metadataFile(info)); err != nil { 255 return fmt.Errorf("Error removing metadata file %s: %s", devices.metadataFile(info), err) 256 } 257 return nil 258 } 259 260 // Given json data and file path, write it to disk 261 func (devices *DeviceSet) writeMetaFile(jsonData []byte, filePath string) error { 262 tmpFile, err := ioutil.TempFile(devices.metadataDir(), ".tmp") 263 if err != nil { 264 return fmt.Errorf("Error creating metadata file: %s", err) 265 } 266 267 n, err := tmpFile.Write(jsonData) 268 if err != nil { 269 return fmt.Errorf("Error writing metadata to %s: %s", tmpFile.Name(), err) 270 } 271 if n < len(jsonData) { 272 return io.ErrShortWrite 273 } 274 if err := tmpFile.Sync(); err != nil { 275 return fmt.Errorf("Error syncing metadata file %s: %s", tmpFile.Name(), err) 276 } 277 if err := tmpFile.Close(); err != nil { 278 return fmt.Errorf("Error closing metadata file %s: %s", tmpFile.Name(), err) 279 } 280 if err := os.Rename(tmpFile.Name(), filePath); err != nil { 281 return fmt.Errorf("Error committing metadata file %s: %s", tmpFile.Name(), err) 282 } 283 284 return nil 285 } 286 287 func (devices *DeviceSet) saveMetadata(info *DevInfo) error { 288 jsonData, err := json.Marshal(info) 289 if err != nil { 290 return fmt.Errorf("Error encoding metadata to json: %s", err) 291 } 292 if err := devices.writeMetaFile(jsonData, devices.metadataFile(info)); err != nil { 293 return err 294 } 295 return nil 296 } 297 298 func (devices *DeviceSet) markDeviceIdUsed(deviceId int) { 299 var mask byte 300 i := deviceId % 8 301 mask = 1 << uint(i) 302 devices.deviceIdMap[deviceId/8] = devices.deviceIdMap[deviceId/8] | mask 303 } 304 305 func (devices *DeviceSet) markDeviceIdFree(deviceId int) { 306 var mask byte 307 i := deviceId % 8 308 mask = ^(1 << uint(i)) 309 devices.deviceIdMap[deviceId/8] = devices.deviceIdMap[deviceId/8] & mask 310 } 311 312 func (devices *DeviceSet) isDeviceIdFree(deviceId int) bool { 313 var mask byte 314 i := deviceId % 8 315 mask = (1 << uint(i)) 316 if (devices.deviceIdMap[deviceId/8] & mask) != 0 { 317 return false 318 } 319 return true 320 } 321 322 func (devices *DeviceSet) lookupDevice(hash string) (*DevInfo, error) { 323 devices.devicesLock.Lock() 324 defer devices.devicesLock.Unlock() 325 info := devices.Devices[hash] 326 if info == nil { 327 info = devices.loadMetadata(hash) 328 if info == nil { 329 return nil, fmt.Errorf("Unknown device %s", hash) 330 } 331 332 devices.Devices[hash] = info 333 } 334 return info, nil 335 } 336 337 func (devices *DeviceSet) deviceFileWalkFunction(path string, finfo os.FileInfo) error { 338 339 // Skip some of the meta files which are not device files. 340 if strings.HasSuffix(finfo.Name(), ".migrated") { 341 logrus.Debugf("Skipping file %s", path) 342 return nil 343 } 344 345 if strings.HasPrefix(finfo.Name(), ".") { 346 logrus.Debugf("Skipping file %s", path) 347 return nil 348 } 349 350 if finfo.Name() == deviceSetMetaFile { 351 logrus.Debugf("Skipping file %s", path) 352 return nil 353 } 354 355 logrus.Debugf("Loading data for file %s", path) 356 357 hash := finfo.Name() 358 if hash == "base" { 359 hash = "" 360 } 361 362 dinfo := devices.loadMetadata(hash) 363 if dinfo == nil { 364 return fmt.Errorf("Error loading device metadata file %s", hash) 365 } 366 367 if dinfo.DeviceId > MaxDeviceId { 368 logrus.Errorf("Ignoring Invalid DeviceId=%d", dinfo.DeviceId) 369 return nil 370 } 371 372 devices.Lock() 373 devices.markDeviceIdUsed(dinfo.DeviceId) 374 devices.Unlock() 375 376 logrus.Debugf("Added deviceId=%d to DeviceIdMap", dinfo.DeviceId) 377 return nil 378 } 379 380 func (devices *DeviceSet) constructDeviceIdMap() error { 381 logrus.Debugf("[deviceset] constructDeviceIdMap()") 382 defer logrus.Debugf("[deviceset] constructDeviceIdMap() END") 383 384 var scan = func(path string, info os.FileInfo, err error) error { 385 if err != nil { 386 logrus.Debugf("Can't walk the file %s", path) 387 return nil 388 } 389 390 // Skip any directories 391 if info.IsDir() { 392 return nil 393 } 394 395 return devices.deviceFileWalkFunction(path, info) 396 } 397 398 return filepath.Walk(devices.metadataDir(), scan) 399 } 400 401 func (devices *DeviceSet) unregisterDevice(id int, hash string) error { 402 logrus.Debugf("unregisterDevice(%v, %v)", id, hash) 403 info := &DevInfo{ 404 Hash: hash, 405 DeviceId: id, 406 } 407 408 devices.devicesLock.Lock() 409 delete(devices.Devices, hash) 410 devices.devicesLock.Unlock() 411 412 if err := devices.removeMetadata(info); err != nil { 413 logrus.Debugf("Error removing metadata: %s", err) 414 return err 415 } 416 417 return nil 418 } 419 420 func (devices *DeviceSet) registerDevice(id int, hash string, size uint64, transactionId uint64) (*DevInfo, error) { 421 logrus.Debugf("registerDevice(%v, %v)", id, hash) 422 info := &DevInfo{ 423 Hash: hash, 424 DeviceId: id, 425 Size: size, 426 TransactionId: transactionId, 427 Initialized: false, 428 devices: devices, 429 } 430 431 devices.devicesLock.Lock() 432 devices.Devices[hash] = info 433 devices.devicesLock.Unlock() 434 435 if err := devices.saveMetadata(info); err != nil { 436 // Try to remove unused device 437 devices.devicesLock.Lock() 438 delete(devices.Devices, hash) 439 devices.devicesLock.Unlock() 440 return nil, err 441 } 442 443 return info, nil 444 } 445 446 func (devices *DeviceSet) activateDeviceIfNeeded(info *DevInfo) error { 447 logrus.Debugf("activateDeviceIfNeeded(%v)", info.Hash) 448 449 // Make sure deferred removal on device is canceled, if one was 450 // scheduled. 451 if err := devices.cancelDeferredRemoval(info); err != nil { 452 return fmt.Errorf("Deivce Deferred Removal Cancellation Failed: %s", err) 453 } 454 455 if devinfo, _ := devicemapper.GetInfo(info.Name()); devinfo != nil && devinfo.Exists != 0 { 456 return nil 457 } 458 459 return devicemapper.ActivateDevice(devices.getPoolDevName(), info.Name(), info.DeviceId, info.Size) 460 } 461 462 func (devices *DeviceSet) createFilesystem(info *DevInfo) error { 463 devname := info.DevName() 464 465 args := []string{} 466 for _, arg := range devices.mkfsArgs { 467 args = append(args, arg) 468 } 469 470 args = append(args, devname) 471 472 var err error 473 switch devices.filesystem { 474 case "xfs": 475 err = exec.Command("mkfs.xfs", args...).Run() 476 case "ext4": 477 err = exec.Command("mkfs.ext4", append([]string{"-E", "nodiscard,lazy_itable_init=0,lazy_journal_init=0"}, args...)...).Run() 478 if err != nil { 479 err = exec.Command("mkfs.ext4", append([]string{"-E", "nodiscard,lazy_itable_init=0"}, args...)...).Run() 480 } 481 if err != nil { 482 return err 483 } 484 err = exec.Command("tune2fs", append([]string{"-c", "-1", "-i", "0"}, devname)...).Run() 485 default: 486 err = fmt.Errorf("Unsupported filesystem type %s", devices.filesystem) 487 } 488 if err != nil { 489 return err 490 } 491 492 return nil 493 } 494 495 func (devices *DeviceSet) migrateOldMetaData() error { 496 // Migrate old metadata file 497 jsonData, err := ioutil.ReadFile(devices.oldMetadataFile()) 498 if err != nil && !os.IsNotExist(err) { 499 return err 500 } 501 502 if jsonData != nil { 503 m := MetaData{Devices: make(map[string]*DevInfo)} 504 505 if err := json.Unmarshal(jsonData, &m); err != nil { 506 return err 507 } 508 509 for hash, info := range m.Devices { 510 info.Hash = hash 511 devices.saveMetadata(info) 512 } 513 if err := os.Rename(devices.oldMetadataFile(), devices.oldMetadataFile()+".migrated"); err != nil { 514 return err 515 } 516 517 } 518 519 return nil 520 } 521 522 func (devices *DeviceSet) initMetaData() error { 523 if err := devices.migrateOldMetaData(); err != nil { 524 return err 525 } 526 527 _, transactionId, _, _, _, _, err := devices.poolStatus() 528 if err != nil { 529 return err 530 } 531 532 devices.TransactionId = transactionId 533 534 if err := devices.constructDeviceIdMap(); err != nil { 535 return err 536 } 537 538 if err := devices.processPendingTransaction(); err != nil { 539 return err 540 } 541 return nil 542 } 543 544 func (devices *DeviceSet) incNextDeviceId() { 545 // Ids are 24bit, so wrap around 546 devices.NextDeviceId = (devices.NextDeviceId + 1) & MaxDeviceId 547 } 548 549 func (devices *DeviceSet) getNextFreeDeviceId() (int, error) { 550 devices.incNextDeviceId() 551 for i := 0; i <= MaxDeviceId; i++ { 552 if devices.isDeviceIdFree(devices.NextDeviceId) { 553 devices.markDeviceIdUsed(devices.NextDeviceId) 554 return devices.NextDeviceId, nil 555 } 556 devices.incNextDeviceId() 557 } 558 559 return 0, fmt.Errorf("Unable to find a free device Id") 560 } 561 562 func (devices *DeviceSet) createRegisterDevice(hash string) (*DevInfo, error) { 563 deviceId, err := devices.getNextFreeDeviceId() 564 if err != nil { 565 return nil, err 566 } 567 568 if err := devices.openTransaction(hash, deviceId); err != nil { 569 logrus.Debugf("Error opening transaction hash = %s deviceId = %d", hash, deviceId) 570 devices.markDeviceIdFree(deviceId) 571 return nil, err 572 } 573 574 for { 575 if err := devicemapper.CreateDevice(devices.getPoolDevName(), deviceId); err != nil { 576 if devicemapper.DeviceIdExists(err) { 577 // Device Id already exists. This should not 578 // happen. Now we have a mechianism to find 579 // a free device Id. So something is not right. 580 // Give a warning and continue. 581 logrus.Errorf("Device Id %d exists in pool but it is supposed to be unused", deviceId) 582 deviceId, err = devices.getNextFreeDeviceId() 583 if err != nil { 584 return nil, err 585 } 586 // Save new device id into transaction 587 devices.refreshTransaction(deviceId) 588 continue 589 } 590 logrus.Debugf("Error creating device: %s", err) 591 devices.markDeviceIdFree(deviceId) 592 return nil, err 593 } 594 break 595 } 596 597 logrus.Debugf("Registering device (id %v) with FS size %v", deviceId, devices.baseFsSize) 598 info, err := devices.registerDevice(deviceId, hash, devices.baseFsSize, devices.OpenTransactionId) 599 if err != nil { 600 _ = devicemapper.DeleteDevice(devices.getPoolDevName(), deviceId) 601 devices.markDeviceIdFree(deviceId) 602 return nil, err 603 } 604 605 if err := devices.closeTransaction(); err != nil { 606 devices.unregisterDevice(deviceId, hash) 607 devicemapper.DeleteDevice(devices.getPoolDevName(), deviceId) 608 devices.markDeviceIdFree(deviceId) 609 return nil, err 610 } 611 return info, nil 612 } 613 614 func (devices *DeviceSet) createRegisterSnapDevice(hash string, baseInfo *DevInfo) error { 615 deviceId, err := devices.getNextFreeDeviceId() 616 if err != nil { 617 return err 618 } 619 620 if err := devices.openTransaction(hash, deviceId); err != nil { 621 logrus.Debugf("Error opening transaction hash = %s deviceId = %d", hash, deviceId) 622 devices.markDeviceIdFree(deviceId) 623 return err 624 } 625 626 for { 627 if err := devicemapper.CreateSnapDevice(devices.getPoolDevName(), deviceId, baseInfo.Name(), baseInfo.DeviceId); err != nil { 628 if devicemapper.DeviceIdExists(err) { 629 // Device Id already exists. This should not 630 // happen. Now we have a mechianism to find 631 // a free device Id. So something is not right. 632 // Give a warning and continue. 633 logrus.Errorf("Device Id %d exists in pool but it is supposed to be unused", deviceId) 634 deviceId, err = devices.getNextFreeDeviceId() 635 if err != nil { 636 return err 637 } 638 // Save new device id into transaction 639 devices.refreshTransaction(deviceId) 640 continue 641 } 642 logrus.Debugf("Error creating snap device: %s", err) 643 devices.markDeviceIdFree(deviceId) 644 return err 645 } 646 break 647 } 648 649 if _, err := devices.registerDevice(deviceId, hash, baseInfo.Size, devices.OpenTransactionId); err != nil { 650 devicemapper.DeleteDevice(devices.getPoolDevName(), deviceId) 651 devices.markDeviceIdFree(deviceId) 652 logrus.Debugf("Error registering device: %s", err) 653 return err 654 } 655 656 if err := devices.closeTransaction(); err != nil { 657 devices.unregisterDevice(deviceId, hash) 658 devicemapper.DeleteDevice(devices.getPoolDevName(), deviceId) 659 devices.markDeviceIdFree(deviceId) 660 return err 661 } 662 return nil 663 } 664 665 func (devices *DeviceSet) loadMetadata(hash string) *DevInfo { 666 info := &DevInfo{Hash: hash, devices: devices} 667 668 jsonData, err := ioutil.ReadFile(devices.metadataFile(info)) 669 if err != nil { 670 return nil 671 } 672 673 if err := json.Unmarshal(jsonData, &info); err != nil { 674 return nil 675 } 676 677 return info 678 } 679 680 func getDeviceUUID(device string) (string, error) { 681 out, err := exec.Command("blkid", "-s", "UUID", "-o", "value", device).Output() 682 if err != nil { 683 logrus.Debugf("Failed to find uuid for device %s:%v", device, err) 684 return "", err 685 } 686 687 uuid := strings.TrimSuffix(string(out), "\n") 688 uuid = strings.TrimSpace(uuid) 689 logrus.Debugf("UUID for device: %s is:%s", device, uuid) 690 return uuid, nil 691 } 692 693 func (devices *DeviceSet) verifyBaseDeviceUUID(baseInfo *DevInfo) error { 694 if err := devices.activateDeviceIfNeeded(baseInfo); err != nil { 695 return err 696 } 697 698 defer devices.deactivateDevice(baseInfo) 699 700 uuid, err := getDeviceUUID(baseInfo.DevName()) 701 if err != nil { 702 return err 703 } 704 705 if devices.BaseDeviceUUID != uuid { 706 return fmt.Errorf("Current Base Device UUID:%s does not match with stored UUID:%s", uuid, devices.BaseDeviceUUID) 707 } 708 709 return nil 710 } 711 712 func (devices *DeviceSet) saveBaseDeviceUUID(baseInfo *DevInfo) error { 713 if err := devices.activateDeviceIfNeeded(baseInfo); err != nil { 714 return err 715 } 716 717 defer devices.deactivateDevice(baseInfo) 718 719 uuid, err := getDeviceUUID(baseInfo.DevName()) 720 if err != nil { 721 return err 722 } 723 724 devices.BaseDeviceUUID = uuid 725 devices.saveDeviceSetMetaData() 726 return nil 727 } 728 729 func (devices *DeviceSet) setupBaseImage() error { 730 oldInfo, _ := devices.lookupDevice("") 731 if oldInfo != nil && oldInfo.Initialized { 732 // If BaseDeviceUUID is nil (upgrade case), save it and 733 // return success. 734 if devices.BaseDeviceUUID == "" { 735 if err := devices.saveBaseDeviceUUID(oldInfo); err != nil { 736 return fmt.Errorf("Could not query and save base device UUID:%v", err) 737 } 738 return nil 739 } 740 741 if err := devices.verifyBaseDeviceUUID(oldInfo); err != nil { 742 return fmt.Errorf("Base Device UUID verification failed. Possibly using a different thin pool then last invocation:%v", err) 743 } 744 return nil 745 } 746 747 if oldInfo != nil && !oldInfo.Initialized { 748 logrus.Debugf("Removing uninitialized base image") 749 if err := devices.DeleteDevice(""); err != nil { 750 return err 751 } 752 } 753 754 if devices.thinPoolDevice != "" && oldInfo == nil { 755 _, transactionId, dataUsed, _, _, _, err := devices.poolStatus() 756 if err != nil { 757 return err 758 } 759 if dataUsed != 0 { 760 return fmt.Errorf("Unable to take ownership of thin-pool (%s) that already has used data blocks", 761 devices.thinPoolDevice) 762 } 763 if transactionId != 0 { 764 return fmt.Errorf("Unable to take ownership of thin-pool (%s) with non-zero transaction Id", 765 devices.thinPoolDevice) 766 } 767 } 768 769 logrus.Debugf("Initializing base device-mapper thin volume") 770 771 // Create initial device 772 info, err := devices.createRegisterDevice("") 773 if err != nil { 774 return err 775 } 776 777 logrus.Debugf("Creating filesystem on base device-mapper thin volume") 778 779 if err := devices.activateDeviceIfNeeded(info); err != nil { 780 return err 781 } 782 783 if err := devices.createFilesystem(info); err != nil { 784 return err 785 } 786 787 info.Initialized = true 788 if err := devices.saveMetadata(info); err != nil { 789 info.Initialized = false 790 return err 791 } 792 793 if err := devices.saveBaseDeviceUUID(info); err != nil { 794 return fmt.Errorf("Could not query and save base device UUID:%v", err) 795 } 796 797 return nil 798 } 799 800 func setCloseOnExec(name string) { 801 if fileInfos, _ := ioutil.ReadDir("/proc/self/fd"); fileInfos != nil { 802 for _, i := range fileInfos { 803 link, _ := os.Readlink(filepath.Join("/proc/self/fd", i.Name())) 804 if link == name { 805 fd, err := strconv.Atoi(i.Name()) 806 if err == nil { 807 syscall.CloseOnExec(fd) 808 } 809 } 810 } 811 } 812 } 813 814 func (devices *DeviceSet) DMLog(level int, file string, line int, dmError int, message string) { 815 // By default libdm sends us all the messages including debug ones. 816 // We need to filter out messages here and figure out which one 817 // should be printed. 818 if level > DMLogLevel { 819 return 820 } 821 822 // FIXME(vbatts) push this back into ./pkg/devicemapper/ 823 if level <= devicemapper.LogLevelErr { 824 logrus.Errorf("libdevmapper(%d): %s:%d (%d) %s", level, file, line, dmError, message) 825 } else if level <= devicemapper.LogLevelInfo { 826 logrus.Infof("libdevmapper(%d): %s:%d (%d) %s", level, file, line, dmError, message) 827 } else { 828 // FIXME(vbatts) push this back into ./pkg/devicemapper/ 829 logrus.Debugf("libdevmapper(%d): %s:%d (%d) %s", level, file, line, dmError, message) 830 } 831 } 832 833 func major(device uint64) uint64 { 834 return (device >> 8) & 0xfff 835 } 836 837 func minor(device uint64) uint64 { 838 return (device & 0xff) | ((device >> 12) & 0xfff00) 839 } 840 841 func (devices *DeviceSet) ResizePool(size int64) error { 842 dirname := devices.loopbackDir() 843 datafilename := path.Join(dirname, "data") 844 if len(devices.dataDevice) > 0 { 845 datafilename = devices.dataDevice 846 } 847 metadatafilename := path.Join(dirname, "metadata") 848 if len(devices.metadataDevice) > 0 { 849 metadatafilename = devices.metadataDevice 850 } 851 852 datafile, err := os.OpenFile(datafilename, os.O_RDWR, 0) 853 if datafile == nil { 854 return err 855 } 856 defer datafile.Close() 857 858 fi, err := datafile.Stat() 859 if fi == nil { 860 return err 861 } 862 863 if fi.Size() > size { 864 return fmt.Errorf("Can't shrink file") 865 } 866 867 dataloopback := devicemapper.FindLoopDeviceFor(datafile) 868 if dataloopback == nil { 869 return fmt.Errorf("Unable to find loopback mount for: %s", datafilename) 870 } 871 defer dataloopback.Close() 872 873 metadatafile, err := os.OpenFile(metadatafilename, os.O_RDWR, 0) 874 if metadatafile == nil { 875 return err 876 } 877 defer metadatafile.Close() 878 879 metadataloopback := devicemapper.FindLoopDeviceFor(metadatafile) 880 if metadataloopback == nil { 881 return fmt.Errorf("Unable to find loopback mount for: %s", metadatafilename) 882 } 883 defer metadataloopback.Close() 884 885 // Grow loopback file 886 if err := datafile.Truncate(size); err != nil { 887 return fmt.Errorf("Unable to grow loopback file: %s", err) 888 } 889 890 // Reload size for loopback device 891 if err := devicemapper.LoopbackSetCapacity(dataloopback); err != nil { 892 return fmt.Errorf("Unable to update loopback capacity: %s", err) 893 } 894 895 // Suspend the pool 896 if err := devicemapper.SuspendDevice(devices.getPoolName()); err != nil { 897 return fmt.Errorf("Unable to suspend pool: %s", err) 898 } 899 900 // Reload with the new block sizes 901 if err := devicemapper.ReloadPool(devices.getPoolName(), dataloopback, metadataloopback, devices.thinpBlockSize); err != nil { 902 return fmt.Errorf("Unable to reload pool: %s", err) 903 } 904 905 // Resume the pool 906 if err := devicemapper.ResumeDevice(devices.getPoolName()); err != nil { 907 return fmt.Errorf("Unable to resume pool: %s", err) 908 } 909 910 return nil 911 } 912 913 func (devices *DeviceSet) loadTransactionMetaData() error { 914 jsonData, err := ioutil.ReadFile(devices.transactionMetaFile()) 915 if err != nil { 916 // There is no active transaction. This will be the case 917 // during upgrade. 918 if os.IsNotExist(err) { 919 devices.OpenTransactionId = devices.TransactionId 920 return nil 921 } 922 return err 923 } 924 925 json.Unmarshal(jsonData, &devices.Transaction) 926 return nil 927 } 928 929 func (devices *DeviceSet) saveTransactionMetaData() error { 930 jsonData, err := json.Marshal(&devices.Transaction) 931 if err != nil { 932 return fmt.Errorf("Error encoding metadata to json: %s", err) 933 } 934 935 return devices.writeMetaFile(jsonData, devices.transactionMetaFile()) 936 } 937 938 func (devices *DeviceSet) removeTransactionMetaData() error { 939 if err := os.RemoveAll(devices.transactionMetaFile()); err != nil { 940 return err 941 } 942 return nil 943 } 944 945 func (devices *DeviceSet) rollbackTransaction() error { 946 logrus.Debugf("Rolling back open transaction: TransactionId=%d hash=%s device_id=%d", devices.OpenTransactionId, devices.DeviceIdHash, devices.DeviceId) 947 948 // A device id might have already been deleted before transaction 949 // closed. In that case this call will fail. Just leave a message 950 // in case of failure. 951 if err := devicemapper.DeleteDevice(devices.getPoolDevName(), devices.DeviceId); err != nil { 952 logrus.Errorf("Unable to delete device: %s", err) 953 } 954 955 dinfo := &DevInfo{Hash: devices.DeviceIdHash} 956 if err := devices.removeMetadata(dinfo); err != nil { 957 logrus.Errorf("Unable to remove metadata: %s", err) 958 } else { 959 devices.markDeviceIdFree(devices.DeviceId) 960 } 961 962 if err := devices.removeTransactionMetaData(); err != nil { 963 logrus.Errorf("Unable to remove transaction meta file %s: %s", devices.transactionMetaFile(), err) 964 } 965 966 return nil 967 } 968 969 func (devices *DeviceSet) processPendingTransaction() error { 970 if err := devices.loadTransactionMetaData(); err != nil { 971 return err 972 } 973 974 // If there was open transaction but pool transaction Id is same 975 // as open transaction Id, nothing to roll back. 976 if devices.TransactionId == devices.OpenTransactionId { 977 return nil 978 } 979 980 // If open transaction Id is less than pool transaction Id, something 981 // is wrong. Bail out. 982 if devices.OpenTransactionId < devices.TransactionId { 983 logrus.Errorf("Open Transaction id %d is less than pool transaction id %d", devices.OpenTransactionId, devices.TransactionId) 984 return nil 985 } 986 987 // Pool transaction Id is not same as open transaction. There is 988 // a transaction which was not completed. 989 if err := devices.rollbackTransaction(); err != nil { 990 return fmt.Errorf("Rolling back open transaction failed: %s", err) 991 } 992 993 devices.OpenTransactionId = devices.TransactionId 994 return nil 995 } 996 997 func (devices *DeviceSet) loadDeviceSetMetaData() error { 998 jsonData, err := ioutil.ReadFile(devices.deviceSetMetaFile()) 999 if err != nil { 1000 // For backward compatibility return success if file does 1001 // not exist. 1002 if os.IsNotExist(err) { 1003 return nil 1004 } 1005 return err 1006 } 1007 1008 return json.Unmarshal(jsonData, devices) 1009 } 1010 1011 func (devices *DeviceSet) saveDeviceSetMetaData() error { 1012 jsonData, err := json.Marshal(devices) 1013 if err != nil { 1014 return fmt.Errorf("Error encoding metadata to json: %s", err) 1015 } 1016 1017 return devices.writeMetaFile(jsonData, devices.deviceSetMetaFile()) 1018 } 1019 1020 func (devices *DeviceSet) openTransaction(hash string, DeviceId int) error { 1021 devices.allocateTransactionId() 1022 devices.DeviceIdHash = hash 1023 devices.DeviceId = DeviceId 1024 if err := devices.saveTransactionMetaData(); err != nil { 1025 return fmt.Errorf("Error saving transaction metadata: %s", err) 1026 } 1027 return nil 1028 } 1029 1030 func (devices *DeviceSet) refreshTransaction(DeviceId int) error { 1031 devices.DeviceId = DeviceId 1032 if err := devices.saveTransactionMetaData(); err != nil { 1033 return fmt.Errorf("Error saving transaction metadata: %s", err) 1034 } 1035 return nil 1036 } 1037 1038 func (devices *DeviceSet) closeTransaction() error { 1039 if err := devices.updatePoolTransactionId(); err != nil { 1040 logrus.Debugf("Failed to close Transaction") 1041 return err 1042 } 1043 return nil 1044 } 1045 1046 func determineDriverCapabilities(version string) error { 1047 /* 1048 * Driver version 4.27.0 and greater support deferred activation 1049 * feature. 1050 */ 1051 1052 logrus.Debugf("devicemapper: driver version is %s", version) 1053 1054 versionSplit := strings.Split(version, ".") 1055 major, err := strconv.Atoi(versionSplit[0]) 1056 if err != nil { 1057 return graphdriver.ErrNotSupported 1058 } 1059 1060 if major > 4 { 1061 DriverDeferredRemovalSupport = true 1062 return nil 1063 } 1064 1065 if major < 4 { 1066 return nil 1067 } 1068 1069 minor, err := strconv.Atoi(versionSplit[1]) 1070 if err != nil { 1071 return graphdriver.ErrNotSupported 1072 } 1073 1074 /* 1075 * If major is 4 and minor is 27, then there is no need to 1076 * check for patch level as it can not be less than 0. 1077 */ 1078 if minor >= 27 { 1079 DriverDeferredRemovalSupport = true 1080 return nil 1081 } 1082 1083 return nil 1084 } 1085 1086 func (devices *DeviceSet) initDevmapper(doInit bool) error { 1087 // give ourselves to libdm as a log handler 1088 devicemapper.LogInit(devices) 1089 1090 version, err := devicemapper.GetDriverVersion() 1091 if err != nil { 1092 // Can't even get driver version, assume not supported 1093 return graphdriver.ErrNotSupported 1094 } 1095 1096 if err := determineDriverCapabilities(version); err != nil { 1097 return graphdriver.ErrNotSupported 1098 } 1099 1100 // If user asked for deferred removal and both library and driver 1101 // supports deferred removal use it. 1102 if EnableDeferredRemoval && DriverDeferredRemovalSupport && devicemapper.LibraryDeferredRemovalSupport == true { 1103 logrus.Debugf("devmapper: Deferred removal support enabled.") 1104 devices.deferredRemove = true 1105 } 1106 1107 // https://github.com/docker/docker/issues/4036 1108 if supported := devicemapper.UdevSetSyncSupport(true); !supported { 1109 logrus.Errorf("Udev sync is not supported. This will lead to unexpected behavior, data loss and errors. For more information, see https://docs.docker.com/reference/commandline/cli/#daemon-storage-driver-option") 1110 if !devices.overrideUdevSyncCheck { 1111 return graphdriver.ErrNotSupported 1112 } 1113 } 1114 1115 if err := os.MkdirAll(devices.metadataDir(), 0700); err != nil && !os.IsExist(err) { 1116 return err 1117 } 1118 1119 // Set the device prefix from the device id and inode of the docker root dir 1120 1121 st, err := os.Stat(devices.root) 1122 if err != nil { 1123 return fmt.Errorf("Error looking up dir %s: %s", devices.root, err) 1124 } 1125 sysSt := st.Sys().(*syscall.Stat_t) 1126 // "reg-" stands for "regular file". 1127 // In the future we might use "dev-" for "device file", etc. 1128 // docker-maj,min[-inode] stands for: 1129 // - Managed by docker 1130 // - The target of this device is at major <maj> and minor <min> 1131 // - If <inode> is defined, use that file inside the device as a loopback image. Otherwise use the device itself. 1132 devices.devicePrefix = fmt.Sprintf("docker-%d:%d-%d", major(sysSt.Dev), minor(sysSt.Dev), sysSt.Ino) 1133 logrus.Debugf("Generated prefix: %s", devices.devicePrefix) 1134 1135 // Check for the existence of the thin-pool device 1136 logrus.Debugf("Checking for existence of the pool '%s'", devices.getPoolName()) 1137 info, err := devicemapper.GetInfo(devices.getPoolName()) 1138 if info == nil { 1139 logrus.Debugf("Error device devicemapper.GetInfo: %s", err) 1140 return err 1141 } 1142 1143 // It seems libdevmapper opens this without O_CLOEXEC, and go exec will not close files 1144 // that are not Close-on-exec, and lxc-start will die if it inherits any unexpected files, 1145 // so we add this badhack to make sure it closes itself 1146 setCloseOnExec("/dev/mapper/control") 1147 1148 // Make sure the sparse images exist in <root>/devicemapper/data and 1149 // <root>/devicemapper/metadata 1150 1151 createdLoopback := false 1152 1153 // If the pool doesn't exist, create it 1154 if info.Exists == 0 && devices.thinPoolDevice == "" { 1155 logrus.Debugf("Pool doesn't exist. Creating it.") 1156 1157 var ( 1158 dataFile *os.File 1159 metadataFile *os.File 1160 ) 1161 1162 if devices.dataDevice == "" { 1163 // Make sure the sparse images exist in <root>/devicemapper/data 1164 1165 hasData := devices.hasImage("data") 1166 1167 if !doInit && !hasData { 1168 return errors.New("Loopback data file not found") 1169 } 1170 1171 if !hasData { 1172 createdLoopback = true 1173 } 1174 1175 data, err := devices.ensureImage("data", devices.dataLoopbackSize) 1176 if err != nil { 1177 logrus.Debugf("Error device ensureImage (data): %s", err) 1178 return err 1179 } 1180 1181 dataFile, err = devicemapper.AttachLoopDevice(data) 1182 if err != nil { 1183 return err 1184 } 1185 devices.dataLoopFile = data 1186 devices.dataDevice = dataFile.Name() 1187 } else { 1188 dataFile, err = os.OpenFile(devices.dataDevice, os.O_RDWR, 0600) 1189 if err != nil { 1190 return err 1191 } 1192 } 1193 defer dataFile.Close() 1194 1195 if devices.metadataDevice == "" { 1196 // Make sure the sparse images exist in <root>/devicemapper/metadata 1197 1198 hasMetadata := devices.hasImage("metadata") 1199 1200 if !doInit && !hasMetadata { 1201 return errors.New("Loopback metadata file not found") 1202 } 1203 1204 if !hasMetadata { 1205 createdLoopback = true 1206 } 1207 1208 metadata, err := devices.ensureImage("metadata", devices.metaDataLoopbackSize) 1209 if err != nil { 1210 logrus.Debugf("Error device ensureImage (metadata): %s", err) 1211 return err 1212 } 1213 1214 metadataFile, err = devicemapper.AttachLoopDevice(metadata) 1215 if err != nil { 1216 return err 1217 } 1218 devices.metadataLoopFile = metadata 1219 devices.metadataDevice = metadataFile.Name() 1220 } else { 1221 metadataFile, err = os.OpenFile(devices.metadataDevice, os.O_RDWR, 0600) 1222 if err != nil { 1223 return err 1224 } 1225 } 1226 defer metadataFile.Close() 1227 1228 if err := devicemapper.CreatePool(devices.getPoolName(), dataFile, metadataFile, devices.thinpBlockSize); err != nil { 1229 return err 1230 } 1231 } 1232 1233 // If we didn't just create the data or metadata image, we need to 1234 // load the transaction id and migrate old metadata 1235 if !createdLoopback { 1236 if err := devices.initMetaData(); err != nil { 1237 return err 1238 } 1239 } 1240 1241 // Right now this loads only NextDeviceId. If there is more metadata 1242 // down the line, we might have to move it earlier. 1243 if err := devices.loadDeviceSetMetaData(); err != nil { 1244 return err 1245 } 1246 1247 // Setup the base image 1248 if doInit { 1249 if err := devices.setupBaseImage(); err != nil { 1250 logrus.Debugf("Error device setupBaseImage: %s", err) 1251 return err 1252 } 1253 } 1254 1255 return nil 1256 } 1257 1258 func (devices *DeviceSet) AddDevice(hash, baseHash string) error { 1259 logrus.Debugf("[deviceset] AddDevice(hash=%s basehash=%s)", hash, baseHash) 1260 defer logrus.Debugf("[deviceset] AddDevice(hash=%s basehash=%s) END", hash, baseHash) 1261 1262 baseInfo, err := devices.lookupDevice(baseHash) 1263 if err != nil { 1264 return err 1265 } 1266 1267 baseInfo.lock.Lock() 1268 defer baseInfo.lock.Unlock() 1269 1270 devices.Lock() 1271 defer devices.Unlock() 1272 1273 if info, _ := devices.lookupDevice(hash); info != nil { 1274 return fmt.Errorf("device %s already exists", hash) 1275 } 1276 1277 if err := devices.createRegisterSnapDevice(hash, baseInfo); err != nil { 1278 return err 1279 } 1280 1281 return nil 1282 } 1283 1284 func (devices *DeviceSet) deleteDevice(info *DevInfo) error { 1285 if devices.doBlkDiscard { 1286 // This is a workaround for the kernel not discarding block so 1287 // on the thin pool when we remove a thinp device, so we do it 1288 // manually 1289 if err := devices.activateDeviceIfNeeded(info); err == nil { 1290 if err := devicemapper.BlockDeviceDiscard(info.DevName()); err != nil { 1291 logrus.Debugf("Error discarding block on device: %s (ignoring)", err) 1292 } 1293 } 1294 } 1295 1296 devinfo, _ := devicemapper.GetInfo(info.Name()) 1297 if devinfo != nil && devinfo.Exists != 0 { 1298 if err := devices.removeDevice(info.Name()); err != nil { 1299 logrus.Debugf("Error removing device: %s", err) 1300 return err 1301 } 1302 } 1303 1304 if err := devices.openTransaction(info.Hash, info.DeviceId); err != nil { 1305 logrus.Debugf("Error opening transaction hash = %s deviceId = %d", "", info.DeviceId) 1306 return err 1307 } 1308 1309 if err := devicemapper.DeleteDevice(devices.getPoolDevName(), info.DeviceId); err != nil { 1310 logrus.Debugf("Error deleting device: %s", err) 1311 return err 1312 } 1313 1314 if err := devices.unregisterDevice(info.DeviceId, info.Hash); err != nil { 1315 return err 1316 } 1317 1318 if err := devices.closeTransaction(); err != nil { 1319 return err 1320 } 1321 1322 devices.markDeviceIdFree(info.DeviceId) 1323 1324 return nil 1325 } 1326 1327 func (devices *DeviceSet) DeleteDevice(hash string) error { 1328 info, err := devices.lookupDevice(hash) 1329 if err != nil { 1330 return err 1331 } 1332 1333 info.lock.Lock() 1334 defer info.lock.Unlock() 1335 1336 devices.Lock() 1337 defer devices.Unlock() 1338 1339 return devices.deleteDevice(info) 1340 } 1341 1342 func (devices *DeviceSet) deactivatePool() error { 1343 logrus.Debugf("[devmapper] deactivatePool()") 1344 defer logrus.Debugf("[devmapper] deactivatePool END") 1345 devname := devices.getPoolDevName() 1346 1347 devinfo, err := devicemapper.GetInfo(devname) 1348 if err != nil { 1349 return err 1350 } 1351 if d, err := devicemapper.GetDeps(devname); err == nil { 1352 // Access to more Debug output 1353 logrus.Debugf("[devmapper] devicemapper.GetDeps() %s: %#v", devname, d) 1354 } 1355 if devinfo.Exists != 0 { 1356 return devicemapper.RemoveDevice(devname) 1357 } 1358 1359 return nil 1360 } 1361 1362 func (devices *DeviceSet) deactivateDevice(info *DevInfo) error { 1363 logrus.Debugf("[devmapper] deactivateDevice(%s)", info.Hash) 1364 defer logrus.Debugf("[devmapper] deactivateDevice END(%s)", info.Hash) 1365 1366 devinfo, err := devicemapper.GetInfo(info.Name()) 1367 if err != nil { 1368 return err 1369 } 1370 1371 if devinfo.Exists == 0 { 1372 return nil 1373 } 1374 1375 if devices.deferredRemove { 1376 if err := devicemapper.RemoveDeviceDeferred(info.Name()); err != nil { 1377 return err 1378 } 1379 } else { 1380 if err := devices.removeDevice(info.Name()); err != nil { 1381 return err 1382 } 1383 } 1384 return nil 1385 } 1386 1387 // Issues the underlying dm remove operation. 1388 func (devices *DeviceSet) removeDevice(devname string) error { 1389 var err error 1390 1391 logrus.Debugf("[devmapper] removeDevice START(%s)", devname) 1392 defer logrus.Debugf("[devmapper] removeDevice END(%s)", devname) 1393 1394 for i := 0; i < 200; i++ { 1395 err = devicemapper.RemoveDevice(devname) 1396 if err == nil { 1397 break 1398 } 1399 if err != devicemapper.ErrBusy { 1400 return err 1401 } 1402 1403 // If we see EBUSY it may be a transient error, 1404 // sleep a bit a retry a few times. 1405 devices.Unlock() 1406 time.Sleep(100 * time.Millisecond) 1407 devices.Lock() 1408 } 1409 1410 return err 1411 } 1412 1413 func (devices *DeviceSet) cancelDeferredRemoval(info *DevInfo) error { 1414 if !devices.deferredRemove { 1415 return nil 1416 } 1417 1418 logrus.Debugf("[devmapper] cancelDeferredRemoval START(%s)", info.Name()) 1419 defer logrus.Debugf("[devmapper] cancelDeferredRemoval END(%s)", info.Name) 1420 1421 devinfo, err := devicemapper.GetInfoWithDeferred(info.Name()) 1422 1423 if devinfo != nil && devinfo.DeferredRemove == 0 { 1424 return nil 1425 } 1426 1427 // Cancel deferred remove 1428 for i := 0; i < 100; i++ { 1429 err = devicemapper.CancelDeferredRemove(info.Name()) 1430 if err == nil { 1431 break 1432 } 1433 1434 if err == devicemapper.ErrEnxio { 1435 // Device is probably already gone. Return success. 1436 return nil 1437 } 1438 1439 if err != devicemapper.ErrBusy { 1440 return err 1441 } 1442 1443 // If we see EBUSY it may be a transient error, 1444 // sleep a bit a retry a few times. 1445 devices.Unlock() 1446 time.Sleep(100 * time.Millisecond) 1447 devices.Lock() 1448 } 1449 return err 1450 } 1451 1452 func (devices *DeviceSet) Shutdown() error { 1453 logrus.Debugf("[deviceset %s] Shutdown()", devices.devicePrefix) 1454 logrus.Debugf("[devmapper] Shutting down DeviceSet: %s", devices.root) 1455 defer logrus.Debugf("[deviceset %s] Shutdown() END", devices.devicePrefix) 1456 1457 var devs []*DevInfo 1458 1459 devices.devicesLock.Lock() 1460 for _, info := range devices.Devices { 1461 devs = append(devs, info) 1462 } 1463 devices.devicesLock.Unlock() 1464 1465 for _, info := range devs { 1466 info.lock.Lock() 1467 if info.mountCount > 0 { 1468 // We use MNT_DETACH here in case it is still busy in some running 1469 // container. This means it'll go away from the global scope directly, 1470 // and the device will be released when that container dies. 1471 if err := syscall.Unmount(info.mountPath, syscall.MNT_DETACH); err != nil { 1472 logrus.Debugf("Shutdown unmounting %s, error: %s", info.mountPath, err) 1473 } 1474 1475 devices.Lock() 1476 if err := devices.deactivateDevice(info); err != nil { 1477 logrus.Debugf("Shutdown deactivate %s , error: %s", info.Hash, err) 1478 } 1479 devices.Unlock() 1480 } 1481 info.lock.Unlock() 1482 } 1483 1484 info, _ := devices.lookupDevice("") 1485 if info != nil { 1486 info.lock.Lock() 1487 devices.Lock() 1488 if err := devices.deactivateDevice(info); err != nil { 1489 logrus.Debugf("Shutdown deactivate base , error: %s", err) 1490 } 1491 devices.Unlock() 1492 info.lock.Unlock() 1493 } 1494 1495 devices.Lock() 1496 if devices.thinPoolDevice == "" { 1497 if err := devices.deactivatePool(); err != nil { 1498 logrus.Debugf("Shutdown deactivate pool , error: %s", err) 1499 } 1500 } 1501 1502 devices.saveDeviceSetMetaData() 1503 devices.Unlock() 1504 1505 return nil 1506 } 1507 1508 func (devices *DeviceSet) MountDevice(hash, path, mountLabel string) error { 1509 info, err := devices.lookupDevice(hash) 1510 if err != nil { 1511 return err 1512 } 1513 1514 info.lock.Lock() 1515 defer info.lock.Unlock() 1516 1517 devices.Lock() 1518 defer devices.Unlock() 1519 1520 if info.mountCount > 0 { 1521 if path != info.mountPath { 1522 return fmt.Errorf("Trying to mount devmapper device in multiple places (%s, %s)", info.mountPath, path) 1523 } 1524 1525 info.mountCount++ 1526 return nil 1527 } 1528 1529 if err := devices.activateDeviceIfNeeded(info); err != nil { 1530 return fmt.Errorf("Error activating devmapper device for '%s': %s", hash, err) 1531 } 1532 1533 var flags uintptr = syscall.MS_MGC_VAL 1534 1535 fstype, err := ProbeFsType(info.DevName()) 1536 if err != nil { 1537 return err 1538 } 1539 1540 options := "" 1541 1542 if fstype == "xfs" { 1543 // XFS needs nouuid or it can't mount filesystems with the same fs 1544 options = joinMountOptions(options, "nouuid") 1545 } 1546 1547 options = joinMountOptions(options, devices.mountOptions) 1548 options = joinMountOptions(options, label.FormatMountLabel("", mountLabel)) 1549 1550 if err := syscall.Mount(info.DevName(), path, fstype, flags, options); err != nil { 1551 return fmt.Errorf("Error mounting '%s' on '%s': %s", info.DevName(), path, err) 1552 } 1553 1554 info.mountCount = 1 1555 info.mountPath = path 1556 1557 return nil 1558 } 1559 1560 func (devices *DeviceSet) UnmountDevice(hash string) error { 1561 logrus.Debugf("[devmapper] UnmountDevice(hash=%s)", hash) 1562 defer logrus.Debugf("[devmapper] UnmountDevice(hash=%s) END", hash) 1563 1564 info, err := devices.lookupDevice(hash) 1565 if err != nil { 1566 return err 1567 } 1568 1569 info.lock.Lock() 1570 defer info.lock.Unlock() 1571 1572 devices.Lock() 1573 defer devices.Unlock() 1574 1575 if info.mountCount == 0 { 1576 return fmt.Errorf("UnmountDevice: device not-mounted id %s", hash) 1577 } 1578 1579 info.mountCount-- 1580 if info.mountCount > 0 { 1581 return nil 1582 } 1583 1584 logrus.Debugf("[devmapper] Unmount(%s)", info.mountPath) 1585 if err := syscall.Unmount(info.mountPath, syscall.MNT_DETACH); err != nil { 1586 return err 1587 } 1588 logrus.Debugf("[devmapper] Unmount done") 1589 1590 if err := devices.deactivateDevice(info); err != nil { 1591 return err 1592 } 1593 1594 info.mountPath = "" 1595 1596 return nil 1597 } 1598 1599 func (devices *DeviceSet) HasDevice(hash string) bool { 1600 devices.Lock() 1601 defer devices.Unlock() 1602 1603 info, _ := devices.lookupDevice(hash) 1604 return info != nil 1605 } 1606 1607 func (devices *DeviceSet) HasActivatedDevice(hash string) bool { 1608 info, _ := devices.lookupDevice(hash) 1609 if info == nil { 1610 return false 1611 } 1612 1613 info.lock.Lock() 1614 defer info.lock.Unlock() 1615 1616 devices.Lock() 1617 defer devices.Unlock() 1618 1619 devinfo, _ := devicemapper.GetInfo(info.Name()) 1620 return devinfo != nil && devinfo.Exists != 0 1621 } 1622 1623 func (devices *DeviceSet) List() []string { 1624 devices.Lock() 1625 defer devices.Unlock() 1626 1627 devices.devicesLock.Lock() 1628 ids := make([]string, len(devices.Devices)) 1629 i := 0 1630 for k := range devices.Devices { 1631 ids[i] = k 1632 i++ 1633 } 1634 devices.devicesLock.Unlock() 1635 1636 return ids 1637 } 1638 1639 func (devices *DeviceSet) deviceStatus(devName string) (sizeInSectors, mappedSectors, highestMappedSector uint64, err error) { 1640 var params string 1641 _, sizeInSectors, _, params, err = devicemapper.GetStatus(devName) 1642 if err != nil { 1643 return 1644 } 1645 if _, err = fmt.Sscanf(params, "%d %d", &mappedSectors, &highestMappedSector); err == nil { 1646 return 1647 } 1648 return 1649 } 1650 1651 func (devices *DeviceSet) GetDeviceStatus(hash string) (*DevStatus, error) { 1652 info, err := devices.lookupDevice(hash) 1653 if err != nil { 1654 return nil, err 1655 } 1656 1657 info.lock.Lock() 1658 defer info.lock.Unlock() 1659 1660 devices.Lock() 1661 defer devices.Unlock() 1662 1663 status := &DevStatus{ 1664 DeviceId: info.DeviceId, 1665 Size: info.Size, 1666 TransactionId: info.TransactionId, 1667 } 1668 1669 if err := devices.activateDeviceIfNeeded(info); err != nil { 1670 return nil, fmt.Errorf("Error activating devmapper device for '%s': %s", hash, err) 1671 } 1672 1673 sizeInSectors, mappedSectors, highestMappedSector, err := devices.deviceStatus(info.DevName()) 1674 1675 if err != nil { 1676 return nil, err 1677 } 1678 1679 status.SizeInSectors = sizeInSectors 1680 status.MappedSectors = mappedSectors 1681 status.HighestMappedSector = highestMappedSector 1682 1683 return status, nil 1684 } 1685 1686 func (devices *DeviceSet) poolStatus() (totalSizeInSectors, transactionId, dataUsed, dataTotal, metadataUsed, metadataTotal uint64, err error) { 1687 var params string 1688 if _, totalSizeInSectors, _, params, err = devicemapper.GetStatus(devices.getPoolName()); err == nil { 1689 _, err = fmt.Sscanf(params, "%d %d/%d %d/%d", &transactionId, &metadataUsed, &metadataTotal, &dataUsed, &dataTotal) 1690 } 1691 return 1692 } 1693 1694 // DataDevicePath returns the path to the data storage for this deviceset, 1695 // regardless of loopback or block device 1696 func (devices *DeviceSet) DataDevicePath() string { 1697 return devices.dataDevice 1698 } 1699 1700 // MetadataDevicePath returns the path to the metadata storage for this deviceset, 1701 // regardless of loopback or block device 1702 func (devices *DeviceSet) MetadataDevicePath() string { 1703 return devices.metadataDevice 1704 } 1705 1706 func (devices *DeviceSet) getUnderlyingAvailableSpace(loopFile string) (uint64, error) { 1707 buf := new(syscall.Statfs_t) 1708 if err := syscall.Statfs(loopFile, buf); err != nil { 1709 logrus.Warnf("Couldn't stat loopfile filesystem %v: %v", loopFile, err) 1710 return 0, err 1711 } 1712 return buf.Bfree * uint64(buf.Bsize), nil 1713 } 1714 1715 func (devices *DeviceSet) isRealFile(loopFile string) (bool, error) { 1716 if loopFile != "" { 1717 fi, err := os.Stat(loopFile) 1718 if err != nil { 1719 logrus.Warnf("Couldn't stat loopfile %v: %v", loopFile, err) 1720 return false, err 1721 } 1722 return fi.Mode().IsRegular(), nil 1723 } 1724 return false, nil 1725 } 1726 1727 // Status returns the current status of this deviceset 1728 func (devices *DeviceSet) Status() *Status { 1729 devices.Lock() 1730 defer devices.Unlock() 1731 1732 status := &Status{} 1733 1734 status.PoolName = devices.getPoolName() 1735 status.DataFile = devices.DataDevicePath() 1736 status.DataLoopback = devices.dataLoopFile 1737 status.MetadataFile = devices.MetadataDevicePath() 1738 status.MetadataLoopback = devices.metadataLoopFile 1739 status.UdevSyncSupported = devicemapper.UdevSyncSupported() 1740 status.DeferredRemoveEnabled = devices.deferredRemove 1741 1742 totalSizeInSectors, _, dataUsed, dataTotal, metadataUsed, metadataTotal, err := devices.poolStatus() 1743 if err == nil { 1744 // Convert from blocks to bytes 1745 blockSizeInSectors := totalSizeInSectors / dataTotal 1746 1747 status.Data.Used = dataUsed * blockSizeInSectors * 512 1748 status.Data.Total = dataTotal * blockSizeInSectors * 512 1749 status.Data.Available = status.Data.Total - status.Data.Used 1750 1751 // metadata blocks are always 4k 1752 status.Metadata.Used = metadataUsed * 4096 1753 status.Metadata.Total = metadataTotal * 4096 1754 status.Metadata.Available = status.Metadata.Total - status.Metadata.Used 1755 1756 status.SectorSize = blockSizeInSectors * 512 1757 1758 if check, _ := devices.isRealFile(devices.dataLoopFile); check { 1759 actualSpace, err := devices.getUnderlyingAvailableSpace(devices.dataLoopFile) 1760 if err == nil && actualSpace < status.Data.Available { 1761 status.Data.Available = actualSpace 1762 } 1763 } 1764 1765 if check, _ := devices.isRealFile(devices.metadataLoopFile); check { 1766 actualSpace, err := devices.getUnderlyingAvailableSpace(devices.metadataLoopFile) 1767 if err == nil && actualSpace < status.Metadata.Available { 1768 status.Metadata.Available = actualSpace 1769 } 1770 } 1771 } 1772 1773 return status 1774 } 1775 1776 // Status returns the current status of this deviceset 1777 func (devices *DeviceSet) ExportDeviceMetadata(hash string) (*DeviceMetadata, error) { 1778 info, err := devices.lookupDevice(hash) 1779 if err != nil { 1780 return nil, err 1781 } 1782 1783 info.lock.Lock() 1784 defer info.lock.Unlock() 1785 1786 metadata := &DeviceMetadata{info.DeviceId, info.Size, info.Name()} 1787 return metadata, nil 1788 } 1789 1790 func NewDeviceSet(root string, doInit bool, options []string) (*DeviceSet, error) { 1791 devicemapper.SetDevDir("/dev") 1792 1793 devices := &DeviceSet{ 1794 root: root, 1795 MetaData: MetaData{Devices: make(map[string]*DevInfo)}, 1796 dataLoopbackSize: DefaultDataLoopbackSize, 1797 metaDataLoopbackSize: DefaultMetaDataLoopbackSize, 1798 baseFsSize: DefaultBaseFsSize, 1799 overrideUdevSyncCheck: DefaultUdevSyncOverride, 1800 filesystem: "ext4", 1801 doBlkDiscard: true, 1802 thinpBlockSize: DefaultThinpBlockSize, 1803 deviceIdMap: make([]byte, DeviceIdMapSz), 1804 } 1805 1806 foundBlkDiscard := false 1807 for _, option := range options { 1808 key, val, err := parsers.ParseKeyValueOpt(option) 1809 if err != nil { 1810 return nil, err 1811 } 1812 key = strings.ToLower(key) 1813 switch key { 1814 case "dm.basesize": 1815 size, err := units.RAMInBytes(val) 1816 if err != nil { 1817 return nil, err 1818 } 1819 devices.baseFsSize = uint64(size) 1820 case "dm.loopdatasize": 1821 size, err := units.RAMInBytes(val) 1822 if err != nil { 1823 return nil, err 1824 } 1825 devices.dataLoopbackSize = size 1826 case "dm.loopmetadatasize": 1827 size, err := units.RAMInBytes(val) 1828 if err != nil { 1829 return nil, err 1830 } 1831 devices.metaDataLoopbackSize = size 1832 case "dm.fs": 1833 if val != "ext4" && val != "xfs" { 1834 return nil, fmt.Errorf("Unsupported filesystem %s\n", val) 1835 } 1836 devices.filesystem = val 1837 case "dm.mkfsarg": 1838 devices.mkfsArgs = append(devices.mkfsArgs, val) 1839 case "dm.mountopt": 1840 devices.mountOptions = joinMountOptions(devices.mountOptions, val) 1841 case "dm.metadatadev": 1842 devices.metadataDevice = val 1843 case "dm.datadev": 1844 devices.dataDevice = val 1845 case "dm.thinpooldev": 1846 devices.thinPoolDevice = strings.TrimPrefix(val, "/dev/mapper/") 1847 case "dm.blkdiscard": 1848 foundBlkDiscard = true 1849 devices.doBlkDiscard, err = strconv.ParseBool(val) 1850 if err != nil { 1851 return nil, err 1852 } 1853 case "dm.blocksize": 1854 size, err := units.RAMInBytes(val) 1855 if err != nil { 1856 return nil, err 1857 } 1858 // convert to 512b sectors 1859 devices.thinpBlockSize = uint32(size) >> 9 1860 case "dm.override_udev_sync_check": 1861 devices.overrideUdevSyncCheck, err = strconv.ParseBool(val) 1862 if err != nil { 1863 return nil, err 1864 } 1865 1866 case "dm.use_deferred_removal": 1867 EnableDeferredRemoval, err = strconv.ParseBool(val) 1868 if err != nil { 1869 return nil, err 1870 } 1871 1872 default: 1873 return nil, fmt.Errorf("Unknown option %s\n", key) 1874 } 1875 } 1876 1877 // By default, don't do blk discard hack on raw devices, its rarely useful and is expensive 1878 if !foundBlkDiscard && (devices.dataDevice != "" || devices.thinPoolDevice != "") { 1879 devices.doBlkDiscard = false 1880 } 1881 1882 if err := devices.initDevmapper(doInit); err != nil { 1883 return nil, err 1884 } 1885 1886 return devices, nil 1887 }