github.com/keybase/client/go@v0.0.0-20241007131713-f10651d043c8/lru/disk_lru.go (about)

     1  package lru
     2  
     3  import (
     4  	"container/list"
     5  	json "encoding/json"
     6  	"errors"
     7  	"fmt"
     8  	"os"
     9  	"path/filepath"
    10  	"sync"
    11  	"time"
    12  
    13  	"github.com/keybase/client/go/libkb"
    14  	context "golang.org/x/net/context"
    15  )
    16  
    17  type Pathable struct {
    18  	Path string
    19  }
    20  
    21  type DiskLRUEntry struct {
    22  	Key          string
    23  	Value        interface{}
    24  	Ctime        time.Time
    25  	LastAccessed time.Time
    26  }
    27  
    28  type diskLRUIndexMarshaled struct {
    29  	Version   int
    30  	EntryKeys []string
    31  }
    32  
    33  type diskLRUIndex struct {
    34  	sync.Mutex
    35  	Version     int
    36  	EntryKeys   *list.List
    37  	entryKeyMap map[string]*list.Element
    38  	dirty       bool
    39  }
    40  
    41  func newDiskLRUIndex(version int) *diskLRUIndex {
    42  	return &diskLRUIndex{
    43  		EntryKeys:   list.New(),
    44  		Version:     version,
    45  		entryKeyMap: make(map[string]*list.Element),
    46  	}
    47  }
    48  
    49  func (d *diskLRUIndex) exists(key string) *list.Element {
    50  	return d.entryKeyMap[key]
    51  }
    52  
    53  func (d *diskLRUIndex) Exists(key string) bool {
    54  	d.Lock()
    55  	defer d.Unlock()
    56  	return (d.exists(key) != nil)
    57  }
    58  
    59  func (d *diskLRUIndex) remove(key string) {
    60  	if el, ok := d.entryKeyMap[key]; ok {
    61  		d.EntryKeys.Remove(el)
    62  		delete(d.entryKeyMap, key)
    63  	}
    64  }
    65  
    66  func (d *diskLRUIndex) Remove(key string) {
    67  	d.Lock()
    68  	defer d.Unlock()
    69  	d.dirty = true
    70  	d.remove(key)
    71  }
    72  
    73  func (d *diskLRUIndex) put(key string) {
    74  	d.entryKeyMap[key] = d.EntryKeys.PushFront(key)
    75  }
    76  
    77  func (d *diskLRUIndex) Put(key string) {
    78  	d.Lock()
    79  	defer d.Unlock()
    80  	d.dirty = true
    81  	if d.exists(key) != nil {
    82  		d.remove(key)
    83  	}
    84  	d.put(key)
    85  }
    86  
    87  func (d *diskLRUIndex) IsDirty() bool {
    88  	d.Lock()
    89  	defer d.Unlock()
    90  	return d.dirty
    91  }
    92  
    93  func (d *diskLRUIndex) ClearDirty() {
    94  	d.Lock()
    95  	defer d.Unlock()
    96  	d.dirty = false
    97  }
    98  
    99  func (d *diskLRUIndex) Marshal() diskLRUIndexMarshaled {
   100  	var m diskLRUIndexMarshaled
   101  	m.Version = d.Version
   102  	for e := d.EntryKeys.Front(); e != nil; e = e.Next() {
   103  		m.EntryKeys = append(m.EntryKeys, e.Value.(string))
   104  	}
   105  	return m
   106  }
   107  
   108  func (d *diskLRUIndex) Unmarshal(m diskLRUIndexMarshaled) {
   109  	d.EntryKeys = list.New()
   110  	d.Version = m.Version
   111  	d.entryKeyMap = make(map[string]*list.Element)
   112  	for _, k := range m.EntryKeys {
   113  		d.entryKeyMap[k] = d.EntryKeys.PushBack(k)
   114  	}
   115  }
   116  
   117  func (d *diskLRUIndex) Size() int {
   118  	d.Lock()
   119  	defer d.Unlock()
   120  	return d.EntryKeys.Len()
   121  }
   122  
   123  func (d *diskLRUIndex) OldestKey() (string, error) {
   124  	d.Lock()
   125  	defer d.Unlock()
   126  	if d.EntryKeys.Len() == 0 {
   127  		return "", errors.New("index is empty")
   128  	}
   129  	return d.EntryKeys.Back().Value.(string), nil
   130  }
   131  
   132  // DiskLRU maintains a cache of files on the disk in a LRU manner.
   133  type DiskLRU struct {
   134  	sync.Mutex
   135  
   136  	index   *diskLRUIndex
   137  	name    string
   138  	version int
   139  	maxSize int
   140  
   141  	lastFlush     time.Time
   142  	flushDuration time.Duration
   143  
   144  	// testing
   145  	flushCh chan struct{}
   146  }
   147  
   148  func NewDiskLRU(name string, version, maxSize int) *DiskLRU {
   149  	return &DiskLRU{
   150  		name:          name,
   151  		version:       version,
   152  		maxSize:       maxSize,
   153  		flushDuration: time.Minute,
   154  	}
   155  }
   156  
   157  func (d *DiskLRU) MaxSize() int {
   158  	d.Lock()
   159  	defer d.Unlock()
   160  	return d.maxSize
   161  }
   162  
   163  func (d *DiskLRU) debug(ctx context.Context, lctx libkb.LRUContext, msg string, args ...interface{}) {
   164  	lctx.GetLog().CDebugf(ctx, fmt.Sprintf("DiskLRU: %s(%d): ", d.name, d.version)+msg, args...)
   165  }
   166  
   167  func (d *DiskLRU) indexKey() libkb.DbKey {
   168  	return libkb.DbKey{
   169  		Typ: libkb.DBDiskLRUIndex,
   170  		Key: fmt.Sprintf("%s:%d", d.name, d.version),
   171  	}
   172  }
   173  
   174  func (d *DiskLRU) entryKey(key string) libkb.DbKey {
   175  	return libkb.DbKey{
   176  		Typ: libkb.DBDiskLRUEntries,
   177  		Key: fmt.Sprintf("%s:%d:%s", d.name, d.version, key),
   178  	}
   179  }
   180  
   181  func (d *DiskLRU) readIndex(ctx context.Context, lctx libkb.LRUContext) (res *diskLRUIndex, err error) {
   182  	// Check memory and stash if we read with no error
   183  	if d.index != nil {
   184  		return d.index, nil
   185  	}
   186  	defer func() {
   187  		if err == nil && res != nil {
   188  			d.index = res
   189  		}
   190  	}()
   191  
   192  	// Grab from the disk if we miss on memory
   193  	var marshalIndex diskLRUIndexMarshaled
   194  	res = new(diskLRUIndex)
   195  	found, err := lctx.GetKVStore().GetInto(&marshalIndex, d.indexKey())
   196  	if err != nil {
   197  		return nil, err
   198  	}
   199  	if !found {
   200  		return newDiskLRUIndex(d.version), nil
   201  	}
   202  	res.Unmarshal(marshalIndex)
   203  	return res, nil
   204  }
   205  
   206  func (d *DiskLRU) writeIndex(ctx context.Context, lctx libkb.LRUContext, index *diskLRUIndex,
   207  	forceFlush bool) error {
   208  	if forceFlush || lctx.GetClock().Now().Sub(d.lastFlush) > d.flushDuration {
   209  		marshalIndex := index.Marshal()
   210  		if err := lctx.GetKVStore().PutObj(d.indexKey(), nil, marshalIndex); err != nil {
   211  			return err
   212  		}
   213  		d.lastFlush = lctx.GetClock().Now()
   214  		index.ClearDirty()
   215  		if d.flushCh != nil {
   216  			d.flushCh <- struct{}{}
   217  		}
   218  	}
   219  	return nil
   220  }
   221  
   222  func (d *DiskLRU) readEntry(ctx context.Context, lctx libkb.LRUContext, key string) (found bool, res DiskLRUEntry, err error) {
   223  	found, err = lctx.GetKVStore().GetInto(&res, d.entryKey(key))
   224  	if err != nil {
   225  		return false, res, err
   226  	}
   227  	return found, res, nil
   228  }
   229  
   230  func (d *DiskLRU) accessEntry(ctx context.Context, lctx libkb.LRUContext, index *diskLRUIndex,
   231  	entry *DiskLRUEntry) error {
   232  	// Promote the key in the index
   233  	index.Put(entry.Key)
   234  	// Write out the entry with new accessed time
   235  	entry.LastAccessed = lctx.GetClock().Now()
   236  	return lctx.GetKVStore().PutObj(d.entryKey(entry.Key), nil, entry)
   237  }
   238  
   239  func (d *DiskLRU) Get(ctx context.Context, lctx libkb.LRUContext, key string) (found bool, res DiskLRUEntry, err error) {
   240  	d.Lock()
   241  	defer d.Unlock()
   242  
   243  	var index *diskLRUIndex
   244  	defer func() {
   245  		// Commit the index
   246  		if err == nil && index != nil && index.IsDirty() {
   247  			err := d.writeIndex(ctx, lctx, index, false)
   248  			if err != nil {
   249  				d.debug(ctx, lctx, "Get: error writing index: %+v", err)
   250  			}
   251  		}
   252  	}()
   253  
   254  	// Grab entry index
   255  	index, err = d.readIndex(ctx, lctx)
   256  	if err != nil {
   257  		return found, res, err
   258  	}
   259  	// Check for a straight up miss
   260  	if !index.Exists(key) {
   261  		return false, res, nil
   262  	}
   263  	// Read entry
   264  	found, res, err = d.readEntry(ctx, lctx, key)
   265  	if err != nil {
   266  		return found, res, err
   267  	}
   268  	if !found {
   269  		// remove from index
   270  		index.Remove(key)
   271  		return false, res, nil
   272  	}
   273  	// update last accessed time for the entry
   274  	if err = d.accessEntry(ctx, lctx, index, &res); err != nil {
   275  		return found, res, err
   276  	}
   277  
   278  	return true, res, nil
   279  }
   280  
   281  func (d *DiskLRU) removeEntry(ctx context.Context, lctx libkb.LRUContext, index *diskLRUIndex, key string) error {
   282  	index.Remove(key)
   283  	return lctx.GetKVStore().Delete(d.entryKey(key))
   284  }
   285  
   286  func (d *DiskLRU) addEntry(ctx context.Context, lctx libkb.LRUContext, index *diskLRUIndex, key string,
   287  	value interface{}) (evicted *DiskLRUEntry, err error) {
   288  
   289  	// Add the new item
   290  	index.Put(key)
   291  	item := DiskLRUEntry{
   292  		Key:          key,
   293  		Value:        value,
   294  		Ctime:        lctx.GetClock().Now(),
   295  		LastAccessed: lctx.GetClock().Now(),
   296  	}
   297  	if err = lctx.GetKVStore().PutObj(d.entryKey(key), nil, item); err != nil {
   298  		return nil, err
   299  	}
   300  
   301  	if index.Size() > d.maxSize {
   302  		// Evict the oldest item
   303  		var found bool
   304  		var lastItem DiskLRUEntry
   305  		lastKey, err := index.OldestKey()
   306  		if err == nil {
   307  			d.debug(ctx, lctx, "evicting: %s", lastKey)
   308  			found, lastItem, err = d.readEntry(ctx, lctx, lastKey)
   309  			if err != nil {
   310  				return nil, err
   311  			}
   312  			if found {
   313  				evicted = &lastItem
   314  				d.debug(ctx, lctx, "addEntry: evicting item: key: %s", lastKey)
   315  			}
   316  			if err = d.removeEntry(ctx, lctx, index, lastKey); err != nil {
   317  				return nil, err
   318  			}
   319  		} else {
   320  			d.debug(ctx, lctx, "addEntry: failed to find oldest key, check cache config")
   321  		}
   322  	}
   323  
   324  	return evicted, nil
   325  }
   326  
   327  func (d *DiskLRU) Put(ctx context.Context, lctx libkb.LRUContext, key string, value interface{}) (evicted *DiskLRUEntry, err error) {
   328  	d.Lock()
   329  	defer d.Unlock()
   330  
   331  	var index *diskLRUIndex
   332  	defer func() {
   333  		// Commit the index
   334  		if err == nil && index != nil && index.IsDirty() {
   335  			err = d.writeIndex(ctx, lctx, index, true)
   336  		}
   337  	}()
   338  
   339  	// Grab entry index
   340  	index, err = d.readIndex(ctx, lctx)
   341  	if err != nil {
   342  		return nil, err
   343  	}
   344  	// Remove existing entry from the index (we don't need to remove entry off the disk, since we will
   345  	// overwrite it with new stuff)
   346  	if index.Exists(key) {
   347  		index.Remove(key)
   348  	}
   349  	// Add the item
   350  	return d.addEntry(ctx, lctx, index, key, value)
   351  }
   352  
   353  func (d *DiskLRU) Remove(ctx context.Context, lctx libkb.LRUContext, key string) (err error) {
   354  	d.Lock()
   355  	defer d.Unlock()
   356  	var index *diskLRUIndex
   357  	defer func() {
   358  		// Commit the index
   359  		if err == nil && index != nil && index.IsDirty() {
   360  			err := d.writeIndex(ctx, lctx, index, false)
   361  			if err != nil {
   362  				d.debug(ctx, lctx, "Get: error writing index: %+v", err)
   363  			}
   364  
   365  		}
   366  	}()
   367  	// Grab entry index
   368  	index, err = d.readIndex(ctx, lctx)
   369  	if err != nil {
   370  		return err
   371  	}
   372  	return d.removeEntry(ctx, lctx, index, key)
   373  }
   374  
   375  func (d *DiskLRU) ClearMemory(ctx context.Context, lctx libkb.LRUContext) {
   376  	d.Lock()
   377  	defer d.Unlock()
   378  	d.flush(ctx, lctx)
   379  	d.index = nil
   380  }
   381  
   382  func (d *DiskLRU) flush(ctx context.Context, lctx libkb.LRUContext) error {
   383  	if d.index != nil {
   384  		return d.writeIndex(ctx, lctx, d.index, true)
   385  	}
   386  	return nil
   387  }
   388  
   389  func (d *DiskLRU) Flush(ctx context.Context, lctx libkb.LRUContext) error {
   390  	d.Lock()
   391  	defer d.Unlock()
   392  	return d.flush(ctx, lctx)
   393  }
   394  
   395  func (d *DiskLRU) Size(ctx context.Context, lctx libkb.LRUContext) (int, error) {
   396  	d.Lock()
   397  	defer d.Unlock()
   398  	index, err := d.readIndex(ctx, lctx)
   399  	if err != nil {
   400  		return 0, err
   401  	}
   402  	return index.Size(), nil
   403  }
   404  
   405  func (d *DiskLRU) allValuesLocked(ctx context.Context, lctx libkb.LRUContext) (entries []DiskLRUEntry, err error) {
   406  	var index *diskLRUIndex
   407  	defer func() {
   408  		// Commit the index
   409  		if err == nil && index != nil && index.IsDirty() {
   410  			err := d.writeIndex(ctx, lctx, index, false)
   411  			if err != nil {
   412  				d.debug(ctx, lctx, "Get: error writing index: %+v", err)
   413  			}
   414  		}
   415  	}()
   416  
   417  	// Grab entry index
   418  	index, err = d.readIndex(ctx, lctx)
   419  	if err != nil {
   420  		return nil, err
   421  	}
   422  	for key := range index.entryKeyMap {
   423  		found, res, err := d.readEntry(ctx, lctx, key)
   424  		switch {
   425  		case err != nil:
   426  			return nil, err
   427  		case !found:
   428  			index.Remove(key)
   429  		default:
   430  			entries = append(entries, res)
   431  		}
   432  	}
   433  	return entries, nil
   434  }
   435  
   436  func (d *DiskLRU) CleanOutOfSync(mctx libkb.MetaContext, cacheDir string) error {
   437  	_, err := d.cleanOutOfSync(mctx, cacheDir, 0)
   438  	return err
   439  }
   440  
   441  func (d *DiskLRU) getPath(entry DiskLRUEntry) (res string, ok bool) {
   442  	if res, ok = entry.Value.(string); ok {
   443  		return res, ok
   444  	}
   445  	if _, ok = entry.Value.(map[string]interface{}); ok {
   446  		var pathable Pathable
   447  		jstr, _ := json.Marshal(entry.Value)
   448  		_ = json.Unmarshal(jstr, &pathable)
   449  		path := pathable.Path
   450  		if len(path) == 0 {
   451  			return "", false
   452  		}
   453  		return path, true
   454  	}
   455  	return "", false
   456  }
   457  
   458  func (d *DiskLRU) cleanOutOfSync(mctx libkb.MetaContext, cacheDir string, batchSize int) (completed bool, err error) {
   459  	defer mctx.Trace("cleanOutOfSync", &err)()
   460  	d.Lock()
   461  	defer d.Unlock()
   462  
   463  	// clear our inmemory cache without flushing to disk to force a new read
   464  	d.index = nil
   465  
   466  	// reverse map of filepaths to lru keys
   467  	cacheRevMap := map[string]string{}
   468  	allVals, err := d.allValuesLocked(mctx.Ctx(), mctx.G())
   469  	if err != nil {
   470  		return false, err
   471  	}
   472  	for _, entry := range allVals {
   473  		path, ok := d.getPath(entry)
   474  		if !ok {
   475  			continue
   476  		}
   477  		// normalize the filepath in case the abs path to of the cacheDir
   478  		// changed.
   479  		path = filepath.Join(cacheDir, filepath.Base(path))
   480  		cacheRevMap[path] = entry.Key
   481  	}
   482  
   483  	files, err := filepath.Glob(filepath.Join(cacheDir, "*"))
   484  	if err != nil {
   485  		return false, err
   486  	}
   487  
   488  	d.debug(mctx.Ctx(), mctx.G(), "Clean: found %d files in %s, %d in cache",
   489  		len(files), cacheDir, len(cacheRevMap))
   490  	removed := 0
   491  	for _, v := range files {
   492  		if _, ok := cacheRevMap[v]; !ok {
   493  			if err := os.Remove(v); err != nil {
   494  				d.debug(mctx.Ctx(), mctx.G(), "Clean: failed to delete file %q: %s", v, err)
   495  			}
   496  			removed++
   497  			if batchSize > 0 && removed > batchSize {
   498  				d.debug(mctx.Ctx(), mctx.G(), "Clean: Aborting clean, reached batch size %d", batchSize)
   499  				return false, nil
   500  			}
   501  		}
   502  	}
   503  	return true, nil
   504  }
   505  
   506  // CleanOutOfSyncWithDelay runs the LRU clean function after the `delay` duration. If
   507  // the service crashes it's possible that temporarily files get stranded on
   508  // disk before they can get recorded in the LRU. Callers can run this in the
   509  // background to prevent leaking space.  We delay to keep off the critical path
   510  // to start up.
   511  func CleanOutOfSyncWithDelay(mctx libkb.MetaContext, d *DiskLRU, cacheDir string, delay time.Duration) {
   512  
   513  	mctx.Debug("CleanOutOfSyncWithDelay: cleaning %s in %v", cacheDir, delay)
   514  	select {
   515  	case <-mctx.Ctx().Done():
   516  		mctx.Debug("CleanOutOfSyncWithDelay: cancelled before initial delay finished")
   517  		return
   518  	case <-time.After(delay):
   519  	}
   520  
   521  	defer mctx.Trace("CleanOutOfSyncWithDelay", nil)()
   522  
   523  	// Batch deletions so we don't hog the lock.
   524  	batchSize := 1000
   525  
   526  	batchDelay := 10 * time.Millisecond
   527  	if mctx.G().IsMobileAppType() {
   528  		batchDelay = 25 * time.Millisecond
   529  	}
   530  	for {
   531  		select {
   532  		case <-mctx.Ctx().Done():
   533  			mctx.Debug("CleanOutOfSyncWithDelay: cancelled")
   534  			return
   535  		default:
   536  		}
   537  		if completed, err := d.cleanOutOfSync(mctx, cacheDir, batchSize); err != nil {
   538  			mctx.Debug("unable to run clean: %v", err)
   539  			break
   540  		} else if completed {
   541  			break
   542  		}
   543  		// Keep out of a tight loop with a short sleep.
   544  		time.Sleep(batchDelay)
   545  	}
   546  	size, err := d.Size(mctx.Ctx(), mctx.G())
   547  	if err != nil {
   548  		mctx.Debug("unable to get diskLRU size: %v", err)
   549  	}
   550  	mctx.Debug("lru current size: %d, max size: %d", size, d.MaxSize())
   551  }