github.com/m3db/m3@v1.5.0/src/query/functions/utils/heap.go (about) 1 // Copyright (c) 2018 Uber Technologies, Inc. 2 // 3 // Permission is hereby granted, free of charge, to any person obtaining a copy 4 // of this software and associated documentation files (the "Software"), to deal 5 // in the Software without restriction, including without limitation the rights 6 // to use, copy, modify, merge, publish, distribute, sublicense, and/or sell 7 // copies of the Software, and to permit persons to whom the Software is 8 // furnished to do so, subject to the following conditions: 9 // 10 // The above copyright notice and this permission notice shall be included in 11 // all copies or substantial portions of the Software. 12 // 13 // THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR 14 // IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, 15 // FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE 16 // AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER 17 // LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, 18 // OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN 19 // THE SOFTWARE. 20 21 package utils 22 23 import ( 24 "container/heap" 25 "math" 26 "sort" 27 ) 28 29 // ValueIndexPair is a pair of float value and index at which it exists 30 type ValueIndexPair struct { 31 Val float64 32 Index int 33 } 34 35 type lessFn func(ValueIndexPair, ValueIndexPair) bool 36 37 func maxHeapLess(i, j ValueIndexPair) bool { 38 if equalWithNaNs(i.Val, j.Val) { 39 return i.Index > j.Index 40 } 41 return i.Val < j.Val || lesserIfNaNs(i.Val, j.Val) 42 } 43 44 func minHeapLess(i, j ValueIndexPair) bool { 45 if equalWithNaNs(i.Val, j.Val) { 46 return i.Index > j.Index 47 } 48 return i.Val > j.Val || lesserIfNaNs(i.Val, j.Val) 49 } 50 51 // Compares two floats for equality with NaNs taken into account. 52 func equalWithNaNs(i,j float64) bool { 53 return i == j || math.IsNaN(i) && math.IsNaN(j) 54 } 55 56 // Compares NaNs. 57 // Basically, we do not want to add NaNs to the heap when it has reached it's cap so this fn should be used to prevent this. 58 func lesserIfNaNs(i,j float64) bool { 59 return math.IsNaN(i) && !math.IsNaN(j) 60 } 61 62 // Compares two float64 values which one is lesser with NaNs. NaNs are always sorted away. 63 func LesserWithNaNs(i, j float64) bool { 64 return i < j || math.IsNaN(j) && !math.IsNaN(i) 65 } 66 67 // Compares two float64 values which one is greater with NaNs. NaNs are always sorted away. 68 func GreaterWithNaNs(i, j float64) bool { 69 return i > j || math.IsNaN(j) && !math.IsNaN(i) 70 } 71 72 // FloatHeap is a heap that can be given a maximum size 73 type FloatHeap struct { 74 isMaxHeap bool 75 capacity int 76 floatHeap *floatHeap 77 } 78 79 // NewFloatHeap builds a new FloatHeap based on first parameter 80 // and a capacity given by second parameter. Zero and negative 81 // values for maxSize provide an unbounded FloatHeap 82 func NewFloatHeap(isMaxHeap bool, capacity int) FloatHeap { 83 var less lessFn 84 if isMaxHeap { 85 less = maxHeapLess 86 } else { 87 less = minHeapLess 88 } 89 90 if capacity < 1 { 91 capacity = 0 92 } 93 94 floatHeap := &floatHeap{ 95 heap: make([]ValueIndexPair, 0, capacity), 96 less: less, 97 } 98 99 heap.Init(floatHeap) 100 return FloatHeap{ 101 isMaxHeap: isMaxHeap, 102 capacity: capacity, 103 floatHeap: floatHeap, 104 } 105 } 106 107 // Push pushes a value and index pair to the heap 108 func (fh *FloatHeap) Push(value float64, index int) { 109 h := fh.floatHeap 110 // If capacity is zero or negative, allow infinite size heap 111 if fh.capacity > 0 { 112 // At max size, drop or replace incoming value. 113 // Otherwise, continue as normal 114 if len(h.heap) >= fh.capacity { 115 peek := h.heap[0] 116 // Compare incoming value with current top of heap. 117 // Decide if to replace the current top, or to drop incoming 118 // value as appropriate for this min/max heap 119 // 120 // If values are equal, do not add incoming value regardless 121 // 122 // NB(arnikola): unfortunately, can't just replace first 123 // element as it may not respect internal order. Need to 124 // run heap.Fix() to rectify this 125 if (fh.isMaxHeap && GreaterWithNaNs(value, peek.Val)) || 126 (!fh.isMaxHeap && LesserWithNaNs(value, peek.Val)) { 127 h.heap[0] = ValueIndexPair{ 128 Val: value, 129 Index: index, 130 } 131 132 heap.Fix(h, 0) 133 } 134 135 return 136 } 137 138 // Otherwise, fallthrough 139 } 140 141 heap.Push(h, ValueIndexPair{ 142 Val: value, 143 Index: index, 144 }) 145 } 146 147 // Len returns the current length of the heap 148 func (fh *FloatHeap) Len() int { 149 return fh.floatHeap.Len() 150 } 151 152 // Cap returns the capacity of the heap 153 func (fh *FloatHeap) Cap() int { 154 return fh.capacity 155 } 156 157 // Reset resets the heap 158 func (fh *FloatHeap) Reset() { 159 fh.floatHeap.heap = fh.floatHeap.heap[:0] 160 } 161 162 // Flush flushes the float heap and resets it. Does not guarantee order. 163 func (fh *FloatHeap) Flush() []ValueIndexPair { 164 values := fh.floatHeap.heap 165 fh.Reset() 166 return values 167 } 168 169 // OrderedFlush flushes the float heap and returns values in order. 170 func (fh *FloatHeap) OrderedFlush() []ValueIndexPair { 171 flushed := fh.Flush() 172 sort.Slice(flushed, func(i, j int) bool { 173 return !fh.floatHeap.less(flushed[i], flushed[j]) //reverse sort 174 }) 175 return flushed 176 } 177 178 // Peek reveals the top value of the heap without mutating the heap. 179 func (fh *FloatHeap) Peek() (ValueIndexPair, bool) { 180 h := fh.floatHeap.heap 181 if len(h) == 0 { 182 return ValueIndexPair{}, false 183 } 184 return h[0], true 185 } 186 187 // floatHeap is a heap that can be given a maximum size 188 type floatHeap struct { 189 less lessFn 190 heap []ValueIndexPair 191 } 192 193 // Assert that floatHeap is a heap.Interface 194 var _ heap.Interface = (*floatHeap)(nil) 195 196 // Len gives the length of items in the heap 197 func (h *floatHeap) Len() int { 198 return len(h.heap) 199 } 200 201 // Less is true if value of i is less than value of j 202 func (h *floatHeap) Less(i, j int) bool { 203 return h.less(h.heap[i], h.heap[j]) 204 } 205 206 // Swap swaps values at these indices 207 func (h *floatHeap) Swap(i, j int) { 208 h.heap[i], h.heap[j] = h.heap[j], h.heap[i] 209 } 210 211 // Push pushes a ValueIndexPair to the FloatMaxHeap 212 func (h *floatHeap) Push(x interface{}) { 213 pair := x.(ValueIndexPair) 214 h.heap = append(h.heap, pair) 215 } 216 217 // Pop pops a ValueIndexPair from the FloatMaxHeap 218 func (h *floatHeap) Pop() interface{} { 219 old := h.heap 220 n := len(old) 221 tail := old[n-1] 222 h.heap = old[:n-1] 223 return tail 224 }