golang.org/x/exp@v0.0.0-20240506185415-9bf2ced13842/slices/zsortanyfunc.go

golang.org/x/exp@v0.0.0-20240506185415-9bf2ced13842/slices/zsortanyfunc.go (about)

     1  // Code generated by gen_sort_variants.go; DO NOT EDIT.
     2  
     3  // Copyright 2022 The Go Authors. All rights reserved.
     4  // Use of this source code is governed by a BSD-style
     5  // license that can be found in the LICENSE file.
     6  
     7  package slices
     8  
     9  // insertionSortCmpFunc sorts data[a:b] using insertion sort.
    10  func insertionSortCmpFunc[E any](data []E, a, b int, cmp func(a, b E) int) {
    11  	for i := a + 1; i < b; i++ {
    12  		for j := i; j > a && (cmp(data[j], data[j-1]) < 0); j-- {
    13  			data[j], data[j-1] = data[j-1], data[j]
    14  		}
    15  	}
    16  }
    17  
    18  // siftDownCmpFunc implements the heap property on data[lo:hi].
    19  // first is an offset into the array where the root of the heap lies.
    20  func siftDownCmpFunc[E any](data []E, lo, hi, first int, cmp func(a, b E) int) {
    21  	root := lo
    22  	for {
    23  		child := 2*root + 1
    24  		if child >= hi {
    25  			break
    26  		}
    27  		if child+1 < hi && (cmp(data[first+child], data[first+child+1]) < 0) {
    28  			child++
    29  		}
    30  		if !(cmp(data[first+root], data[first+child]) < 0) {
    31  			return
    32  		}
    33  		data[first+root], data[first+child] = data[first+child], data[first+root]
    34  		root = child
    35  	}
    36  }
    37  
    38  func heapSortCmpFunc[E any](data []E, a, b int, cmp func(a, b E) int) {
    39  	first := a
    40  	lo := 0
    41  	hi := b - a
    42  
    43  	// Build heap with greatest element at top.
    44  	for i := (hi - 1) / 2; i >= 0; i-- {
    45  		siftDownCmpFunc(data, i, hi, first, cmp)
    46  	}
    47  
    48  	// Pop elements, largest first, into end of data.
    49  	for i := hi - 1; i >= 0; i-- {
    50  		data[first], data[first+i] = data[first+i], data[first]
    51  		siftDownCmpFunc(data, lo, i, first, cmp)
    52  	}
    53  }
    54  
    55  // pdqsortCmpFunc sorts data[a:b].
    56  // The algorithm based on pattern-defeating quicksort(pdqsort), but without the optimizations from BlockQuicksort.
    57  // pdqsort paper: https://arxiv.org/pdf/2106.05123.pdf
    58  // C++ implementation: https://github.com/orlp/pdqsort
    59  // Rust implementation: https://docs.rs/pdqsort/latest/pdqsort/
    60  // limit is the number of allowed bad (very unbalanced) pivots before falling back to heapsort.
    61  func pdqsortCmpFunc[E any](data []E, a, b, limit int, cmp func(a, b E) int) {
    62  	const maxInsertion = 12
    63  
    64  	var (
    65  		wasBalanced    = true // whether the last partitioning was reasonably balanced
    66  		wasPartitioned = true // whether the slice was already partitioned
    67  	)
    68  
    69  	for {
    70  		length := b - a
    71  
    72  		if length <= maxInsertion {
    73  			insertionSortCmpFunc(data, a, b, cmp)
    74  			return
    75  		}
    76  
    77  		// Fall back to heapsort if too many bad choices were made.
    78  		if limit == 0 {
    79  			heapSortCmpFunc(data, a, b, cmp)
    80  			return
    81  		}
    82  
    83  		// If the last partitioning was imbalanced, we need to breaking patterns.
    84  		if !wasBalanced {
    85  			breakPatternsCmpFunc(data, a, b, cmp)
    86  			limit--
    87  		}
    88  
    89  		pivot, hint := choosePivotCmpFunc(data, a, b, cmp)
    90  		if hint == decreasingHint {
    91  			reverseRangeCmpFunc(data, a, b, cmp)
    92  			// The chosen pivot was pivot-a elements after the start of the array.
    93  			// After reversing it is pivot-a elements before the end of the array.
    94  			// The idea came from Rust's implementation.
    95  			pivot = (b - 1) - (pivot - a)
    96  			hint = increasingHint
    97  		}
    98  
    99  		// The slice is likely already sorted.
   100  		if wasBalanced && wasPartitioned && hint == increasingHint {
   101  			if partialInsertionSortCmpFunc(data, a, b, cmp) {
   102  				return
   103  			}
   104  		}
   105  
   106  		// Probably the slice contains many duplicate elements, partition the slice into
   107  		// elements equal to and elements greater than the pivot.
   108  		if a > 0 && !(cmp(data[a-1], data[pivot]) < 0) {
   109  			mid := partitionEqualCmpFunc(data, a, b, pivot, cmp)
   110  			a = mid
   111  			continue
   112  		}
   113  
   114  		mid, alreadyPartitioned := partitionCmpFunc(data, a, b, pivot, cmp)
   115  		wasPartitioned = alreadyPartitioned
   116  
   117  		leftLen, rightLen := mid-a, b-mid
   118  		balanceThreshold := length / 8
   119  		if leftLen < rightLen {
   120  			wasBalanced = leftLen >= balanceThreshold
   121  			pdqsortCmpFunc(data, a, mid, limit, cmp)
   122  			a = mid + 1
   123  		} else {
   124  			wasBalanced = rightLen >= balanceThreshold
   125  			pdqsortCmpFunc(data, mid+1, b, limit, cmp)
   126  			b = mid
   127  		}
   128  	}
   129  }
   130  
   131  // partitionCmpFunc does one quicksort partition.
   132  // Let p = data[pivot]
   133  // Moves elements in data[a:b] around, so that data[i]<p and data[j]>=p for i<newpivot and j>newpivot.
   134  // On return, data[newpivot] = p
   135  func partitionCmpFunc[E any](data []E, a, b, pivot int, cmp func(a, b E) int) (newpivot int, alreadyPartitioned bool) {
   136  	data[a], data[pivot] = data[pivot], data[a]
   137  	i, j := a+1, b-1 // i and j are inclusive of the elements remaining to be partitioned
   138  
   139  	for i <= j && (cmp(data[i], data[a]) < 0) {
   140  		i++
   141  	}
   142  	for i <= j && !(cmp(data[j], data[a]) < 0) {
   143  		j--
   144  	}
   145  	if i > j {
   146  		data[j], data[a] = data[a], data[j]
   147  		return j, true
   148  	}
   149  	data[i], data[j] = data[j], data[i]
   150  	i++
   151  	j--
   152  
   153  	for {
   154  		for i <= j && (cmp(data[i], data[a]) < 0) {
   155  			i++
   156  		}
   157  		for i <= j && !(cmp(data[j], data[a]) < 0) {
   158  			j--
   159  		}
   160  		if i > j {
   161  			break
   162  		}
   163  		data[i], data[j] = data[j], data[i]
   164  		i++
   165  		j--
   166  	}
   167  	data[j], data[a] = data[a], data[j]
   168  	return j, false
   169  }
   170  
   171  // partitionEqualCmpFunc partitions data[a:b] into elements equal to data[pivot] followed by elements greater than data[pivot].
   172  // It assumed that data[a:b] does not contain elements smaller than the data[pivot].
   173  func partitionEqualCmpFunc[E any](data []E, a, b, pivot int, cmp func(a, b E) int) (newpivot int) {
   174  	data[a], data[pivot] = data[pivot], data[a]
   175  	i, j := a+1, b-1 // i and j are inclusive of the elements remaining to be partitioned
   176  
   177  	for {
   178  		for i <= j && !(cmp(data[a], data[i]) < 0) {
   179  			i++
   180  		}
   181  		for i <= j && (cmp(data[a], data[j]) < 0) {
   182  			j--
   183  		}
   184  		if i > j {
   185  			break
   186  		}
   187  		data[i], data[j] = data[j], data[i]
   188  		i++
   189  		j--
   190  	}
   191  	return i
   192  }
   193  
   194  // partialInsertionSortCmpFunc partially sorts a slice, returns true if the slice is sorted at the end.
   195  func partialInsertionSortCmpFunc[E any](data []E, a, b int, cmp func(a, b E) int) bool {
   196  	const (
   197  		maxSteps         = 5  // maximum number of adjacent out-of-order pairs that will get shifted
   198  		shortestShifting = 50 // don't shift any elements on short arrays
   199  	)
   200  	i := a + 1
   201  	for j := 0; j < maxSteps; j++ {
   202  		for i < b && !(cmp(data[i], data[i-1]) < 0) {
   203  			i++
   204  		}
   205  
   206  		if i == b {
   207  			return true
   208  		}
   209  
   210  		if b-a < shortestShifting {
   211  			return false
   212  		}
   213  
   214  		data[i], data[i-1] = data[i-1], data[i]
   215  
   216  		// Shift the smaller one to the left.
   217  		if i-a >= 2 {
   218  			for j := i - 1; j >= 1; j-- {
   219  				if !(cmp(data[j], data[j-1]) < 0) {
   220  					break
   221  				}
   222  				data[j], data[j-1] = data[j-1], data[j]
   223  			}
   224  		}
   225  		// Shift the greater one to the right.
   226  		if b-i >= 2 {
   227  			for j := i + 1; j < b; j++ {
   228  				if !(cmp(data[j], data[j-1]) < 0) {
   229  					break
   230  				}
   231  				data[j], data[j-1] = data[j-1], data[j]
   232  			}
   233  		}
   234  	}
   235  	return false
   236  }
   237  
   238  // breakPatternsCmpFunc scatters some elements around in an attempt to break some patterns
   239  // that might cause imbalanced partitions in quicksort.
   240  func breakPatternsCmpFunc[E any](data []E, a, b int, cmp func(a, b E) int) {
   241  	length := b - a
   242  	if length >= 8 {
   243  		random := xorshift(length)
   244  		modulus := nextPowerOfTwo(length)
   245  
   246  		for idx := a + (length/4)*2 - 1; idx <= a+(length/4)*2+1; idx++ {
   247  			other := int(uint(random.Next()) & (modulus - 1))
   248  			if other >= length {
   249  				other -= length
   250  			}
   251  			data[idx], data[a+other] = data[a+other], data[idx]
   252  		}
   253  	}
   254  }
   255  
   256  // choosePivotCmpFunc chooses a pivot in data[a:b].
   257  //
   258  // [0,8): chooses a static pivot.
   259  // [8,shortestNinther): uses the simple median-of-three method.
   260  // [shortestNinther,∞): uses the Tukey ninther method.
   261  func choosePivotCmpFunc[E any](data []E, a, b int, cmp func(a, b E) int) (pivot int, hint sortedHint) {
   262  	const (
   263  		shortestNinther = 50
   264  		maxSwaps        = 4 * 3
   265  	)
   266  
   267  	l := b - a
   268  
   269  	var (
   270  		swaps int
   271  		i     = a + l/4*1
   272  		j     = a + l/4*2
   273  		k     = a + l/4*3
   274  	)
   275  
   276  	if l >= 8 {
   277  		if l >= shortestNinther {
   278  			// Tukey ninther method, the idea came from Rust's implementation.
   279  			i = medianAdjacentCmpFunc(data, i, &swaps, cmp)
   280  			j = medianAdjacentCmpFunc(data, j, &swaps, cmp)
   281  			k = medianAdjacentCmpFunc(data, k, &swaps, cmp)
   282  		}
   283  		// Find the median among i, j, k and stores it into j.
   284  		j = medianCmpFunc(data, i, j, k, &swaps, cmp)
   285  	}
   286  
   287  	switch swaps {
   288  	case 0:
   289  		return j, increasingHint
   290  	case maxSwaps:
   291  		return j, decreasingHint
   292  	default:
   293  		return j, unknownHint
   294  	}
   295  }
   296  
   297  // order2CmpFunc returns x,y where data[x] <= data[y], where x,y=a,b or x,y=b,a.
   298  func order2CmpFunc[E any](data []E, a, b int, swaps *int, cmp func(a, b E) int) (int, int) {
   299  	if cmp(data[b], data[a]) < 0 {
   300  		*swaps++
   301  		return b, a
   302  	}
   303  	return a, b
   304  }
   305  
   306  // medianCmpFunc returns x where data[x] is the median of data[a],data[b],data[c], where x is a, b, or c.
   307  func medianCmpFunc[E any](data []E, a, b, c int, swaps *int, cmp func(a, b E) int) int {
   308  	a, b = order2CmpFunc(data, a, b, swaps, cmp)
   309  	b, c = order2CmpFunc(data, b, c, swaps, cmp)
   310  	a, b = order2CmpFunc(data, a, b, swaps, cmp)
   311  	return b
   312  }
   313  
   314  // medianAdjacentCmpFunc finds the median of data[a - 1], data[a], data[a + 1] and stores the index into a.
   315  func medianAdjacentCmpFunc[E any](data []E, a int, swaps *int, cmp func(a, b E) int) int {
   316  	return medianCmpFunc(data, a-1, a, a+1, swaps, cmp)
   317  }
   318  
   319  func reverseRangeCmpFunc[E any](data []E, a, b int, cmp func(a, b E) int) {
   320  	i := a
   321  	j := b - 1
   322  	for i < j {
   323  		data[i], data[j] = data[j], data[i]
   324  		i++
   325  		j--
   326  	}
   327  }
   328  
   329  func swapRangeCmpFunc[E any](data []E, a, b, n int, cmp func(a, b E) int) {
   330  	for i := 0; i < n; i++ {
   331  		data[a+i], data[b+i] = data[b+i], data[a+i]
   332  	}
   333  }
   334  
   335  func stableCmpFunc[E any](data []E, n int, cmp func(a, b E) int) {
   336  	blockSize := 20 // must be > 0
   337  	a, b := 0, blockSize
   338  	for b <= n {
   339  		insertionSortCmpFunc(data, a, b, cmp)
   340  		a = b
   341  		b += blockSize
   342  	}
   343  	insertionSortCmpFunc(data, a, n, cmp)
   344  
   345  	for blockSize < n {
   346  		a, b = 0, 2*blockSize
   347  		for b <= n {
   348  			symMergeCmpFunc(data, a, a+blockSize, b, cmp)
   349  			a = b
   350  			b += 2 * blockSize
   351  		}
   352  		if m := a + blockSize; m < n {
   353  			symMergeCmpFunc(data, a, m, n, cmp)
   354  		}
   355  		blockSize *= 2
   356  	}
   357  }
   358  
   359  // symMergeCmpFunc merges the two sorted subsequences data[a:m] and data[m:b] using
   360  // the SymMerge algorithm from Pok-Son Kim and Arne Kutzner, "Stable Minimum
   361  // Storage Merging by Symmetric Comparisons", in Susanne Albers and Tomasz
   362  // Radzik, editors, Algorithms - ESA 2004, volume 3221 of Lecture Notes in
   363  // Computer Science, pages 714-723. Springer, 2004.
   364  //
   365  // Let M = m-a and N = b-n. Wolog M < N.
   366  // The recursion depth is bound by ceil(log(N+M)).
   367  // The algorithm needs O(M*log(N/M + 1)) calls to data.Less.
   368  // The algorithm needs O((M+N)*log(M)) calls to data.Swap.
   369  //
   370  // The paper gives O((M+N)*log(M)) as the number of assignments assuming a
   371  // rotation algorithm which uses O(M+N+gcd(M+N)) assignments. The argumentation
   372  // in the paper carries through for Swap operations, especially as the block
   373  // swapping rotate uses only O(M+N) Swaps.
   374  //
   375  // symMerge assumes non-degenerate arguments: a < m && m < b.
   376  // Having the caller check this condition eliminates many leaf recursion calls,
   377  // which improves performance.
   378  func symMergeCmpFunc[E any](data []E, a, m, b int, cmp func(a, b E) int) {
   379  	// Avoid unnecessary recursions of symMerge
   380  	// by direct insertion of data[a] into data[m:b]
   381  	// if data[a:m] only contains one element.
   382  	if m-a == 1 {
   383  		// Use binary search to find the lowest index i
   384  		// such that data[i] >= data[a] for m <= i < b.
   385  		// Exit the search loop with i == b in case no such index exists.
   386  		i := m
   387  		j := b
   388  		for i < j {
   389  			h := int(uint(i+j) >> 1)
   390  			if cmp(data[h], data[a]) < 0 {
   391  				i = h + 1
   392  			} else {
   393  				j = h
   394  			}
   395  		}
   396  		// Swap values until data[a] reaches the position before i.
   397  		for k := a; k < i-1; k++ {
   398  			data[k], data[k+1] = data[k+1], data[k]
   399  		}
   400  		return
   401  	}
   402  
   403  	// Avoid unnecessary recursions of symMerge
   404  	// by direct insertion of data[m] into data[a:m]
   405  	// if data[m:b] only contains one element.
   406  	if b-m == 1 {
   407  		// Use binary search to find the lowest index i
   408  		// such that data[i] > data[m] for a <= i < m.
   409  		// Exit the search loop with i == m in case no such index exists.
   410  		i := a
   411  		j := m
   412  		for i < j {
   413  			h := int(uint(i+j) >> 1)
   414  			if !(cmp(data[m], data[h]) < 0) {
   415  				i = h + 1
   416  			} else {
   417  				j = h
   418  			}
   419  		}
   420  		// Swap values until data[m] reaches the position i.
   421  		for k := m; k > i; k-- {
   422  			data[k], data[k-1] = data[k-1], data[k]
   423  		}
   424  		return
   425  	}
   426  
   427  	mid := int(uint(a+b) >> 1)
   428  	n := mid + m
   429  	var start, r int
   430  	if m > mid {
   431  		start = n - b
   432  		r = mid
   433  	} else {
   434  		start = a
   435  		r = m
   436  	}
   437  	p := n - 1
   438  
   439  	for start < r {
   440  		c := int(uint(start+r) >> 1)
   441  		if !(cmp(data[p-c], data[c]) < 0) {
   442  			start = c + 1
   443  		} else {
   444  			r = c
   445  		}
   446  	}
   447  
   448  	end := n - start
   449  	if start < m && m < end {
   450  		rotateCmpFunc(data, start, m, end, cmp)
   451  	}
   452  	if a < start && start < mid {
   453  		symMergeCmpFunc(data, a, start, mid, cmp)
   454  	}
   455  	if mid < end && end < b {
   456  		symMergeCmpFunc(data, mid, end, b, cmp)
   457  	}
   458  }
   459  
   460  // rotateCmpFunc rotates two consecutive blocks u = data[a:m] and v = data[m:b] in data:
   461  // Data of the form 'x u v y' is changed to 'x v u y'.
   462  // rotate performs at most b-a many calls to data.Swap,
   463  // and it assumes non-degenerate arguments: a < m && m < b.
   464  func rotateCmpFunc[E any](data []E, a, m, b int, cmp func(a, b E) int) {
   465  	i := m - a
   466  	j := b - m
   467  
   468  	for i != j {
   469  		if i > j {
   470  			swapRangeCmpFunc(data, m-i, m, j, cmp)
   471  			i -= j
   472  		} else {
   473  			swapRangeCmpFunc(data, m-i, m+j-i, i, cmp)
   474  			j -= i
   475  		}
   476  	}
   477  	// i == j
   478  	swapRangeCmpFunc(data, m-i, m, i, cmp)
   479  }