Skip to content

Commit 22a2bdf

Browse files
committedOct 3, 2016
sort: add Slice, SliceStable, and SliceIsSorted
Add helpers for sorting slices. Slice sorts slices: sort.Slice(s, func(i, j int) bool { if s[i].Foo != s[j].Foo { return s[i].Foo < s[j].Foo } return s[i].Bar < s[j].Bar }) SliceStable is the same, but does a stable sort. SliceIsSorted reports whether a slice is already sorted. Fixes #16721 Change-Id: I346530af1c5dee148ea9be85946fe08f23ae53e7 Reviewed-on: https://go-review.googlesource.com/27321 Run-TryBot: Brad Fitzpatrick <[email protected]> TryBot-Result: Gobot Gobot <[email protected]> Reviewed-by: Russ Cox <[email protected]>
1 parent 003a598 commit 22a2bdf

File tree

6 files changed

+518
-25
lines changed

6 files changed

+518
-25
lines changed
 

‎src/cmd/dist/deps.go

+6-6
Original file line numberDiff line numberDiff line change
@@ -7,7 +7,7 @@ var builddeps = map[string][]string{
77
"bytes": {"errors", "internal/race", "io", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sync", "sync/atomic", "unicode", "unicode/utf8"},
88
"compress/flate": {"bufio", "bytes", "errors", "fmt", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "math", "os", "reflect", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "sync", "sync/atomic", "syscall", "time", "unicode", "unicode/utf16", "unicode/utf8"},
99
"compress/zlib": {"bufio", "bytes", "compress/flate", "errors", "fmt", "hash", "hash/adler32", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "math", "os", "reflect", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "sync", "sync/atomic", "syscall", "time", "unicode", "unicode/utf16", "unicode/utf8"},
10-
"container/heap": {"runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort"},
10+
"container/heap": {"errors", "internal/race", "math", "reflect", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "sync", "sync/atomic", "unicode/utf8"},
1111
"context": {"errors", "fmt", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "math", "os", "reflect", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "strconv", "sync", "sync/atomic", "syscall", "time", "unicode/utf16", "unicode/utf8"},
1212
"crypto": {"errors", "hash", "internal/race", "io", "math", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "strconv", "sync", "sync/atomic", "unicode/utf8"},
1313
"crypto/sha1": {"crypto", "errors", "hash", "internal/race", "io", "math", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "strconv", "sync", "sync/atomic", "unicode/utf8"},
@@ -35,22 +35,22 @@ var builddeps = map[string][]string{
3535
"internal/syscall/windows/registry": {"errors", "internal/race", "internal/syscall/windows/sysdll", "io", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sync", "sync/atomic", "syscall", "unicode/utf16"},
3636
"internal/syscall/windows/sysdll": {"runtime", "runtime/internal/atomic", "runtime/internal/sys"},
3737
"io": {"errors", "internal/race", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sync", "sync/atomic"},
38-
"io/ioutil": {"bytes", "errors", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "math", "os", "path/filepath", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "strings", "sync", "sync/atomic", "syscall", "time", "unicode", "unicode/utf16", "unicode/utf8"},
38+
"io/ioutil": {"bytes", "errors", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "math", "os", "path/filepath", "reflect", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "strings", "sync", "sync/atomic", "syscall", "time", "unicode", "unicode/utf16", "unicode/utf8"},
3939
"log": {"errors", "fmt", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "math", "os", "reflect", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "strconv", "sync", "sync/atomic", "syscall", "time", "unicode/utf16", "unicode/utf8"},
4040
"math": {"runtime", "runtime/internal/atomic", "runtime/internal/sys"},
4141
"net/url": {"bytes", "errors", "fmt", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "math", "os", "reflect", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "strings", "sync", "sync/atomic", "syscall", "time", "unicode", "unicode/utf16", "unicode/utf8"},
4242
"os": {"errors", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sync", "sync/atomic", "syscall", "time", "unicode/utf16", "unicode/utf8"},
4343
"os/exec": {"bytes", "context", "errors", "fmt", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "math", "os", "path/filepath", "reflect", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "strings", "sync", "sync/atomic", "syscall", "time", "unicode", "unicode/utf16", "unicode/utf8"},
4444
"os/signal": {"errors", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "os", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sync", "sync/atomic", "syscall", "time", "unicode/utf16", "unicode/utf8"},
4545
"path": {"errors", "internal/race", "io", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "strings", "sync", "sync/atomic", "unicode", "unicode/utf8"},
46-
"path/filepath": {"errors", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "os", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strings", "sync", "sync/atomic", "syscall", "time", "unicode", "unicode/utf16", "unicode/utf8"},
46+
"path/filepath": {"errors", "internal/race", "internal/syscall/windows", "internal/syscall/windows/registry", "internal/syscall/windows/sysdll", "io", "math", "os", "reflect", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "strings", "sync", "sync/atomic", "syscall", "time", "unicode", "unicode/utf16", "unicode/utf8"},
4747
"reflect": {"errors", "internal/race", "math", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "strconv", "sync", "sync/atomic", "unicode/utf8"},
48-
"regexp": {"bytes", "errors", "internal/race", "io", "math", "regexp/syntax", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "strings", "sync", "sync/atomic", "unicode", "unicode/utf8"},
49-
"regexp/syntax": {"bytes", "errors", "internal/race", "io", "math", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "strings", "sync", "sync/atomic", "unicode", "unicode/utf8"},
48+
"regexp": {"bytes", "errors", "internal/race", "io", "math", "reflect", "regexp/syntax", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "strings", "sync", "sync/atomic", "unicode", "unicode/utf8"},
49+
"regexp/syntax": {"bytes", "errors", "internal/race", "io", "math", "reflect", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sort", "strconv", "strings", "sync", "sync/atomic", "unicode", "unicode/utf8"},
5050
"runtime": {"runtime/internal/atomic", "runtime/internal/sys"},
5151
"runtime/internal/atomic": {"runtime/internal/sys"},
5252
"runtime/internal/sys": {},
53-
"sort": {"runtime", "runtime/internal/atomic", "runtime/internal/sys"},
53+
"sort": {"errors", "internal/race", "math", "reflect", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "strconv", "sync", "sync/atomic", "unicode/utf8"},
5454
"strconv": {"errors", "math", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "unicode/utf8"},
5555
"strings": {"errors", "internal/race", "io", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sync", "sync/atomic", "unicode", "unicode/utf8"},
5656
"sync": {"internal/race", "runtime", "runtime/internal/atomic", "runtime/internal/sys", "sync/atomic"},

‎src/go/build/deps_test.go

+1-1
Original file line numberDiff line numberDiff line change
@@ -59,7 +59,6 @@ var pkgDeps = map[string][]string{
5959
"math": {"unsafe"},
6060
"math/cmplx": {"math"},
6161
"math/rand": {"L0", "math"},
62-
"sort": {},
6362
"strconv": {"L0", "unicode/utf8", "math"},
6463
"unicode/utf16": {},
6564
"unicode/utf8": {},
@@ -109,6 +108,7 @@ var pkgDeps = map[string][]string{
109108
"image/color": {"L2"}, // interfaces
110109
"image/color/palette": {"L2", "image/color"},
111110
"reflect": {"L2"},
111+
"sort": {"reflect"},
112112

113113
"L3": {
114114
"L2",

‎src/sort/genzfunc.go

+122
Original file line numberDiff line numberDiff line change
@@ -0,0 +1,122 @@
1+
// Copyright 2016 The Go Authors. All rights reserved.
2+
// Use of this source code is governed by a BSD-style
3+
// license that can be found in the LICENSE file.
4+
5+
// +build ignore
6+
7+
// This program is run via "go generate" (via a directive in sort.go)
8+
// to generate zfuncversion.go.
9+
//
10+
// It copies sort.go to zfuncversion.go, only retaining funcs which
11+
// take a "data Interface" parameter, and renaming each to have a
12+
// "_func" suffix and taking a "data lessSwap" instead. It then rewrites
13+
// each internal function call to the appropriate _func variants.
14+
15+
package main
16+
17+
import (
18+
"bytes"
19+
"go/ast"
20+
"go/format"
21+
"go/parser"
22+
"go/token"
23+
"io/ioutil"
24+
"log"
25+
"regexp"
26+
)
27+
28+
var fset = token.NewFileSet()
29+
30+
func main() {
31+
af, err := parser.ParseFile(fset, "sort.go", nil, 0)
32+
if err != nil {
33+
log.Fatal(err)
34+
}
35+
af.Doc = nil
36+
af.Imports = nil
37+
af.Comments = nil
38+
39+
var newDecl []ast.Decl
40+
for _, d := range af.Decls {
41+
fd, ok := d.(*ast.FuncDecl)
42+
if !ok {
43+
continue
44+
}
45+
if fd.Recv != nil || fd.Name.IsExported() {
46+
continue
47+
}
48+
typ := fd.Type
49+
if len(typ.Params.List) < 1 {
50+
continue
51+
}
52+
arg0 := typ.Params.List[0]
53+
arg0Name := arg0.Names[0].Name
54+
arg0Type := arg0.Type.(*ast.Ident)
55+
if arg0Name != "data" || arg0Type.Name != "Interface" {
56+
continue
57+
}
58+
arg0Type.Name = "lessSwap"
59+
60+
newDecl = append(newDecl, fd)
61+
}
62+
af.Decls = newDecl
63+
ast.Walk(visitFunc(rewriteCalls), af)
64+
65+
var out bytes.Buffer
66+
if err := format.Node(&out, fset, af); err != nil {
67+
log.Fatalf("format.Node: %v", err)
68+
}
69+
70+
// Get rid of blank lines after removal of comments.
71+
src := regexp.MustCompile(`\n{2,}`).ReplaceAll(out.Bytes(), []byte("\n"))
72+
73+
// Add comments to each func, for the lost reader.
74+
// This is so much easier than adding comments via the AST
75+
// and trying to get position info correct.
76+
src = regexp.MustCompile(`(?m)^func (\w+)`).ReplaceAll(src, []byte("\n// Auto-generated variant of sort.go:$1\nfunc ${1}_func"))
77+
78+
// Final gofmt.
79+
src, err = format.Source(src)
80+
if err != nil {
81+
log.Fatalf("format.Source: %v on\n%s", err, src)
82+
}
83+
84+
out.Reset()
85+
out.WriteString(`// DO NOT EDIT; AUTO-GENERATED from sort.go using genzfunc.go
86+
87+
// Copyright 2016 The Go Authors. All rights reserved.
88+
// Use of this source code is governed by a BSD-style
89+
// license that can be found in the LICENSE file.
90+
91+
`)
92+
out.Write(src)
93+
94+
const target = "zfuncversion.go"
95+
if err := ioutil.WriteFile(target, out.Bytes(), 0644); err != nil {
96+
log.Fatal(err)
97+
}
98+
}
99+
100+
type visitFunc func(ast.Node) ast.Visitor
101+
102+
func (f visitFunc) Visit(n ast.Node) ast.Visitor { return f(n) }
103+
104+
func rewriteCalls(n ast.Node) ast.Visitor {
105+
ce, ok := n.(*ast.CallExpr)
106+
if ok {
107+
rewriteCall(ce)
108+
}
109+
return visitFunc(rewriteCalls)
110+
}
111+
112+
func rewriteCall(ce *ast.CallExpr) {
113+
ident, ok := ce.Fun.(*ast.Ident)
114+
if !ok {
115+
// e.g. skip SelectorExpr (data.Less(..) calls)
116+
return
117+
}
118+
if len(ce.Args) < 1 {
119+
return
120+
}
121+
ident.Name += "_func"
122+
}

‎src/sort/sort.go

+62-6
Original file line numberDiff line numberDiff line change
@@ -2,10 +2,14 @@
22
// Use of this source code is governed by a BSD-style
33
// license that can be found in the LICENSE file.
44

5+
//go:generate go run genzfunc.go
6+
57
// Package sort provides primitives for sorting slices and user-defined
68
// collections.
79
package sort
810

11+
import "reflect"
12+
913
// A type, typically a collection, that satisfies sort.Interface can be
1014
// sorted by the routines in this package. The methods require that the
1115
// elements of the collection be enumerated by an integer index.
@@ -212,14 +216,63 @@ func quickSort(data Interface, a, b, maxDepth int) {
212216
// It makes one call to data.Len to determine n, and O(n*log(n)) calls to
213217
// data.Less and data.Swap. The sort is not guaranteed to be stable.
214218
func Sort(data Interface) {
215-
// Switch to heapsort if depth of 2*ceil(lg(n+1)) is reached.
216219
n := data.Len()
217-
maxDepth := 0
220+
quickSort(data, 0, n, maxDepth(n))
221+
}
222+
223+
// maxDepth returns a threshold at which quicksort should switch
224+
// to heapsort. It returns 2*ceil(lg(n+1)).
225+
func maxDepth(n int) int {
226+
var depth int
218227
for i := n; i > 0; i >>= 1 {
219-
maxDepth++
228+
depth++
229+
}
230+
return depth * 2
231+
}
232+
233+
// lessSwap is a pair of Less and Swap function for use with the
234+
// auto-generated func-optimized variant of sort.go in
235+
// zfuncversion.go.
236+
type lessSwap struct {
237+
Less func(i, j int) bool
238+
Swap func(i, j int)
239+
}
240+
241+
// Slice sorts the provided slice given the provided less function.
242+
//
243+
// The sort is not guaranteed to be stable. For a stable sort, use
244+
// SliceStable.
245+
//
246+
// The function panics if the provided interface is not a slice.
247+
func Slice(slice interface{}, less func(i, j int) bool) {
248+
rv := reflect.ValueOf(slice)
249+
swap := reflect.Swapper(slice)
250+
length := rv.Len()
251+
quickSort_func(lessSwap{less, swap}, 0, length, maxDepth(length))
252+
}
253+
254+
// SliceStable sorts the provided slice given the provided less
255+
// function while keeping the original order of equal elements.
256+
//
257+
// The function panics if the provided interface is not a slice.
258+
func SliceStable(slice interface{}, less func(i, j int) bool) {
259+
rv := reflect.ValueOf(slice)
260+
swap := reflect.Swapper(slice)
261+
stable_func(lessSwap{less, swap}, rv.Len())
262+
}
263+
264+
// SliceIsSorted tests whether a slice is sorted.
265+
//
266+
// The function panics if the provided interface is not a slice.
267+
func SliceIsSorted(slice interface{}, less func(i, j int) bool) bool {
268+
rv := reflect.ValueOf(slice)
269+
n := rv.Len()
270+
for i := n - 1; i > 0; i-- {
271+
if less(i, i-1) {
272+
return false
273+
}
220274
}
221-
maxDepth *= 2
222-
quickSort(data, 0, n, maxDepth)
275+
return true
223276
}
224277

225278
type reverse struct {
@@ -337,7 +390,10 @@ func StringsAreSorted(a []string) bool { return IsSorted(StringSlice(a)) }
337390
// It makes one call to data.Len to determine n, O(n*log(n)) calls to
338391
// data.Less and O(n*log(n)*log(n)) calls to data.Swap.
339392
func Stable(data Interface) {
340-
n := data.Len()
393+
stable(data, data.Len())
394+
}
395+
396+
func stable(data Interface, n int) {
341397
blockSize := 20 // must be > 0
342398
a, b := 0, blockSize
343399
for b <= n {

‎src/sort/sort_test.go

+62-12
Original file line numberDiff line numberDiff line change
@@ -76,6 +76,17 @@ func TestStrings(t *testing.T) {
7676
}
7777
}
7878

79+
func TestSlice(t *testing.T) {
80+
data := strings
81+
Slice(data[:], func(i, j int) bool {
82+
return data[i] < data[j]
83+
})
84+
if !SliceIsSorted(data[:], func(i, j int) bool { return data[i] < data[j] }) {
85+
t.Errorf("sorted %v", strings)
86+
t.Errorf(" got %v", data)
87+
}
88+
}
89+
7990
func TestSortLarge_Random(t *testing.T) {
8091
n := 1000000
8192
if testing.Short() {
@@ -150,24 +161,46 @@ func TestNonDeterministicComparison(t *testing.T) {
150161

151162
func BenchmarkSortString1K(b *testing.B) {
152163
b.StopTimer()
164+
unsorted := make([]string, 1<<10)
165+
for i := range unsorted {
166+
unsorted[i] = strconv.Itoa(i ^ 0x2cc)
167+
}
168+
data := make([]string, len(unsorted))
169+
153170
for i := 0; i < b.N; i++ {
154-
data := make([]string, 1<<10)
155-
for i := 0; i < len(data); i++ {
156-
data[i] = strconv.Itoa(i ^ 0x2cc)
157-
}
171+
copy(data, unsorted)
158172
b.StartTimer()
159173
Strings(data)
160174
b.StopTimer()
161175
}
162176
}
163177

178+
func BenchmarkSortString1K_Slice(b *testing.B) {
179+
b.StopTimer()
180+
unsorted := make([]string, 1<<10)
181+
for i := range unsorted {
182+
unsorted[i] = strconv.Itoa(i ^ 0x2cc)
183+
}
184+
data := make([]string, len(unsorted))
185+
186+
for i := 0; i < b.N; i++ {
187+
copy(data, unsorted)
188+
b.StartTimer()
189+
Slice(data, func(i, j int) bool { return data[i] < data[j] })
190+
b.StopTimer()
191+
}
192+
}
193+
164194
func BenchmarkStableString1K(b *testing.B) {
165195
b.StopTimer()
196+
unsorted := make([]string, 1<<10)
197+
for i := 0; i < len(data); i++ {
198+
unsorted[i] = strconv.Itoa(i ^ 0x2cc)
199+
}
200+
data := make([]string, len(unsorted))
201+
166202
for i := 0; i < b.N; i++ {
167-
data := make([]string, 1<<10)
168-
for i := 0; i < len(data); i++ {
169-
data[i] = strconv.Itoa(i ^ 0x2cc)
170-
}
203+
copy(data, unsorted)
171204
b.StartTimer()
172205
Stable(StringSlice(data))
173206
b.StopTimer()
@@ -189,17 +222,34 @@ func BenchmarkSortInt1K(b *testing.B) {
189222

190223
func BenchmarkStableInt1K(b *testing.B) {
191224
b.StopTimer()
225+
unsorted := make([]int, 1<<10)
226+
for i := range unsorted {
227+
unsorted[i] = i ^ 0x2cc
228+
}
229+
data := make([]int, len(unsorted))
192230
for i := 0; i < b.N; i++ {
193-
data := make([]int, 1<<10)
194-
for i := 0; i < len(data); i++ {
195-
data[i] = i ^ 0x2cc
196-
}
231+
copy(data, unsorted)
197232
b.StartTimer()
198233
Stable(IntSlice(data))
199234
b.StopTimer()
200235
}
201236
}
202237

238+
func BenchmarkStableInt1K_Slice(b *testing.B) {
239+
b.StopTimer()
240+
unsorted := make([]int, 1<<10)
241+
for i := range unsorted {
242+
unsorted[i] = i ^ 0x2cc
243+
}
244+
data := make([]int, len(unsorted))
245+
for i := 0; i < b.N; i++ {
246+
copy(data, unsorted)
247+
b.StartTimer()
248+
Slice(data, func(i, j int) bool { return data[i] < data[j] })
249+
b.StopTimer()
250+
}
251+
}
252+
203253
func BenchmarkSortInt64K(b *testing.B) {
204254
b.StopTimer()
205255
for i := 0; i < b.N; i++ {

0 commit comments

Comments
 (0)