]> Cypherpunks repositories - gostls13.git/commitdiff
cmd/compile: schedule values with no in-block uses later
authorKeith Randall <khr@golang.org>
Wed, 1 Feb 2023 16:31:03 +0000 (08:31 -0800)
committerKeith Randall <khr@google.com>
Wed, 1 Feb 2023 18:41:07 +0000 (18:41 +0000)
When scheduling a block, deprioritize values whose results aren't used
until subsequent blocks.

For #58166, this has the effect of pushing the induction variable increment
to the end of the block, past all the other uses of the pre-incremented value.

Do this only with optimizations on. Debuggers have a preference for values
in source code order, which this CL can degrade.

Fixes #58166
Fixes #57976

Change-Id: I40d5885c661b142443c6d4702294c8abe8026c4f
Reviewed-on: https://go-review.googlesource.com/c/go/+/463751
Run-TryBot: Keith Randall <khr@golang.org>
Reviewed-by: David Chase <drchase@google.com>
Reviewed-by: Keith Randall <khr@google.com>
TryBot-Result: Gopher Robot <gobot@golang.org>

src/cmd/compile/internal/ssa/schedule.go
test/codegen/issue58166.go [new file with mode: 0644]

index 4cd60d714c9ed1d10d4505ab35288901ea8f31f1..c291e5c13f0079955693f09a61594a8b0b86be30 100644 (file)
@@ -25,8 +25,9 @@ const (
 )
 
 type ValHeap struct {
-       a     []*Value
-       score []int8
+       a           []*Value
+       score       []int8
+       inBlockUses []bool
 }
 
 func (h ValHeap) Len() int      { return len(h.a) }
@@ -56,6 +57,12 @@ func (h ValHeap) Less(i, j int) bool {
        // Note: only scores are required for correct scheduling.
        // Everything else is just heuristics.
 
+       ix := h.inBlockUses[x.ID]
+       iy := h.inBlockUses[y.ID]
+       if ix != iy {
+               return ix // values with in-block uses come earlier
+       }
+
        if x.Pos != y.Pos { // Favor in-order line stepping
                if x.Block == x.Block.Func.Entry && x.Pos.IsStmt() != y.Pos.IsStmt() {
                        // In the entry block, put statement-marked instructions earlier.
@@ -110,6 +117,23 @@ func schedule(f *Func) {
        nextMem := f.Cache.allocValueSlice(f.NumValues())
        defer f.Cache.freeValueSlice(nextMem)
 
+       // inBlockUses records whether a value is used in the block
+       // in which it lives. (block control values don't count as uses.)
+       inBlockUses := f.Cache.allocBoolSlice(f.NumValues())
+       defer f.Cache.freeBoolSlice(inBlockUses)
+       if f.Config.optimize {
+               for _, b := range f.Blocks {
+                       for _, v := range b.Values {
+                               for _, a := range v.Args {
+                                       if a.Block == b {
+                                               inBlockUses[a.ID] = true
+                                       }
+                               }
+                       }
+               }
+       }
+       priq.inBlockUses = inBlockUses
+
        for _, b := range f.Blocks {
                // Compute score. Larger numbers are scheduled closer to the end of the block.
                for _, v := range b.Values {
diff --git a/test/codegen/issue58166.go b/test/codegen/issue58166.go
new file mode 100644 (file)
index 0000000..8be5aac
--- /dev/null
@@ -0,0 +1,23 @@
+// asmcheck
+
+// Copyright 2023 The Go Authors. All rights reserved.
+// Use of this source code is governed by a BSD-style
+// license that can be found in the LICENSE file.
+
+package p
+
+func dgemmSerialNotNot(m, n, k int, a []float64, lda int, b []float64, ldb int, c []float64, ldc int, alpha float64) {
+       for i := 0; i < m; i++ {
+               ctmp := c[i*ldc : i*ldc+n]
+               for l, v := range a[i*lda : i*lda+k] {
+                       tmp := alpha * v
+                       if tmp != 0 {
+                               x := b[l*ldb : l*ldb+n]
+                               // amd64:"INCQ"
+                               for i, v := range x {
+                                       ctmp[i] += tmp * v
+                               }
+                       }
+               }
+       }
+}