Daniel Morsing (Gerrit)

unread,

Nov 6, 2025, 3:18:32 PM (7 days ago) Nov 6

to goph...@pubsubhelper.golang.org, golang-co...@googlegroups.com

Daniel Morsing has uploaded the change for review

Commit message

cmd/compile: optimize liveness in stackalloc

The stackalloc code needs to run a liveness pass to build the
interference graph between stack slots. Because the values that we need
liveness over is so sparse, we can optimize the analysis by using a path
exploration algorithm rather than a iterative dataflow one

In local testing, this cuts 74.05 ms of CPU time off a build of cmd/compile.

Change-Id: I765ace87d5e8aae177e65eb63da482e3d698bea7

Change diff

diff --git a/src/cmd/compile/internal/ssa/stackalloc.go b/src/cmd/compile/internal/ssa/stackalloc.go
index 11ffe5b..eabdba3 100644
--- a/src/cmd/compile/internal/ssa/stackalloc.go
+++ b/src/cmd/compile/internal/ssa/stackalloc.go
@@ -56,10 +56,36 @@
 }
 
 type stackValState struct {
-	typ      *types.Type
-	spill    *Value
-	needSlot bool
-	isArg    bool
+	typ       *types.Type
+	spill     *Value
+	needSlot  bool
+	isArg     bool
+	defBlock  ID
+	useBlocks []stackUseBlock
+}
+
+// addUseBlock adds a block to the set of blocks that uses this value.
+// The set property is loosely enforced. We append a block if the
+// last block was a different block. Because we add values block by block
+// (barring phi-nodes), this approximates a set. It is ok for useBlocks
+// to have duplicates, since we will just run right through them when we
+// perform the liveness analysis
+func (sv *stackValState) addUseBlock(b *Block, liveout bool) {
+	entry := stackUseBlock{
+		b:       b,
+		liveout: liveout,
+	}
+	if sv.useBlocks == nil || sv.useBlocks[len(sv.useBlocks)-1] != entry {
+		sv.useBlocks = append(sv.useBlocks, stackUseBlock{
+			b:       b,
+			liveout: liveout,
+		})
+	}
+}
+
+type stackUseBlock struct {
+	b       *Block
+	liveout bool
 }
 
 // stackalloc allocates storage in the stack frame for
@@ -99,6 +125,7 @@
 			s.values[v.ID].typ = v.Type
 			s.values[v.ID].needSlot = !v.Type.IsMemory() && !v.Type.IsVoid() && !v.Type.IsFlags() && f.getHome(v.ID) == nil && !v.rematerializeable() && !v.OnWasmStack
 			s.values[v.ID].isArg = hasAnyArgOp(v)
+			s.values[v.ID].defBlock = b.ID
 			if f.pass.debug > stackDebug && s.values[v.ID].needSlot {
 				fmt.Printf("%s needs a stack slot\n", v)
 			}
@@ -291,80 +318,83 @@
 
 // computeLive computes a map from block ID to a list of
 // stack-slot-needing value IDs live at the end of that block.
-// TODO: this could be quadratic if lots of variables are live across lots of
-// basic blocks. Figure out a way to make this function (or, more precisely, the user
-// of this function) require only linear size & time.
+//
+// Because values using stack slots are few and far inbetween
+// (compared to the set of all values), we use a path exploration
+// algorithm to calculate liveness here.
 func (s *stackAllocState) computeLive(spillLive [][]ID) {
-	s.live = make([][]ID, s.f.NumBlocks())
-	var phis []*Value
-	live := s.f.newSparseSet(s.f.NumValues())
-	defer s.f.retSparseSet(live)
-	t := s.f.newSparseSet(s.f.NumValues())
-	defer s.f.retSparseSet(t)
-
-	// Instead of iterating over f.Blocks, iterate over their postordering.
-	// Liveness information flows backward, so starting at the end
-	// increases the probability that we will stabilize quickly.
-	po := s.f.postorder()
-	for {
-		changed := false
-		for _, b := range po {
-			// Start with known live values at the end of the block
-			live.clear()
-			live.addAll(s.live[b.ID])
-
-			// Propagate backwards to the start of the block
-			phis = phis[:0]
-			for i := len(b.Values) - 1; i >= 0; i-- {
-				v := b.Values[i]
-				live.remove(v.ID)
-				if v.Op == OpPhi {
-					// Save phi for later.
-					// Note: its args might need a stack slot even though
-					// the phi itself doesn't. So don't use needSlot.
-					if !v.Type.IsMemory() && !v.Type.IsVoid() {
-						phis = append(phis, v)
-					}
-					continue
-				}
-				for _, a := range v.Args {
-					if s.values[a.ID].needSlot {
-						live.add(a.ID)
-					}
-				}
-			}
-
-			// for each predecessor of b, expand its list of live-at-end values
-			// invariant: s contains the values live at the start of b (excluding phi inputs)
-			for i, e := range b.Preds {
-				p := e.b
-				t.clear()
-				t.addAll(s.live[p.ID])
-				t.addAll(live.contents())
-				t.addAll(spillLive[p.ID])
-				for _, v := range phis {
-					a := v.Args[i]
-					if s.values[a.ID].needSlot {
-						t.add(a.ID)
-					}
-					if spill := s.values[a.ID].spill; spill != nil {
-						//TODO: remove?  Subsumed by SpillUse?
-						t.add(spill.ID)
-					}
-				}
-				if t.size() == len(s.live[p.ID]) {
-					continue
-				}
-				// grow p's live set
-				s.live[p.ID] = append(s.live[p.ID][:0], t.contents()...)
-				changed = true
-			}
+	f := s.f
+	for _, b := range f.Blocks {
+		for _, spillvid := range spillLive[b.ID] {
+			val := &s.values[spillvid]
+			val.addUseBlock(b, true)
 		}
-
-		if !changed {
-			break
+		for _, v := range b.Values {
+			for i, a := range v.Args {
+				val := &s.values[a.ID]
+				useBlock := b
+				forceLiveout := false
+				if v.Op == OpPhi {
+					useBlock = b.Preds[i].b
+					forceLiveout = true
+					if spill := val.spill; spill != nil {
+						s.values[spill.ID].addUseBlock(useBlock, true)
+					}
+				}
+				if !val.needSlot {
+					continue
+				}
+				val.addUseBlock(useBlock, forceLiveout)
+			}
 		}
 	}
+
+	s.live = make([][]ID, f.NumBlocks())
+	push := func(bid, vid ID) {
+		l := s.live[bid]
+		if l == nil || l[len(l)-1] != vid {
+			l = append(l, vid)
+		}
+		s.live[bid] = l
+	}
+	// TODO: If we can help along the interference graph by calculating livein sets,
+	// we can do so trivially by turning this sparse set into an array of arrays
+	// and checking the top for the current value instead of inclusion in the sparse set.
+	seen := f.newSparseSet(f.NumBlocks())
+	defer f.retSparseSet(seen)
+	// instead of pruning out duplicate blocks when we build the useblocks
+	// or when we add them to the queue, rely on the seen set to stop considering
+	// them. This is slightly faster than building the workqueues as sets
+	//
+	// However, this means that the queue can grow larger than the number of blocks.
+	// hence, we cannot use allocBlockSlice.
+	bqueue := make([]*Block, 0, f.NumBlocks())
+	for vid, v := range s.values {
+		if !v.needSlot {
+			continue
+		}
+		seen.clear()
+		bqueue = bqueue[:0]
+		for _, b := range v.useBlocks {
+			if b.liveout {
+				push(b.b.ID, ID(vid))
+			}
+			bqueue = append(bqueue, b.b)
+		}
+		for len(bqueue) > 0 {
+			work := bqueue[len(bqueue)-1]
+			bqueue = bqueue[:len(bqueue)-1]
+			if seen.contains(work.ID) || work.ID == v.defBlock {
+				continue
+			}
+			seen.add(work.ID)
+			for _, e := range work.Preds {
+				push(e.b.ID, ID(vid))
+				bqueue = append(bqueue, e.b)
+			}
+		}
+	}
+
 	if s.f.pass.debug > stackDebug {
 		for _, b := range s.f.Blocks {
 			fmt.Printf("stacklive %s %v\n", b, s.live[b.ID])

Change information

Files:

M src/cmd/compile/internal/ssa/stackalloc.go

Change size: M

Delta: 1 file changed, 104 insertions(+), 74 deletions(-)

Open in Gerrit

Related details

Attention set is empty

Submit Requirements:

Code-Review
No-Unresolved-Comments
Review-Enforcement
TryBots-Pass

Inspect html for hidden footers to help with email filtering. To unsubscribe visit settings.

Gerrit

unsatisfied_requirement

satisfied_requirement

open

diffy

Daniel Morsing (Gerrit)

unread,

Nov 6, 2025, 5:50:22 PM (6 days ago) Nov 6

to goph...@pubsubhelper.golang.org, Keith Randall, Martin Möhrmann, Gopher Robot, golang-co...@googlegroups.com

Attention needed from Keith Randall and Martin Möhrmann

Daniel Morsing voted Commit-Queue+1

Commit-Queue

+1

Open in Gerrit

Related details

Attention is currently required from:

Keith Randall
Martin Möhrmann

Submit Requirements:

Code-Review
No-Unresolved-Comments
Review-Enforcement
TryBots-Pass

Inspect html for hidden footers to help with email filtering. To unsubscribe visit settings.

Gerrit

unsatisfied_requirement

satisfied_requirement

open

diffy

Daniel Morsing (Gerrit)

unread,

Nov 10, 2025, 7:26:57 AM (3 days ago) Nov 10

to goph...@pubsubhelper.golang.org, golang-co...@googlegroups.com

Attention needed from Keith Randall and Martin Möhrmann

Daniel Morsing uploaded new patchset

Daniel Morsing uploaded patch set #2 to this change.

Following approvals got outdated and were removed:

TryBots-Pass: LUCI-TryBot-Result+1 by Go LUCI

Open in Gerrit

Related details

Attention is currently required from:

Keith Randall
Martin Möhrmann

Submit Requirements:

Code-Review
No-Unresolved-Comments
Review-Enforcement
TryBots-Pass

Inspect html for hidden footers to help with email filtering. To unsubscribe visit settings.

Gerrit

unsatisfied_requirement

satisfied_requirement

open

diffy

Keith Randall (Gerrit)

unread,

Nov 11, 2025, 4:03:39 PM (2 days ago) Nov 11

to Daniel Morsing, goph...@pubsubhelper.golang.org, Go LUCI, Keith Randall, Martin Möhrmann, Gopher Robot, golang-co...@googlegroups.com

Attention needed from Daniel Morsing and Martin Möhrmann

Keith Randall added 5 comments

File src/cmd/compile/internal/ssa/stackalloc.go

Line 68, Patchset 2 (Latest):// The set property is loosely enforced. We append a block if the

Keith Randall . unresolved

"The set property" you mean here is the no duplicates property, you should make that clear.

Line 322, Patchset 2 (Latest):// Because values using stack slots are few and far inbetween

Keith Randall . unresolved

This comment should probably go inside the body, as it relates to the implementation (not needed by callers).

Line 351, Patchset 2 (Parent): //TODO: remove? Subsumed by SpillUse?

Keith Randall . unresolved

Keep this TODO?

Line 358, Patchset 2 (Latest): s.live[bid] = l

Keith Randall . unresolved

This can go inside the `if`.

Line 385, Patchset 2 (Latest): push(b.b.ID, ID(vid))

Keith Randall . unresolved

This case means we might have duplicates in s.live, right?

That's new behavior, might be worth checking that that is still ok. (It probably is, we just call `addAll` on it?)

Open in Gerrit

Related details

Attention is currently required from:

Daniel Morsing
Martin Möhrmann

Submit Requirements:

Code-Review

No-Unresolved-Comments

Review-Enforcement
TryBots-Pass

Inspect html for hidden footers to help with email filtering. To unsubscribe visit settings.

Gerrit

unsatisfied_requirement

open

diffy

Daniel Morsing (Gerrit)

unread,

Nov 12, 2025, 11:40:27 AM (18 hours ago) Nov 12

to goph...@pubsubhelper.golang.org, golang-co...@googlegroups.com

Attention needed from Daniel Morsing and Martin Möhrmann

Daniel Morsing uploaded new patchset

Daniel Morsing uploaded patch set #3 to this change.

Open in Gerrit

Related details

Attention is currently required from:

Daniel Morsing
Martin Möhrmann

Submit Requirements:

Code-Review
No-Unresolved-Comments
Review-Enforcement
TryBots-Pass

Inspect html for hidden footers to help with email filtering. To unsubscribe visit settings.

Gerrit

unsatisfied_requirement

open

diffy

Daniel Morsing (Gerrit)

unread,

Nov 12, 2025, 11:40:57 AM (18 hours ago) Nov 12

to goph...@pubsubhelper.golang.org, Go LUCI, Keith Randall, Martin Möhrmann, Gopher Robot, golang-co...@googlegroups.com

Attention needed from Keith Randall and Martin Möhrmann

Daniel Morsing voted and added 6 comments

Votes added by Daniel Morsing

Commit-Queue

+1

6 comments

Patchset-level comments

File-level comment, Patchset 2:

Daniel Morsing . resolved

PTAL

File src/cmd/compile/internal/ssa/stackalloc.go

Line 68, Patchset 2:// The set property is loosely enforced. We append a block if the

Keith Randall . resolved

"The set property" you mean here is the no duplicates property, you should make that clear.

Daniel Morsing

Wrote a better comment 😊

Line 322, Patchset 2:// Because values using stack slots are few and far inbetween

Keith Randall . resolved

This comment should probably go inside the body, as it relates to the implementation (not needed by callers).

Daniel Morsing

Done

Line 351, Patchset 2 (Parent): //TODO: remove? Subsumed by SpillUse?

Keith Randall . resolved

Keep this TODO?

Daniel Morsing

Done

Line 358, Patchset 2: s.live[bid] = l

Keith Randall . resolved

This can go inside the `if`.

Daniel Morsing

Done

Line 385, Patchset 2: push(b.b.ID, ID(vid))

Keith Randall . resolved

This case means we might have duplicates in s.live, right?
That's new behavior, might be worth checking that that is still ok. (It probably is, we just call `addAll` on it?)

Daniel Morsing

That's the neat thing about doing this value by value. Because we are iterating over the values in the outer loop, we either find the top of the stack for a given block to already have the value (the `l[len(l)-1] != vid` check in `push`) or we see that it's missing and push it.

Open in Gerrit

Related details

Attention is currently required from:

Keith Randall
Martin Möhrmann

Submit Requirements:

Code-Review

No-Unresolved-Comments

Review-Enforcement
TryBots-Pass

Inspect html for hidden footers to help with email filtering. To unsubscribe visit settings.

Gerrit

unsatisfied_requirement

satisfied_requirement

open

diffy

Keith Randall (Gerrit)

unread,

Nov 12, 2025, 12:33:34 PM (17 hours ago) Nov 12

to Daniel Morsing, goph...@pubsubhelper.golang.org, Keith Randall, Go LUCI, Martin Möhrmann, Gopher Robot, golang-co...@googlegroups.com

Attention needed from Daniel Morsing and Martin Möhrmann

Keith Randall voted and added 1 comment

Votes added by Keith Randall

Auto-Submit	+1
Code-Review	+2

1 comment

File src/cmd/compile/internal/ssa/stackalloc.go

Line 385, Patchset 2: push(b.b.ID, ID(vid))

Keith Randall . resolved

This case means we might have duplicates in s.live, right?
That's new behavior, might be worth checking that that is still ok. (It probably is, we just call `addAll` on it?)

Daniel Morsing

That's the neat thing about doing this value by value. Because we are iterating over the values in the outer loop, we either find the top of the stack for a given block to already have the value (the `l[len(l)-1] != vid` check in `push`) or we see that it's missing and push it.

Keith Randall

I see, there may be duplicate blocks in the queue, but we never get duplicate values in any block's list.

Open in Gerrit

Related details

Attention is currently required from:

Daniel Morsing
Martin Möhrmann

Submit Requirements:

Code-Review

No-Unresolved-Comments
Review-Enforcement

TryBots-Pass

Inspect html for hidden footers to help with email filtering. To unsubscribe visit settings.

Gerrit

satisfied_requirement

unsatisfied_requirement

open

diffy

Keith Randall (Gerrit)

unread,

Nov 12, 2025, 12:33:44 PM (17 hours ago) Nov 12

to Daniel Morsing, goph...@pubsubhelper.golang.org, Keith Randall, Go LUCI, Martin Möhrmann, Gopher Robot, golang-co...@googlegroups.com

Attention needed from Daniel Morsing and Martin Möhrmann

Keith Randall voted Code-Review+1

Code-Review

+1

Open in Gerrit

Related details

Attention is currently required from:

Daniel Morsing
Martin Möhrmann

Submit Requirements:

Code-Review
No-Unresolved-Comments
Review-Enforcement
TryBots-Pass

Inspect html for hidden footers to help with email filtering. To unsubscribe visit settings.

Gerrit

satisfied_requirement

unsatisfied_requirement

open

diffy

Junyang Shao (Gerrit)

unread,

Nov 12, 2025, 1:02:25 PM (16 hours ago) Nov 12

to Daniel Morsing, goph...@pubsubhelper.golang.org, Keith Randall, Keith Randall, Go LUCI, Martin Möhrmann, Gopher Robot, golang-co...@googlegroups.com

Attention needed from Daniel Morsing and Martin Möhrmann

Junyang Shao voted Code-Review+1

Code-Review

+1

Open in Gerrit

Related details

Attention is currently required from:

Daniel Morsing
Martin Möhrmann

Submit Requirements:

Code-Review
No-Unresolved-Comments

Review-Enforcement
TryBots-Pass

Inspect html for hidden footers to help with email filtering. To unsubscribe visit settings.

Gerrit

satisfied_requirement

open

diffy

Gopher Robot (Gerrit)

unread,

Nov 12, 2025, 1:02:35 PM (16 hours ago) Nov 12

to Daniel Morsing, goph...@pubsubhelper.golang.org, golang-...@googlegroups.com, Junyang Shao, Keith Randall, Keith Randall, Go LUCI, Martin Möhrmann, golang-co...@googlegroups.com

Gopher Robot submitted the change

Change information

Commit message:

cmd/compile: optimize liveness in stackalloc

The stackalloc code needs to run a liveness pass to build the
interference graph between stack slots. Because the values that we need
liveness over is so sparse, we can optimize the analysis by using a path
exploration algorithm rather than a iterative dataflow one

In local testing, this cuts 74.05 ms of CPU time off a build of cmd/compile.

Change-Id: I765ace87d5e8aae177e65eb63da482e3d698bea7

Reviewed-on: https://go-review.googlesource.com/c/go/+/718540

Reviewed-by: Keith Randall <k...@golang.org>

Auto-Submit: Keith Randall <k...@golang.org>

Reviewed-by: Junyang Shao <shaoj...@google.com>

LUCI-TryBot-Result: Go LUCI <golang...@luci-project-accounts.iam.gserviceaccount.com>

Reviewed-by: Keith Randall <k...@google.com>

Files:

M src/cmd/compile/internal/ssa/stackalloc.go

Change size: M

Delta: 1 file changed, 108 insertions(+), 73 deletions(-)

Branch: refs/heads/master

Submit Requirements:

Code-Review: +2 by Keith Randall, +1 by Junyang Shao, +1 by Keith Randall
TryBots-Pass: LUCI-TryBot-Result+1 by Go LUCI

Open in Gerrit

Inspect html for hidden footers to help with email filtering. To unsubscribe visit settings.

Gerrit

open

diffy

satisfied_requirement

Reply all

Reply to author

Forward

[go] cmd/compile: optimize liveness in stackalloc

Daniel Morsing (Gerrit)

Daniel Morsing has uploaded the change for review

Commit message

Change diff

Change information

Related details

Daniel Morsing (Gerrit)

Daniel Morsing voted Commit-Queue+1

Related details

Daniel Morsing (Gerrit)

Daniel Morsing uploaded new patchset

Related details

Keith Randall (Gerrit)

Keith Randall added 5 comments

Related details

Daniel Morsing (Gerrit)

Daniel Morsing uploaded new patchset

Related details

Daniel Morsing (Gerrit)

Daniel Morsing voted and added 6 comments

Votes added by Daniel Morsing

6 comments

Related details

Keith Randall (Gerrit)

Keith Randall voted and added 1 comment

Votes added by Keith Randall

1 comment

Related details

Keith Randall (Gerrit)

Keith Randall voted Code-Review+1

Related details

Junyang Shao (Gerrit)

Junyang Shao voted Code-Review+1

Related details

Gopher Robot (Gerrit)

Gopher Robot submitted the change

Change information