tetratelabs · evacchi · Nov 28, 2023 · Nov 28, 2023 · Nov 28, 2023 · Nov 28, 2023
@@ -1732,27 +1732,30 @@ func (i *Instruction) InsertlaneData() (x, y Value, index byte, l VecLane) {
 }
 
 // AsFadd initializes this instruction as a floating-point addition instruction with OpcodeFadd.
-func (i *Instruction) AsFadd(x, y Value) {
+func (i *Instruction) AsFadd(x, y Value) *Instruction {
 	i.opcode = OpcodeFadd
 	i.v = x
 	i.v2 = y
 	i.typ = x.Type()
+	return i
 }
 
 // AsFsub initializes this instruction as a floating-point subtraction instruction with OpcodeFsub.
-func (i *Instruction) AsFsub(x, y Value) {
+func (i *Instruction) AsFsub(x, y Value) *Instruction {
 	i.opcode = OpcodeFsub
 	i.v = x
 	i.v2 = y
 	i.typ = x.Type()
+	return i
 }
 
 // AsFmul initializes this instruction as a floating-point multiplication instruction with OpcodeFmul.
-func (i *Instruction) AsFmul(x, y Value) {
+func (i *Instruction) AsFmul(x, y Value) *Instruction {
 	i.opcode = OpcodeFmul
 	i.v = x
 	i.v2 = y
 	i.typ = x.Type()
+	return i
 }
 
 // AsFdiv initializes this instruction as a floating-point division instruction with OpcodeFdiv.

@@ -2,6 +2,7 @@ package ssa
 
 import (
 	"fmt"
+	"math"
 	"sort"
 
 	"github.com/tetratelabs/wazero/internal/engine/wazevo/wazevoapi"
@@ -17,8 +18,11 @@ func (b *builder) RunPasses() {
 	passSortSuccessors(b)
 	passDeadBlockEliminationOpt(b)
 	passRedundantPhiEliminationOpt(b)
-	// The result of passCalculateImmediateDominators will be used by various passes below.
+	// The result of passCalculateImmediateDominators and passCollectValueIdToInstructionMapping
+	// will be used by various passes below.
 	passCalculateImmediateDominators(b)
+	passCollectValueIdToInstructionMapping(b)
+
 	passNopInstElimination(b)
 
 	// TODO: implement either conversion of irreducible CFG into reducible one, or irreducible CFG detection where we panic.
@@ -33,6 +37,8 @@ func (b *builder) RunPasses() {
 	// 	Arithmetic simplifications.
 	// 	and more!
 
+	passConstFoldingOpt(b)
+
 	// passDeadCodeEliminationOpt could be more accurate if we do this after other optimizations.
 	passDeadCodeEliminationOpt(b)
 	b.donePasses = true
@@ -174,9 +180,6 @@ func passDeadCodeEliminationOpt(b *builder) {
 	if nvid >= len(b.valueRefCounts) {
 		b.valueRefCounts = append(b.valueRefCounts, make([]int, b.nextValueID)...)
 	}
-	if nvid >= len(b.valueIDToInstruction) {
-		b.valueIDToInstruction = append(b.valueIDToInstruction, make([]*Instruction, b.nextValueID)...)
-	}
 
 	// First, we gather all the instructions with side effects.
 	liveInstructions := b.instStack[:0]
@@ -195,14 +198,6 @@ func passDeadCodeEliminationOpt(b *builder) {
 				// The strict side effect should create different instruction groups.
 				gid++
 			}
-
-			r1, rs := cur.Returns()
-			if r1.Valid() {
-				b.valueIDToInstruction[r1.ID()] = cur
-			}
-			for _, r := range rs {
-				b.valueIDToInstruction[r.ID()] = cur
-			}
 		}
 	}
 
@@ -309,26 +304,13 @@ func (b *builder) clearBlkVisited() {
 
 // passNopInstElimination eliminates the instructions which is essentially a no-op.
 func passNopInstElimination(b *builder) {
-	if int(b.nextValueID) >= len(b.valueIDToInstruction) {
-		b.valueIDToInstruction = append(b.valueIDToInstruction, make([]*Instruction, b.nextValueID)...)
-	}
-
 	for blk := b.blockIteratorBegin(); blk != nil; blk = b.blockIteratorNext() {
 		for cur := blk.rootInstr; cur != nil; cur = cur.next {
-			r1, rs := cur.Returns()
-			if r1.Valid() {
-				b.valueIDToInstruction[r1.ID()] = cur
-			}
-			for _, r := range rs {
-				b.valueIDToInstruction[r.ID()] = cur
-			}
-		}
-	}
-
-	for blk := b.blockIteratorBegin(); blk != nil; blk = b.blockIteratorNext() {
-		for cur := blk.rootInstr; cur != nil; cur = cur.next {
-			switch cur.Opcode() {
+			op := cur.Opcode()
+			switch op {
 			// TODO: add more logics here.
+			// Amount := (Const $someValue)
+			// (Shift X, Amount) where Amount == x.Type.Bits() => X
 			case OpcodeIshl, OpcodeSshr, OpcodeUshr:
 				x, amount := cur.Arg2()
 				definingInst := b.valueIDToInstruction[amount.ID()]
@@ -348,6 +330,138 @@ func passNopInstElimination(b *builder) {
 						b.alias(cur.Return(), x)
 					}
 				}
+			// Z := Const 0
+			// (Iadd X, Z) => X
+			// (Iadd Z, Y) => Y
+			case OpcodeIadd:
+				x, y := cur.Arg2()
+				definingInst := b.valueIDToInstruction[y.ID()]
+				if definingInst == nil {
+					if definingInst = b.valueIDToInstruction[x.ID()]; definingInst == nil {
+						continue
+					} else {
+						x = y
+					}
+				}
+				if definingInst.Constant() && definingInst.ConstantVal() == 0 {
+					b.alias(cur.Return(), x)
+				}
+			}
+		}
+	}
+}
+
+func passCollectValueIdToInstructionMapping(b *builder) {
+	if int(b.nextValueID) >= len(b.valueIDToInstruction) {
+		b.valueIDToInstruction = append(b.valueIDToInstruction, make([]*Instruction, b.nextValueID)...)
+	}
+
+	for blk := b.blockIteratorBegin(); blk != nil; blk = b.blockIteratorNext() {
+		for cur := blk.rootInstr; cur != nil; cur = cur.next {
+			r1, rs := cur.Returns()
+			if r1.Valid() {
+				b.valueIDToInstruction[r1.ID()] = cur
+			}
+			for _, r := range rs {
+				b.valueIDToInstruction[r.ID()] = cur
+			}
+		}
+	}
+}
+
+// passConstFoldingOpt scans all instructions for arithmetic operations over constants,
+// and replaces them with a const of their result.
+func passConstFoldingOpt(b *builder) {
+	for blk := b.blockIteratorBegin(); blk != nil; blk = b.blockIteratorNext() {
+		for cur := blk.rootInstr; cur != nil; cur = cur.next {
+			// The fixed point is reached through a simple iteration over the list of instructions.
+			// Note: Instead of just an unbounded loop with a flag, we may also add an upper bound to the number of iterations.
+			isFixedPoint := false
+			for !isFixedPoint {
+				isFixedPoint = true
+				op := cur.Opcode()
+				switch op {
+				// X := Const xc
+				// Y := Const yc
+				// - (Iadd X, Y) => Const (xc + yc)
+				case OpcodeIadd, OpcodeIsub, OpcodeImul:
+					x, y := cur.Arg2()
+					xDef := b.valueIDToInstruction[x.ID()]
+					yDef := b.valueIDToInstruction[y.ID()]
+					if xDef == nil || yDef == nil {
+						// If we are adding some parameter, ignore.
+						continue
+					}
+					if xDef.Constant() && yDef.Constant() {
+						isFixedPoint = false
+						// Mutate the instruction to an Iconst.
+						cur.opcode = OpcodeIconst
+						// Clear the references to operands.
+						cur.v, cur.v2 = ValueInvalid, ValueInvalid
+						// We assume all the types are consistent.
+						if x.Type().Bits() == 64 {
+							xc, yc := int64(xDef.ConstantVal()), int64(yDef.ConstantVal())
+							switch op {
+							case OpcodeIadd:
+								cur.u1 = uint64(xc + yc)
+							case OpcodeIsub:
+								cur.u1 = uint64(xc - yc)
+							case OpcodeImul:
+								cur.u1 = uint64(xc * yc)
+							}
+						} else {
+							xc, yc := int32(xDef.ConstantVal()), int32(yDef.ConstantVal())
+							switch op {
+							case OpcodeIadd:
+								cur.u1 = uint64(xc + yc)
+							case OpcodeIsub:
+								cur.u1 = uint64(xc - yc)
+							case OpcodeImul:
+								cur.u1 = uint64(xc * yc)
+							}
+						}
+					}
+				case OpcodeFadd, OpcodeFsub, OpcodeFmul:
+					x, y := cur.Arg2()
+					xDef := b.valueIDToInstruction[x.ID()]
+					yDef := b.valueIDToInstruction[y.ID()]
+					if xDef == nil || yDef == nil {
+						// If we are adding together some parameter, ignore.
+						continue
+					}
+					if xDef.Constant() && yDef.Constant() {
+						isFixedPoint = false
+						// Mutate the instruction to an Iconst.
+						// Clear the references to operands.
+						cur.v, cur.v2 = ValueInvalid, ValueInvalid
+						// We assume all the types are consistent.
+						if x.Type().Bits() == 64 {
+							cur.opcode = OpcodeF64const
+							yc := math.Float64frombits(yDef.ConstantVal())
+							xc := math.Float64frombits(xDef.ConstantVal())
+							switch op {
+							case OpcodeFadd:
+								cur.u1 = math.Float64bits(xc + yc)
+							case OpcodeFsub:
+								cur.u1 = math.Float64bits(xc - yc)
+							case OpcodeFmul:
+								cur.u1 = math.Float64bits(xc * yc)
+							}
+						} else {
+							cur.opcode = OpcodeF32const
+							yc := math.Float32frombits(uint32(yDef.ConstantVal()))
+							xc := math.Float32frombits(uint32(xDef.ConstantVal()))
+							switch op {
+							case OpcodeFadd:
+								cur.u1 = uint64(math.Float32bits(xc + yc))
+							case OpcodeFsub:
+								cur.u1 = uint64(math.Float32bits(xc - yc))
+							case OpcodeFmul:
+								cur.u1 = uint64(math.Float32bits(xc * yc))
+							}
+						}
+					}
+				}
 			}
 		}
 	}