Last active
June 11, 2024 21:18
-
-
Save evanw/58a8a5b8b4a1da32fcdcfbf9da87c82a to your computer and use it in GitHub Desktop.
Example "stackify" algorithm for turning SSA into WASM
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
// This code demonstrates a simplified "stackification" algorithm to turn | |
// instructions in a basic block back into a tree. This is useful when | |
// generating WebAssembly code from assembly instructions in SSA form. | |
// | |
// It's the algorithm used by LLVM's WebAssembly backend, viewable here: | |
// https://github.com/llvm-mirror/llvm/blob/master/lib/Target/WebAssembly/WebAssemblyRegStackify.cpp | |
type InsKind = | |
'Add' | | |
'LocalSet' | | |
'LocalGet'; | |
interface Ins { | |
kind: InsKind; | |
// arg >= 0 means "index of previous instruction" | |
// arg < 0 means "~arg is a constant value" | |
args: number[]; | |
} | |
interface Tree { | |
kind: InsKind; | |
children: (number | string | Tree)[]; | |
} | |
function stackify(block: Ins[]): void { | |
function recoverTree(): [Tree, boolean] { | |
const ins = block[index]; | |
const children: (number | string | Tree)[] = []; | |
let stopped = false; | |
for (let j = ins.args.length - 1; j >= 0; j--) { | |
const arg = ins.args[j]; | |
// Is this a constant? If so, add it directly | |
if (arg < 0) { | |
children.unshift(~arg); | |
} | |
// If this argument is a single-use value immediately before this | |
// instruction and we haven't hit any problems yet, recover it too. | |
else if (uses[arg] === 1 && arg === index - 1 && !stopped) { | |
index--; | |
const [childTree, childStopped] = recoverTree(); | |
children.unshift(childTree); | |
if (childStopped) stopped = true; | |
} | |
// Otherwise we've hit a match failure and will have to pop all the way | |
// back up the DFS call stack and generate another tree. That tree will | |
// be referenced from here. | |
else { | |
children.unshift(`tree${arg}`); | |
stopped = true; | |
} | |
} | |
return [{kind: ins.kind, children}, stopped]; | |
} | |
// Count how many times an instruction was used. Instructions can only be | |
// stackified as nested instructions if they are used exactly once. | |
const uses: number[] = []; | |
for (const ins of block) { | |
uses.push(0); | |
for (const arg of ins.args) { | |
if (arg >= 0) { | |
uses[arg]++; | |
} | |
} | |
} | |
// Stackify the block from the back towards the front. The "index" variable | |
// is modified by "recoverTree" so we will automatically skip over any | |
// instructions that were included as part of the recovered tree. | |
let trees: [number, Tree][] = []; | |
let index = block.length; | |
while (index > 0) { | |
index--; | |
trees.unshift([index, recoverTree()[0]]); | |
} | |
block.forEach((ins, i) => { | |
console.log(`var${i} =`, ins.kind, ins.args.map(a => { | |
return a >= 0 ? `var${a}` : ~a; | |
}).join(', ')); | |
}); | |
console.log('\n-- becomes --\n'); | |
for (const [i, tree] of trees) { | |
console.log(`tree${i} =`, treeToString(tree, '')); | |
} | |
console.log('\n-------------------------------------------------------------\n'); | |
} | |
function treeToString(tree: Tree, indent: string): string { | |
if (tree.children.length < 2) { | |
return tree.kind + '(' + tree.children.map(c => { | |
return typeof c === 'number' || typeof c === 'string' ? c : treeToString(c, indent); | |
}).join('') + ')'; | |
} | |
indent += ' '; | |
return tree.kind + '(' + tree.children.map(c => { | |
return '\n' + indent + (typeof c === 'number' || typeof c === 'string' | |
? c : treeToString(c, indent)); | |
}).join(',') + ')'; | |
} | |
stackify([ | |
{kind: 'LocalGet', args: [~0]}, | |
{kind: 'Add', args: [0, ~1]}, | |
{kind: 'Add', args: [~2, ~3]}, | |
{kind: 'Add', args: [1, 2]}, | |
{kind: 'LocalSet', args: [~0, 3]}, | |
]); | |
stackify([ | |
{kind: 'LocalGet', args: [~0]}, | |
{kind: 'Add', args: [0, ~1]}, | |
{kind: 'Add', args: [0, ~2]}, | |
{kind: 'Add', args: [1, 2]}, | |
{kind: 'LocalSet', args: [~0, 3]}, | |
]); | |
stackify([ | |
{kind: 'LocalGet', args: [~0]}, | |
{kind: 'Add', args: [0, ~1]}, | |
{kind: 'Add', args: [~2, ~3]}, | |
{kind: 'Add', args: [1, 2]}, | |
{kind: 'LocalSet', args: [~0, 3]}, | |
{kind: 'Add', args: [3, ~4]}, | |
{kind: 'LocalSet', args: [~1, 5]}, | |
]); |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
var0 = LocalGet 0 | |
var1 = Add var0, 1 | |
var2 = Add 2, 3 | |
var3 = Add var1, var2 | |
var4 = LocalSet 0, var3 | |
-- becomes -- | |
tree4 = LocalSet( | |
0, | |
Add( | |
Add( | |
LocalGet(0), | |
1), | |
Add( | |
2, | |
3))) | |
------------------------------------------------------------- | |
var0 = LocalGet 0 | |
var1 = Add var0, 1 | |
var2 = Add var0, 2 | |
var3 = Add var1, var2 | |
var4 = LocalSet 0, var3 | |
-- becomes -- | |
tree0 = LocalGet(0) | |
tree1 = Add( | |
tree0, | |
1) | |
tree4 = LocalSet( | |
0, | |
Add( | |
tree1, | |
Add( | |
tree0, | |
2))) | |
------------------------------------------------------------- | |
var0 = LocalGet 0 | |
var1 = Add var0, 1 | |
var2 = Add 2, 3 | |
var3 = Add var1, var2 | |
var4 = LocalSet 0, var3 | |
var5 = Add var3, 4 | |
var6 = LocalSet 1, var5 | |
-- becomes -- | |
tree3 = Add( | |
Add( | |
LocalGet(0), | |
1), | |
Add( | |
2, | |
3)) | |
tree4 = LocalSet( | |
0, | |
tree3) | |
tree6 = LocalSet( | |
1, | |
Add( | |
tree3, | |
4)) | |
------------------------------------------------------------- | |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment