nthery/basic_block.dl

## basic_block.dl
// Break down linear IR into basic blocks and construct CFG.
// Just a naive program to teach myself datalog and Souffle.

.type Address <: number

// A sequential instruction, i.e. one that does not change control flow.
// Don't bother describing operands as we're only interested in control flow here.
// (ALU, load, store)
.decl seq(address:Address)

// An unconditional jump.
.decl jmp(address:Address, dest:Address)

// A conditional jump.
.decl cjmp(address:Address, ifTrue:Address, ifFalse:Address)

// A small program in this IR.
jmp(0, 1).
seq(1).
seq(2).
cjmp(3,1,7).
seq(4).
jmp(5, 6).
jmp(6, 1).
seq(7).

// A basic block terminator.
.decl terminator(address:Address)
terminator(a) :- jmp(a, _).
terminator(a) :- cjmp(a, _, _).

// An instruction is either a terminator or not.
.decl insn(address:Address)
insn(a) :- terminator(a); seq(a).

// A basic block.
.decl basic_block(first:Address, last:Address)
basic_block(f,l) :- max_sequence_without_terminator(f,l-1), terminator(l).
basic_block(f,l) :- max_sequence_without_terminator(f,l), !insn(l+1).
basic_block(f,l) :- f = l, (terminator(f-1); !insn(f-1)), terminator(l).

// A non-maximal sequence of instructions without branches.
.decl sequence_without_terminator(first:Address, last:Address)
sequence_without_terminator(f,l) :- f = l, seq(f).
sequence_without_terminator(f,l) :- seq(f), sequence_without_terminator(f+1,l).

// A maximal sequence of instructions without branches.
.decl max_sequence_without_terminator(first:Address, last:Address)
max_sequence_without_terminator(f,l) :- !seq(f-1), sequence_without_terminator(f, l).

// Control flow graph.
// Successor of basic block [first, last].
.decl succ(first:Address, last:Address, succ:Address)
succ(f, l, s) :- basic_block(f, l), branch_to(l, s).

// Extract destination address of branch instruction.
.decl branch_to(a:Address, to:Address)
branch_to(a, to) :- jmp(a, to); cjmp(a, to, _); cjmp(a, _, to).

.output succ

// Output is:
// 0       0       1
// 1       3       1
// 1       3       7
// 4       5       6
// 6       6       1
	// Break down linear IR into basic blocks and construct CFG.
	// Just a naive program to teach myself datalog and Souffle.

	.type Address <: number

	// A sequential instruction, i.e. one that does not change control flow.
	// Don't bother describing operands as we're only interested in control flow here.
	// (ALU, load, store)
	.decl seq(address:Address)

	// An unconditional jump.
	.decl jmp(address:Address, dest:Address)

	// A conditional jump.
	.decl cjmp(address:Address, ifTrue:Address, ifFalse:Address)

	// A small program in this IR.
	jmp(0, 1).
	seq(1).
	seq(2).
	cjmp(3,1,7).
	seq(4).
	jmp(5, 6).
	jmp(6, 1).
	seq(7).

	// A basic block terminator.
	.decl terminator(address:Address)
	terminator(a) :- jmp(a, _).
	terminator(a) :- cjmp(a, _, _).

	// An instruction is either a terminator or not.
	.decl insn(address:Address)
	insn(a) :- terminator(a); seq(a).

	// A basic block.
	.decl basic_block(first:Address, last:Address)
	basic_block(f,l) :- max_sequence_without_terminator(f,l-1), terminator(l).
	basic_block(f,l) :- max_sequence_without_terminator(f,l), !insn(l+1).
	basic_block(f,l) :- f = l, (terminator(f-1); !insn(f-1)), terminator(l).

	// A non-maximal sequence of instructions without branches.
	.decl sequence_without_terminator(first:Address, last:Address)
	sequence_without_terminator(f,l) :- f = l, seq(f).
	sequence_without_terminator(f,l) :- seq(f), sequence_without_terminator(f+1,l).

	// A maximal sequence of instructions without branches.
	.decl max_sequence_without_terminator(first:Address, last:Address)
	max_sequence_without_terminator(f,l) :- !seq(f-1), sequence_without_terminator(f, l).

	// Control flow graph.
	// Successor of basic block [first, last].
	.decl succ(first:Address, last:Address, succ:Address)
	succ(f, l, s) :- basic_block(f, l), branch_to(l, s).

	// Extract destination address of branch instruction.
	.decl branch_to(a:Address, to:Address)
	branch_to(a, to) :- jmp(a, to); cjmp(a, to, _); cjmp(a, _, to).

	.output succ

	// Output is:
	// 0 0 1
	// 1 3 1
	// 1 3 7
	// 4 5 6
	// 6 6 1