Skip to content
New issue

Have a question about this project? Sign up for a free GitHub account to open an issue and contact its maintainers and the community.

By clicking “Sign up for GitHub”, you agree to our terms of service and privacy statement. We’ll occasionally send you account related emails.

Already on GitHub? Sign in to your account

feat[venom]: add loop invariant hoisting pass #4175

Open
wants to merge 20 commits into
base: master
Choose a base branch
from
Open
Show file tree
Hide file tree
Changes from 8 commits
Commits
Show all changes
20 commits
Select commit Hold shift + click to select a range
13944eb
feat[venom]: add loop invariant hoisting pass
HodanPlodky Jul 10, 2024
f626b68
feat[venom]: add unit test for loop invariant hoisting
HodanPlodky Jul 12, 2024
942c731
feat[venom]: add unit test for loop invariant hoisting
HodanPlodky Jul 12, 2024
399a0a4
feat[venom]: clean up and comments
HodanPlodky Jul 15, 2024
2a8dd4a
fix[venom]: incorrect loop detection fix
HodanPlodky Jul 15, 2024
302aa21
fix[venom]: removed hoisting just constants
HodanPlodky Jul 17, 2024
013840c
fix[venom]: removed unnecessary hoisting
HodanPlodky Jul 18, 2024
1ee0068
feat[venom]: clean up after changes
HodanPlodky Jul 18, 2024
f703408
fix[venom]: changes from review and better loophoisting structure (sk…
HodanPlodky Jul 19, 2024
c5dbf05
fix[venom]: ignore code offset calculation
HodanPlodky Jul 22, 2024
cd655fc
fix[venom]: changes according to review
HodanPlodky Jul 22, 2024
ecb272a
fix[venom]: changes according to review
HodanPlodky Jul 22, 2024
18c7610
fix[venom]: changes according to review
HodanPlodky Jul 23, 2024
5583cc5
fix[venom]: review changes (_is_store condition negation to reduce ne…
HodanPlodky Jul 23, 2024
bdb2896
clean up loop detection
harkal Jul 29, 2024
788bd0d
Merge pull request #1 from harkal/update_loop_detection
HodanPlodky Aug 10, 2024
715b128
fix[venom]: improved tests to increase coverage
HodanPlodky Aug 12, 2024
8edce11
fix[venom]: error when the store is not constant
HodanPlodky Aug 13, 2024
cf6b25e
Merge branch 'master' into loop_invariant
HodanPlodky Sep 30, 2024
77f97b6
Merge branch 'master' into loop_invariant
HodanPlodky Jan 9, 2025
File filter

Filter by extension

Filter by extension

Conversations
Failed to load comments.
Loading
Jump to
Jump to file
Failed to load files.
Loading
Diff view
Diff view
155 changes: 155 additions & 0 deletions tests/unit/compiler/venom/test_loop_invariant_hoisting.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,155 @@
import pytest

from vyper.venom.analysis.analysis import IRAnalysesCache
from vyper.venom.analysis.loop_detection import LoopDetectionAnalysis
from vyper.venom.basicblock import IRBasicBlock, IRLabel, IRVariable
from vyper.venom.context import IRContext
from vyper.venom.function import IRFunction
from vyper.venom.passes.loop_invariant_hosting import LoopInvariantHoisting


def _create_loops(fn, depth, loop_id, body_fn=lambda _: (), top=True):
bb = fn.get_basic_block()
cond = IRBasicBlock(IRLabel(f"cond{loop_id}{depth}"), fn)
body = IRBasicBlock(IRLabel(f"body{loop_id}{depth}"), fn)
if top:
exit_block = IRBasicBlock(IRLabel(f"exit_top{loop_id}{depth}"), fn)
else:
exit_block = IRBasicBlock(IRLabel(f"exit{loop_id}{depth}"), fn)
fn.append_basic_block(cond)
fn.append_basic_block(body)

bb.append_instruction("jmp", cond.label)

cond_var = IRVariable(f"cond_var{loop_id}{depth}")
cond.append_instruction("iszero", 0, ret=cond_var)
assert isinstance(cond_var, IRVariable)
cond.append_instruction("jnz", cond_var, body.label, exit_block.label)
body_fn(fn, loop_id, depth)
if depth > 1:
_create_loops(fn, depth - 1, loop_id, body_fn, top=False)
bb = fn.get_basic_block()
bb.append_instruction("jmp", cond.label)
fn.append_basic_block(exit_block)


def _simple_body(fn, loop_id, depth):
assert isinstance(fn, IRFunction)
bb = fn.get_basic_block()
add_var = IRVariable(f"add_var{loop_id}{depth}")
bb.append_instruction("add", 1, 2, ret=add_var)


def _hoistable_body(fn, loop_id, depth):
assert isinstance(fn, IRFunction)
bb = fn.get_basic_block()
add_var_a = IRVariable(f"add_var_a{loop_id}{depth}")
bb.append_instruction("add", 1, 2, ret=add_var_a)
add_var_b = IRVariable(f"add_var_b{loop_id}{depth}")
bb.append_instruction("add", add_var_a, 2, ret=add_var_b)


@pytest.mark.parametrize("depth", range(1, 4))
@pytest.mark.parametrize("count", range(1, 4))
def test_loop_detection_analysis(depth, count):
ctx = IRContext()
fn = ctx.create_function("_global")

for c in range(count):
_create_loops(fn, depth, c, _simple_body)

bb = fn.get_basic_block()
bb.append_instruction("ret")

ac = IRAnalysesCache(fn)
analysis = ac.request_analysis(LoopDetectionAnalysis)
assert len(analysis.loops) == depth * count


@pytest.mark.parametrize("depth", range(1, 4))
@pytest.mark.parametrize("count", range(1, 4))
def test_loop_invariant_hoisting_simple(depth, count):
ctx = IRContext()
fn = ctx.create_function("_global")

for c in range(count):
_create_loops(fn, depth, c, _simple_body)

bb = fn.get_basic_block()
bb.append_instruction("ret")

ac = IRAnalysesCache(fn)
LoopInvariantHoisting(ac, fn).run_pass()

entry = fn.entry
assignments = list(map(lambda x: x.value, entry.get_assignments()))
for bb in filter(lambda bb: bb.label.name.startswith("exit_top"), fn.get_basic_blocks()):
assignments.extend(map(lambda x: x.value, bb.get_assignments()))

assert len(assignments) == depth * count * 2
for loop_id in range(count):
for d in range(1, depth + 1):
assert f"%add_var{loop_id}{d}" in assignments, repr(fn)
assert f"%cond_var{loop_id}{d}" in assignments, repr(fn)


@pytest.mark.parametrize("depth", range(1, 4))
@pytest.mark.parametrize("count", range(1, 4))
def test_loop_invariant_hoisting_dependant(depth, count):
ctx = IRContext()
fn = ctx.create_function("_global")

for c in range(count):
_create_loops(fn, depth, c, _hoistable_body)

bb = fn.get_basic_block()
bb.append_instruction("ret")

ac = IRAnalysesCache(fn)
LoopInvariantHoisting(ac, fn).run_pass()

entry = fn.entry
assignments = list(map(lambda x: x.value, entry.get_assignments()))
for bb in filter(lambda bb: bb.label.name.startswith("exit_top"), fn.get_basic_blocks()):
assignments.extend(map(lambda x: x.value, bb.get_assignments()))

assert len(assignments) == depth * count * 3
for loop_id in range(count):
for d in range(1, depth + 1):
assert f"%add_var_a{loop_id}{d}" in assignments, repr(fn)
assert f"%add_var_b{loop_id}{d}" in assignments, repr(fn)
assert f"%cond_var{loop_id}{d}" in assignments, repr(fn)

def _unhoistable_body(fn, loop_id, depth):
assert isinstance(fn, IRFunction)
bb = fn.get_basic_block()
add_var_a = IRVariable(f"add_var_a{loop_id}{depth}")
bb.append_instruction("mload", 64, ret=add_var_a)
add_var_b = IRVariable(f"add_var_b{loop_id}{depth}")
bb.append_instruction("add", add_var_a, 2, ret=add_var_b)

@pytest.mark.parametrize("depth", range(1, 4))
@pytest.mark.parametrize("count", range(1, 4))
def test_loop_invariant_hoisting_unhoistable(depth, count):
ctx = IRContext()
fn = ctx.create_function("_global")

for c in range(count):
_create_loops(fn, depth, c, _unhoistable_body)

bb = fn.get_basic_block()
bb.append_instruction("ret")

ac = IRAnalysesCache(fn)
LoopInvariantHoisting(ac, fn).run_pass()

entry = fn.entry
assignments = list(map(lambda x: x.value, entry.get_assignments()))
for bb in filter(lambda bb: bb.label.name.startswith("exit_top"), fn.get_basic_blocks()):
assignments.extend(map(lambda x: x.value, bb.get_assignments()))

assert len(assignments) == depth * count
for loop_id in range(count):
for d in range(1, depth + 1):
assert f"%cond_var{loop_id}{d}" in assignments, repr(fn)

2 changes: 2 additions & 0 deletions vyper/venom/__init__.py
Original file line number Diff line number Diff line change
Expand Up @@ -13,6 +13,7 @@
from vyper.venom.passes.branch_optimization import BranchOptimizationPass
from vyper.venom.passes.dft import DFTPass
from vyper.venom.passes.extract_literals import ExtractLiteralsPass
from vyper.venom.passes.loop_invariant_hosting import LoopInvariantHoisting
from vyper.venom.passes.make_ssa import MakeSSA
from vyper.venom.passes.mem2var import Mem2Var
from vyper.venom.passes.remove_unused_variables import RemoveUnusedVariablesPass
Expand Down Expand Up @@ -56,6 +57,7 @@ def _run_passes(fn: IRFunction, optimize: OptimizationLevel) -> None:
BranchOptimizationPass(ac, fn).run_pass()
ExtractLiteralsPass(ac, fn).run_pass()
RemoveUnusedVariablesPass(ac, fn).run_pass()
LoopInvariantHoisting(ac, fn).run_pass()
DFTPass(ac, fn).run_pass()


Expand Down
72 changes: 72 additions & 0 deletions vyper/venom/analysis/loop_detection.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,72 @@
from vyper.utils import OrderedSet
from vyper.venom.analysis.analysis import IRAnalysis
from vyper.venom.analysis.cfg import CFGAnalysis
from vyper.venom.basicblock import IRBasicBlock


class LoopDetectionAnalysis(IRAnalysis):
"""
Detects loops and computes basic blocks
and the block which is before the loop
"""

# key = start of the loop (last bb not in the loop)
# value = all the block that loop contains
loops: dict[IRBasicBlock, OrderedSet[IRBasicBlock]]

done: OrderedSet[IRBasicBlock]
visited: OrderedSet[IRBasicBlock]

def analyze(self):
self.analyses_cache.request_analysis(CFGAnalysis)
self.loops: dict[IRBasicBlock, OrderedSet[IRBasicBlock]] = dict()
self.done = OrderedSet()
self.visited = OrderedSet()
entry = self.function.entry
self.dfs(entry)

def invalidate(self):
return super().invalidate()
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

no need for this implementation


def dfs(self, bb: IRBasicBlock, before: IRBasicBlock = None):
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

this function does loop detection, why name it dfs?

Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

style: we use the convention foo_r() for recursive functions, and prefix with underscore (i.e. _foo_r()) for "private" functions (those that are not called externally)

if bb in self.visited:
assert before is not None, "Loop must have one basic block before it"
loop = self.collect_path(before, bb)
in_bb = bb.cfg_in.difference({before})
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

i think this might be clearer as if before in bb.cfg_in: .... does that introduce any bugs?

Copy link
Collaborator Author

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

This is just because it checks for natural loops, so I check if it has only one input into the loop.

assert len(in_bb) == 1, "Loop must have one input basic block"
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

  • Since we are looking for natural loops, we should probably rename the analysis to NaturalLoopDetectionAnalysis
  • We should also probably not assert if the loop was not natural, just ignore that loop

input_bb = in_bb.first()
self.loops[input_bb] = loop
self.done.add(bb)
return

self.visited.add(bb)

for neighbour in bb.cfg_out:
if neighbour not in self.done:
self.dfs(neighbour, bb)

self.done.add(bb)
return
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

redundant


def collect_path(self, bb_from: IRBasicBlock, bb_to: IRBasicBlock) -> OrderedSet[IRBasicBlock]:
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

style: _collect_path

loop = OrderedSet()
collect_visit = OrderedSet()
self.collect_path_inner(bb_from, bb_to, loop, collect_visit)
return loop

def collect_path_inner(
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

_collect_path_inner()

self,
act_bb: IRBasicBlock,
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

does "act_bb" stand for "active bb"? maybe cur_bb or bb_from or just bb would be better.

bb_to: IRBasicBlock,
loop: OrderedSet[IRBasicBlock],
collect_visit: OrderedSet[IRBasicBlock],
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

maybe just visited

):
if act_bb in collect_visit:
return
collect_visit.add(act_bb)
loop.add(act_bb)
if act_bb == bb_to:
return

for before in act_bb.cfg_in:
self.collect_path_inner(before, bb_to, loop, collect_visit)
127 changes: 127 additions & 0 deletions vyper/venom/passes/loop_invariant_hosting.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,127 @@
from vyper.utils import OrderedSet
from vyper.venom.analysis.cfg import CFGAnalysis
from vyper.venom.analysis.dfg import DFGAnalysis
from vyper.venom.analysis.liveness import LivenessAnalysis
from vyper.venom.analysis.loop_detection import LoopDetectionAnalysis
from vyper.venom.basicblock import IRBasicBlock, IRInstruction, IRLiteral, IRVariable
from vyper.venom.function import IRFunction
from vyper.venom.passes.base_pass import IRPass

def _ignore_instruction(instruction: IRInstruction) -> bool:
return (
instruction.is_volatile
or instruction.is_bb_terminator
or instruction.opcode == "returndatasize"
or instruction.opcode == "phi"
)


def _is_correct_store(instruction: IRInstruction) -> bool:
Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

This is basically _is_store()

return (
instruction.opcode == "store"
and len(instruction.operands) == 1
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

this condition is always true, no?

and isinstance(instruction.operands[0], IRLiteral)
)


class LoopInvariantHoisting(IRPass):
"""
This pass detects invariants in loops and hoists them above the loop body.
Any VOLATILE_INSTRUCTIONS, BB_TERMINATORS CFG_ALTERING_INSTRUCTIONS are ignored
"""

from typing import Iterator
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

no need for local import, please hoist this to top of file


function: IRFunction
loops: dict[IRBasicBlock, OrderedSet[IRBasicBlock]]
dfg: DFGAnalysis

def run_pass(self):
self.analyses_cache.request_analysis(CFGAnalysis)
self.dfg = self.analyses_cache.request_analysis(DFGAnalysis)
loops = self.analyses_cache.request_analysis(LoopDetectionAnalysis)
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

loops.loops looks weird, maybe just name this t? or loops_analysis

Copy link
Collaborator

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

loops_analysis 👍

self.loops = loops.loops
while True:
change = False
for from_bb, loop in self.loops.items():
hoistable: list[
tuple[IRBasicBlock, IRBasicBlock, IRInstruction]
] = self._get_hoistable_loop(from_bb, loop)
if len(hoistable) == 0:
continue
change |= True
self._hoist(hoistable)
if not change:
break
# I have this inside the loop because I dont need to
# invalidate if you dont hoist anything
self.analyses_cache.invalidate_analysis(LivenessAnalysis)
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

let's bring this outside the loop, and add a flag inside the loop to detect if invalidate_analysis should be called


def _hoist(self, hoistable: list[tuple[IRBasicBlock, IRBasicBlock, IRInstruction]]):
for loop_idx, bb, inst in hoistable:
bb.remove_instruction(inst)
bb_before: IRBasicBlock = loop_idx
bb_before.insert_instruction(inst, index=len(bb_before.instructions) - 1)

def _get_hoistable_loop(
self, from_bb: IRBasicBlock, loop: OrderedSet[IRBasicBlock]
) -> list[tuple[IRBasicBlock, IRBasicBlock, IRInstruction]]:
result: list[tuple[IRBasicBlock, IRBasicBlock, IRInstruction]] = []
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

these type signatures are hard to read -- either make them less specific (e.g. -> list or -> list[tuple]) or make a small dataclass local to this file to carry around the data structure.

for bb in loop:
result.extend(self._get_hoistable_bb(bb, from_bb))
return result

def _get_hoistable_bb(
self, bb: IRBasicBlock, loop_idx: IRBasicBlock
) -> list[tuple[IRBasicBlock, IRBasicBlock, IRInstruction]]:
result: list[tuple[IRBasicBlock, IRBasicBlock, IRInstruction]] = []
for instruction in bb.instructions:
if self._can_hoist_instruction(instruction, self.loops[loop_idx]):
result.append((loop_idx, bb, instruction))

return result

def _can_hoist_instruction(
self, instruction: IRInstruction, loop: OrderedSet[IRBasicBlock]
) -> bool:
if _ignore_instruction(instruction):
return False
for bb in loop:
if self._in_bb(instruction, bb):
return False

if _is_correct_store(instruction):
for used_instruction in self.dfg.get_uses(instruction.output):
if not self._can_hoist_instruction_ignore_stores(used_instruction, loop):
return False

return True

def _in_bb(self, instruction: IRInstruction, bb: IRBasicBlock):
for in_var in instruction.get_input_variables():
assert isinstance(in_var, IRVariable)
source_ins = self.dfg._dfg_outputs[in_var]
if source_ins in bb.instructions:
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

i think we can just check inst.parent for each instruction here

return True
return False

def _can_hoist_instruction_ignore_stores(
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

leave a comment explaining why this is necessary?

Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

maybe just call this _can_hoist_instruction (or just _can_hoist!), as it doesn't need to be contrasted with a function like _can_hoist_instruction_not_ignoring_stores.

self, instruction: IRInstruction, loop: OrderedSet[IRBasicBlock]
) -> bool:
if _ignore_instruction(instruction):
return False
for bb in loop:
if self._in_bb_ignore_store(instruction, bb):
return False
return True

def _in_bb_ignore_store(self, instruction: IRInstruction, bb: IRBasicBlock):
for in_var in instruction.get_input_variables():
assert isinstance(in_var, IRVariable)
source_ins = self.dfg._dfg_outputs[in_var]
Copy link
Member

@charles-cooper charles-cooper Jul 23, 2024

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

prefer instruction to always be abbreviated as inst, and also to use the public interface of the dfg analysis, for example:

prev_inst = self.dfg.get_producing_instruction(in_var)
# can add `assert prev_inst is not None` if desired

if _is_correct_store(source_ins):
Copy link
Member

Choose a reason for hiding this comment

The reason will be displayed to describe this comment to others. Learn more.

how can this condition ever hold true?

continue

if source_ins in bb.instructions:
return True
return False