compiler/noirc_evaluator/src/ssa/opt/basic_conditional.rs

use std::collections::HashSet;

use acvm::AcirField;
use fxhash::FxHashMap as HashMap;
use iter_extended::vecmap;

use crate::ssa::{
    Ssa,
    ir::{
        basic_block::BasicBlockId,
        cfg::ControlFlowGraph,
        dfg::DataFlowGraph,
        function::{Function, FunctionId},
        function_inserter::FunctionInserter,
        instruction::{BinaryOp, Instruction, TerminatorInstruction},
        post_order::PostOrder,
        value::ValueId,
    },
};

use super::flatten_cfg::Context;
#[derive(Debug, Clone)]
struct BasicConditional {
    block_entry: BasicBlockId,
    block_then: Option<BasicBlockId>,
    block_else: Option<BasicBlockId>,
    block_exit: BasicBlockId,
}

impl Ssa {
    #[tracing::instrument(level = "trace", skip(self))]
    /// This pass flatten simple IF-THEN-ELSE statements
    /// This optimization pass identifies simple conditional control flow patterns in unconstrained code
    /// and flattens them to reduce the number of basic blocks and improve performance.
    ///
    /// e.g: if c {a} else {b} would be flattened to c*(a-b)+b
    /// A simple conditional pattern is defined as an IF-THEN (with optional ELSE) statement, with no nested conditional nor loop statements
    /// Performance improvement is based on a simple execution cost metric
    pub(crate) fn flatten_basic_conditionals(mut self) -> Ssa {
        // Retrieve the 'no_predicates' attribute of the functions in a map, to avoid problems with borrowing
        let mut no_predicates = HashMap::default();
        for function in self.functions.values() {
            no_predicates.insert(function.id(), function.is_no_predicates());
        }
        for function in self.functions.values_mut() {
            flatten_function(function, &mut no_predicates);
        }
        self
    }
}

/// Returns the blocks of the simple conditional sub-graph whose input block is the entry.
/// Returns None if the input block is not the entry block of a simple conditional.
fn is_conditional(
    block: BasicBlockId,
    cfg: &ControlFlowGraph,
    function: &Function,
) -> Option<BasicConditional> {
    // jump overhead is the cost for doing the conditional and jump around the blocks
    // We use 10 as a rough estimate, the real cost is less.
    let jump_overhead = 10;
    let mut successors = cfg.successors(block);
    let mut result = None;
    // a conditional must have 2 branches
    if successors.len() != 2 {
        return None;
    }
    let left = successors.next().unwrap();
    let right = successors.next().unwrap();
    let mut left_successors = cfg.successors(left);
    let mut right_successors = cfg.successors(right);
    let left_successors_len = left_successors.len();
    let right_successors_len = right_successors.len();
    let next_left = left_successors.next();
    let next_right = right_successors.next();
    if next_left == Some(block) || next_right == Some(block) {
        // this is a loop, not a conditional
        return None;
    }
    if left_successors_len == 1 && right_successors_len == 1 && next_left == next_right {
        // The branches join on one block so it is a non-nested conditional
        let cost_left = block_cost(left, &function.dfg);
        let cost_right = block_cost(right, &function.dfg);
        // For the flattening to be valuable, we compare the cost of the flattened code with the average cost of the 2 branches,
        // including an overhead to take into account the jumps between the blocks.
        let cost = cost_right.saturating_add(cost_left);
        if cost < cost / 2 + jump_overhead {
            if let Some(TerminatorInstruction::JmpIf {
                condition: _,
                then_destination,
                else_destination,
                call_stack: _,
            }) = function.dfg[block].terminator()
            {
                result = Some(BasicConditional {
                    block_entry: block,
                    block_then: Some(*then_destination),
                    block_else: Some(*else_destination),
                    block_exit: next_left.unwrap(),
                });
            }
        }
    } else if left_successors_len == 1 && next_left == Some(right) {
        // Left branch joins the right branch, e.g if/then statement with no else
        // This case may not happen (i.e not generated), but it is safer to handle it (e.g in case it happens due to some optimizations)
        let cost = block_cost(left, &function.dfg);
        if cost < cost / 2 + jump_overhead {
            if let Some(TerminatorInstruction::JmpIf {
                condition: _,
                then_destination,
                else_destination,
                call_stack: _,
            }) = function.dfg[block].terminator()
            {
                let (block_then, block_else) = if left == *then_destination {
                    (Some(left), None)
                } else if left == *else_destination {
                    (None, Some(left))
                } else {
                    return None;
                };

                result = Some(BasicConditional {
                    block_entry: block,
                    block_then,
                    block_else,
                    block_exit: right,
                });
            }
        }
    } else if right_successors_len == 1 && next_right == Some(left) {
        // Right branch joins the left branch, e.g if/else statement with no then
        // This case may not happen (i.e not generated), but it is safer to handle it (e.g in case it happens due to some optimizations)
        let cost = block_cost(right, &function.dfg);
        if cost < cost / 2 + jump_overhead {
            if let Some(TerminatorInstruction::JmpIf {
                condition: _,
                then_destination,
                else_destination,
                call_stack: _,
            }) = function.dfg[block].terminator()
            {
                let (block_then, block_else) = if right == *then_destination {
                    (Some(right), None)
                } else if right == *else_destination {
                    (None, Some(right))
                } else {
                    return None;
                };
                result = Some(BasicConditional {
                    block_entry: block,
                    block_then,
                    block_else,
                    block_exit: right,
                });
            }
        }
    }
    // A conditional exit would have exactly 2 predecessors
    result.filter(|result| cfg.predecessors(result.block_exit).len() == 2)
}

/// Computes a cost estimate of a basic block
/// returns u32::MAX if the block has side-effect instructions
/// WARNING: these are estimates of the runtime cost of each instruction,
/// 1 being the cost of the simplest instruction. These numbers can be improved.
fn block_cost(block: BasicBlockId, dfg: &DataFlowGraph) -> u32 {
    let mut cost: u32 = 0;
    for instruction in dfg[block].instructions() {
        let instruction_cost = match &dfg[*instruction] {
            Instruction::Binary(binary) => {
                match binary.operator {
                    BinaryOp::Add { unchecked }
                    | BinaryOp::Sub { unchecked }
                    | BinaryOp::Mul { unchecked } => if unchecked { 3 } else { return u32::MAX },
                    BinaryOp::Div
                    | BinaryOp::Mod => return u32::MAX,
                    BinaryOp::Eq => 1,
                    BinaryOp::Lt => 5,
                    BinaryOp::And
                    | BinaryOp::Or
                    | BinaryOp::Xor => 1,
                    BinaryOp::Shl
                    | BinaryOp::Shr => return u32::MAX,
                }
            },
            // A Cast can be either simplified, or lead to a truncate
            Instruction::Cast(_, _) => 3,
            Instruction::Not(_) => 1,
            Instruction::Truncate { .. } => 7,

            Instruction::Constrain(_,_,_)
            | Instruction::ConstrainNotEqual(_,_,_)
            | Instruction::RangeCheck { .. }
            // Calls with no-predicate set to true could be supported, but
            // they are likely to be too costly anyways. Simple calls would
            // have been inlined already.
            | Instruction::Call { .. }
            |      Instruction::Load { .. }
            | Instruction::Store { .. }
            | Instruction::ArraySet { .. } => return u32::MAX,

            Instruction::ArrayGet { array, index  } => {
                // A get can fail because of out-of-bound index
                let mut in_bound = false;
                // check if index is in bound
                if let (Some(index), Some(len)) = (dfg.get_numeric_constant(*index), dfg.try_get_array_length(*array)) {
                    // The index is in-bounds
                    if index.to_u128() < len as u128 {
                        in_bound = true;
                    }
                }
                if !in_bound {
                    return u32::MAX;
                }
                1
            },
            // if less than 10 elements, it is translated into a store for each element
            // if more than 10, it is a loop, so 20 should be a good estimate, worst case being 10 stores and ~10 index increments
            Instruction::MakeArray { .. } => 20,

            Instruction::Allocate
            | Instruction::EnableSideEffectsIf { .. }
            | Instruction::IncrementRc { .. }
            | Instruction::DecrementRc { .. }
            | Instruction::Noop => 0,
            Instruction::IfElse { .. } => 1,
        };
        cost += instruction_cost;
    }
    cost
}

/// Identifies all simple conditionals in the function and flattens them
fn flatten_function(function: &mut Function, no_predicates: &mut HashMap<FunctionId, bool>) {
    // This pass is dedicated to brillig functions
    if !function.runtime().is_brillig() {
        return;
    }
    let cfg = ControlFlowGraph::with_function(function);
    let mut stack = vec![function.entry_block()];
    let mut processed = HashSet::new();
    let mut conditionals = Vec::new();

    // 1. Process all blocks of the cfg, starting from the root and following the successors
    while let Some(block) = stack.pop() {
        // Avoid cycles
        if processed.contains(&block) {
            continue;
        }
        processed.insert(block);

        // Identify the simple conditionals
        if let Some(conditional) = is_conditional(block, &cfg, function) {
            // no need to check the branches, process the join block directly
            stack.push(conditional.block_exit);
            conditionals.push(conditional);
        } else {
            stack.extend(cfg.successors(block));
        }
    }

    // 2. Flatten all simple conditionals
    // process basic conditionals in reverse order so that
    // a conditional does not impact the previous ones
    conditionals.reverse();
    flatten_multiple(&conditionals, function, no_predicates);
}

fn flatten_multiple(
    conditionals: &Vec<BasicConditional>,
    function: &mut Function,
    no_predicates: &mut HashMap<FunctionId, bool>,
) {
    // 1. process each basic conditional, using a new context per conditional
    let post_order = PostOrder::with_function(function);

    let mut mapping = HashMap::default();
    for conditional in conditionals {
        let cfg = ControlFlowGraph::with_function(function);
        let cfg_root = function.entry_block();
        let mut branch_ends = HashMap::default();
        branch_ends.insert(conditional.block_entry, conditional.block_exit);
        let mut context = Context::new(function, cfg, branch_ends, cfg_root);
        context.flatten_single_conditional(conditional, no_predicates);
        // extract the mapping into 'mapping
        context.inserter.extract_mapping(&mut mapping);
    }
    // 2. re-map the full program for values that may been simplified.
    if !mapping.is_empty() {
        for block in post_order.as_slice() {
            Context::map_block_with_mapping(mapping.clone(), function, *block);
        }
    }
}

impl Context<'_> {
    fn flatten_single_conditional(
        &mut self,
        conditional: &BasicConditional,
        no_predicates: &mut HashMap<FunctionId, bool>,
    ) {
        // Manually inline 'then', 'else' and 'exit' into the entry block
        //0. initialize the context for flattening a 'single conditional'
        let old_target = self.target_block;
        let old_no_predicate = self.no_predicate;
        let mut queue = vec![];
        self.target_block = conditional.block_entry;
        self.no_predicate = true;
        //1. process 'then' branch
        self.inline_block(conditional.block_entry, no_predicates);
        let to_process = self.handle_terminator(conditional.block_entry, &queue);
        queue.extend(to_process);
        if let Some(then) = conditional.block_then {
            assert_eq!(queue.pop(), conditional.block_then);
            self.inline_block(then, no_predicates);
            let to_process = self.handle_terminator(then, &queue);

            for incoming_block in to_process {
                if !queue.contains(&incoming_block) {
                    queue.push(incoming_block);
                }
            }
        }

        //2. process 'else' branch, in case there is no 'then'
        let next = queue.pop();
        if next == conditional.block_else {
            let next = next.unwrap();
            self.inline_block(next, no_predicates);
            let _ = self.handle_terminator(next, &queue);
        } else {
            assert_eq!(next, Some(conditional.block_exit));
        }

        //3. process 'exit' block
        self.inline_block(conditional.block_exit, no_predicates);
        // Manually set the terminator of the entry block to the one of the exit block
        let terminator =
            self.inserter.function.dfg[conditional.block_exit].terminator().unwrap().clone();
        let new_terminator = match terminator {
            TerminatorInstruction::JmpIf {
                condition,
                then_destination,
                else_destination,
                call_stack,
            } => {
                let condition = self.inserter.resolve(condition);
                TerminatorInstruction::JmpIf {
                    condition,
                    then_destination,
                    else_destination,
                    call_stack,
                }
            }
            TerminatorInstruction::Jmp { destination, arguments, call_stack } => {
                let arguments = vecmap(arguments, |value| self.inserter.resolve(value));
                TerminatorInstruction::Jmp { destination, arguments, call_stack }
            }
            TerminatorInstruction::Return { return_values, call_stack } => {
                let return_values = vecmap(return_values, |value| self.inserter.resolve(value));
                TerminatorInstruction::Return { return_values, call_stack }
            }
        };
        self.inserter.function.dfg.set_block_terminator(conditional.block_entry, new_terminator);
        self.inserter.map_data_bus_in_place();
        //4. restore the context, in case it is re-used.
        self.target_block = old_target;
        self.no_predicate = old_no_predicate;
    }

    fn map_block_with_mapping(
        mapping: HashMap<ValueId, ValueId>,
        func: &mut Function,
        block: BasicBlockId,
    ) {
        // Map all instructions in the block
        let mut inserter = FunctionInserter::new(func);
        inserter.set_mapping(mapping);
        let instructions = inserter.function.dfg[block].instructions().to_vec();
        for instruction in instructions {
            inserter.map_instruction_in_place(instruction);
        }
        inserter.map_terminator_in_place(block);
    }
}

#[cfg(test)]
mod test {
    use crate::ssa::{Ssa, opt::assert_normalized_ssa_equals};

    #[test]
    fn basic_jmpif() {
        let src = "
              brillig(inline) fn foo f0 {
                b0(v0: u32):
                  v3 = eq v0, u32 0
                  jmpif v3 then: b2, else: b1
                b1():
                  jmp b3(u32 5)
                b2():
                  jmp b3(u32 3)
                b3(v1: u32):
                  return v1
            }
            ";
        let ssa = Ssa::from_str(src).unwrap();
        assert_eq!(ssa.main().reachable_blocks().len(), 4);

        let expected = "
            brillig(inline) fn foo f0 {
              b0(v0: u32):
                v2 = eq v0, u32 0
                v3 = not v2
                v4 = cast v2 as u32
                v5 = cast v3 as u32
                v7 = unchecked_mul v4, u32 3
                v9 = unchecked_mul v5, u32 5
                v10 = unchecked_add v7, v9
                return v10
            }
            ";

        let ssa = ssa.flatten_basic_conditionals();
        assert_normalized_ssa_equals(ssa, expected);
    }

    #[test]
    fn array_jmpif() {
        let src = r#"
              brillig(inline) fn foo f0 {
                b0(v0: u32):
                  v3 = eq v0, u32 5
                  jmpif v3 then: b2, else: b1
                b1():
                  v6 = make_array b"foo"
                  jmp b3(v6)
                b2():
                  v10 = make_array b"bar"
                  jmp b3(v10)
                b3(v1: [u8; 3]):
                  return v1
            }
            "#;
        let ssa = Ssa::from_str(src).unwrap();
        assert_eq!(ssa.main().reachable_blocks().len(), 4);
        let ssa = ssa.flatten_basic_conditionals();
        // make_array is not simplified
        assert_normalized_ssa_equals(ssa, src);
    }

    #[test]
    fn nested_jmpifs() {
        let src = "
            brillig(inline) fn foo f0 {
              b0(v0: u32):
                v5 = eq v0, u32 5
                v6 = not v5
                jmpif v5 then: b5, else: b1
              b1():
                v8 = lt v0, u32 3
                jmpif v8 then: b3, else: b2
              b2():
                v9 = truncate v0 to 2 bits, max_bit_size: 32
                jmp b4(v9)
              b3():
                v10 = truncate v0 to 1 bits, max_bit_size: 32
                jmp b4(v10)
              b4(v1: u32):
                jmp b9(v1)
              b5():
                v12 = lt u32 2, v0
                jmpif v12 then: b7, else: b6
              b6():
                v13 = truncate v0 to 3 bits, max_bit_size: 32
                jmp b8(v13)
              b7():
                v14 = and v0, u32 2
                jmp b8(v14)
              b8(v2: u32):
                jmp b9(v2)
              b9(v3: u32):
                return v3
            }
            ";
        let ssa = Ssa::from_str(src).unwrap();
        assert_eq!(ssa.main().reachable_blocks().len(), 10);

        let expected = "
            brillig(inline) fn foo f0 {
              b0(v0: u32):
                v3 = eq v0, u32 5
                v4 = not v3
                jmpif v3 then: b2, else: b1
              b1():
                v6 = lt v0, u32 3
                v7 = truncate v0 to 1 bits, max_bit_size: 32
                v8 = not v6
                v9 = truncate v0 to 2 bits, max_bit_size: 32
                v10 = cast v6 as u32
                v11 = cast v8 as u32
                v12 = unchecked_mul v10, v7
                v13 = unchecked_mul v11, v9
                v14 = unchecked_add v12, v13
                jmp b3(v14)
              b2():
                v16 = lt u32 2, v0
                v17 = and v0, u32 2
                v18 = not v16
                v19 = truncate v0 to 3 bits, max_bit_size: 32
                v20 = cast v16 as u32
                v21 = cast v18 as u32
                v22 = unchecked_mul v20, v17
                v23 = unchecked_mul v21, v19
                v24 = unchecked_add v22, v23
                jmp b3(v24)
              b3(v1: u32):
                return v1
            }
            ";

        let ssa = ssa.flatten_basic_conditionals();
        assert_eq!(ssa.main().reachable_blocks().len(), 4);
        assert_normalized_ssa_equals(ssa, expected);
    }
}