concrete/tests/common/optimization/test_float_fusing.py

"""Test file for float subgraph fusing"""

import random
from inspect import signature

import numpy
import pytest

from concrete.common.data_types.integers import Integer
from concrete.common.debugging.custom_assert import assert_not_reached
from concrete.common.optimization.topological import fuse_float_operations
from concrete.common.values import EncryptedScalar, EncryptedTensor
from concrete.numpy import tracing
from concrete.numpy.tracing import trace_numpy_function


def no_fuse(x):
    """No fuse"""
    return x + 2


def no_fuse_unhandled(x, y):
    """No fuse unhandled"""
    x_1 = x + 0.7
    y_1 = y + 1.3
    intermediate = x_1 + y_1
    return intermediate.astype(numpy.int32)


def simple_fuse_not_output(x):
    """Simple fuse not output"""
    intermediate = x.astype(numpy.float64)
    intermediate = intermediate.astype(numpy.int32)
    return intermediate + 2


def simple_fuse_output(x):
    """Simple fuse output"""
    return x.astype(numpy.float64).astype(numpy.int32)


def mix_x_and_y_intricately_and_call_f(function, x, y):
    """Mix x and y in an intricated way, that can't be simplified by
    an optimizer eg, and then call function
    """
    intermediate = x + y
    intermediate = intermediate + 2
    intermediate = intermediate.astype(numpy.float32)
    intermediate = intermediate.astype(numpy.int32)
    x_p_1 = intermediate + 1.5
    x_p_2 = intermediate + 2.7
    x_p_3 = function(x_p_1 + x_p_2)
    return (
        x_p_3.astype(numpy.int32),
        x_p_2.astype(numpy.int32),
        (x_p_2 + 3).astype(numpy.int32),
        x_p_3.astype(numpy.int32) + 67,
        y,
        (y + 4.7).astype(numpy.int32) + 3,
    )


def mix_x_and_y_and_call_f(function, x, y):
    """Mix x and y and then call function"""
    x_p_1 = x + 0.1
    x_p_2 = x + 0.2
    x_p_3 = function(x_p_1 + x_p_2)
    return (
        x_p_3.astype(numpy.int32),
        x_p_2.astype(numpy.int32),
        (x_p_2 + 3).astype(numpy.int32),
        x_p_3.astype(numpy.int32) + 67,
        y,
        (y + 4.7).astype(numpy.int32) + 3,
    )


def mix_x_and_y_into_integer_and_call_f(function, x, y):
    """Mix x and y but keep the entry to function as an integer"""
    x_p_1 = x + 1
    x_p_2 = x + 2
    x_p_3 = function(x_p_1 + x_p_2)
    return (
        x_p_3.astype(numpy.int32),
        x_p_2.astype(numpy.int32),
        (x_p_2 + 3).astype(numpy.int32),
        x_p_3.astype(numpy.int32) + 67,
        y,
        (y + 4.7).astype(numpy.int32) + 3,
    )


@pytest.mark.parametrize(
    "function_to_trace,fused",
    [
        pytest.param(no_fuse, False, id="no_fuse"),
        pytest.param(no_fuse_unhandled, False, id="no_fuse_unhandled"),
        pytest.param(simple_fuse_not_output, True, id="no_fuse"),
        pytest.param(simple_fuse_output, True, id="no_fuse"),
        pytest.param(
            lambda x, y: mix_x_and_y_intricately_and_call_f(numpy.rint, x, y),
            True,
            id="mix_x_and_y_intricately_and_call_f_with_rint",
        ),
        pytest.param(
            lambda x, y: mix_x_and_y_and_call_f(numpy.rint, x, y),
            True,
            id="mix_x_and_y_and_call_f_with_rint",
        ),
    ],
)
@pytest.mark.parametrize("input_", [0, 2, 42, 44])
def test_fuse_float_operations(function_to_trace, fused, input_):
    """Test function for fuse_float_operations"""

    params_names = signature(function_to_trace).parameters.keys()

    op_graph = trace_numpy_function(
        function_to_trace,
        {param_name: EncryptedScalar(Integer(32, True)) for param_name in params_names},
    )
    orig_num_nodes = len(op_graph.graph)
    fuse_float_operations(op_graph)
    fused_num_nodes = len(op_graph.graph)

    if fused:
        assert fused_num_nodes < orig_num_nodes
    else:
        assert fused_num_nodes == orig_num_nodes

    input_ = numpy.int32(input_)

    num_params = len(params_names)
    inputs = (input_,) * num_params
    assert function_to_trace(*inputs) == op_graph(*inputs)


def subtest_tensor_no_fuse(fun, tensor_shape):
    """Test case to verify float fusing is only applied on functions on scalars."""

    if tensor_shape == ():
        # We want tensors
        return

    if fun in LIST_OF_UFUNC_WHICH_HAVE_INTEGER_ONLY_SOURCES:
        # We need at least one input of the bivariate function to be float
        return

    # Float fusing currently cannot work if the constant in a bivariate operator is bigger than the
    # variable input.
    # Make a broadcastable shape but with the constant being bigger
    variable_tensor_shape = (1,) + tensor_shape
    constant_bigger_shape = (random.randint(2, 10),) + tensor_shape

    def tensor_no_fuse(x):
        intermediate = x.astype(numpy.float64)
        intermediate = fun(intermediate, numpy.ones(constant_bigger_shape))
        return intermediate.astype(numpy.int32)

    function_to_trace = tensor_no_fuse
    params_names = signature(function_to_trace).parameters.keys()

    op_graph = trace_numpy_function(
        function_to_trace,
        {
            param_name: EncryptedTensor(Integer(32, True), shape=variable_tensor_shape)
            for param_name in params_names
        },
    )
    orig_num_nodes = len(op_graph.graph)
    fuse_float_operations(op_graph)
    fused_num_nodes = len(op_graph.graph)

    assert orig_num_nodes == fused_num_nodes


def check_results_are_equal(function_result, op_graph_result):
    """Check the output of function execution and OPGraph evaluation are equal."""

    if isinstance(function_result, tuple) and isinstance(op_graph_result, tuple):
        assert len(function_result) == len(op_graph_result)
        are_equal = (
            function_output == op_graph_output
            for function_output, op_graph_output in zip(function_result, op_graph_result)
        )
    elif not isinstance(function_result, tuple) and not isinstance(op_graph_result, tuple):
        are_equal = (function_result == op_graph_result,)
    else:
        assert_not_reached(f"Incompatible outputs: {function_result}, {op_graph_result}")

    return all(value.all() if isinstance(value, numpy.ndarray) else value for value in are_equal)


def subtest_fuse_float_unary_operations_correctness(fun, tensor_shape):
    """Test a unary function with fuse_float_operations."""

    # Some manipulation to avoid issues with domain of definitions of functions
    if fun == numpy.arccosh:
        input_list = [1, 2, 42, 44]
        super_fun_list = [mix_x_and_y_and_call_f]
    elif fun in [numpy.arctanh, numpy.arccos, numpy.arcsin, numpy.arctan]:
        input_list = [0, 0.1, 0.2]
        super_fun_list = [mix_x_and_y_and_call_f]
    elif fun == numpy.invert:
        input_list = [1, 2, 42, 44]
        super_fun_list = [mix_x_and_y_into_integer_and_call_f]
    else:
        input_list = [0, 2, 42, 44]
        super_fun_list = [mix_x_and_y_and_call_f, mix_x_and_y_intricately_and_call_f]

    for super_fun in super_fun_list:

        for input_ in input_list:

            def get_function_to_trace():
                return lambda x, y: super_fun(fun, x, y)

            function_to_trace = get_function_to_trace()

            params_names = signature(function_to_trace).parameters.keys()

            op_graph = trace_numpy_function(
                function_to_trace,
                {
                    param_name: EncryptedTensor(Integer(32, True), tensor_shape)
                    for param_name in params_names
                },
            )
            orig_num_nodes = len(op_graph.graph)
            fuse_float_operations(op_graph)
            fused_num_nodes = len(op_graph.graph)

            assert fused_num_nodes < orig_num_nodes

            ones_input = (
                numpy.ones(tensor_shape, dtype=numpy.dtype(type(input_)))
                if tensor_shape != ()
                else 1
            )
            input_ = numpy.int32(input_ * ones_input)

            num_params = len(params_names)
            inputs = (input_,) * num_params

            function_result = function_to_trace(*inputs)
            op_graph_result = op_graph(*inputs)

            assert check_results_are_equal(function_result, op_graph_result)


LIST_OF_UFUNC_WHICH_HAVE_INTEGER_ONLY_SOURCES = {
    numpy.bitwise_and,
    numpy.bitwise_or,
    numpy.bitwise_xor,
    numpy.gcd,
    numpy.invert,
    numpy.lcm,
    numpy.ldexp,
    numpy.left_shift,
    numpy.logical_and,
    numpy.logical_not,
    numpy.logical_or,
    numpy.logical_xor,
    numpy.remainder,
    numpy.right_shift,
}


def subtest_fuse_float_binary_operations_correctness(fun, tensor_shape):
    """Test a binary functions with fuse_float_operations, with a constant as a source."""

    for i in range(4):

        # Know if the function is defined for integer inputs
        if fun in LIST_OF_UFUNC_WHICH_HAVE_INTEGER_ONLY_SOURCES:
            if i not in [0, 2]:
                continue

        # The .astype(numpy.float64) that we have in cases 0 and 2 is here to force
        # a float output even for functions which return an integer (eg, XOR), such
        # that our frontend always try to fuse them

        # The .astype(numpy.float64) that we have in cases 1 and 3 is here to force
        # a float output even for functions which return a bool (eg, EQUAL), such
        # that our frontend always try to fuse them

        # For bivariate functions: fix one of the inputs
        if i == 0:
            # With an integer in first position
            ones_0 = numpy.ones(tensor_shape, dtype=numpy.int64) if tensor_shape != () else 1

            def get_function_to_trace():
                return lambda x, y: fun(3 * ones_0, x + y).astype(numpy.float64).astype(numpy.int32)

        elif i == 1:
            # With a float in first position
            ones_1 = numpy.ones(tensor_shape, dtype=numpy.float64) if tensor_shape != () else 1

            def get_function_to_trace():
                return (
                    lambda x, y: fun(2.3 * ones_1, x + y).astype(numpy.float64).astype(numpy.int32)
                )

        elif i == 2:
            # With an integer in second position
            ones_2 = numpy.ones(tensor_shape, dtype=numpy.int64) if tensor_shape != () else 1

            def get_function_to_trace():
                return lambda x, y: fun(x + y, 4 * ones_2).astype(numpy.float64).astype(numpy.int32)

        else:
            # With a float in second position
            ones_else = numpy.ones(tensor_shape, dtype=numpy.float64) if tensor_shape != () else 1

            def get_function_to_trace():
                return (
                    lambda x, y: fun(x + y, 5.7 * ones_else)
                    .astype(numpy.float64)
                    .astype(numpy.int32)
                )

        input_list = [0, 2, 42, 44]

        # Domain of definition
        if fun in [numpy.true_divide, numpy.remainder, numpy.floor_divide, numpy.fmod]:
            input_list = [2, 42, 44]

        for input_ in input_list:
            ones_input = (
                numpy.ones(tensor_shape, dtype=numpy.dtype(type(input_)))
                if tensor_shape != ()
                else 1
            )
            input_ = input_ * ones_input

            function_to_trace = get_function_to_trace()

            params_names = signature(function_to_trace).parameters.keys()

            op_graph = trace_numpy_function(
                function_to_trace,
                {
                    param_name: EncryptedTensor(Integer(32, True), tensor_shape)
                    for param_name in params_names
                },
            )
            orig_num_nodes = len(op_graph.graph)
            fuse_float_operations(op_graph)
            fused_num_nodes = len(op_graph.graph)

            assert fused_num_nodes < orig_num_nodes

            input_ = numpy.int32(input_)

            num_params = len(params_names)
            inputs = (input_,) * num_params

            function_result = function_to_trace(*inputs)
            op_graph_result = op_graph(*inputs)

            assert check_results_are_equal(function_result, op_graph_result)


def subtest_fuse_float_binary_operations_dont_support_two_variables(fun, tensor_shape):
    """Test a binary function with fuse_float_operations, with no constant as
    a source."""

    def get_function_to_trace():
        return lambda x, y: fun(x, y).astype(numpy.int32)

    function_to_trace = get_function_to_trace()

    params_names = signature(function_to_trace).parameters.keys()

    with pytest.raises(NotImplementedError, match=r"Can't manage binary operator"):
        trace_numpy_function(
            function_to_trace,
            {
                param_name: EncryptedTensor(Integer(32, True), tensor_shape)
                for param_name in params_names
            },
        )


@pytest.mark.parametrize("fun", tracing.NPTracer.LIST_OF_SUPPORTED_UFUNC)
@pytest.mark.parametrize("tensor_shape", [(), (3, 1, 2)])
def test_ufunc_operations(fun, tensor_shape):
    """Test functions which are in tracing.NPTracer.LIST_OF_SUPPORTED_UFUNC."""

    if fun.nin == 1:
        subtest_fuse_float_unary_operations_correctness(fun, tensor_shape)
    elif fun.nin == 2:
        subtest_fuse_float_binary_operations_correctness(fun, tensor_shape)
        subtest_fuse_float_binary_operations_dont_support_two_variables(fun, tensor_shape)
        subtest_tensor_no_fuse(fun, tensor_shape)
    else:
        raise NotImplementedError("Only unary and binary functions are tested for now")