concrete/tests/quantization/test_quantized_array.py

"""Tests for the quantized array/tensors."""
import numpy
import pytest

from concrete.quantization import QuantizedArray


@pytest.mark.parametrize(
    "n_bits",
    [32, 28, 20, 16, 8, 4],
)
@pytest.mark.parametrize("is_signed", [pytest.param(True), pytest.param(False)])
@pytest.mark.parametrize("values", [pytest.param(numpy.random.randn(2000))])
def test_quant_dequant_update(values, n_bits, is_signed, check_array_equality):
    """Test the quant and dequant function."""

    quant_array = QuantizedArray(n_bits, values, is_signed)
    qvalues = quant_array.quant()

    # Quantized values must be contained between 0 and 2**n_bits
    assert numpy.max(qvalues) <= 2 ** (n_bits) - 1 - quant_array.offset
    assert numpy.min(qvalues) >= -quant_array.offset

    # Dequantized values must be close to original values
    dequant_values = quant_array.dequant()

    # Check that all values are close
    tolerance = quant_array.scale / 2
    assert numpy.isclose(dequant_values, values, atol=tolerance).all()

    # Explain the choice of tolerance
    # This test checks the values are quantized and dequantized correctly
    # Each quantization have a maximum error per quantized value an it's `scale / 2`

    # To give an intuition, let's say you have the scale of 0.5
    #     the range `[a + 0.00, a + 0.25]` will be quantized into 0, dequantized into `a + 0.00`
    #     the range `[a + 0.25, a + 0.75]` will be quantized into 1, dequantized into `a + 0.50`
    #     the range `[a + 0.75, a + 1.25]` will be quantized into 2, dequantized into `a + 1.00`
    #     ...

    # So for each quantization-then-dequantization operation,
    # the maximum error is `0.25`, which is `scale / 2`

    # Test update functions
    new_values = numpy.array([0.3, 0.5, -1.2, -3.4])
    new_qvalues_ = quant_array.update_values(new_values)

    # Make sure the shape changed for the qvalues
    assert new_qvalues_.shape != qvalues.shape

    new_qvalues = numpy.array([1, 4, 7, 29])
    new_values_updated = quant_array.update_qvalues(new_qvalues)

    # Make sure that we can see at least one change.
    assert not numpy.array_equal(new_qvalues, new_qvalues_)
    assert not numpy.array_equal(new_values, new_values_updated)

    # Check that the __call__ returns also the qvalues.
    check_array_equality(quant_array(), new_qvalues)