fastmachinelearning · jurevreca12 · Apr 28, 2025 · May 7, 2025 · May 7, 2025 · May 7, 2025
diff --git a/.gitignore b/.gitignore
@@ -14,3 +14,4 @@ docs/autodoc/*
 hls4mlprj_*
 *~
 *.ipynb_checkpoints/
+*.bak
diff --git a/hls4ml/converters/onnx/core.py b/hls4ml/converters/onnx/core.py
@@ -120,3 +120,14 @@ def parse_quant_layer(node, input_names, input_shapes, graph):
     layer['signed'] = bool(get_onnx_attribute(node, 'signed'))
 
     return layer
+
+
+@onnx_handler('BipolarQuant')
+def parse_bipolar_quant_layer(node, input_names, input_shapes, graph):
+    layer = {}
+
+    layer['class_name'] = 'BipolarQuant'
+    layer['name'] = node.name
+    layer['inputs'] = input_names
+    layer['outputs'] = list(node.output)
+    return layer
diff --git a/hls4ml/model/layers.py b/hls4ml/model/layers.py
@@ -421,6 +421,21 @@ def initialize(self):
         self.add_output_variable(shape, dims)
 
 
+class BipolarQuant(Layer):  # The QONNX quantization layer
+    """
+    This is a QONNX quantization layer. Optimizations should convert it
+    before HLS is produced.
+    """
+
+    _expected_attributes = []
+
+    def initialize(self):
+        inp = self.get_input_variable(self.inputs[0])
+        shape = inp.shape
+        dims = inp.dim_names
+        self.add_output_variable(shape, dims)
+
+
 class Reshape(Layer):
     _expected_attributes = [
         Attribute('target_shape', value_type=typing.Sequence),
@@ -1724,6 +1739,7 @@ def initialize(self):
     'GarNet': GarNet,
     'GarNetStack': GarNetStack,
     'Quant': Quant,
+    'BipolarQuant': BipolarQuant,
     'ApplyAlpha': ApplyAlpha,
     'BatchNormOnnx': BatchNormOnnx,
     'LayerGroup': LayerGroup,

diff --git a/hls4ml/model/optimizer/__init__.py b/hls4ml/model/optimizer/__init__.py
@@ -40,6 +40,9 @@
         'fuse_quant_with_constant',
         'const_quant_to_const_alpha',
         'quant_to_alpha_activation_alpha',
+        'bipolar_quant_constant_parameters',
+        'bipolar_quant_to_activation',
+        'fuse_bipolar_quant_with_constant',
         'batch_norm_onnx_constant_parameters',
         'constant_batch_norm_fusion',
         'merge_two_constants',

diff --git a/hls4ml/model/optimizer/passes/bipolar_quant_opt.py b/hls4ml/model/optimizer/passes/bipolar_quant_opt.py
@@ -0,0 +1,151 @@
+"""
+This file includes optimizations related to BipolarQuant nodes.
+
+As a first step, QuantConstantParameters converts the extra inputs to attributes.
+
+The next step differs between the case of (1) (positive) power-of-2 scale and zero offset, or (2) other cases. In the first
+case no explicit scaling is required, so a Quant node logically becomes a linear activation. (Cases when the scale is a
+power of 2 not equal to one are implicitly scaled with fixed precision types.) When the activation is applied to a constant
+weight, the activation is immediately merged with the weight, quantizing the weights. In case (2), we need to explicitly
+scale and unscale, so the Quant node becomes 3 nodes, an ApplyAlpha node to apply a scale/shift, a Linear node to apply the
+quantization, and another ApplyAlpha to unscale/shift. We depend on optimization steps to move the unscaling ApplyAlpha
+down as needed so that we can do integer or fixed-point calculations. When the Quant is a applied to a weight, the scaling
+and Linear nodes are immediately merged into the Constant.
+
+"""
+
+import numpy as np
+
+from hls4ml.model.layers import Activation, BipolarQuant, Constant
+from hls4ml.model.optimizer import OptimizerPass
+from hls4ml.model.quantizers import BinaryQuantizer
+from hls4ml.model.types import XnorPrecisionType
+
+_ALSO_MATCH_PO2 = True
+
+
+class BipolarQuantConstantParameters(OptimizerPass):
+    """Remove Constant from the Qaunt node parameters (but not input[0])"""
+
+    def match(self, node):
+        is_match = (
+            isinstance(node, BipolarQuant)
+            and len(node.inputs) == 2
+            and (node.get_input_node(node.inputs[1]) and isinstance(node.get_input_node(node.inputs[1]), Constant))
+        )
+
+        return is_match
+
+    def transform(self, model, node):
+        """
+        Remove Constant from the Quant node parameters (but not input[0])
+        """
+        if node.get_input_node(node.inputs[1]):
+            scale_node = node.get_input_node(node.inputs[1])
+            if isinstance(scale_node, Constant):
+                node.set_attr('scale', scale_node.get_attr('value'))
+                node.inputs[1] = ''
+                model.remove_node(scale_node)
+
+        node.inputs = [inp for inp in node.inputs if inp]
+        if len(node.inputs) != 1:
+            raise RuntimeError("hls4ml only supports constant scale")
+
+        return True
+
+
+class BipolarQuantToActivation(OptimizerPass):
+    """
+    This is for the case when scale is a (positive) power of 2 and zeropt is 0. It is a a 1:1 transformation of
+    a BipolarQuant to an Activation.
+
+    As an optimization, this is not called when the input is constant.
+    """
+
+    def match(self, node):
+        # only matches after the other inputs are already folded
+
+        is_match = (
+            isinstance(node, BipolarQuant)
+            and len(node.inputs) == 1
+            and not isinstance(node.get_input_node(node.inputs[0]), Constant)
+        )
+
+        # Only match if the scale is power of 2 and the zero-point is 0s
+        if is_match:  # to make sure this is a quant node with inputs
+            scale = node.get_attr('scale')
+            # check if scale is ones-like or a power of two
+            scale_unit_or_po2 = (scale == np.ones_like(scale)).all()
+            is_match = scale_unit_or_po2
+
+        return is_match
+
+    def transform(self, model, node):
+        """
+        Change quant node to Activation
+        """
+        scale = node.get_attr('scale')
+        assert np.all(scale == 1.0)  # TODO: Is this required?
+
+        precision = XnorPrecisionType()
+        quantizer = BinaryQuantizer(bits=1)
+
+        attributes = {'activation': 'linear', 'quantizer': quantizer}
+
+        # update the configuration
+        config = model.config.get_layer_config(node)
+        prec_config = config.setdefault('Precision', {})
+        prec_config['result'] = str(precision)
+        new_name = f'{node.name}_act'
+        model.config.set_name_config(new_name, config)
+        model.config.parse_name_config(new_name, config)
+
+        new_node = model.make_node(Activation, new_name, attributes, [node.inputs[0]], [x for x in node.outputs])
+        model.replace_node(node, new_node)
+        return True
+
+
+class FuseBipolarQuantWithConstant(OptimizerPass):
+    """
+    This is for the case when scale is a positive power of 2 and zeropt is 0.
+    """
+
+    def match(self, node):
+        # only matches after the other inputs are already folded
+        is_match = (
+            isinstance(node, BipolarQuant)
+            and len(node.inputs) == 1
+            and isinstance(node.get_input_node(node.inputs[0]), Constant)
+        )
+
+        # Only match if the scale is power of 2 and the zero-point is 0s
+        if is_match:  # to make sure this is a quant node with inputs
+            scale = node.get_attr('scale')
+
+            # check if scale is ones-like or a power of two
+            scale_unit_or_po2 = (scale == np.ones_like(scale)).all()
+            is_match = scale_unit_or_po2
+
+        return is_match
+
+    def transform(self, model, node):
+        """
+        Fuse Quant with Constant.
+        """
+
+        scale = node.get_attr('scale')
+        assert np.all(scale == 1.0)  # TODO: Is this required?
+
+        precision = XnorPrecisionType()
+        quantizer = BinaryQuantizer(bits=1)
+
+        const_node = node.get_input_node(node.inputs[0])
+        const_node.set_attr('quantizer', quantizer)
+        const_node.get_output_variable().type.precision = precision
+
+        # Should we update the configuration to reflect the new precision? I don't think it's necessary
+
+        # remove the Quant node
+        model.remove_node(node)
+
+        return True
diff --git a/test/pytest/bnn_model_fc_1layer.onnx b/test/pytest/bnn_model_fc_1layer.onnx
diff --git a/test/pytest/test_qonnx.py b/test/pytest/test_qonnx.py
@@ -12,6 +12,7 @@
 from qonnx.core.modelwrapper import ModelWrapper
 from qonnx.transformation.channels_last import ConvertToChannelsLastAndClean
 from qonnx.transformation.gemm_to_matmul import GemmToMatMul
+from qonnx.util.cleanup import cleanup_model
 
 import hls4ml
 
@@ -428,3 +429,45 @@ def test_simple_model(model_name, io_type, backend, request):
     y_hls4ml = hls_model.predict(X)
 
     np.testing.assert_allclose(y_qonnx.ravel(), y_hls4ml.ravel(), atol=1e-2, rtol=1)
+
+
+@pytest.mark.parametrize('backend', ['Vitis'])
+@pytest.mark.parametrize('io_type', ['io_parallel', 'io_stream'])
+def test_bnn(io_type, backend):
+    "Checks if a basic binarized model works correctly."
+    test_dir = os.path.dirname(os.path.abspath(__file__))
+    qonnx_model = ModelWrapper(f'{test_dir}/bnn_model_fc_1layer.onnx')
+    qonnx_model = cleanup_model(qonnx_model)
+    qonnx_model = qonnx_model.transform(GemmToMatMul())  # ishape = (1, 3)
+    qonnx_model = qonnx.util.cleanup.cleanup_model(qonnx_model)
+    config = hls4ml.utils.config.config_from_onnx_model(
+        qonnx_model, granularity='name', backend=backend, default_precision='fixed<16,6>'
+    )
+    model_name = 'bnn_model_fc_1layer'
+    hls_model = hls4ml.converters.convert_from_onnx_model(
+        qonnx_model,
+        output_dir=str(test_root_path / f'hls4mlprj_onnx_{model_name}_{io_type}_{backend}'),
+        io_type=io_type,
+        backend=backend,
+        hls_config=config,
+    )
+    hls_model.compile()
+
+    X = np.array(
+        [
+            [[+1, +1, +1]],
+            [[+1, +1, -1]],
+            [[+1, -1, +1]],
+            [[-1, -1, -1]],
+            [[-1, +1, +1]],
+            [[-1, +1, -1]],
+            [[-1, -1, +1]],
+            [[-1, -1, -1]],
+        ],
+        dtype=np.float32,
+    )
+    for x in X:
+        idict = {qonnx_model.graph.input[0].name: x}
+        y_qonnx = oxe.execute_onnx(qonnx_model, idict)[qonnx_model.graph.output[0].name]
+        y_hls4ml = hls_model.predict(X)
+        np.array_equal(y_qonnx.ravel(), y_hls4ml.ravel())
-Original file line number
+Diff line change
@@ Expand Up / @@ -14,3 +14,4 @@ docs/autodoc/* @@
     hls4mlprj_*
     *~
     *.ipynb_checkpoints/
+    *.bak