Source code for omlt.neuralnet.layers.partition_based

import numpy as np
import pyomo.environ as pyo
from pyomo.contrib.fbbt.fbbt import compute_bounds_on_expr


[docs]def default_partition_split_func(w, n):
    r"""
    Default function for partitioning weights in :math:`w` into :math:`n` partitions.

    Weights in :math:`w` are sorted and partitioned evenly.

    """
    sorted_indexes = np.argsort(w)
    n = min(n, len(sorted_indexes))
    return np.array_split(sorted_indexes, n)


[docs]def partition_based_dense_relu_layer(net_block, net, layer_block, layer, split_func):
    r"""
    Partition-based ReLU activation formulation.

    Generates the constraints for the ReLU activation function:

    .. math::

        \begin{align*}
            y_j = \max\left(0,\sum\limits_{i=0}^{F_{in}-1}w_{ij}x_i+b_j\right), && \forall 0\le j<F_{out}
        \end{align*}

    We additionally introduce the following notations to describe this formulation:

    .. math::

        \begin{align*}
            n       &:= \text{the number of partitions}\\
            S_k     &:=  \text{indexes of the $k$-th partition satisfying:} \\
                    & \quad\quad \bigcup\limits_{k=0}^{n-1} S_k=\{0,1,\dots,F_{in}-1\},~S_{k_1}\cap S_{k_2}=\emptyset, ~\forall k_1\neq k_2\\
            \sigma  &:= \text{if this activation function is activated, i.e.,}\\
                    & \quad\quad y_j=
                    \begin{cases}
                        0, & \sigma=1\\
                        \sum\limits_{i=0}^{F_{in}-1}w_{ij}x_i+b_j, & \sigma=0
                    \end{cases}\\
            p_k     &:=\text{auxiliary variable representing the $k$-th partition, i.e., $\sum\limits_{i\in S_k}w_{ij}x_i$}\\
            l_k     &:=\text{the lower bound of $\sum\limits_{i\in S_k}w_{ij}x_i$}\\
            u_k     &:=\text{the upper bound of $\sum\limits_{i\in S_k}w_{ij}x_i$}
        \end{align*}


    The partition-based formulation for :math:`y_j` is given by:

    .. math::

        \begin{align*}
            & y_j=\sum\limits_{k=0}^{n-1}p_k+(1-\sigma)b_j\\
            & \sum\limits_{k=0}^{n-1}\left(\sum\limits_{i\in S_k}w_{ij}x_i-p_k\right)+\sigma b_j\le 0\\
            & \sum\limits_{k=0}^{n-1}p_k+(1-\sigma)b_j\ge 0\\
            & \sigma l_k\le \sum\limits_{i\in S_k}w_{ij}x_i-p_k\le \sigma u_k,~0\le k<n\\
            & (1-\sigma)l_k\le p_k\le (1-\sigma)u_k,~0\le k<n
        \end{align*}

    """
    # not an input layer, process the expressions
    prev_layers = list(net.predecessors(layer))
    if len(prev_layers) == 0:
        raise ValueError(
            f"Layer {layer} is not an input layer, but has no predecessors."
        )
    elif len(prev_layers) > 1:
        raise ValueError(f"Layer {layer} has multiple predecessors.")
    prev_layer = prev_layers[0]
    prev_layer_block = net_block.layer[id(prev_layer)]

    @layer_block.Block(layer.output_indexes)
    def output_node_block(b, *output_index):
        # dense layers multiply only the last dimension of
        # their inputs
        weights = layer.weights[:, output_index[-1]]
        bias = layer.biases[output_index[-1]]

        splits = split_func(weights)
        num_splits = len(splits)

        b.sig = pyo.Var(domain=pyo.Binary)
        b.z2 = pyo.Var(range(num_splits))

        mapper = layer.input_index_mapper

        b.eq_16_lb = pyo.ConstraintList()
        b.eq_16_ub = pyo.ConstraintList()

        b.eq_17_lb = pyo.ConstraintList()
        b.eq_17_ub = pyo.ConstraintList()

        input_layer_indexes = list(layer.input_indexes_with_input_layer_indexes)

        # Add Equation 16 and 17
        for split_index in range(num_splits):
            expr = 0.0
            for split_local_index in splits[split_index]:
                _, local_index = input_layer_indexes[split_local_index]

                if mapper:
                    input_index = mapper(local_index)
                else:
                    input_index = local_index

                w = weights[local_index[-1]]
                expr += prev_layer_block.z[input_index] * w

            lb, ub = compute_bounds_on_expr(expr)
            if lb is None:
                raise ValueError("Expression is unbounded below.")
            if ub is None:
                raise ValueError("Expression is unbounded above.")

            z2 = b.z2[split_index]
            z2.setlb(min(0, lb))
            z2.setub(max(0, ub))

            b.eq_16_lb.add(expr - z2 >= b.sig * lb)
            b.eq_16_ub.add(expr - z2 <= b.sig * ub)
            b.eq_17_lb.add(z2 >= (1 - b.sig) * lb)
            b.eq_17_ub.add(z2 <= (1 - b.sig) * ub)

        # compute dense layer expression to compute bounds
        expr = 0.0
        for local_index, input_index in layer.input_indexes_with_input_layer_indexes:
            w = layer.weights[local_index[-1], output_index[-1]]
            expr += prev_layer_block.z[input_index] * w
        # move this at the end to avoid numpy/pyomo var bug
        expr += bias

        lb, ub = compute_bounds_on_expr(expr)
        if lb is None:
            raise ValueError("Expression is unbounded below.")
        if ub is None:
            raise ValueError("Expression is unbounded above.")

        layer_block.z[output_index].setlb(0)
        layer_block.z[output_index].setub(max(0, ub))

        eq_13_expr = 0.0
        for split_index in range(num_splits):
            for split_local_index in splits[split_index]:
                _, local_index = input_layer_indexes[split_local_index]
                if mapper:
                    input_index = mapper(local_index)
                else:
                    input_index = local_index

                w = weights[local_index[-1]]
                eq_13_expr += prev_layer_block.z[input_index] * w
            eq_13_expr -= b.z2[split_index]
        eq_13_expr += bias * b.sig

        b.eq_13 = pyo.Constraint(expr=eq_13_expr <= 0)
        b.eq_14 = pyo.Constraint(
            expr=sum(b.z2[s] for s in range(num_splits)) + bias * (1 - b.sig) >= 0
        )
        b.eq_15 = pyo.Constraint(
            expr=layer_block.z[output_index]
            == sum(b.z2[s] for s in range(num_splits)) + bias * (1 - b.sig)
        )