Module `furiosa.quantizer.frontend.onnx.transformer.deprecated.fuse_softmax`

Expand source code

import onnx
import numpy as np

from onnx.helper import make_node, make_tensor_value_info

from furiosa_sdk_quantizer.interfaces.transformer import Transformer
from furiosa_sdk_quantizer.frontend.onnx.transformer import utils
from furiosa_sdk_quantizer.frontend.onnx.utils.check_model import check_model


class FuseSoftmax(Transformer):
    """
    https://github.com/onnx/onnx/blob/master/docs/Operators.md#softmax
    from: Exp -> ReduceSum -> Div
    to: Transpose -> Softmax -> Transpose
    
    Assume NCHW Input
    """

    def transform(self, model: onnx.ModelProto) -> onnx.ModelProto:
        nodes_by_output_name = {node.output[0]: node for node in model.graph.node}
        initializer = {init.name: init for init in model.graph.initializer}
        value_info = {vi.name: vi for vi in
                      list(model.graph.value_info) + list(model.graph.input) + list(model.graph.output)}

        post_fix = '_transposed'
        optimized_nodes = []
        removed_nodes = []
        for node in model.graph.node:
            if node.op_type != 'Div':
                optimized_nodes.append(node)
                continue

            # Div has no specific order of input according to spec.
            # Therefore, we need to find the input index of Exp and ReduceSum.
            def _is_input_op_type(node_input, op_type):
                if node_input in initializer.keys():
                    return False
                return nodes_by_output_name[node_input].op_type == op_type

            idx_exp = list(filter(lambda enum: _is_input_op_type(enum[1], 'Exp'), enumerate(node.input)))
            idx_rsum = list(filter(lambda enum: _is_input_op_type(enum[1], 'ReduceSum'), enumerate(node.input)))

            # Expect one of the inputs is Exp and the other is ReduceSum
            if len(idx_exp) != 1 and len(idx_rsum) != 1:
                optimized_nodes.append(node)
                continue

            idx_exp = idx_exp[0][0]
            idx_rsum = idx_rsum[0][0]

            exp_node = nodes_by_output_name[node.input[idx_exp]]
            rsum_node = nodes_by_output_name[node.input[idx_rsum]]
            removed_nodes.extend([node, exp_node, rsum_node])

            # assert dim(input_shape) == 4
            exp_shape = [dim.dim_value for dim in value_info[exp_node.output[0]].type.tensor_type.shape.dim]
            length = len(exp_shape)

            axis = rsum_node.attribute[0].ints

            # assert ReduceSum takes only 1 axis
            assert len(axis) == 1
            axis = axis[0]
            if axis == -1:
                axis = length - 1

            # make permutation according to axis given
            perm = list(range(0, length))
            perm[axis], perm[-1] = perm[-1], perm[axis]

            new_vi = []
            if axis != length - 1:
                trans_node_1 = make_node('Transpose', inputs=[exp_node.input[0]],
                                         outputs=[exp_node.output[0] + post_fix], perm=perm)

                softmax_node = make_node('Softmax', inputs=[exp_node.output[0] + post_fix],
                                         outputs=[exp_node.output[0] + '_softmax'], axis=length - 1)

                trans_node_2 = make_node('Transpose', inputs=[exp_node.output[0] + '_softmax'],
                                         outputs=[node.output[0]], perm=perm)
                optimized_nodes.extend([trans_node_1, softmax_node, trans_node_2])
                perm1_shape = np.array(exp_shape)[perm].tolist()
                new_vi.append(make_tensor_value_info(name=softmax_node.output[0],
                                                     elem_type=onnx.TensorProto.FLOAT,
                                                     shape=perm1_shape))
                new_vi.append(make_tensor_value_info(name=trans_node_1.output[0],
                                                     elem_type=onnx.TensorProto.FLOAT,
                                                     shape=perm1_shape))
            else:
                softmax_node = make_node('Softmax', inputs=[exp_node.input[0]],
                                         outputs=[node.output[0]], axis=length - 1)
                optimized_nodes.extend([softmax_node])

            model.graph.value_info.extend(new_vi)

        # remove duplicate node(s) in optimized nodes
        seen = []
        for op_node in optimized_nodes:
            if op_node in seen:
                continue
            seen.append(op_node)
        optimized_nodes = seen

        new_nodes = list(filter(lambda node: node not in removed_nodes, optimized_nodes))
        model = utils.rebuild_model(model, new_nodes)
        check_model(model)

        return model

Classes

class FuseSoftmax (*args, **kwds)

https://github.com/onnx/onnx/blob/master/docs/Operators.md#softmax from: Exp -> ReduceSum -> Div to: Transpose -> Softmax -> Transpose

Assume NCHW Input

Expand source code

class FuseSoftmax(Transformer):
    """
    https://github.com/onnx/onnx/blob/master/docs/Operators.md#softmax
    from: Exp -> ReduceSum -> Div
    to: Transpose -> Softmax -> Transpose
    
    Assume NCHW Input
    """

    def transform(self, model: onnx.ModelProto) -> onnx.ModelProto:
        nodes_by_output_name = {node.output[0]: node for node in model.graph.node}
        initializer = {init.name: init for init in model.graph.initializer}
        value_info = {vi.name: vi for vi in
                      list(model.graph.value_info) + list(model.graph.input) + list(model.graph.output)}

        post_fix = '_transposed'
        optimized_nodes = []
        removed_nodes = []
        for node in model.graph.node:
            if node.op_type != 'Div':
                optimized_nodes.append(node)
                continue

            # Div has no specific order of input according to spec.
            # Therefore, we need to find the input index of Exp and ReduceSum.
            def _is_input_op_type(node_input, op_type):
                if node_input in initializer.keys():
                    return False
                return nodes_by_output_name[node_input].op_type == op_type

            idx_exp = list(filter(lambda enum: _is_input_op_type(enum[1], 'Exp'), enumerate(node.input)))
            idx_rsum = list(filter(lambda enum: _is_input_op_type(enum[1], 'ReduceSum'), enumerate(node.input)))

            # Expect one of the inputs is Exp and the other is ReduceSum
            if len(idx_exp) != 1 and len(idx_rsum) != 1:
                optimized_nodes.append(node)
                continue

            idx_exp = idx_exp[0][0]
            idx_rsum = idx_rsum[0][0]

            exp_node = nodes_by_output_name[node.input[idx_exp]]
            rsum_node = nodes_by_output_name[node.input[idx_rsum]]
            removed_nodes.extend([node, exp_node, rsum_node])

            # assert dim(input_shape) == 4
            exp_shape = [dim.dim_value for dim in value_info[exp_node.output[0]].type.tensor_type.shape.dim]
            length = len(exp_shape)

            axis = rsum_node.attribute[0].ints

            # assert ReduceSum takes only 1 axis
            assert len(axis) == 1
            axis = axis[0]
            if axis == -1:
                axis = length - 1

            # make permutation according to axis given
            perm = list(range(0, length))
            perm[axis], perm[-1] = perm[-1], perm[axis]

            new_vi = []
            if axis != length - 1:
                trans_node_1 = make_node('Transpose', inputs=[exp_node.input[0]],
                                         outputs=[exp_node.output[0] + post_fix], perm=perm)

                softmax_node = make_node('Softmax', inputs=[exp_node.output[0] + post_fix],
                                         outputs=[exp_node.output[0] + '_softmax'], axis=length - 1)

                trans_node_2 = make_node('Transpose', inputs=[exp_node.output[0] + '_softmax'],
                                         outputs=[node.output[0]], perm=perm)
                optimized_nodes.extend([trans_node_1, softmax_node, trans_node_2])
                perm1_shape = np.array(exp_shape)[perm].tolist()
                new_vi.append(make_tensor_value_info(name=softmax_node.output[0],
                                                     elem_type=onnx.TensorProto.FLOAT,
                                                     shape=perm1_shape))
                new_vi.append(make_tensor_value_info(name=trans_node_1.output[0],
                                                     elem_type=onnx.TensorProto.FLOAT,
                                                     shape=perm1_shape))
            else:
                softmax_node = make_node('Softmax', inputs=[exp_node.input[0]],
                                         outputs=[node.output[0]], axis=length - 1)
                optimized_nodes.extend([softmax_node])

            model.graph.value_info.extend(new_vi)

        # remove duplicate node(s) in optimized nodes
        seen = []
        for op_node in optimized_nodes:
            if op_node in seen:
                continue
            seen.append(op_node)
        optimized_nodes = seen

        new_nodes = list(filter(lambda node: node not in removed_nodes, optimized_nodes))
        model = utils.rebuild_model(model, new_nodes)
        check_model(model)

        return model

Ancestors

furiosa_sdk_quantizer.interfaces.transformer.Transformer
typing.Generic

Methods

def transform(self, model: onnx.onnx_ml_pb2.ModelProto) ‑> onnx.onnx_ml_pb2.ModelProto

Expand source code

def transform(self, model: onnx.ModelProto) -> onnx.ModelProto:
    nodes_by_output_name = {node.output[0]: node for node in model.graph.node}
    initializer = {init.name: init for init in model.graph.initializer}
    value_info = {vi.name: vi for vi in
                  list(model.graph.value_info) + list(model.graph.input) + list(model.graph.output)}

    post_fix = '_transposed'
    optimized_nodes = []
    removed_nodes = []
    for node in model.graph.node:
        if node.op_type != 'Div':
            optimized_nodes.append(node)
            continue

        # Div has no specific order of input according to spec.
        # Therefore, we need to find the input index of Exp and ReduceSum.
        def _is_input_op_type(node_input, op_type):
            if node_input in initializer.keys():
                return False
            return nodes_by_output_name[node_input].op_type == op_type

        idx_exp = list(filter(lambda enum: _is_input_op_type(enum[1], 'Exp'), enumerate(node.input)))
        idx_rsum = list(filter(lambda enum: _is_input_op_type(enum[1], 'ReduceSum'), enumerate(node.input)))

        # Expect one of the inputs is Exp and the other is ReduceSum
        if len(idx_exp) != 1 and len(idx_rsum) != 1:
            optimized_nodes.append(node)
            continue

        idx_exp = idx_exp[0][0]
        idx_rsum = idx_rsum[0][0]

        exp_node = nodes_by_output_name[node.input[idx_exp]]
        rsum_node = nodes_by_output_name[node.input[idx_rsum]]
        removed_nodes.extend([node, exp_node, rsum_node])

        # assert dim(input_shape) == 4
        exp_shape = [dim.dim_value for dim in value_info[exp_node.output[0]].type.tensor_type.shape.dim]
        length = len(exp_shape)

        axis = rsum_node.attribute[0].ints

        # assert ReduceSum takes only 1 axis
        assert len(axis) == 1
        axis = axis[0]
        if axis == -1:
            axis = length - 1

        # make permutation according to axis given
        perm = list(range(0, length))
        perm[axis], perm[-1] = perm[-1], perm[axis]

        new_vi = []
        if axis != length - 1:
            trans_node_1 = make_node('Transpose', inputs=[exp_node.input[0]],
                                     outputs=[exp_node.output[0] + post_fix], perm=perm)

            softmax_node = make_node('Softmax', inputs=[exp_node.output[0] + post_fix],
                                     outputs=[exp_node.output[0] + '_softmax'], axis=length - 1)

            trans_node_2 = make_node('Transpose', inputs=[exp_node.output[0] + '_softmax'],
                                     outputs=[node.output[0]], perm=perm)
            optimized_nodes.extend([trans_node_1, softmax_node, trans_node_2])
            perm1_shape = np.array(exp_shape)[perm].tolist()
            new_vi.append(make_tensor_value_info(name=softmax_node.output[0],
                                                 elem_type=onnx.TensorProto.FLOAT,
                                                 shape=perm1_shape))
            new_vi.append(make_tensor_value_info(name=trans_node_1.output[0],
                                                 elem_type=onnx.TensorProto.FLOAT,
                                                 shape=perm1_shape))
        else:
            softmax_node = make_node('Softmax', inputs=[exp_node.input[0]],
                                     outputs=[node.output[0]], axis=length - 1)
            optimized_nodes.extend([softmax_node])

        model.graph.value_info.extend(new_vi)

    # remove duplicate node(s) in optimized nodes
    seen = []
    for op_node in optimized_nodes:
        if op_node in seen:
            continue
        seen.append(op_node)
    optimized_nodes = seen

    new_nodes = list(filter(lambda node: node not in removed_nodes, optimized_nodes))
    model = utils.rebuild_model(model, new_nodes)
    check_model(model)

    return model