Added handlers for tflite (#1270)

TomWildenhain-Microsoft · web-flow · commit c4a214234a62 · 2021-01-14T20:33:33.000-05:00
Signed-off-by: Tom Wildenhain &lt;tomwi@microsoft.com&gt;
diff --git a/tf2onnx/tflite_handlers/__init__.py b/tf2onnx/tflite_handlers/__init__.py
@@ -0,0 +1,11 @@
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT license.
+"""tf2onnx.tflite_handlers module"""
+
+from . import (
+    tfl_math,
+    tfl_nn,
+    tfl_controlflow,
+    tfl_direct,
+    tfl_tensor
+)
diff --git a/tf2onnx/tflite_handlers/tfl_controlflow.py b/tf2onnx/tflite_handlers/tfl_controlflow.py
@@ -0,0 +1,94 @@
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT license.
+
+"""
+tfl_controlflow
+"""
+
+import copy
+import numpy as np
+from onnx.onnx_pb import TensorProto
+
+from tf2onnx.handler import tfl_op
+from tf2onnx import utils
+from tf2onnx.tf_loader import find_function
+from tf2onnx.onnx_opset.controlflow import parameter_binding, inline_subgraph
+
+
+# pylint: disable=unused-argument,missing-docstring,unused-variable,pointless-string-statement,invalid-name
+
+
+@tfl_op(["TFL_WHILE"])
+class TflWhile:
+    @classmethod
+    def version_7(cls, ctx, node, **kwargs):
+        tfl_while_inputs = node.input
+        output_shapes = node.output_shapes
+        output_dtypes = node.output_dtypes
+        output_names = node.output
+
+        cond_name = node.get_attr_str("cond_subgraph_index")
+        cond_graph = find_function(cond_name)
+        cond_graph.parent_graph = ctx
+
+        body_name = node.get_attr_str("body_subgraph_index")
+        body = find_function(body_name)
+        body.parent_graph = ctx
+
+        ctx.remove_node(node.name)
+
+        cond_binding = parameter_binding(cond_graph, tfl_while_inputs)
+        cond_outputs = inline_subgraph(ctx, cond_graph, cond_name, cond_binding)
+
+        max_iterations = ctx.make_const(utils.make_name("max_iterations"), np.array(np.iinfo(np.int64).max))
+
+        loop_node = ctx.make_node("Loop", [max_iterations.output[0], cond_outputs[0]] + tfl_while_inputs,
+                                  output_count=len(output_shapes), name=node.name + "_loop",
+                                  shapes=output_shapes, dtypes=output_dtypes, skip_conversion=True)
+
+        output_map = dict(zip(output_names, loop_node.output))
+
+        # shift output consumers
+        for k, v in output_map.items():
+            ctx.replace_all_inputs(k, v)  # ops=ctx.get_nodes()
+
+        body = wire_tfl_while_body(body, loop_node.inputs, output_shapes, output_dtypes, cond_graph)
+
+        loop_node.set_body_graph_as_attr("body", body)
+
+def wire_tfl_while_body(g, loop_node_inputs, output_shapes,
+                        output_dtypes, cond_graph):
+    """Wire subgraph graph into main."""
+
+    g = copy.deepcopy(g)
+
+    # onnx will pass in cond as argument
+    iter_node = g.make_node("Placeholder", [], name=utils.make_name("iteration_num"),
+                            output_count=1, dtypes=[TensorProto.INT64], shapes=[[]])
+    cond_node = g.make_node("Placeholder", [], name=utils.make_name("cond"),
+                            output_count=1, dtypes=[TensorProto.BOOL], shapes=[[]])
+    cond_binding = parameter_binding(cond_graph, g.outputs)
+
+    # in onnx the body inputs are: index, cond, [loop_vars]
+    g.func_inputs = [iter_node.output[0], cond_node.output[0]] + g.func_inputs
+    # tell graph lib to keep inputs in order
+    g._order_sensitive_inputs = \
+        [g.get_node_by_output(name) for name in g.func_inputs]  # pylint: disable=protected-access
+
+    for p, c in zip(loop_node_inputs, g.func_inputs):
+        shape = p.output_shapes[0]
+        g.set_shape(c, shape)
+
+    cond_outputs = inline_subgraph(g, cond_graph, "cond__", cond_binding)
+
+    g.outputs = [cond_outputs[0]] + g.outputs
+    return g
+
+@tfl_op(["TFL_IF"], tf_op="If")
+class TflIfOp:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        node.attr["then_branch"] = node.attr["then_subgraph_index"]
+        del node.attr["then_subgraph_index"]
+        node.attr["else_branch"] = node.attr["else_subgraph_index"]
+        del node.attr["else_subgraph_index"]
diff --git a/tf2onnx/tflite_handlers/tfl_direct.py b/tf2onnx/tflite_handlers/tfl_direct.py
@@ -0,0 +1,85 @@
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT license.
+
+"""
+tfl_direct
+"""
+
+from tf2onnx.handler import tfl_op
+
+
+# pylint: disable=unused-argument,missing-docstring,unused-variable,pointless-string-statement,invalid-name
+
+
+@tfl_op("TFL_ABS", tf_op="Abs")
+@tfl_op("TFL_CEIL", tf_op="Ceil")
+@tfl_op("TFL_COS", tf_op="Cos")
+@tfl_op("TFL_ELU", tf_op="Elu")
+@tfl_op("TFL_EQUAL", tf_op="Equal")
+@tfl_op("TFL_EXP", tf_op="Exp")
+@tfl_op("TFL_FLOOR", tf_op="Floor")
+@tfl_op("TFL_FLOOR_DIV", tf_op="FloorDiv")
+@tfl_op("TFL_FLOOR_MOD", tf_op="FloorMod")
+@tfl_op("TFL_GREATER", tf_op="Greater")
+@tfl_op("TFL_GREATER_EQUAL", tf_op="GreaterEqual")
+@tfl_op("TFL_LESS", tf_op="Less")
+@tfl_op("TFL_LESS_EQUAL", tf_op="LessEqual")
+@tfl_op("TFL_LOG", tf_op="Log")
+@tfl_op("TFL_LOG_SOFTMAX", tf_op="LogSoftmax")
+@tfl_op("TFL_LOGICAL_AND", tf_op="LogicalAnd")
+@tfl_op("TFL_LOGICAL_NOT", tf_op="LogicalNot")
+@tfl_op("TFL_LOGICAL_OR", tf_op="LogicalOr")
+@tfl_op("TFL_MATRIX_DIAG", tf_op="MatrixDiag")
+@tfl_op("TFL_MATRIX_SET_DIAG", tf_op="MatrixSetDiag")
+@tfl_op("TFL_MAXIMUM", tf_op="Maximum")
+@tfl_op("TFL_MINIMUM", tf_op="Minimum")
+@tfl_op("TFL_NEG", tf_op="Neg")
+@tfl_op("TFL_NOT_EQUAL", tf_op="NotEqual")
+@tfl_op("TFL_POW", tf_op="Pow")
+@tfl_op("TFL_RANK", tf_op="Rank")
+@tfl_op("TFL_RELU", tf_op="Relu")
+@tfl_op("TFL_RELU6", tf_op="Relu6")
+@tfl_op("TFL_ROUND", tf_op="Round")
+@tfl_op("TFL_RSQRT", tf_op="Rsqrt")
+@tfl_op("TFL_SELECT", tf_op="Select")
+@tfl_op("TFL_SELECT_V2", tf_op="SelectV2")
+@tfl_op("TFL_SIN", tf_op="Sin")
+@tfl_op("TFL_SQRT", tf_op="Sqrt")
+@tfl_op("TFL_SQUARE", tf_op="Square")
+@tfl_op("TFL_SQUARED_DIFFERENCE", tf_op="SquaredDifference")
+@tfl_op("TFL_TANH", tf_op="Tanh")
+@tfl_op("TFL_WHERE", tf_op="Where")
+@tfl_op("TFL_ZEROS_LIKE", tf_op="ZerosLike")
+@tfl_op("TFL_FILL", tf_op="Fill")
+@tfl_op("TFL_GATHER_ND", tf_op="GatherNd")
+@tfl_op("TFL_PAD", tf_op="Pad")
+@tfl_op("TFL_REVERSE_V2", tf_op="ReverseV2")
+@tfl_op("TFL_SCATTER_ND", tf_op="ScatterNd")
+@tfl_op("TFL_SEGMENT_SUM", tf_op="SegmentSum")
+@tfl_op("TFL_SHAPE", tf_op="Shape")
+@tfl_op("TFL_SLICE", tf_op="Slice")
+@tfl_op("TFL_SQUEEZE", tf_op="Squeeze")
+@tfl_op("TFL_TILE", tf_op="Tile")
+@tfl_op("TFL_EXPAND_DIMS", tf_op="ExpandDims")
+@tfl_op("TFL_TRANSPOSE", tf_op="Transpose")
+@tfl_op("TFL_UNPACK", tf_op="Unpack")
+@tfl_op("TFL_ADD_N", tf_op="AddN")
+@tfl_op("TFL_ONE_HOT", tf_op="OneHot")
+@tfl_op("TFL_DEPTH_TO_SPACE", tf_op="DepthToSpace")
+@tfl_op("TFL_ARG_MIN", tf_op="ArgMin")
+@tfl_op("TFL_ARG_MAX", tf_op="ArgMax")
+@tfl_op("TFL_NON_MAX_SUPPRESSION_V5", tf_op="NonMaxSuppressionV5")
+@tfl_op("TFL_RESIZE_NEAREST_NEIGHBOR", tf_op="ResizeNearestNeighbor")
+@tfl_op("TFL_LEAKY_RELU", tf_op="LeakyRelu")
+@tfl_op("TFL_STRIDED_SLICE", tf_op="StridedSlice")
+@tfl_op("TFL_MEAN", tf_op="Mean")
+@tfl_op("TFL_SUM", tf_op="Sum")
+@tfl_op("TFL_MIRROR_PAD", tf_op="MirrorPad")
+@tfl_op("TFL_RESIZE_BILINEAR", tf_op="ResizeBilinear")
+@tfl_op("TFL_REVERSE_SEQUENCE", tf_op="ReverseSequence")
+@tfl_op("TFL_SPARSE_TO_DENSE", tf_op="SparseToDense")
+@tfl_op("TFL_CUMSUM", tf_op="Cumsum")
+class TflDirectOp:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        pass
diff --git a/tf2onnx/tflite_handlers/tfl_math.py b/tf2onnx/tflite_handlers/tfl_math.py
@@ -0,0 +1,174 @@
+# Copyright (c) Microsoft Corporation. All rights reserved.
+# Licensed under the MIT license.
+
+"""
+tfl_math
+"""
+
+import logging
+import numpy as np
+from tf2onnx.handler import tfl_op
+from tf2onnx import utils
+
+logger = logging.getLogger(__name__)
+
+
+# pylint: disable=unused-argument,missing-docstring,unused-variable,pointless-string-statement,invalid-name
+
+
+def separate_fused_activation_function(ctx, node):
+    activation_fn = node.attr['fused_activation_function'].s
+    del node.attr['fused_activation_function']
+    if activation_fn == b'RELU':
+        ctx.insert_new_node_on_output("Relu", node.output[0])
+    elif activation_fn == b'RELU6':
+        new_node = ctx.insert_new_node_on_output("Relu6", node.output[0])
+        new_node.skip_conversion = False
+    elif activation_fn == b'TANH':
+        ctx.insert_new_node_on_output("Tanh", node.output[0])
+    else:
+        # TODO: SIGN_BIT and RELU_N1_TO_1 not supported yet
+        utils.make_sure(activation_fn == b'NONE', "Unsupported fused activation function %s on node %s",
+                        activation_fn, node.name)
+
+@tfl_op(["TFL_ADD"], tf_op="Add")
+class TflAdd:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        separate_fused_activation_function(ctx, node)
+
+@tfl_op(["TFL_SUB"], tf_op="Sub")
+class TflSub:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        separate_fused_activation_function(ctx, node)
+
+@tfl_op(["TFL_MUL"], tf_op="Mul")
+class TflMul:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        separate_fused_activation_function(ctx, node)
+
+@tfl_op(["TFL_DIV"], tf_op="Div")
+class TflDiv:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        separate_fused_activation_function(ctx, node)
+
+@tfl_op(["TFL_LOGISTIC"], tf_op="Sigmoid")
+class TflLogistic:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        pass
+
+@tfl_op(["TFL_REDUCE_MAX"], tf_op="Max")
+@tfl_op(["TFL_REDUCE_ANY"], tf_op="Any")
+@tfl_op(["TFL_REDUCE_PROD"], tf_op="Prod")
+class TflReduceOp:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        pass
+
+@tfl_op(["TFL_LOCAL_RESPONSE_NORMALIZATION"], tf_op="LRN")
+class TFlLocalResponseNormalizationOp:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        node.attr["depth_radius"] = node.attr["radius"]
+        del node.attr["radius"]
+
+@tfl_op(["TFL_RANGE"], tf_op="Range")
+class TflRangeOp:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        node.set_attr("Tidx", ctx.get_dtype(node.output[0]))
+
+@tfl_op(["TFL_QUANTIZE"], onnx_op="QuantizeLinear")
+class TflQuantizeOp:
+    @classmethod
+    def version_10(cls, ctx, node, **kwargs):
+        scale = node.get_attr_value('scale')
+        zero_point = node.get_attr_value('zero_point')
+        axis = node.get_attr_value('quantized_dimension')
+        np_q_type = utils.map_onnx_to_numpy_type(ctx.get_dtype(node.output[0]))
+        if len(scale) > 1 or len(zero_point) > 1:
+            node.set_attr("axis", axis)
+        scale_node = ctx.make_const(utils.make_name("scale"), np.array(scale[0], dtype=np.float32))
+        zero_point_node = ctx.make_const(utils.make_name("zero_point"), np.array(zero_point[0], dtype=np_q_type))
+        ctx.replace_inputs(node, [node.input[0], scale_node.output[0], zero_point_node.output[0]])
+        del node.attr["scale"]
+        del node.attr["zero_point"]
+        del node.attr["quantized_dimension"]
+
+@tfl_op(["TFL_DEQUANTIZE"], onnx_op="DequantizeLinear")
+class TflDequantizeOp:
+    @classmethod
+    def version_10(cls, ctx, node, **kwargs):
+        scale = node.get_attr_value('scale')
+        zero_point = node.get_attr_value('zero_point')
+        axis = node.get_attr_value('quantized_dimension')
+        np_q_type = utils.map_onnx_to_numpy_type(ctx.get_dtype(node.input[0]))
+        if len(scale) > 1 or len(zero_point) > 1:
+            utils.make_sure(ctx.opset >= 13, "Opset 13 is required for per-axis quantization")
+            node.set_attr("axis", axis)
+            scale_node = ctx.make_const(utils.make_name("scale"), np.array(scale, dtype=np.float32))
+            zero_point_node = ctx.make_const(utils.make_name("zero_point"), np.array(zero_point, dtype=np_q_type))
+        else:
+            scale_node = ctx.make_const(utils.make_name("scale"), np.array(scale[0], dtype=np.float32))
+            zero_point_node = ctx.make_const(utils.make_name("zero_point"), np.array(zero_point[0], dtype=np_q_type))
+        ctx.replace_inputs(node, [node.input[0], scale_node.output[0], zero_point_node.output[0]])
+        del node.attr["scale"]
+        del node.attr["zero_point"]
+        del node.attr["quantized_dimension"]
+
+def dynamic_quantize_inputs(ctx, node):
+    if ctx.opset < 11:
+        logger.warning("Opset 11 is required for asymmetric_quantize_inputs of node %s", node.name)
+        return
+    for i in range(len(node.input)):
+        # Don't quantize inputs that are already quantized
+        if node.inputs[i].type in ["DequantizeLinear", "TFL_DEQUANTIZE"]:
+            continue
+        dyn_quant = ctx.make_node("DynamicQuantizeLinear", [node.input[i]], output_count=3, op_name_scope=node.name)
+        dyn_quant.skip_conversion = True
+        dequant = ctx.make_node("DequantizeLinear", dyn_quant.output, op_name_scope=node.name)
+        dequant.skip_conversion = True
+        ctx.replace_input(node, node.input[i], dequant.output[0], input_index=i)
+
+@tfl_op(["TFL_FULLY_CONNECTED"])
+class TflFullyConnectedOp:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        separate_fused_activation_function(ctx, node)
+        utils.make_sure(node.attr['weights_format'].s == b'DEFAULT',
+                        "Only default weights format supported for fully connected op")
+        utils.make_sure(node.attr['keep_num_dims'].i == 0,
+                        "Only keep_num_dims=False supported for fully connected op")
+        if node.attr['asymmetric_quantize_inputs'].i == 1:
+            dynamic_quantize_inputs(ctx, node)
+
+        transpose_node = ctx.insert_new_node_on_input(node, "Transpose", node.input[1],
+                                                      name=None, input_index=1, perm=[1, 0])
+        transpose_node.skip_conversion = True
+        node.set_attr("transpose_a", 0)
+        node.set_attr("transpose_b", 0)
+        node.type = "MatMul"
+
+        if len(node.input) == 3:
+            # FIXME: Add a test for this
+            bias_inp = node.input[2]
+            ctx.replace_inputs(node, node.input[:2])
+            add_node = ctx.insert_new_node_on_output("Add", node.output[0], inputs=[node.output[0], bias_inp])
+            add_node.skip_conversion = True
+
+        del node.attr["weights_format"]
+        del node.attr["keep_num_dims"]
+        del node.attr["asymmetric_quantize_inputs"]
+
+@tfl_op(["TFL_SOFTMAX"], tf_op="Softmax")
+class TFlSoftmaxOp:
+    @classmethod
+    def to_tf(cls, ctx, node, **kwargs):
+        beta = node.get_attr_value("beta")
+        beta_node = ctx.make_const(utils.make_name("beta"), np.array(beta, dtype=np.float32))
+        mul_node = ctx.insert_new_node_on_output("Mul", node.output[0], name=utils.make_name(node.name))
+        ctx.replace_inputs(mul_node, [node.output[0], beta_node.output[0]])
diff --git a/tf2onnx/tflite_handlers/tfl_nn.py b/tf2onnx/tflite_handlers/tfl_nn.py
diff --git a/tf2onnx/tflite_handlers/tfl_tensor.py b/tf2onnx/tflite_handlers/tfl_tensor.py