Remove the OneHot from SparseSoftmaxCrossEntropyWithLogits for opset >= 11 (#1454)

TomWildenhain-Microsoft · web-flow · commit da3d0b48032e · 2021-04-15T17:07:24.000-04:00
Signed-off-by: Tom Wildenhain &lt;tomwi@microsoft.com&gt;
diff --git a/tf2onnx/onnx_opset/nn.py b/tf2onnx/onnx_opset/nn.py
@@ -1812,11 +1812,20 @@ def version_9(cls, ctx, node, **kwargs):
             onehot_indice = ctx.make_node("Cast", [label_name], attr={"to": TensorProto.INT64}).output[0]
         else:
             onehot_indice = label_name
-        label_node = ctx.make_node(op_type="OneHot",
-                                   inputs=[onehot_indice, depth_node, values_node])
+        if ctx.opset < 11:
+            label_node = ctx.make_node(op_type="OneHot",
+                                       inputs=[onehot_indice, depth_node, values_node])
+        else:
+            # OneHot is very slow but this workaround requires opset 11
+            index_unsq = GraphBuilder(ctx).make_unsqueeze({'data': onehot_indice, 'axes': [-1]})
+            depth_sq = GraphBuilder(ctx).make_squeeze({'data': depth_node, 'axes': [0]})
+            zero_const = ctx.make_const(utils.make_name("const_zero"), np.array(0, np.int64)).output[0]
+            one_const = ctx.make_const(utils.make_name("const_one"), np.array(1, np.int64)).output[0]
+            dp_range = ctx.make_node("Range", [zero_const, depth_sq, one_const]).output[0]
+            label_node = ctx.make_node("Equal", [index_unsq, dp_range])
         # the above logic makes output dtype of label_node now always int64
         # make sure label has same dtype as logit
-        if logit_dtype != TensorProto.INT64:
+        if logit_dtype != ctx.get_dtype(label_node.output[0]):
             label_node = ctx.make_node("Cast", label_node.output, attr={"to": logit_dtype}, dtypes=[logit_dtype])
 
         _make_sparse_softmax_cross_entropy_with_logits(ctx, label_node, logit_node, node)