Fix xgboost converter, check value of best_ntree_limit (#429)

xadupre · wenbingl · web-flow · commit b04d05bda625 · 2021-01-08T00:32:26.000+01:00
Co-authored-by: Wenbing Li &lt;10278425+wenbingl@users.noreply.github.com&gt;
diff --git a/onnxmltools/convert/xgboost/operator_converters/XGBoost.py b/onnxmltools/convert/xgboost/operator_converters/XGBoost.py
@@ -188,6 +188,12 @@ def convert(scope, operator, container):
 
         attr_pairs = XGBRegressorConverter._get_default_tree_attribute_pairs()
         attr_pairs['base_values'] = [base_score]
+
+        bst = xgb_node.get_booster()
+        best_ntree_limit = getattr(bst, 'best_ntree_limit', len(js_trees))
+        if best_ntree_limit < len(js_trees):
+            js_trees = js_trees[:best_ntree_limit]
+
         XGBConverter.fill_tree_attributes(js_trees, attr_pairs, [1 for _ in js_trees], False)
 
         # add nodes
@@ -222,13 +228,19 @@ def convert(scope, operator, container):
         objective, base_score, js_trees = XGBConverter.common_members(xgb_node, inputs)
 
         params = XGBConverter.get_xgb_params(xgb_node)
-
         attr_pairs = XGBClassifierConverter._get_default_tree_attribute_pairs()
         XGBConverter.fill_tree_attributes(js_trees, attr_pairs, [1 for _ in js_trees], True)
+        ncl = (max(attr_pairs['class_treeids']) + 1) // params['n_estimators']
+
+        bst = xgb_node.get_booster()
+        best_ntree_limit = getattr(bst, 'best_ntree_limit', len(js_trees)) * ncl
+        if best_ntree_limit < len(js_trees):
+            js_trees = js_trees[:best_ntree_limit]
+            attr_pairs = XGBClassifierConverter._get_default_tree_attribute_pairs()
+            XGBConverter.fill_tree_attributes(js_trees, attr_pairs, [1 for _ in js_trees], True)
 
         if len(attr_pairs['class_treeids']) == 0:
             raise RuntimeError("XGBoost model is empty.")
-        ncl = (max(attr_pairs['class_treeids']) + 1) // params['n_estimators']
         if ncl <= 1:
             ncl = 2
             # See https://github.com/dmlc/xgboost/blob/master/src/common/math.h#L23.
diff --git a/tests/xgboost/test_xgboost_converters.py b/tests/xgboost/test_xgboost_converters.py
@@ -14,6 +14,7 @@
 from onnxmltools.convert import convert_xgboost
 from onnxmltools.convert.common.data_types import FloatTensorType
 from onnxmltools.utils import dump_data_and_model
+from onnxruntime import InferenceSession
 
 
 def _fit_classification_model(model, n_classes, is_str=False, dtype=None):
@@ -31,8 +32,6 @@ def _fit_classification_model(model, n_classes, is_str=False, dtype=None):
 
 class TestXGBoostModels(unittest.TestCase):
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgb_regressor(self):
         iris = load_diabetes()
         x = iris.data
@@ -42,7 +41,7 @@ def test_xgb_regressor(self):
         xgb = XGBRegressor()
         xgb.fit(x_train, y_train)
         conv_model = convert_xgboost(
-            xgb, initial_types=[('input', FloatTensorType(shape=['None', 'None']))])
+            xgb, initial_types=[('input', FloatTensorType(shape=[None, None]))])
         self.assertTrue(conv_model is not None)
         dump_data_and_model(
             x_test.astype("float32"),
@@ -54,12 +53,10 @@ def test_xgb_regressor(self):
             "< StrictVersion('1.3.0')",
         )
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgb_classifier(self):
         xgb, x_test = _fit_classification_model(XGBClassifier(), 2)
         conv_model = convert_xgboost(
-            xgb, initial_types=[('input', FloatTensorType(shape=['None', 'None']))])
+            xgb, initial_types=[('input', FloatTensorType(shape=[None, None]))])
         self.assertTrue(conv_model is not None)
         dump_data_and_model(
             x_test,
@@ -71,8 +68,6 @@ def test_xgb_classifier(self):
             "< StrictVersion('1.3.0')",
         )
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgb_classifier_uint8(self):
         xgb, x_test = _fit_classification_model(
             XGBClassifier(), 2, dtype=np.uint8)
@@ -89,12 +84,10 @@ def test_xgb_classifier_uint8(self):
             "< StrictVersion('1.3.0')",
         )
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgb_classifier_multi(self):
         xgb, x_test = _fit_classification_model(XGBClassifier(), 3)
         conv_model = convert_xgboost(
-            xgb, initial_types=[('input', FloatTensorType(shape=['None', 'None']))])
+            xgb, initial_types=[('input', FloatTensorType(shape=[None, None]))])
         self.assertTrue(conv_model is not None)
         dump_data_and_model(
             x_test,
@@ -106,13 +99,11 @@ def test_xgb_classifier_multi(self):
             "< StrictVersion('1.3.0')",
         )
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgb_classifier_multi_reglog(self):
         xgb, x_test = _fit_classification_model(
             XGBClassifier(objective='reg:logistic'), 4)
         conv_model = convert_xgboost(
-            xgb, initial_types=[('input', FloatTensorType(shape=['None', 'None']))])
+            xgb, initial_types=[('input', FloatTensorType(shape=[None, None]))])
         self.assertTrue(conv_model is not None)
         dump_data_and_model(
             x_test,
@@ -124,13 +115,11 @@ def test_xgb_classifier_multi_reglog(self):
             "< StrictVersion('1.3.0')",
         )
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgb_classifier_reglog(self):
         xgb, x_test = _fit_classification_model(
             XGBClassifier(objective='reg:logistic'), 2)
         conv_model = convert_xgboost(
-            xgb, initial_types=[('input', FloatTensorType(shape=['None', 'None']))])
+            xgb, initial_types=[('input', FloatTensorType(shape=[None, None]))])
         self.assertTrue(conv_model is not None)
         dump_data_and_model(
             x_test,
@@ -142,13 +131,11 @@ def test_xgb_classifier_reglog(self):
             "< StrictVersion('1.3.0')",
         )
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgb_classifier_multi_str_labels(self):
         xgb, x_test = _fit_classification_model(
             XGBClassifier(n_estimators=4), 5, is_str=True)
         conv_model = convert_xgboost(
-            xgb, initial_types=[('input', FloatTensorType(shape=['None', 'None']))])
+            xgb, initial_types=[('input', FloatTensorType(shape=[None, None]))])
         self.assertTrue(conv_model is not None)
         dump_data_and_model(
             x_test,
@@ -160,8 +147,6 @@ def test_xgb_classifier_multi_str_labels(self):
             "< StrictVersion('1.3.0')",
         )
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgb_classifier_multi_discrete_int_labels(self):
         iris = load_iris()
         x = iris.data[:, :2]
@@ -176,7 +161,7 @@ def test_xgb_classifier_multi_discrete_int_labels(self):
         xgb = XGBClassifier(n_estimators=3)
         xgb.fit(x_train, y_train)
         conv_model = convert_xgboost(
-            xgb, initial_types=[('input', FloatTensorType(shape=['None', 'None']))])
+            xgb, initial_types=[('input', FloatTensorType(shape=[None, None]))])
         self.assertTrue(conv_model is not None)
         dump_data_and_model(
             x_test.astype("float32"),
@@ -188,8 +173,6 @@ def test_xgb_classifier_multi_discrete_int_labels(self):
             "< StrictVersion('1.3.0')",
         )
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgboost_booster_classifier_bin(self):
         x, y = make_classification(n_classes=2, n_features=5,
                                    n_samples=100,
@@ -207,8 +190,6 @@ def test_xgboost_booster_classifier_bin(self):
                             allow_failure="StrictVersion(onnx.__version__) < StrictVersion('1.3.0')",
                             basename="XGBBoosterMCl")
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgboost_booster_classifier_multiclass(self):
         x, y = make_classification(n_classes=3, n_features=5,
                                    n_samples=100,
@@ -227,8 +208,6 @@ def test_xgboost_booster_classifier_multiclass(self):
                             allow_failure="StrictVersion(onnx.__version__) < StrictVersion('1.3.0')",
                             basename="XGBBoosterMCl")
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgboost_booster_classifier_reg(self):
         x, y = make_classification(n_classes=2, n_features=5,
                                    n_samples=100,
@@ -247,8 +226,6 @@ def test_xgboost_booster_classifier_reg(self):
                             allow_failure="StrictVersion(onnx.__version__) < StrictVersion('1.3.0')",
                             basename="XGBBoosterReg")
 
-    @unittest.skipIf(sys.version_info[0] == 2,
-                     reason="xgboost converter not tested on python 2")
     def test_xgboost_10(self):
         this = os.path.abspath(os.path.dirname(__file__))
         train = os.path.join(this, "input_fail_train.csv")
@@ -282,6 +259,29 @@ def test_xgboost_10(self):
             allow_failure="StrictVersion(onnx.__version__) < StrictVersion('1.3.0')",
             basename="XGBBoosterRegBug")
 
+    def test_xgboost_classifier_i5450(self):
+        iris = load_iris()
+        X, y = iris.data, iris.target
+        X_train, X_test, y_train, y_test = train_test_split(X, y, random_state=10)
+        clr = XGBClassifier(objective="multi:softmax", max_depth=1, n_estimators=2)
+        clr.fit(X_train, y_train, eval_set=[(X_test, y_test)], early_stopping_rounds=40)
+        initial_type = [('float_input', FloatTensorType([None, 4]))]
+        onx = convert_xgboost(clr, initial_types=initial_type)
+        sess = InferenceSession(onx.SerializeToString())
+        input_name = sess.get_inputs()[0].name
+        label_name = sess.get_outputs()[1].name
+        predict_list = [1.,  20., 466.,   0.]
+        predict_array = np.array(predict_list).reshape((1,-1)).astype(np.float32)
+        pred_onx = sess.run([label_name], {input_name: predict_array})[0]
+        pred_xgboost = sessresults=clr.predict_proba(predict_array)
+        bst = clr.get_booster()
+        bst.dump_model('dump.raw.txt')
+        dump_data_and_model(
+            X_test.astype(np.float32) + 1e-5,
+            clr, onx,
+            allow_failure="StrictVersion(onnx.__version__) < StrictVersion('1.3.0')",
+            basename="XGBClassifierIris")
+        
     def test_xgboost_example_mnist(self):
         """
         Train a simple xgboost model and store associated artefacts.