From 182ad8f24c75eb3d459949ad3fd060e039fd4299 Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Sun, 12 Apr 2020 20:26:37 +0800
Subject: [PATCH 01/16] Allow slicing tree models.

* Implement `save_best`.
---
 doc/python/callbacks.rst           |   8 +-
 doc/python/index.rst               |   1 +
 doc/python/model.rst               |  27 +++++++
 include/xgboost/c_api.h            |  15 ++++
 include/xgboost/gbm.h              |  10 +++
 include/xgboost/learner.h          |  10 +++
 python-package/xgboost/callback.py |  22 ++++--
 python-package/xgboost/core.py     |  31 +++++++-
 python-package/xgboost/training.py |   4 +-
 src/c_api/c_api.cc                 |  12 +++
 src/gbm/gbtree.cc                  |  42 ++++++++++
 src/gbm/gbtree.h                   |  57 +++++++++++--
 src/gbm/gbtree_model.cc            |   2 +-
 src/gbm/gbtree_model.h             |   3 +-
 src/learner.cc                     |  22 ++++++
 tests/cpp/gbm/test_gbtree.cc       | 123 ++++++++++++++++++++++++++++-
 tests/cpp/test_learner.cc          |   7 +-
 tests/python/test_basic_models.py  |  54 +++++++++++++
 18 files changed, 419 insertions(+), 31 deletions(-)
 create mode 100644 doc/python/model.rst

diff --git a/doc/python/callbacks.rst b/doc/python/callbacks.rst
index 009b4d742fe5..943df4d511b8 100644
--- a/doc/python/callbacks.rst
+++ b/doc/python/callbacks.rst
@@ -7,9 +7,9 @@ package.  In XGBoost 1.3, a new callback interface is designed for Python packag
 provides the flexiblity of designing various extension for training.  Also, XGBoost has a
 number of pre-defined callbacks for supporting early stopping, checkpoints etc.
 
-#######################
+
 Using builtin callbacks
-#######################
+-----------------------
 
 By default, training methods in XGBoost have parameters like ``early_stopping_rounds`` and
 ``verbose``/``verbose_eval``, when specified the training procedure will define the
@@ -50,9 +50,9 @@ this callback function directly into XGBoost:
     dump = booster.get_dump(dump_format='json')
     assert len(early_stop.stopping_history['Valid']['CustomErr']) == len(dump)
 
-##########################
+
 Defining your own callback
-##########################
+--------------------------
 
 XGBoost provides an callback interface class: ``xgboost.callback.TrainingCallback``, user
 defined callbacks should inherit this class and override corresponding methods.  There's a
diff --git a/doc/python/index.rst b/doc/python/index.rst
index 7596be247f9b..d46b6cb45df3 100644
--- a/doc/python/index.rst
+++ b/doc/python/index.rst
@@ -12,4 +12,5 @@ Contents
   python_intro
   python_api
   callbacks
+  model
   Python examples <https://github.com/dmlc/xgboost/tree/master/demo/guide-python>
diff --git a/doc/python/model.rst b/doc/python/model.rst
new file mode 100644
index 000000000000..176f9012e544
--- /dev/null
+++ b/doc/python/model.rst
@@ -0,0 +1,27 @@
+#####
+Model
+#####
+
+Slice tree model
+----------------
+
+When ``booster`` is set to ``gbtree`` or ``dart``, XGBoost builds a tree model, which is a
+list of trees and can be sliced into multiple sub-models.
+
+.. code-block:: python
+    from sklearn.datasets import make_classification
+    num_classes = 3
+    X, y = make_classification(n_samples=1000, n_informative=5,
+                               n_classes=num_classes)
+    dtrain = xgb.DMatrix(data=X, label=y)
+    num_parallel_tree = 4
+    num_boost_round = 16
+    total_trees = num_parallel_tree * num_classes * num_boost_round
+
+    # We build a boosted random forest for classification here.
+    booster = xgb.train({
+        'num_parallel_tree': 4, 'subsample': 0.5, 'num_class': 3},
+                        num_boost_round=num_boost_round, dtrain=dtrain)
+
+    # This is the sliced model, containing [3, 7) forests
+    sliced: xgb.Booster = booster[3:7]
diff --git a/include/xgboost/c_api.h b/include/xgboost/c_api.h
index 4db461d11b1c..3988dddac892 100644
--- a/include/xgboost/c_api.h
+++ b/include/xgboost/c_api.h
@@ -580,6 +580,21 @@ XGB_DLL int XGBoosterCreate(const DMatrixHandle dmats[],
  */
 XGB_DLL int XGBoosterFree(BoosterHandle handle);
 
+/*!
+ * \brief Slice a model according to layers.
+ *
+ * \param handle Booster to be sliced.
+ * \param begin_layer
+ * \param end_layer
+ * \param step
+ * \param out Sliced booster.
+ *
+ * \return 0 when success, -1 when failure happens
+ */
+XGB_DLL int XGBoosterSlice(BoosterHandle handle, int begin_layer,
+                           int end_layer, int step,
+                           BoosterHandle *out);
+
 /*!
  * \brief set parameters
  * \param handle handle
diff --git a/include/xgboost/gbm.h b/include/xgboost/gbm.h
index 8081e15d0922..e4a5683f153a 100644
--- a/include/xgboost/gbm.h
+++ b/include/xgboost/gbm.h
@@ -60,6 +60,16 @@ class GradientBooster : public Model, public Configurable {
    * \param fo output stream
    */
   virtual void Save(dmlc::Stream* fo) const = 0;
+  /*!
+   * \brief Slice the model.
+   * \param layer_begin Begining of boosted tree layer used for prediction.
+   * \param layer_end   End of booster layer. 0 means do not limit trees.
+   * \param out         Output gradient booster
+   */
+  virtual void Slice(int32_t layer_begin, int32_t layer_end, int32_t step,
+                     GradientBooster *out) const {
+    LOG(FATAL) << "Slice is not supported by current booster.";
+  }
   /*!
    * \brief whether the model allow lazy checkpoint
    * return true if model is only updated in DoBoost
diff --git a/include/xgboost/learner.h b/include/xgboost/learner.h
index 50b20de677f1..865e7fec8b01 100644
--- a/include/xgboost/learner.h
+++ b/include/xgboost/learner.h
@@ -195,6 +195,16 @@ class Learner : public Model, public Configurable, public dmlc::Serializable {
    * \return whether the model allow lazy checkpoint in rabit.
    */
   bool AllowLazyCheckPoint() const;
+  /*!
+   * \brief Slice the model.
+   *
+   * See InplacePredict for layer parameters.
+   *
+   * \param step step size between slice.
+   *
+   * \return a sliced model.
+   */
+  virtual Learner *Slice(int32_t begin_layer, int32_t end_layer, int32_t step) = 0;
   /*!
    * \brief dump the model in the requested format
    * \param fmap feature map that may help give interpretations of feature
diff --git a/python-package/xgboost/callback.py b/python-package/xgboost/callback.py
index 32cc957cb5c9..d30f5a07499f 100644
--- a/python-package/xgboost/callback.py
+++ b/python-package/xgboost/callback.py
@@ -10,7 +10,7 @@
 import numpy
 
 from . import rabit
-from .core import EarlyStopException, CallbackEnv
+from .core import EarlyStopException, CallbackEnv, Booster
 from .compat import STRING_TYPES
 
 
@@ -279,9 +279,11 @@ def __init__(self):
 
     def before_training(self, model):
         '''Run before training starts.'''
+        return model
 
     def after_training(self, model):
         '''Run after training is finished.'''
+        return model
 
     def before_iteration(self, model, epoch, evals_log):
         '''Run before each iteration.  Return True when training should stop.'''
@@ -362,12 +364,16 @@ def __init__(self, callbacks: List[TrainingCallback],
     def before_training(self, model):
         '''Function called before training.'''
         for c in self.callbacks:
-            c.before_training(model=model)
+            model = c.before_training(model=model)
+            assert isinstance(model, Booster), 'before_training should return the Booster'
+        return model
 
     def after_training(self, model):
         '''Function called after training.'''
         for c in self.callbacks:
-            c.after_training(model)
+            model = c.after_training(model=model)
+            assert isinstance(model, Booster), 'after_training should return the Booster'
+        return model
 
     def before_iteration(self, model, epoch, dtrain, evals):
         '''Function called before training iteration.'''
@@ -461,7 +467,7 @@ class EarlyStopping(TrainingCallback):
     maximize : bool
         Whether to maximize evaluation metric.  None means auto (discouraged).
     save_best : bool
-        Placeholder, the feature is not yet supported.
+        Whether training should return the best model or the last model.
     '''
     def __init__(self,
                  rounds,
@@ -473,9 +479,6 @@ def __init__(self,
         self.metric_name = metric_name
         self.rounds = rounds
         self.save_best = save_best
-        # https://github.com/dmlc/xgboost/issues/5531
-        assert self.save_best is False, 'save best is not yet supported.'
-
         self.maximize = maximize
         self.stopping_history = {}
 
@@ -551,6 +554,11 @@ def after_iteration(self, model, epoch, evals_log):
         score = data_log[metric_name][-1]
         return self._update_rounds(score, data_name, metric_name, model, epoch)
 
+    def after_training(self, model):
+        if self.save_best:
+            model = model[: model.best_iteration]
+        return model
+
 
 class EvaluationMonitor(TrainingCallback):
     '''Print the evaluation result at each iteration.
diff --git a/python-package/xgboost/core.py b/python-package/xgboost/core.py
index e834f409b6f2..78d841933a2d 100644
--- a/python-package/xgboost/core.py
+++ b/python-package/xgboost/core.py
@@ -947,8 +947,8 @@ def __init__(self, params=None, cache=(), model_file=None):
             Parameters for boosters.
         cache : list
             List of cache items.
-        model_file : string or os.PathLike
-            Path to the model file.
+        model_file : string/os.PathLike/Booster/bytearray
+            Path to the model file if it's string or PathLike.
         """
         for d in cache:
             if not isinstance(d, DMatrix):
@@ -1024,6 +1024,33 @@ def __setstate__(self, state):
             state['handle'] = handle
         self.__dict__.update(state)
 
+    def __getitem__(self, val: slice):
+        if isinstance(val.start, type(Ellipsis)) or val.start is None:
+            start = 0
+        else:
+            start = val.start
+
+        if isinstance(val.stop, type(Ellipsis)) or val.stop is None:
+            stop = 0
+        else:
+            stop = val.stop
+            if stop < start:
+                raise ValueError('Invalid slice', val)
+
+        step = val.step if val.step else 1
+
+        start = ctypes.c_uint(start)
+        stop = ctypes.c_uint(stop)
+        step = c_bst_ulong(step)
+
+        sliced_handle = ctypes.c_void_p()
+        _check_call(_LIB.XGBoosterSlice(self.handle, start, stop, step,
+                                        ctypes.byref(sliced_handle)))
+        sliced = Booster()
+        _check_call(_LIB.XGBoosterFree(sliced.handle))
+        sliced.handle = sliced_handle
+        return sliced
+
     def save_config(self):
         '''Output internal parameter configuration of Booster as a JSON
         string.
diff --git a/python-package/xgboost/training.py b/python-package/xgboost/training.py
index 6b333e246d4a..ef280dba4786 100644
--- a/python-package/xgboost/training.py
+++ b/python-package/xgboost/training.py
@@ -101,7 +101,7 @@ def _train_internal(params, dtrain,
             num_boost_round, feval, evals_result, callbacks,
             show_stdv=False, cvfolds=None)
 
-    callbacks.before_training(bst)
+    bst = callbacks.before_training(bst)
     for i in range(start_iteration, num_boost_round):
         if callbacks.before_iteration(bst, i, dtrain, evals):
             break
@@ -123,7 +123,7 @@ def _train_internal(params, dtrain,
         bst.save_rabit_checkpoint()
         version += 1
 
-    callbacks.after_training(bst)
+    bst = callbacks.after_training(bst)
 
     if evals_result is not None and is_new_callback:
         evals_result.update(callbacks.history)
diff --git a/src/c_api/c_api.cc b/src/c_api/c_api.cc
index d91b179f0a5c..3fb60f72b2cb 100644
--- a/src/c_api/c_api.cc
+++ b/src/c_api/c_api.cc
@@ -730,6 +730,18 @@ XGB_DLL int XGBoosterSaveRabitCheckpoint(BoosterHandle handle) {
   API_END();
 }
 
+XGB_DLL int XGBoosterSlice(BoosterHandle handle, int begin_layer,
+                           int end_layer, int step,
+                           BoosterHandle *out) {
+  API_BEGIN();
+  CHECK_HANDLE();
+  auto* learner = static_cast<Learner*>(handle);
+  auto p_out = learner->Slice(begin_layer, end_layer, step);
+  CHECK(p_out);
+  *out = p_out;
+  API_END();
+}
+
 inline void XGBoostDumpModelImpl(BoosterHandle handle, const FeatureMap &fmap,
                                  int with_stats, const char *format,
                                  xgboost::bst_ulong *len,
diff --git a/src/gbm/gbtree.cc b/src/gbm/gbtree.cc
index 5d88b4d34ac2..6d84ce7e9dc4 100644
--- a/src/gbm/gbtree.cc
+++ b/src/gbm/gbtree.cc
@@ -398,6 +398,36 @@ void GBTree::SaveModel(Json* p_out) const {
   model_.SaveModel(&model);
 }
 
+void GBTree::Slice(int32_t layer_begin, int32_t layer_end, int32_t step,
+                   GradientBooster *out) const {
+  CHECK(configured_);
+  CHECK(out);
+
+  auto p_gbtree = dynamic_cast<GBTree *>(out);
+  CHECK(p_gbtree);
+  GBTreeModel &out_model = p_gbtree->model_;
+  auto layer_trees = this->LayerTrees();
+
+  layer_end = layer_end == 0 ? model_.trees.size() / layer_trees : layer_end;
+  CHECK_GE(layer_end, layer_begin);
+  int32_t n_layers = (layer_end - layer_begin) / step;
+  std::vector<std::unique_ptr<RegTree>> &out_trees = out_model.trees;
+  out_trees.resize(layer_trees * n_layers);
+  std::vector<int32_t> &out_trees_info = out_model.tree_info;
+  out_trees_info.resize(layer_trees * n_layers);
+  out_model.param.num_trees = out_model.trees.size();
+  CHECK(this->model_.trees_to_update.empty());
+
+  detail::SliceTrees(layer_begin, layer_end, step, this->model_, tparam_,
+                     layer_trees, [&](auto const &in_it, auto const &out_it) {
+                       auto new_tree = std::make_unique<RegTree>(
+                           *this->model_.trees.at(in_it));
+                       bst_group_t group = this->model_.tree_info[in_it];
+                       out_trees.at(out_it) = std::move(new_tree);
+                       out_trees_info.at(out_it) = group;
+                     });
+}
+
 void GBTree::PredictBatch(DMatrix* p_fmat,
                           PredictionCacheEntry* out_preds,
                           bool,
@@ -494,6 +524,18 @@ class Dart : public GBTree {
     dparam_.UpdateAllowUnknown(cfg);
   }
 
+  void Slice(int32_t layer_begin, int32_t layer_end, int32_t step,
+             GradientBooster *out) const final {
+    GBTree::Slice(layer_begin, layer_end, step, out);
+    auto p_dart = dynamic_cast<Dart*>(out);
+    CHECK(p_dart);
+    detail::SliceTrees(
+        layer_begin, layer_end, step, model_, tparam_, this->LayerTrees(),
+        [&](auto const& in_it, auto const& out_it) {
+          p_dart->weight_drop_.push_back(this->weight_drop_.at(in_it));
+        });
+  }
+
   void SaveModel(Json *p_out) const override {
     auto &out = *p_out;
     out["name"] = String("dart");
diff --git a/src/gbm/gbtree.h b/src/gbm/gbtree.h
index f96a895aef9e..854224c84297 100644
--- a/src/gbm/gbtree.h
+++ b/src/gbm/gbtree.h
@@ -152,6 +152,46 @@ struct DartTrainParam : public XGBoostParameter<DartTrainParam> {
   }
 };
 
+namespace detail {
+// From here on, layer becomes concrete trees.
+inline std::pair<uint32_t, uint32_t> LayerToTree(gbm::GBTreeModel const &model,
+                                                 GBTreeTrainParam const &tparam,
+                                                 size_t layer_begin,
+                                                 size_t layer_end) {
+  bst_group_t groups = model.learner_model_param->num_output_group;
+  uint32_t tree_begin = layer_begin * groups * tparam.num_parallel_tree;
+  uint32_t tree_end = layer_end * groups * tparam.num_parallel_tree;
+  if (tree_end == 0 || tree_end > model.trees.size()) {
+    tree_end = static_cast<uint32_t>(model.trees.size());
+  }
+  CHECK_LE(tree_end, model.trees.size());
+  CHECK_LT(tree_begin, tree_end);
+  return {tree_begin, tree_end};
+}
+
+// Call fn for each pair of input output tree.
+template <typename Func>
+inline void SliceTrees(int32_t layer_begin, int32_t layer_end, int32_t step,
+                       GBTreeModel const &model, GBTreeTrainParam const &tparam,
+                       size_t layer_trees, Func fn) {
+  uint32_t tree_begin, tree_end;
+  std::tie(tree_begin, tree_end) = detail::LayerToTree(model, tparam, layer_begin, layer_end);
+  layer_end = layer_end == 0 ? model.trees.size() / layer_trees : layer_end;
+  uint32_t n_layers = (layer_end - layer_begin) / step;
+  int32_t in_it = tree_begin;
+  int32_t out_it = 0;
+  for (uint32_t l = 0; l < n_layers; ++l) {
+    for (uint32_t i = 0; i < layer_trees; ++i) {
+      CHECK_LT(in_it, tree_end);
+      fn(in_it, out_it);
+      out_it++;
+      in_it++;
+    }
+    in_it += (step - 1) * layer_trees;
+  }
+}
+}  // namespace detail
+
 // gradient boosted trees
 class GBTree : public GradientBooster {
  public:
@@ -200,6 +240,14 @@ class GBTree : public GradientBooster {
     return model_.learner_model_param->num_output_group == 1;
   }
 
+  auto LayerTrees() const {
+    auto n_trees = model_.learner_model_param->num_output_group * tparam_.num_parallel_tree;
+    return n_trees;
+  }
+  // slice the trees, out must be already allocated
+  void Slice(int32_t layer_begin, int32_t layer_end, int32_t step,
+             GradientBooster *out) const override;
+
   void PredictBatch(DMatrix* p_fmat,
                     PredictionCacheEntry* out_preds,
                     bool training,
@@ -210,13 +258,8 @@ class GBTree : public GradientBooster {
                       uint32_t layer_begin,
                       unsigned layer_end) const override {
     CHECK(configured_);
-    // From here on, layer becomes concrete trees.
-    bst_group_t groups = model_.learner_model_param->num_output_group;
-    uint32_t tree_begin = layer_begin * groups * tparam_.num_parallel_tree;
-    uint32_t tree_end = layer_end * groups * tparam_.num_parallel_tree;
-    if (tree_end == 0 || tree_end > model_.trees.size()) {
-      tree_end = static_cast<uint32_t>(model_.trees.size());
-    }
+    uint32_t tree_begin, tree_end;
+    std::tie(tree_begin, tree_end) = detail::LayerToTree(model_, tparam_, layer_begin, layer_end);
     this->GetPredictor()->InplacePredict(x, model_, missing, out_preds,
                                          tree_begin, tree_end);
   }
diff --git a/src/gbm/gbtree_model.cc b/src/gbm/gbtree_model.cc
index 4a20b48f7d1d..e56dc0ad3a59 100644
--- a/src/gbm/gbtree_model.cc
+++ b/src/gbm/gbtree_model.cc
@@ -6,10 +6,10 @@
 #include "xgboost/json.h"
 #include "xgboost/logging.h"
 #include "gbtree_model.h"
+#include "gbtree.h"
 
 namespace xgboost {
 namespace gbm {
-
 void GBTreeModel::Save(dmlc::Stream* fo) const {
   CHECK_EQ(param.num_trees, static_cast<int32_t>(trees.size()));
 
diff --git a/src/gbm/gbtree_model.h b/src/gbm/gbtree_model.h
index 5a89878d3816..2d07ec198a79 100644
--- a/src/gbm/gbtree_model.h
+++ b/src/gbm/gbtree_model.h
@@ -1,5 +1,5 @@
 /*!
- * Copyright 2017-2019 by Contributors
+ * Copyright 2017-2020 by Contributors
  * \file gbtree_model.h
  */
 #ifndef XGBOOST_GBM_GBTREE_MODEL_H_
@@ -22,6 +22,7 @@ namespace xgboost {
 class Json;
 
 namespace gbm {
+
 /*! \brief model parameters */
 struct GBTreeModelParam : public dmlc::Parameter<GBTreeModelParam> {
  public:
diff --git a/src/learner.cc b/src/learner.cc
index 85ca3a503260..0b9aa0f4aa88 100644
--- a/src/learner.cc
+++ b/src/learner.cc
@@ -971,6 +971,28 @@ class LearnerImpl : public LearnerIO {
     return gbm_->DumpModel(fmap, with_stats, format);
   }
 
+  Learner* Slice(int32_t begin_layer, int32_t end_layer, int32_t step) override {
+    this->Configure();
+    CHECK_GE(begin_layer, 0);
+    if(end_layer != 0) {
+      CHECK_GE(end_layer, begin_layer);
+    }
+
+    auto *out_impl = new LearnerImpl({});
+    auto gbm = std::unique_ptr<GradientBooster>(GradientBooster::Create(
+        this->tparam_.booster, &this->generic_parameters_,
+        &this->learner_model_param_));
+    this->gbm_->Slice(begin_layer, end_layer, step, gbm.get());
+    out_impl->gbm_ = std::move(gbm);
+    Json config { Object() };
+    this->SaveConfig(&config);
+    out_impl->mparam_ = this->mparam_;
+    out_impl->learner_model_param_ = this->learner_model_param_;
+    out_impl->LoadConfig(config);
+    out_impl->Configure();
+    return out_impl;
+  }
+
   void UpdateOneIter(int iter, std::shared_ptr<DMatrix> train) override {
     monitor_.Start("UpdateOneIter");
     TrainingObserver::Instance().Update(iter);
diff --git a/tests/cpp/gbm/test_gbtree.cc b/tests/cpp/gbm/test_gbtree.cc
index 463253aea019..7dade61f89ec 100644
--- a/tests/cpp/gbm/test_gbtree.cc
+++ b/tests/cpp/gbm/test_gbtree.cc
@@ -154,9 +154,9 @@ TEST(GBTree, JsonIO) {
   ASSERT_EQ(get<String>(model["model"]["name"]), "gbtree");
 
   auto const& gbtree_model = model["model"]["model"];
-  ASSERT_EQ(get<Array>(gbtree_model["trees"]).size(), 1);
+  ASSERT_EQ(get<Array>(gbtree_model["trees"]).size(), 1ul);
   ASSERT_EQ(get<Integer>(get<Object>(get<Array>(gbtree_model["trees"]).front()).at("id")), 0);
-  ASSERT_EQ(get<Array>(gbtree_model["tree_info"]).size(), 1);
+  ASSERT_EQ(get<Array>(gbtree_model["tree_info"]).size(), 1ul);
 
   auto j_train_param = model["config"]["gbtree_train_param"];
   ASSERT_EQ(get<String>(j_train_param["num_parallel_tree"]), "1");
@@ -194,7 +194,7 @@ TEST(Dart, JsonIO) {
   ASSERT_EQ(get<String>(model["model"]["name"]), "dart") << model;
   ASSERT_EQ(get<String>(model["config"]["name"]), "dart");
   ASSERT_TRUE(IsA<Object>(model["model"]["gbtree"]));
-  ASSERT_NE(get<Array>(model["model"]["weight_drop"]).size(), 0);
+  ASSERT_NE(get<Array>(model["model"]["weight_drop"]).size(), 0ul);
 }
 
 TEST(Dart, Prediction) {
@@ -230,4 +230,121 @@ TEST(Dart, Prediction) {
     ASSERT_GT(std::abs(h_predts_training[i] - h_predts_inference[i]), kRtEps);
   }
 }
+
+std::pair<Json, Json> TestModelSlice(std::string booster) {
+  size_t constexpr kRows = 1000, kCols = 100, kForest = 2, kClasses = 3;
+  auto m = RandomDataGenerator{kRows, kCols, 0}.GenerateDMatrix(true, false, kClasses);
+
+  int32_t kIters = 10;
+  std::unique_ptr<Learner> learner {
+    Learner::Create({m})
+  };
+  learner->SetParams(Args{{"booster", booster},
+                          {"tree_method", "hist"},
+                          {"num_parallel_tree", std::to_string(kForest)},
+                          {"num_class", std::to_string(kClasses)},
+                          {"subsample", "0.5"},
+                          {"max_depth", "2"}});
+
+  for (auto i = 0; i < kIters; ++i) {
+    learner->UpdateOneIter(i, m);
+  }
+
+  Json model{Object()};
+  Json config{Object()};
+  learner->SaveModel(&model);
+  learner->SaveConfig(&config);
+
+  size_t constexpr kSliceStart = 2, kSliceEnd = 8, kStep = 3;
+  std::unique_ptr<Learner> sliced {learner->Slice(kSliceStart, kSliceEnd, kStep)};
+  Json sliced_model{Object()};
+  sliced->SaveModel(&sliced_model);
+
+  auto get_shape = [&](Json const& model) {
+    if (booster == "gbtree") {
+      return get<Object const>(model["learner"]["gradient_booster"]["model"]["gbtree_model_param"]);
+    } else {
+      return get<Object const>(model["learner"]["gradient_booster"]["gbtree"]["model"]["gbtree_model_param"]);
+    }
+  };
+
+  auto const& model_shape = get_shape(sliced_model);
+  CHECK_EQ(get<String const>(model_shape.at("num_trees")), std::to_string(2 * kClasses * kForest));
+
+  Json sliced_config {Object()};
+  sliced->SaveConfig(&sliced_config);
+  CHECK_EQ(sliced_config, config);
+
+  auto get_trees = [&](Json const& model) {
+    if (booster == "gbtree") {
+      return get<Array const>(model["learner"]["gradient_booster"]["model"]["trees"]);
+    } else {
+      return get<Array const>(model["learner"]["gradient_booster"]["gbtree"]["model"]["trees"]);
+    }
+  };
+
+  auto get_info = [&](Json const& model) {
+    if (booster == "gbtree") {
+      return get<Array const>(model["learner"]["gradient_booster"]["model"]["tree_info"]);
+    } else {
+      return get<Array const>(model["learner"]["gradient_booster"]["gbtree"]["model"]["tree_info"]);
+    }
+  };
+
+  auto const &sliced_trees = get_trees(sliced_model);
+  CHECK_EQ(sliced_trees.size(), 2 * kClasses * kForest);
+
+  auto constexpr kLayerSize = kClasses * kForest;
+  auto const &sliced_info = get_info(sliced_model);
+
+  for (size_t layer = 0; layer < 2; ++layer) {
+    for (size_t j = 0; j < kClasses; ++j) {
+      for (size_t k = 0; k < kForest; ++k) {
+        auto idx = layer * kLayerSize + j * kForest + k;
+        auto const &group = get<Integer const>(sliced_info.at(idx));
+        CHECK_EQ(static_cast<size_t>(group), j);
+      }
+    }
+  }
+
+  auto const& trees = get_trees(model);
+
+  // Sliced layers are [2, 5]
+  auto begin = kLayerSize * kSliceStart;
+  auto end = begin + kLayerSize;
+  auto j = 0;
+  for (size_t i = begin; i < end; ++i) {
+    Json tree = trees[i];
+    tree["id"] = Integer(0);  // id is different, we set it to 0 to allow comparison.
+    auto sliced_tree = sliced_trees[j];
+    sliced_tree["id"] = Integer(0);
+    CHECK_EQ(tree, sliced_tree);
+    j++;
+  }
+
+  begin = kLayerSize * (kSliceStart + kStep);
+  end = begin + kLayerSize;
+  for (size_t i = begin; i < end; ++i) {
+    Json tree = trees[i];
+    tree["id"] = Integer(0);
+    auto sliced_tree = sliced_trees[j];
+    sliced_tree["id"] = Integer(0);
+    CHECK_EQ(tree, sliced_tree);
+    j++;
+  }
+
+  return std::make_pair(model, sliced_model);
+}
+
+TEST(GBTree, Slice) {
+  TestModelSlice("gbtree");
+}
+
+TEST(Dart, Slice) {
+  Json model, sliced_model;
+  std::tie(model, sliced_model) = TestModelSlice("dart");
+  auto const& weights = get<Array const>(model["learner"]["gradient_booster"]["weight_drop"]);
+  auto const& trees = get<Array const>(model["learner"]["gradient_booster"]["gbtree"]["model"]["trees"]);
+  ASSERT_EQ(weights.size(), trees.size());
+}
 }  // namespace xgboost
diff --git a/tests/cpp/test_learner.cc b/tests/cpp/test_learner.cc
index 56e4a95ece42..ff1a7c7cd79d 100644
--- a/tests/cpp/test_learner.cc
+++ b/tests/cpp/test_learner.cc
@@ -118,7 +118,7 @@ TEST(Learner, Configuration) {
 
     // eval_metric is not part of configuration
     auto attr_names = learner->GetConfigurationArguments();
-    ASSERT_EQ(attr_names.size(), 1);
+    ASSERT_EQ(attr_names.size(), 1ul);
     ASSERT_EQ(attr_names.find(emetric), attr_names.cend());
     ASSERT_EQ(attr_names.at("foo"), "bar");
   }
@@ -127,7 +127,7 @@ TEST(Learner, Configuration) {
     std::unique_ptr<Learner> learner { Learner::Create({nullptr}) };
     learner->SetParams({{"foo", "bar"}, {emetric, "auc"}, {emetric, "entropy"}, {emetric, "KL"}});
     auto attr_names = learner->GetConfigurationArguments();
-    ASSERT_EQ(attr_names.size(), 1);
+    ASSERT_EQ(attr_names.size(), 1ul);
     ASSERT_EQ(attr_names.at("foo"), "bar");
   }
 }
@@ -181,7 +181,7 @@ TEST(Learner, JsonModelIO) {
     learner->SaveModel(&new_in);
 
     ASSERT_TRUE(IsA<Object>(out["learner"]["attributes"]));
-    ASSERT_EQ(get<Object>(out["learner"]["attributes"]).size(), 1);
+    ASSERT_EQ(get<Object>(out["learner"]["attributes"]).size(), 1ul);
     ASSERT_EQ(out, new_in);
   }
 }
@@ -333,5 +333,4 @@ TEST(Learner, Seed) {
   ASSERT_EQ(std::to_string(seed),
             get<String>(config["learner"]["generic_param"]["seed"]));
 }
-
 }  // namespace xgboost
diff --git a/tests/python/test_basic_models.py b/tests/python/test_basic_models.py
index dc3a2778af02..1e5e21b0d5f1 100644
--- a/tests/python/test_basic_models.py
+++ b/tests/python/test_basic_models.py
@@ -325,3 +325,57 @@ def validate_model(parameters):
         parameters = {'tree_method': 'hist', 'booster': 'dart',
                       'objective': 'multi:softmax'}
         validate_model(parameters)
+
+    def run_slice(self, booster):
+        from sklearn.datasets import make_classification
+        num_classes = 3
+        X, y = make_classification(n_samples=1000, n_informative=5,
+                                   n_classes=num_classes)
+        dtrain = xgb.DMatrix(data=X, label=y)
+        num_parallel_tree = 4
+        num_boost_round = 16
+        total_trees = num_parallel_tree * num_classes * num_boost_round
+        booster = xgb.train({
+            'num_parallel_tree': 4, 'subsample': 0.5, 'num_class': 3, 'booster': booster},
+                            num_boost_round=num_boost_round, dtrain=dtrain)
+        assert len(booster.get_dump()) == total_trees
+        beg = 3
+        end = 7
+        sliced: xgb.Booster = booster[beg: end]
+
+        sliced_trees = (end - beg) * num_parallel_tree * num_classes
+        assert sliced_trees == len(sliced.get_dump())
+
+        sliced_trees = sliced_trees // 2
+        sliced: xgb.Booster = booster[beg: end: 2]
+        assert sliced_trees == len(sliced.get_dump())
+
+        sliced: xgb.Booster = booster[beg: ...]
+        sliced_trees = (num_boost_round - beg) * num_parallel_tree * num_classes
+        assert sliced_trees == len(sliced.get_dump())
+
+        sliced: xgb.Booster = booster[beg:]
+        sliced_trees = (num_boost_round - beg) * num_parallel_tree * num_classes
+        assert sliced_trees == len(sliced.get_dump())
+
+        sliced: xgb.Booster = booster[:end]
+        sliced_trees = end * num_parallel_tree * num_classes
+        assert sliced_trees == len(sliced.get_dump())
+
+        sliced: xgb.Booster = booster[...:end]
+        sliced_trees = end * num_parallel_tree * num_classes
+        assert sliced_trees == len(sliced.get_dump())
+
+        self.assertRaises(ValueError, lambda: booster[-1: 0])
+        # we do not accept empty slice.
+        self.assertRaises(ValueError, lambda: booster[1:1])
+        self.assertRaises(ValueError, lambda: booster[3:0])
+        self.assertRaises(ValueError, lambda: booster[3:-1])
+
+        def assign():
+            booster[...:end] = booster
+        self.assertRaises(TypeError, assign)
+
+    def test_slice(self):
+        self.run_slice('gbtree')
+        self.run_slice('dart')

From e173173cac62477e7ac03945029c4959dff1a5c0 Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Wed, 28 Oct 2020 14:27:03 +0800
Subject: [PATCH 02/16] Add test for save model.

---
 python-package/xgboost/callback.py |  6 +++---
 src/learner.cc                     |  1 +
 tests/python/test_callback.py      | 13 +++++++++++++
 3 files changed, 17 insertions(+), 3 deletions(-)

diff --git a/python-package/xgboost/callback.py b/python-package/xgboost/callback.py
index d30f5a07499f..712b4c4d737b 100644
--- a/python-package/xgboost/callback.py
+++ b/python-package/xgboost/callback.py
@@ -528,7 +528,7 @@ def _update_rounds(self, score, name, metric, model, epoch):
             return True
         return False
 
-    def after_iteration(self, model, epoch, evals_log):
+    def after_iteration(self, model: Booster, epoch, evals_log):
         msg = 'Must have at least 1 validation dataset for early stopping.'
         assert len(evals_log.keys()) >= 1, msg
         data_name = ''
@@ -554,9 +554,9 @@ def after_iteration(self, model, epoch, evals_log):
         score = data_log[metric_name][-1]
         return self._update_rounds(score, data_name, metric_name, model, epoch)
 
-    def after_training(self, model):
+    def after_training(self, model: Booster):
         if self.save_best:
-            model = model[: model.best_iteration]
+            model = model[: int(model.attr('best_iteration'))]
         return model
 
 
diff --git a/src/learner.cc b/src/learner.cc
index 0b9aa0f4aa88..7125ab9b3460 100644
--- a/src/learner.cc
+++ b/src/learner.cc
@@ -987,6 +987,7 @@ class LearnerImpl : public LearnerIO {
     Json config { Object() };
     this->SaveConfig(&config);
     out_impl->mparam_ = this->mparam_;
+    out_impl->attributes_ = this->attributes_;
     out_impl->learner_model_param_ = this->learner_model_param_;
     out_impl->LoadConfig(config);
     out_impl->Configure();
diff --git a/tests/python/test_callback.py b/tests/python/test_callback.py
index 2b482bb99c5e..79ce53fb9629 100644
--- a/tests/python/test_callback.py
+++ b/tests/python/test_callback.py
@@ -113,6 +113,19 @@ def test_early_stopping_custom_eval_skl(self):
         dump = booster.get_dump(dump_format='json')
         assert len(dump) - booster.best_iteration == early_stopping_rounds + 1
 
+    def test_early_stopping_save_best_model(self):
+        from sklearn.datasets import load_breast_cancer
+        X, y = load_breast_cancer(return_X_y=True)
+        cls = xgb.XGBClassifier()
+        early_stopping_rounds = 5
+        early_stop = xgb.callback.EarlyStopping(rounds=early_stopping_rounds,
+                                                save_best=True)
+        cls.fit(X, y, eval_set=[(X, y)],
+                eval_metric=tm.eval_error_metric, callbacks=[early_stop])
+        booster = cls.get_booster()
+        dump = booster.get_dump(dump_format='json')
+        assert len(dump) == booster.best_iteration
+
     def run_eta_decay(self, tree_method, deprecated_callback):
         if deprecated_callback:
             scheduler = xgb.callback.reset_learning_rate

From 8723f80a2d77c078acd67daf229bba076373968b Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Wed, 28 Oct 2020 14:54:10 +0800
Subject: [PATCH 03/16] Consistent type.

---
 doc/python/model.rst              | 6 ++++++
 python-package/xgboost/core.py    | 8 ++++----
 src/gbm/gbtree.cc                 | 1 +
 src/gbm/gbtree.h                  | 3 ++-
 src/learner.cc                    | 4 ----
 tests/python/test_basic_models.py | 5 +++++
 6 files changed, 18 insertions(+), 9 deletions(-)

diff --git a/doc/python/model.rst b/doc/python/model.rst
index 176f9012e544..b0361a17e646 100644
--- a/doc/python/model.rst
+++ b/doc/python/model.rst
@@ -24,4 +24,10 @@ list of trees and can be sliced into multiple sub-models.
                         num_boost_round=num_boost_round, dtrain=dtrain)
 
     # This is the sliced model, containing [3, 7) forests
+    # step is also supported with some limitations like negative step is invalid.
     sliced: xgb.Booster = booster[3:7]
+
+
+The sliced model is a copy of selected trees, that means the model itself is immutable
+during slicing.  This feature is the basis of `save_best` option in early stopping
+callback.
diff --git a/python-package/xgboost/core.py b/python-package/xgboost/core.py
index 78d841933a2d..5b69649b8b39 100644
--- a/python-package/xgboost/core.py
+++ b/python-package/xgboost/core.py
@@ -1037,11 +1037,11 @@ def __getitem__(self, val: slice):
             if stop < start:
                 raise ValueError('Invalid slice', val)
 
-        step = val.step if val.step else 1
+        step = val.step if val.step is not None else 1
 
-        start = ctypes.c_uint(start)
-        stop = ctypes.c_uint(stop)
-        step = c_bst_ulong(step)
+        start = ctypes.c_int(start)
+        stop = ctypes.c_int(stop)
+        step = ctypes.c_int(step)
 
         sliced_handle = ctypes.c_void_p()
         _check_call(_LIB.XGBoosterSlice(self.handle, start, stop, step,
diff --git a/src/gbm/gbtree.cc b/src/gbm/gbtree.cc
index 6d84ce7e9dc4..397652527685 100644
--- a/src/gbm/gbtree.cc
+++ b/src/gbm/gbtree.cc
@@ -410,6 +410,7 @@ void GBTree::Slice(int32_t layer_begin, int32_t layer_end, int32_t step,
 
   layer_end = layer_end == 0 ? model_.trees.size() / layer_trees : layer_end;
   CHECK_GE(layer_end, layer_begin);
+  CHECK_GE(step, 1);
   int32_t n_layers = (layer_end - layer_begin) / step;
   std::vector<std::unique_ptr<RegTree>> &out_trees = out_model.trees;
   out_trees.resize(layer_trees * n_layers);
diff --git a/src/gbm/gbtree.h b/src/gbm/gbtree.h
index 854224c84297..45bfca22362d 100644
--- a/src/gbm/gbtree.h
+++ b/src/gbm/gbtree.h
@@ -173,7 +173,7 @@ inline std::pair<uint32_t, uint32_t> LayerToTree(gbm::GBTreeModel const &model,
 template <typename Func>
 inline void SliceTrees(int32_t layer_begin, int32_t layer_end, int32_t step,
                        GBTreeModel const &model, GBTreeTrainParam const &tparam,
-                       size_t layer_trees, Func fn) {
+                       uint32_t layer_trees, Func fn) {
   uint32_t tree_begin, tree_end;
   std::tie(tree_begin, tree_end) = detail::LayerToTree(model, tparam, layer_begin, layer_end);
   layer_end = layer_end == 0 ? model.trees.size() / layer_trees : layer_end;
@@ -240,6 +240,7 @@ class GBTree : public GradientBooster {
     return model_.learner_model_param->num_output_group == 1;
   }
 
+  // Number of trees per layer.
   auto LayerTrees() const {
     auto n_trees = model_.learner_model_param->num_output_group * tparam_.num_parallel_tree;
     return n_trees;
diff --git a/src/learner.cc b/src/learner.cc
index 7125ab9b3460..23724d5ef9a0 100644
--- a/src/learner.cc
+++ b/src/learner.cc
@@ -974,10 +974,6 @@ class LearnerImpl : public LearnerIO {
   Learner* Slice(int32_t begin_layer, int32_t end_layer, int32_t step) override {
     this->Configure();
     CHECK_GE(begin_layer, 0);
-    if(end_layer != 0) {
-      CHECK_GE(end_layer, begin_layer);
-    }
-
     auto *out_impl = new LearnerImpl({});
     auto gbm = std::unique_ptr<GradientBooster>(GradientBooster::Create(
         this->tparam_.booster, &this->generic_parameters_,
diff --git a/tests/python/test_basic_models.py b/tests/python/test_basic_models.py
index 1e5e21b0d5f1..1779f0be524d 100644
--- a/tests/python/test_basic_models.py
+++ b/tests/python/test_basic_models.py
@@ -369,8 +369,13 @@ def run_slice(self, booster):
         self.assertRaises(ValueError, lambda: booster[-1: 0])
         # we do not accept empty slice.
         self.assertRaises(ValueError, lambda: booster[1:1])
+        # stop can not be smaller than begin
         self.assertRaises(ValueError, lambda: booster[3:0])
         self.assertRaises(ValueError, lambda: booster[3:-1])
+        # negative step is not supported.
+        self.assertRaises(ValueError, lambda: booster[0:2:-1])
+        # step can not be 0.
+        self.assertRaises(ValueError, lambda: booster[0:2:0])
 
         def assign():
             booster[...:end] = booster

From a33657aff6bf3936822c26859b05f50f3317eca9 Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Wed, 28 Oct 2020 14:59:15 +0800
Subject: [PATCH 04/16] Checks.

---
 include/xgboost/c_api.h | 6 +++---
 src/gbm/gbtree.cc       | 3 ++-
 2 files changed, 5 insertions(+), 4 deletions(-)

diff --git a/include/xgboost/c_api.h b/include/xgboost/c_api.h
index 3988dddac892..3ed1679bf8de 100644
--- a/include/xgboost/c_api.h
+++ b/include/xgboost/c_api.h
@@ -584,9 +584,9 @@ XGB_DLL int XGBoosterFree(BoosterHandle handle);
  * \brief Slice a model according to layers.
  *
  * \param handle Booster to be sliced.
- * \param begin_layer
- * \param end_layer
- * \param step
+ * \param begin_layer start of the slice
+ * \param end_layer   end of the slice
+ * \param step        step size of the slice
  * \param out Sliced booster.
  *
  * \return 0 when success, -1 when failure happens
diff --git a/src/gbm/gbtree.cc b/src/gbm/gbtree.cc
index 397652527685..1f29d6141e61 100644
--- a/src/gbm/gbtree.cc
+++ b/src/gbm/gbtree.cc
@@ -530,9 +530,10 @@ class Dart : public GBTree {
     GBTree::Slice(layer_begin, layer_end, step, out);
     auto p_dart = dynamic_cast<Dart*>(out);
     CHECK(p_dart);
+    CHECK(p_dart->weight_drop_.empty());
     detail::SliceTrees(
         layer_begin, layer_end, step, model_, tparam_, this->LayerTrees(),
-        [&](auto const& in_it, auto const& out_it) {
+        [&](auto const& in_it, auto const&) {
           p_dart->weight_drop_.push_back(this->weight_drop_.at(in_it));
         });
   }

From c9ddda0d0a385ae30c6ecb676b6208bd5a8a0e9e Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Wed, 28 Oct 2020 16:15:04 +0800
Subject: [PATCH 05/16] Generate out of bound error.

---
 doc/python/model.rst              |  4 ++++
 include/xgboost/c_api.h           |  2 +-
 include/xgboost/gbm.h             |  2 +-
 include/xgboost/learner.h         |  4 +++-
 python-package/xgboost/core.py    | 16 ++++++++++++----
 src/c_api/c_api.cc                |  6 +++++-
 src/gbm/gbtree.cc                 | 26 +++++++++++++++-----------
 src/gbm/gbtree.h                  | 14 +++++++++-----
 src/learner.cc                    |  5 +++--
 tests/cpp/gbm/test_gbtree.cc      |  3 ++-
 tests/python/test_basic_models.py |  6 ++++++
 11 files changed, 61 insertions(+), 27 deletions(-)

diff --git a/doc/python/model.rst b/doc/python/model.rst
index b0361a17e646..38fc5f49d0ee 100644
--- a/doc/python/model.rst
+++ b/doc/python/model.rst
@@ -27,6 +27,10 @@ list of trees and can be sliced into multiple sub-models.
     # step is also supported with some limitations like negative step is invalid.
     sliced: xgb.Booster = booster[3:7]
 
+    # Access individual tree layer
+    trees = [_ for _ in booster]
+    assert len(trees) == num_boost_round
+
 
 The sliced model is a copy of selected trees, that means the model itself is immutable
 during slicing.  This feature is the basis of `save_best` option in early stopping
diff --git a/include/xgboost/c_api.h b/include/xgboost/c_api.h
index 3ed1679bf8de..199702fd1abd 100644
--- a/include/xgboost/c_api.h
+++ b/include/xgboost/c_api.h
@@ -589,7 +589,7 @@ XGB_DLL int XGBoosterFree(BoosterHandle handle);
  * \param step        step size of the slice
  * \param out Sliced booster.
  *
- * \return 0 when success, -1 when failure happens
+ * \return 0 when success, -1 when failure happens, -2 when index is out of bound.
  */
 XGB_DLL int XGBoosterSlice(BoosterHandle handle, int begin_layer,
                            int end_layer, int step,
diff --git a/include/xgboost/gbm.h b/include/xgboost/gbm.h
index e4a5683f153a..2836cc72a132 100644
--- a/include/xgboost/gbm.h
+++ b/include/xgboost/gbm.h
@@ -67,7 +67,7 @@ class GradientBooster : public Model, public Configurable {
    * \param out         Output gradient booster
    */
   virtual void Slice(int32_t layer_begin, int32_t layer_end, int32_t step,
-                     GradientBooster *out) const {
+                     GradientBooster *out, bool* out_of_bound) const {
     LOG(FATAL) << "Slice is not supported by current booster.";
   }
   /*!
diff --git a/include/xgboost/learner.h b/include/xgboost/learner.h
index 865e7fec8b01..a3c46085bf35 100644
--- a/include/xgboost/learner.h
+++ b/include/xgboost/learner.h
@@ -201,10 +201,12 @@ class Learner : public Model, public Configurable, public dmlc::Serializable {
    * See InplacePredict for layer parameters.
    *
    * \param step step size between slice.
+   * \param out_of_bound Return true if end layer is out of bound.
    *
    * \return a sliced model.
    */
-  virtual Learner *Slice(int32_t begin_layer, int32_t end_layer, int32_t step) = 0;
+  virtual Learner *Slice(int32_t begin_layer, int32_t end_layer, int32_t step,
+                         bool *out_of_bound) = 0;
   /*!
    * \brief dump the model in the requested format
    * \param fmap feature map that may help give interpretations of feature
diff --git a/python-package/xgboost/core.py b/python-package/xgboost/core.py
index 5b69649b8b39..421ce32056a8 100644
--- a/python-package/xgboost/core.py
+++ b/python-package/xgboost/core.py
@@ -1024,12 +1024,16 @@ def __setstate__(self, state):
             state['handle'] = handle
         self.__dict__.update(state)
 
-    def __getitem__(self, val: slice):
+    def __getitem__(self, val):
+        if isinstance(val, int):
+            val = slice(val, val+1)
+        if not isinstance(val, slice):
+            msg = _expect((int, slice), type(val))
+            raise TypeError(msg)
         if isinstance(val.start, type(Ellipsis)) or val.start is None:
             start = 0
         else:
             start = val.start
-
         if isinstance(val.stop, type(Ellipsis)) or val.stop is None:
             stop = 0
         else:
@@ -1044,8 +1048,12 @@ def __getitem__(self, val: slice):
         step = ctypes.c_int(step)
 
         sliced_handle = ctypes.c_void_p()
-        _check_call(_LIB.XGBoosterSlice(self.handle, start, stop, step,
-                                        ctypes.byref(sliced_handle)))
+        status = _LIB.XGBoosterSlice(self.handle, start, stop, step,
+                                     ctypes.byref(sliced_handle))
+        if status == -2:
+            raise IndexError('Layer index out of range')
+        _check_call(status)
+
         sliced = Booster()
         _check_call(_LIB.XGBoosterFree(sliced.handle))
         sliced.handle = sliced_handle
diff --git a/src/c_api/c_api.cc b/src/c_api/c_api.cc
index 3fb60f72b2cb..cf0bbebdeaa7 100644
--- a/src/c_api/c_api.cc
+++ b/src/c_api/c_api.cc
@@ -736,7 +736,11 @@ XGB_DLL int XGBoosterSlice(BoosterHandle handle, int begin_layer,
   API_BEGIN();
   CHECK_HANDLE();
   auto* learner = static_cast<Learner*>(handle);
-  auto p_out = learner->Slice(begin_layer, end_layer, step);
+  bool out_of_bound = false;
+  auto p_out = learner->Slice(begin_layer, end_layer, step, &out_of_bound);
+  if (out_of_bound) {
+    return -2;
+  }
   CHECK(p_out);
   *out = p_out;
   API_END();
diff --git a/src/gbm/gbtree.cc b/src/gbm/gbtree.cc
index 1f29d6141e61..6142cb010dde 100644
--- a/src/gbm/gbtree.cc
+++ b/src/gbm/gbtree.cc
@@ -399,7 +399,7 @@ void GBTree::SaveModel(Json* p_out) const {
 }
 
 void GBTree::Slice(int32_t layer_begin, int32_t layer_end, int32_t step,
-                   GradientBooster *out) const {
+                   GradientBooster *out, bool* out_of_bound) const {
   CHECK(configured_);
   CHECK(out);
 
@@ -419,14 +419,15 @@ void GBTree::Slice(int32_t layer_begin, int32_t layer_end, int32_t step,
   out_model.param.num_trees = out_model.trees.size();
   CHECK(this->model_.trees_to_update.empty());
 
-  detail::SliceTrees(layer_begin, layer_end, step, this->model_, tparam_,
-                     layer_trees, [&](auto const &in_it, auto const &out_it) {
-                       auto new_tree = std::make_unique<RegTree>(
-                           *this->model_.trees.at(in_it));
-                       bst_group_t group = this->model_.tree_info[in_it];
-                       out_trees.at(out_it) = std::move(new_tree);
-                       out_trees_info.at(out_it) = group;
-                     });
+  *out_of_bound = detail::SliceTrees(
+      layer_begin, layer_end, step, this->model_, tparam_, layer_trees,
+      [&](auto const &in_it, auto const &out_it) {
+        auto new_tree =
+            std::make_unique<RegTree>(*this->model_.trees.at(in_it));
+        bst_group_t group = this->model_.tree_info[in_it];
+        out_trees.at(out_it) = std::move(new_tree);
+        out_trees_info.at(out_it) = group;
+      });
 }
 
 void GBTree::PredictBatch(DMatrix* p_fmat,
@@ -526,8 +527,11 @@ class Dart : public GBTree {
   }
 
   void Slice(int32_t layer_begin, int32_t layer_end, int32_t step,
-             GradientBooster *out) const final {
-    GBTree::Slice(layer_begin, layer_end, step, out);
+             GradientBooster *out, bool* out_of_bound) const final {
+    GBTree::Slice(layer_begin, layer_end, step, out, out_of_bound);
+    if (*out_of_bound) {
+      return;
+    }
     auto p_dart = dynamic_cast<Dart*>(out);
     CHECK(p_dart);
     CHECK(p_dart->weight_drop_.empty());
diff --git a/src/gbm/gbtree.h b/src/gbm/gbtree.h
index 45bfca22362d..b2a990dbe304 100644
--- a/src/gbm/gbtree.h
+++ b/src/gbm/gbtree.h
@@ -161,21 +161,24 @@ inline std::pair<uint32_t, uint32_t> LayerToTree(gbm::GBTreeModel const &model,
   bst_group_t groups = model.learner_model_param->num_output_group;
   uint32_t tree_begin = layer_begin * groups * tparam.num_parallel_tree;
   uint32_t tree_end = layer_end * groups * tparam.num_parallel_tree;
-  if (tree_end == 0 || tree_end > model.trees.size()) {
+  if (tree_end == 0) {
     tree_end = static_cast<uint32_t>(model.trees.size());
   }
-  CHECK_LE(tree_end, model.trees.size());
   CHECK_LT(tree_begin, tree_end);
   return {tree_begin, tree_end};
 }
 
-// Call fn for each pair of input output tree.
+// Call fn for each pair of input output tree.  Return true if index is out of bound.
 template <typename Func>
-inline void SliceTrees(int32_t layer_begin, int32_t layer_end, int32_t step,
+inline bool SliceTrees(int32_t layer_begin, int32_t layer_end, int32_t step,
                        GBTreeModel const &model, GBTreeTrainParam const &tparam,
                        uint32_t layer_trees, Func fn) {
   uint32_t tree_begin, tree_end;
   std::tie(tree_begin, tree_end) = detail::LayerToTree(model, tparam, layer_begin, layer_end);
+  if (tree_end > model.trees.size()) {
+    return true;
+  }
+
   layer_end = layer_end == 0 ? model.trees.size() / layer_trees : layer_end;
   uint32_t n_layers = (layer_end - layer_begin) / step;
   int32_t in_it = tree_begin;
@@ -189,6 +192,7 @@ inline void SliceTrees(int32_t layer_begin, int32_t layer_end, int32_t step,
     }
     in_it += (step - 1) * layer_trees;
   }
+  return false;
 }
 }  // namespace detail
 
@@ -247,7 +251,7 @@ class GBTree : public GradientBooster {
   }
   // slice the trees, out must be already allocated
   void Slice(int32_t layer_begin, int32_t layer_end, int32_t step,
-             GradientBooster *out) const override;
+             GradientBooster *out, bool* out_of_bound) const override;
 
   void PredictBatch(DMatrix* p_fmat,
                     PredictionCacheEntry* out_preds,
diff --git a/src/learner.cc b/src/learner.cc
index 23724d5ef9a0..ce652a420e78 100644
--- a/src/learner.cc
+++ b/src/learner.cc
@@ -971,14 +971,15 @@ class LearnerImpl : public LearnerIO {
     return gbm_->DumpModel(fmap, with_stats, format);
   }
 
-  Learner* Slice(int32_t begin_layer, int32_t end_layer, int32_t step) override {
+  Learner *Slice(int32_t begin_layer, int32_t end_layer, int32_t step,
+                 bool *out_of_bound) override {
     this->Configure();
     CHECK_GE(begin_layer, 0);
     auto *out_impl = new LearnerImpl({});
     auto gbm = std::unique_ptr<GradientBooster>(GradientBooster::Create(
         this->tparam_.booster, &this->generic_parameters_,
         &this->learner_model_param_));
-    this->gbm_->Slice(begin_layer, end_layer, step, gbm.get());
+    this->gbm_->Slice(begin_layer, end_layer, step, gbm.get(), out_of_bound);
     out_impl->gbm_ = std::move(gbm);
     Json config { Object() };
     this->SaveConfig(&config);
diff --git a/tests/cpp/gbm/test_gbtree.cc b/tests/cpp/gbm/test_gbtree.cc
index 7dade61f89ec..64a94e736800 100644
--- a/tests/cpp/gbm/test_gbtree.cc
+++ b/tests/cpp/gbm/test_gbtree.cc
@@ -254,9 +254,10 @@ std::pair<Json, Json> TestModelSlice(std::string booster) {
   Json config{Object()};
   learner->SaveModel(&model);
   learner->SaveConfig(&config);
+  bool out_of_bound = false;
 
   size_t constexpr kSliceStart = 2, kSliceEnd = 8, kStep = 3;
-  std::unique_ptr<Learner> sliced {learner->Slice(kSliceStart, kSliceEnd, kStep)};
+  std::unique_ptr<Learner> sliced {learner->Slice(kSliceStart, kSliceEnd, kStep, &out_of_bound)};
   Json sliced_model{Object()};
   sliced->SaveModel(&sliced_model);
 
diff --git a/tests/python/test_basic_models.py b/tests/python/test_basic_models.py
index 1779f0be524d..c9f06a7cc9f2 100644
--- a/tests/python/test_basic_models.py
+++ b/tests/python/test_basic_models.py
@@ -377,6 +377,12 @@ def run_slice(self, booster):
         # step can not be 0.
         self.assertRaises(ValueError, lambda: booster[0:2:0])
 
+        trees = [_ for _ in booster]
+        assert len(trees) == num_boost_round
+
+        self.assertRaises(TypeError, lambda: booster["wrong type"])
+        self.assertRaises(IndexError, lambda: booster[:num_boost_round+1])
+
         def assign():
             booster[...:end] = booster
         self.assertRaises(TypeError, assign)

From 40b556201d8346d8e5af22f4141aa72a42ac1496 Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Wed, 28 Oct 2020 16:43:02 +0800
Subject: [PATCH 06/16] Fix legacy callback.

---
 python-package/xgboost/callback.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/python-package/xgboost/callback.py b/python-package/xgboost/callback.py
index 712b4c4d737b..3588d62dc368 100644
--- a/python-package/xgboost/callback.py
+++ b/python-package/xgboost/callback.py
@@ -692,9 +692,11 @@ def __init__(self, callbacks, start_iteration, end_iteration,
 
     def before_training(self, model):
         '''Nothing to do for legacy callbacks'''
+        return model
 
     def after_training(self, model):
         '''Nothing to do for legacy callbacks'''
+        return model
 
     def before_iteration(self, model, epoch, dtrain, evals):
         '''Called before each iteration.'''

From 5cb2d5e9c9bdbc0bd1231043f4497250efb86f4a Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Wed, 28 Oct 2020 18:04:41 +0800
Subject: [PATCH 07/16] Fix CV.

---
 python-package/xgboost/callback.py | 12 ++++++++++--
 python-package/xgboost/training.py |  6 ++++--
 2 files changed, 14 insertions(+), 4 deletions(-)

diff --git a/python-package/xgboost/callback.py b/python-package/xgboost/callback.py
index 3588d62dc368..ddd9710ea9be 100644
--- a/python-package/xgboost/callback.py
+++ b/python-package/xgboost/callback.py
@@ -365,14 +365,22 @@ def before_training(self, model):
         '''Function called before training.'''
         for c in self.callbacks:
             model = c.before_training(model=model)
-            assert isinstance(model, Booster), 'before_training should return the Booster'
+            msg = 'before_training should return the model'
+            if self.is_cv:
+                assert isinstance(model.cvfolds, list), msg
+            else:
+                assert isinstance(model, Booster), msg
         return model
 
     def after_training(self, model):
         '''Function called after training.'''
         for c in self.callbacks:
             model = c.after_training(model=model)
-            assert isinstance(model, Booster), 'after_training should return the Booster'
+            msg = 'after_training should return the model'
+            if self.is_cv:
+                assert isinstance(model.cvfolds, list), msg
+            else:
+                assert isinstance(model, Booster), msg
         return model
 
     def before_iteration(self, model, epoch, dtrain, evals):
diff --git a/python-package/xgboost/training.py b/python-package/xgboost/training.py
index ef280dba4786..7ca5922905dd 100644
--- a/python-package/xgboost/training.py
+++ b/python-package/xgboost/training.py
@@ -493,9 +493,8 @@ def cv(params, dtrain, num_boost_round=10, nfold=3, stratified=False, folds=None
             verbose_eval, early_stopping_rounds, maximize, 0,
             num_boost_round, feval, None, callbacks,
             show_stdv=show_stdv, cvfolds=cvfolds)
-    callbacks.before_training(cvfolds)
-
     booster = _PackedBooster(cvfolds)
+    callbacks.before_training(booster)
 
     for i in range(num_boost_round):
         if callbacks.before_iteration(booster, i, dtrain, None):
@@ -522,4 +521,7 @@ def cv(params, dtrain, num_boost_round=10, nfold=3, stratified=False, folds=None
             results = pd.DataFrame.from_dict(results)
         except ImportError:
             pass
+
+    callbacks.after_training(booster)
+
     return results

From 60368c83374befe641d426c11db07505cd6ff164 Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Fri, 30 Oct 2020 10:13:48 +0800
Subject: [PATCH 08/16] Add tests for gblinear.

---
 python-package/xgboost/callback.py |  9 ++++++---
 tests/python/test_callback.py      | 17 ++++++++++++++++-
 2 files changed, 22 insertions(+), 4 deletions(-)

diff --git a/python-package/xgboost/callback.py b/python-package/xgboost/callback.py
index ddd9710ea9be..7c8bdaff3c60 100644
--- a/python-package/xgboost/callback.py
+++ b/python-package/xgboost/callback.py
@@ -10,7 +10,7 @@
 import numpy
 
 from . import rabit
-from .core import EarlyStopException, CallbackEnv, Booster
+from .core import EarlyStopException, CallbackEnv, Booster, XGBoostError
 from .compat import STRING_TYPES
 
 
@@ -563,8 +563,11 @@ def after_iteration(self, model: Booster, epoch, evals_log):
         return self._update_rounds(score, data_name, metric_name, model, epoch)
 
     def after_training(self, model: Booster):
-        if self.save_best:
-            model = model[: int(model.attr('best_iteration'))]
+        try:
+            if self.save_best:
+                model = model[: int(model.attr('best_iteration'))]
+        except XGBoostError as e:
+            raise XGBoostError('`save_best` is not applicable to current booster') from e
         return model
 
 
diff --git a/tests/python/test_callback.py b/tests/python/test_callback.py
index 79ce53fb9629..fccbba636997 100644
--- a/tests/python/test_callback.py
+++ b/tests/python/test_callback.py
@@ -116,7 +116,7 @@ def test_early_stopping_custom_eval_skl(self):
     def test_early_stopping_save_best_model(self):
         from sklearn.datasets import load_breast_cancer
         X, y = load_breast_cancer(return_X_y=True)
-        cls = xgb.XGBClassifier()
+        cls = xgb.XGBClassifier(n_estimators=10)
         early_stopping_rounds = 5
         early_stop = xgb.callback.EarlyStopping(rounds=early_stopping_rounds,
                                                 save_best=True)
@@ -126,6 +126,21 @@ def test_early_stopping_save_best_model(self):
         dump = booster.get_dump(dump_format='json')
         assert len(dump) == booster.best_iteration
 
+        early_stop = xgb.callback.EarlyStopping(rounds=early_stopping_rounds,
+                                                save_best=True)
+        cls = xgb.XGBClassifier(booster='gblinear', n_estimators=10)
+        self.assertRaises(ValueError, lambda: cls.fit(X, y, eval_set=[(X, y)],
+                                                      eval_metric=tm.eval_error_metric,
+                                                      callbacks=[early_stop]))
+
+        # No error
+        early_stop = xgb.callback.EarlyStopping(rounds=early_stopping_rounds,
+                                                save_best=False)
+        xgb.XGBClassifier(booster='gblinear', n_estimators=10).fit(
+            X, y, eval_set=[(X, y)],
+            eval_metric=tm.eval_error_metric,
+            callbacks=[early_stop])
+
     def run_eta_decay(self, tree_method, deprecated_callback):
         if deprecated_callback:
             scheduler = xgb.callback.reset_learning_rate

From ef48197da0ac9bf1cf400c1f9d1f9434b3188795 Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Mon, 2 Nov 2020 19:36:31 -0500
Subject: [PATCH 09/16] Stronger tests.

---
 python-package/xgboost/core.py    | 2 ++
 tests/python/test_basic_models.py | 1 +
 tests/python/test_callback.py     | 3 ++-
 3 files changed, 5 insertions(+), 1 deletion(-)

diff --git a/python-package/xgboost/core.py b/python-package/xgboost/core.py
index 421ce32056a8..9dd708be3f53 100644
--- a/python-package/xgboost/core.py
+++ b/python-package/xgboost/core.py
@@ -1027,6 +1027,8 @@ def __setstate__(self, state):
     def __getitem__(self, val):
         if isinstance(val, int):
             val = slice(val, val+1)
+        if isinstance(val, tuple):
+            raise ValueError('Only supports slicing through 1 dimension.')
         if not isinstance(val, slice):
             msg = _expect((int, slice), type(val))
             raise TypeError(msg)
diff --git a/tests/python/test_basic_models.py b/tests/python/test_basic_models.py
index c9f06a7cc9f2..8fb54bf36f84 100644
--- a/tests/python/test_basic_models.py
+++ b/tests/python/test_basic_models.py
@@ -382,6 +382,7 @@ def run_slice(self, booster):
 
         self.assertRaises(TypeError, lambda: booster["wrong type"])
         self.assertRaises(IndexError, lambda: booster[:num_boost_round+1])
+        self.assertRaises(ValueError, lambda: booster[1, 2])  # too many dims
 
         def assign():
             booster[...:end] = booster
diff --git a/tests/python/test_callback.py b/tests/python/test_callback.py
index fccbba636997..9f444e60c668 100644
--- a/tests/python/test_callback.py
+++ b/tests/python/test_callback.py
@@ -116,7 +116,8 @@ def test_early_stopping_custom_eval_skl(self):
     def test_early_stopping_save_best_model(self):
         from sklearn.datasets import load_breast_cancer
         X, y = load_breast_cancer(return_X_y=True)
-        cls = xgb.XGBClassifier(n_estimators=10)
+        n_estimators = 100
+        cls = xgb.XGBClassifier(n_estimators=n_estimators)
         early_stopping_rounds = 5
         early_stop = xgb.callback.EarlyStopping(rounds=early_stopping_rounds,
                                                 save_best=True)

From 52948c682c2474b15356a85f9bcac76c47682edb Mon Sep 17 00:00:00 2001
From: Philip Hyunsu Cho <chohyu01@cs.washington.edu>
Date: Mon, 2 Nov 2020 17:52:03 -0800
Subject: [PATCH 10/16] Fix formatting in model.rst

---
 doc/python/model.rst | 1 +
 1 file changed, 1 insertion(+)

diff --git a/doc/python/model.rst b/doc/python/model.rst
index 38fc5f49d0ee..e93c9b42e3bc 100644
--- a/doc/python/model.rst
+++ b/doc/python/model.rst
@@ -9,6 +9,7 @@ When ``booster`` is set to ``gbtree`` or ``dart``, XGBoost builds a tree model,
 list of trees and can be sliced into multiple sub-models.
 
 .. code-block:: python
+
     from sklearn.datasets import make_classification
     num_classes = 3
     X, y = make_classification(n_samples=1000, n_informative=5,

From 7e30509770ca260fdd05c1e8e97b7397c4982cb4 Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Mon, 2 Nov 2020 22:44:34 -0500
Subject: [PATCH 11/16] Parametrize

---
 tests/python/test_basic_models.py | 7 ++-----
 1 file changed, 2 insertions(+), 5 deletions(-)

diff --git a/tests/python/test_basic_models.py b/tests/python/test_basic_models.py
index 8fb54bf36f84..00b479d57852 100644
--- a/tests/python/test_basic_models.py
+++ b/tests/python/test_basic_models.py
@@ -326,7 +326,8 @@ def validate_model(parameters):
                       'objective': 'multi:softmax'}
         validate_model(parameters)
 
-    def run_slice(self, booster):
+    @pytest.mark.parametrize('booster', ['gbtree', 'dart'])
+    def test_slice(self, booster):
         from sklearn.datasets import make_classification
         num_classes = 3
         X, y = make_classification(n_samples=1000, n_informative=5,
@@ -387,7 +388,3 @@ def run_slice(self, booster):
         def assign():
             booster[...:end] = booster
         self.assertRaises(TypeError, assign)
-
-    def test_slice(self):
-        self.run_slice('gbtree')
-        self.run_slice('dart')

From a087793557b798bf939e2ed0ec9da8a917526196 Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Mon, 2 Nov 2020 22:48:18 -0500
Subject: [PATCH 12/16] Doc and comment.

---
 doc/python/model.rst    | 2 +-
 include/xgboost/c_api.h | 8 +++++---
 include/xgboost/gbm.h   | 3 ++-
 3 files changed, 8 insertions(+), 5 deletions(-)

diff --git a/doc/python/model.rst b/doc/python/model.rst
index 38fc5f49d0ee..e1fb90f41d41 100644
--- a/doc/python/model.rst
+++ b/doc/python/model.rst
@@ -16,7 +16,7 @@ list of trees and can be sliced into multiple sub-models.
     dtrain = xgb.DMatrix(data=X, label=y)
     num_parallel_tree = 4
     num_boost_round = 16
-    total_trees = num_parallel_tree * num_classes * num_boost_round
+    # total number of built trees is num_parallel_tree * num_classes * num_boost_round
 
     # We build a boosted random forest for classification here.
     booster = xgb.train({
diff --git a/include/xgboost/c_api.h b/include/xgboost/c_api.h
index 199702fd1abd..12f395c66e45 100644
--- a/include/xgboost/c_api.h
+++ b/include/xgboost/c_api.h
@@ -581,12 +581,14 @@ XGB_DLL int XGBoosterCreate(const DMatrixHandle dmats[],
 XGB_DLL int XGBoosterFree(BoosterHandle handle);
 
 /*!
- * \brief Slice a model according to layers.
+ * \brief Slice a model using boosting index. The slice m:n indicates taking all trees
+ *        that were fit during the boosting rounds m, (m+1), (m+2), ..., (n-1).
  *
  * \param handle Booster to be sliced.
  * \param begin_layer start of the slice
- * \param end_layer   end of the slice
- * \param step        step size of the slice
+ * \param end_layer end of the slice; end_layer=0 is equivalent to
+ *                  end_layer=num_boost_round
+ * \param step step size of the slice
  * \param out Sliced booster.
  *
  * \return 0 when success, -1 when failure happens, -2 when index is out of bound.
diff --git a/include/xgboost/gbm.h b/include/xgboost/gbm.h
index 2836cc72a132..20b2fbf11218 100644
--- a/include/xgboost/gbm.h
+++ b/include/xgboost/gbm.h
@@ -61,7 +61,8 @@ class GradientBooster : public Model, public Configurable {
    */
   virtual void Save(dmlc::Stream* fo) const = 0;
   /*!
-   * \brief Slice the model.
+   * \brief Slice a model using boosting index. The slice m:n indicates taking all trees
+   *        that were fit during the boosting rounds m, (m+1), (m+2), ..., (n-1).
    * \param layer_begin Begining of boosted tree layer used for prediction.
    * \param layer_end   End of booster layer. 0 means do not limit trees.
    * \param out         Output gradient booster

From 4dc4dd3866271dc6663a4449dc3a2ae5ca123479 Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Mon, 2 Nov 2020 23:10:35 -0500
Subject: [PATCH 13/16] Add prediction test.

---
 tests/python/test_basic_models.py | 20 ++++++++++++++++++++
 1 file changed, 20 insertions(+)

diff --git a/tests/python/test_basic_models.py b/tests/python/test_basic_models.py
index 00b479d57852..ecc7795ec3d9 100644
--- a/tests/python/test_basic_models.py
+++ b/tests/python/test_basic_models.py
@@ -388,3 +388,23 @@ def test_slice(self, booster):
         def assign():
             booster[...:end] = booster
         self.assertRaises(TypeError, assign)
+
+        sliced_0 = booster[1:3]
+        sliced_1 = booster[3:7]
+
+        predt_0 = sliced_0.predict(dtrain)
+        predt_1 = sliced_1.predict(dtrain)
+
+        merged = predt_0 + predt_1 - 0.5
+        single = booster[1:7].predict(dtrain)
+        np.testing.assert_allclose(merged, single)
+
+        sliced_0 = booster[1:7:2]  # 1,3,5
+        sliced_1 = booster[2:8:2]  # 2,4,6
+
+        predt_0 = sliced_0.predict(dtrain)
+        predt_1 = sliced_1.predict(dtrain)
+
+        merged = predt_0 + predt_1 - 0.5
+        single = booster[1:7].predict(dtrain)
+        np.testing.assert_allclose(merged, single)

From ae9ee40c066f711a1965a071ccbfd11a353ee496 Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Mon, 2 Nov 2020 23:11:33 -0500
Subject: [PATCH 14/16] Revert parametrize.

---
 tests/python/test_basic_models.py | 7 +++++--
 1 file changed, 5 insertions(+), 2 deletions(-)

diff --git a/tests/python/test_basic_models.py b/tests/python/test_basic_models.py
index ecc7795ec3d9..96d6aed57bc4 100644
--- a/tests/python/test_basic_models.py
+++ b/tests/python/test_basic_models.py
@@ -326,8 +326,7 @@ def validate_model(parameters):
                       'objective': 'multi:softmax'}
         validate_model(parameters)
 
-    @pytest.mark.parametrize('booster', ['gbtree', 'dart'])
-    def test_slice(self, booster):
+    def run_slice(self, booster):
         from sklearn.datasets import make_classification
         num_classes = 3
         X, y = make_classification(n_samples=1000, n_informative=5,
@@ -408,3 +407,7 @@ def assign():
         merged = predt_0 + predt_1 - 0.5
         single = booster[1:7].predict(dtrain)
         np.testing.assert_allclose(merged, single)
+
+    def test_slice(self):
+        self.run_slice('gbtree')
+        self.run_slice('dart')

From e83b6b4b972052713f5f4ea306d8a058be0084d5 Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Mon, 2 Nov 2020 23:21:29 -0500
Subject: [PATCH 15/16] Use margin.

---
 tests/python/test_basic_models.py | 21 +++++++++++----------
 1 file changed, 11 insertions(+), 10 deletions(-)

diff --git a/tests/python/test_basic_models.py b/tests/python/test_basic_models.py
index 96d6aed57bc4..7d04ef477b3e 100644
--- a/tests/python/test_basic_models.py
+++ b/tests/python/test_basic_models.py
@@ -336,7 +336,8 @@ def run_slice(self, booster):
         num_boost_round = 16
         total_trees = num_parallel_tree * num_classes * num_boost_round
         booster = xgb.train({
-            'num_parallel_tree': 4, 'subsample': 0.5, 'num_class': 3, 'booster': booster},
+            'num_parallel_tree': 4, 'subsample': 0.5, 'num_class': 3, 'booster': booster,
+            'objective': 'multi:softprob'},
                             num_boost_round=num_boost_round, dtrain=dtrain)
         assert len(booster.get_dump()) == total_trees
         beg = 3
@@ -391,22 +392,22 @@ def assign():
         sliced_0 = booster[1:3]
         sliced_1 = booster[3:7]
 
-        predt_0 = sliced_0.predict(dtrain)
-        predt_1 = sliced_1.predict(dtrain)
+        predt_0 = sliced_0.predict(dtrain, output_margin=True)
+        predt_1 = sliced_1.predict(dtrain, output_margin=True)
 
-        merged = predt_0 + predt_1 - 0.5
-        single = booster[1:7].predict(dtrain)
-        np.testing.assert_allclose(merged, single)
+        merged = predt_0 + predt_1 - 0.5  # base score.
+        single = booster[1:7].predict(dtrain, output_margin=True)
+        np.testing.assert_allclose(merged, single, atol=1e-6)
 
         sliced_0 = booster[1:7:2]  # 1,3,5
         sliced_1 = booster[2:8:2]  # 2,4,6
 
-        predt_0 = sliced_0.predict(dtrain)
-        predt_1 = sliced_1.predict(dtrain)
+        predt_0 = sliced_0.predict(dtrain, output_margin=True)
+        predt_1 = sliced_1.predict(dtrain, output_margin=True)
 
         merged = predt_0 + predt_1 - 0.5
-        single = booster[1:7].predict(dtrain)
-        np.testing.assert_allclose(merged, single)
+        single = booster[1:7].predict(dtrain, output_margin=True)
+        np.testing.assert_allclose(merged, single, atol=1e-6)
 
     def test_slice(self):
         self.run_slice('gbtree')

From accc0f10dd4bd13a127cde7e43d2abe49b57c3dd Mon Sep 17 00:00:00 2001
From: fis <jm.yuan@outlook.com>
Date: Tue, 3 Nov 2020 01:28:07 -0500
Subject: [PATCH 16/16] Use pytest raises and parametrize.

---
 tests/python/test_basic_models.py | 48 ++++++++++++++++++-------------
 1 file changed, 28 insertions(+), 20 deletions(-)

diff --git a/tests/python/test_basic_models.py b/tests/python/test_basic_models.py
index 7d04ef477b3e..9744eec34d40 100644
--- a/tests/python/test_basic_models.py
+++ b/tests/python/test_basic_models.py
@@ -29,7 +29,7 @@ def json_model(model_path, parameters):
     return model
 
 
-class TestModels(unittest.TestCase):
+class TestModels:
     def test_glm(self):
         param = {'verbosity': 0, 'objective': 'binary:logistic',
                  'booster': 'gblinear', 'alpha': 0.0001, 'lambda': 1,
@@ -209,12 +209,14 @@ def test_feature_names_validation(self):
 
         bst = xgb.train([], dm1)
         bst.predict(dm1)  # success
-        self.assertRaises(ValueError, bst.predict, dm2)
+        with pytest.raises(ValueError):
+            bst.predict(dm2)
         bst.predict(dm1)  # success
 
         bst = xgb.train([], dm2)
         bst.predict(dm2)  # success
-        self.assertRaises(ValueError, bst.predict, dm1)
+        with pytest.raises(ValueError):
+            bst.predict(dm1)
         bst.predict(dm2)  # success
 
     def test_model_binary_io(self):
@@ -326,7 +328,8 @@ def validate_model(parameters):
                       'objective': 'multi:softmax'}
         validate_model(parameters)
 
-    def run_slice(self, booster):
+    @pytest.mark.parametrize('booster', ['gbtree', 'dart'])
+    def test_slice(self, booster):
         from sklearn.datasets import make_classification
         num_classes = 3
         X, y = make_classification(n_samples=1000, n_informative=5,
@@ -367,27 +370,36 @@ def run_slice(self, booster):
         sliced_trees = end * num_parallel_tree * num_classes
         assert sliced_trees == len(sliced.get_dump())
 
-        self.assertRaises(ValueError, lambda: booster[-1: 0])
+        with pytest.raises(ValueError, match=r'>= 0'):
+            booster[-1: 0]
+
         # we do not accept empty slice.
-        self.assertRaises(ValueError, lambda: booster[1:1])
+        with pytest.raises(ValueError):
+            booster[1:1]
         # stop can not be smaller than begin
-        self.assertRaises(ValueError, lambda: booster[3:0])
-        self.assertRaises(ValueError, lambda: booster[3:-1])
+        with pytest.raises(ValueError, match=r'Invalid.*'):
+            booster[3:0]
+        with pytest.raises(ValueError, match=r'Invalid.*'):
+            booster[3:-1]
         # negative step is not supported.
-        self.assertRaises(ValueError, lambda: booster[0:2:-1])
+        with pytest.raises(ValueError, match=r'.*>= 1.*'):
+            booster[0:2:-1]
         # step can not be 0.
-        self.assertRaises(ValueError, lambda: booster[0:2:0])
+        with pytest.raises(ValueError, match=r'.*>= 1.*'):
+            booster[0:2:0]
 
         trees = [_ for _ in booster]
         assert len(trees) == num_boost_round
 
-        self.assertRaises(TypeError, lambda: booster["wrong type"])
-        self.assertRaises(IndexError, lambda: booster[:num_boost_round+1])
-        self.assertRaises(ValueError, lambda: booster[1, 2])  # too many dims
-
-        def assign():
+        with pytest.raises(TypeError):
+            booster["wrong type"]
+        with pytest.raises(IndexError):
+            booster[:num_boost_round+1]
+        with pytest.raises(ValueError):
+            booster[1, 2]       # too many dims
+        # setitem is not implemented as model is immutable during slicing.
+        with pytest.raises(TypeError):
             booster[...:end] = booster
-        self.assertRaises(TypeError, assign)
 
         sliced_0 = booster[1:3]
         sliced_1 = booster[3:7]
@@ -408,7 +420,3 @@ def assign():
         merged = predt_0 + predt_1 - 0.5
         single = booster[1:7].predict(dtrain, output_margin=True)
         np.testing.assert_allclose(merged, single, atol=1e-6)
-
-    def test_slice(self):
-        self.run_slice('gbtree')
-        self.run_slice('dart')