dmlc
diff --git a/‎cmake/Version.cmake
Lines changed: 1 addition & 1 deletion b/‎cmake/Version.cmake
Lines changed: 1 addition & 1 deletion
diff --git a/‎include/xgboost/base.h
Lines changed: 1 addition & 1 deletion b/‎include/xgboost/base.h
Lines changed: 1 addition & 1 deletion
diff --git a/‎include/xgboost/data.h
Lines changed: 0 additions & 2 deletions b/‎include/xgboost/data.h
Lines changed: 0 additions & 2 deletions
diff --git a/‎include/xgboost/gbm.h
Lines changed: 22 additions & 14 deletions b/‎include/xgboost/gbm.h
Lines changed: 22 additions & 14 deletions
diff --git a/‎include/xgboost/generic_parameters.h
Lines changed: 13 additions & 3 deletions b/‎include/xgboost/generic_parameters.h
Lines changed: 13 additions & 3 deletions
diff --git a/‎include/xgboost/learner.h
Lines changed: 28 additions & 8 deletions b/‎include/xgboost/learner.h
Lines changed: 28 additions & 8 deletions
diff --git a/‎include/xgboost/objective.h
Lines changed: 1 addition & 1 deletion b/‎include/xgboost/objective.h
Lines changed: 1 addition & 1 deletion
diff --git a/‎include/xgboost/tree_model.h
Lines changed: 5 additions & 2 deletions b/‎include/xgboost/tree_model.h
Lines changed: 5 additions & 2 deletions
diff --git a/‎include/xgboost/tree_updater.h
Lines changed: 3 additions & 0 deletions b/‎include/xgboost/tree_updater.h
Lines changed: 3 additions & 0 deletions
diff --git a/‎src/common/hist_util.cc
Lines changed: 6 additions & 2 deletions b/‎src/common/hist_util.cc
Lines changed: 6 additions & 2 deletions
diff --git a/‎src/common/io.cc
Lines changed: 1 addition & 1 deletion b/‎src/common/io.cc
Lines changed: 1 addition & 1 deletion
@@ -5,5 +5,5 @@ function (write_version)
     ${xgboost_SOURCE_DIR}/include/xgboost/version_config.h @ONLY)
   configure_file(
     ${xgboost_SOURCE_DIR}/cmake/Python_version.in
-    ${xgboost_SOURCE_DIR}/python-package/xgboost/VERSION)
+    ${xgboost_SOURCE_DIR}/python-package/xgboost/VERSION @ONLY)
 endfunction (write_version)
@@ -112,7 +112,7 @@ using bst_float = float;  // NOLINT
 
 /*! \brief Type for data column (feature) index. */
 using bst_feature_t = uint32_t;  // NOLINT
-/*! \breif Type for data row index.
+/*! \brief Type for data row index.
  *
  * Be careful `std::size_t' is implementation-defined.  Meaning that the binary
  * representation of DMatrix might not be portable across platform.  Booster model should
 
@@ -22,8 +22,6 @@
 #include <vector>
 
 namespace xgboost {
-// forward declare learner.
-class LearnerImpl;
 // forward declare dmatrix.
 class DMatrix;
 
 
@@ -11,10 +11,8 @@
 #include <dmlc/registry.h>
 #include <xgboost/base.h>
 #include <xgboost/data.h>
-#include <xgboost/objective.h>
-#include <xgboost/feature_map.h>
-#include <xgboost/generic_parameters.h>
 #include <xgboost/host_device_vector.h>
+#include <xgboost/model.h>
 
 #include <vector>
 #include <utility>
@@ -23,6 +21,14 @@
 #include <memory>
 
 namespace xgboost {
+
+class Json;
+class FeatureMap;
+class ObjFunction;
+
+struct GenericParameter;
+struct LearnerModelParam;
+
 /*!
  * \brief interface of gradient boosting model.
  */
@@ -117,13 +123,14 @@ class GradientBooster {
    * \param condition_feature feature to condition on (i.e. fix) during calculations
    */
   virtual void PredictContribution(DMatrix* dmat,
-                           std::vector<bst_float>* out_contribs,
-                           unsigned ntree_limit = 0, bool approximate = false,
-                           int condition = 0, unsigned condition_feature = 0) = 0;
+                                   std::vector<bst_float>* out_contribs,
+                                   unsigned ntree_limit = 0,
+                                   bool approximate = false, int condition = 0,
+                                   unsigned condition_feature = 0) = 0;
 
   virtual void PredictInteractionContributions(DMatrix* dmat,
-                           std::vector<bst_float>* out_contribs,
-                           unsigned ntree_limit, bool approximate) = 0;
+                                               std::vector<bst_float>* out_contribs,
+                                               unsigned ntree_limit, bool approximate) = 0;
 
   /*!
    * \brief dump the model in the requested format
@@ -136,21 +143,22 @@ class GradientBooster {
                                              bool with_stats,
                                              std::string format) const = 0;
   /*!
-   * \brief Whether the current booster use GPU.
+   * \brief Whether the current booster uses GPU.
    */
   virtual bool UseGPU() const = 0;
   /*!
    * \brief create a gradient booster from given name
    * \param name name of gradient booster
+   * \param generic_param Pointer to runtime parameters
+   * \param learner_model_param pointer to global model parameters
    * \param cache_mats The cache data matrix of the Booster.
-   * \param base_margin The base margin of prediction.
    * \return The created booster.
    */
   static GradientBooster* Create(
       const std::string& name,
-      GenericParameter const* gparam,
-      const std::vector<std::shared_ptr<DMatrix> >& cache_mats,
-      bst_float base_margin);
+      GenericParameter const* generic_param,
+      LearnerModelParam const* learner_model_param,
+      const std::vector<std::shared_ptr<DMatrix> >& cache_mats);
 
   static void AssertGPUSupport() {
 #ifndef XGBOOST_USE_CUDA
@@ -166,7 +174,7 @@ struct GradientBoosterReg
     : public dmlc::FunctionRegEntryBase<
   GradientBoosterReg,
   std::function<GradientBooster* (const std::vector<std::shared_ptr<DMatrix> > &cached_mats,
-                                  bst_float base_margin)> > {
+                                  LearnerModelParam const* learner_model_param)> > {
 };
 
 /*!
 
@@ -13,8 +13,9 @@
 namespace xgboost {
 struct GenericParameter : public XGBoostParameter<GenericParameter> {
   // Constant representing the device ID of CPU.
-  static int constexpr kCpuId = -1;
+  static int32_t constexpr kCpuId = -1;
 
+ public:
   // stored random seed
   int seed;
   // whether seed the PRNG each iteration
@@ -26,8 +27,7 @@ struct GenericParameter : public XGBoostParameter<GenericParameter> {
   int gpu_id;
   // gpu page size in external memory mode, 0 means using the default.
   size_t gpu_page_size;
-
-  void ConfigureGpuId(bool require_gpu);
+  bool enable_experimental_json_serialization {false};
 
   void CheckDeprecated() {
     if (this->n_gpus != 0) {
@@ -36,6 +36,12 @@ struct GenericParameter : public XGBoostParameter<GenericParameter> {
           << this->__MANAGER__()->Find("n_gpus")->GetFieldInfo().description;
     }
   }
+  /*!
+   * \brief Configure the parameter `gpu_id'.
+   *
+   * \param require_gpu  Whether GPU is explicitly required from user.
+   */
+  void ConfigureGpuId(bool require_gpu);
 
   // declare parameters
   DMLC_DECLARE_PARAMETER(GenericParameter) {
@@ -60,6 +66,10 @@ struct GenericParameter : public XGBoostParameter<GenericParameter> {
         .set_default(0)
         .set_lower_bound(0)
         .describe("GPU page size when running in external memory mode.");
+    DMLC_DECLARE_FIELD(enable_experimental_json_serialization)
+        .set_default(false)
+        .describe("Enable using JSON for memory serialization (Python Pickle, "
+                  "rabit checkpoints etc.).");
     DMLC_DECLARE_FIELD(n_gpus)
         .set_default(0)
         .set_range(0, 1)
 
@@ -9,13 +9,10 @@
 #define XGBOOST_LEARNER_H_
 
 #include <rabit/rabit.h>
-
 #include <xgboost/base.h>
-#include <xgboost/gbm.h>
-#include <xgboost/metric.h>
-#include <xgboost/objective.h>
 #include <xgboost/feature_map.h>
 #include <xgboost/generic_parameters.h>
+#include <xgboost/host_device_vector.h>
 #include <xgboost/model.h>
 
 #include <utility>
@@ -26,6 +23,12 @@
 
 namespace xgboost {
 
+class Metric;
+class GradientBooster;
+class ObjFunction;
+class DMatrix;
+class Json;
+
 /*!
  * \brief Learner class that does training and prediction.
  *  This is the user facing module of xgboost training.
@@ -45,7 +48,7 @@ namespace xgboost {
 class Learner : public Model, public rabit::Serializable {
  public:
   /*! \brief virtual destructor */
-  ~Learner() override = default;
+  ~Learner() override;
   /*!
    * \brief Configure Learner based on set parameters.
    */
@@ -180,16 +183,33 @@ class Learner : public Model, public rabit::Serializable {
   virtual const std::map<std::string, std::string>& GetConfigurationArguments() const = 0;
 
  protected:
-  /*! \brief internal base score of the model */
-  bst_float base_score_;
   /*! \brief objective function */
   std::unique_ptr<ObjFunction> obj_;
   /*! \brief The gradient booster used by the model*/
   std::unique_ptr<GradientBooster> gbm_;
   /*! \brief The evaluation metrics used to evaluate the model. */
   std::vector<std::unique_ptr<Metric> > metrics_;
   /*! \brief Training parameter. */
-  GenericParameter generic_param_;
+  GenericParameter generic_parameters_;
+};
+
+struct LearnerModelParamLegacy;
+
+/*
+ * \brief Basic Model Parameters, used to describe the booster.
+ */
+struct LearnerModelParam {
+  /* \brief global bias */
+  bst_float base_score;
+  /* \brief number of features  */
+  uint32_t num_feature;
+  /* \brief number of classes, if it is multi-class classification  */
+  uint32_t num_output_group;
+
+  LearnerModelParam() : base_score {0.5}, num_feature{0}, num_output_group{0} {}
+  // As the old `LearnerModelParamLegacy` is still used by binary IO, we keep
+  // this one as an immutable copy.
+  LearnerModelParam(LearnerModelParamLegacy const& user_param, float base_margin);
 };
 
 }  // namespace xgboost
 
@@ -1,5 +1,5 @@
 /*!
- * Copyright 2014 by Contributors
+ * Copyright 2014-2019 by Contributors
  * \file objective.h
  * \brief interface of objective function used by xgboost.
  * \author Tianqi Chen, Kailong Chen
 
@@ -27,6 +27,9 @@ namespace xgboost {
 
 struct PathElement;  // forward declaration
 
+class Json;
+// FIXME(trivialfis): Once binary IO is gone, make this parameter internal as it should
+// not be configured by users.
 /*! \brief meta parameters of the tree */
 struct TreeParam : public dmlc::Parameter<TreeParam> {
   /*! \brief (Deprecated) number of start root */
@@ -36,7 +39,7 @@ struct TreeParam : public dmlc::Parameter<TreeParam> {
   /*!\brief number of deleted nodes */
   int num_deleted;
   /*! \brief maximum depth, this is a statistics of the tree */
-  int max_depth;
+  int deprecated_max_depth;
   /*! \brief number of features used for tree construction */
   int num_feature;
   /*!
@@ -67,7 +70,7 @@ struct TreeParam : public dmlc::Parameter<TreeParam> {
 
   bool operator==(const TreeParam& b) const {
     return num_nodes == b.num_nodes &&
-           num_deleted == b.num_deleted && max_depth == b.max_depth &&
+           num_deleted == b.num_deleted &&
            num_feature == b.num_feature &&
            size_leaf_vector == b.size_leaf_vector;
   }
 
@@ -22,6 +22,9 @@
 #include <string>
 
 namespace xgboost {
+
+class Json;
+
 /*!
  * \brief interface of tree update module, that performs update of a tree.
  */
 
@@ -44,11 +44,15 @@ void HistogramCuts::Build(DMatrix* dmat, uint32_t const max_num_bins) {
   float constexpr kSparsityThreshold = 0.0005;
   // FIXME(trivialfis): Distributed environment is not supported.
   if (sparsity < kSparsityThreshold && (!rabit::IsDistributed())) {
-    LOG(INFO) << "Building quantile cut on a sparse dataset.";
     SparseCuts cuts(this);
     cuts.Build(dmat, max_num_bins);
   } else {
-    LOG(INFO) << "Building quantile cut on a dense dataset or distributed environment.";
+    if (rabit::IsDistributed() && sparsity < kSparsityThreshold) {
+      LOG(WARNING) << "Building quantile cuts with a sparse dataset on distributed "
+                   << "environment, which may incur higher memory usage and longer "
+                   << "build time.";
+    }
+
     DenseCuts cuts(this);
     cuts.Build(dmat, max_num_bins);
   }
 
@@ -136,9 +136,9 @@ std::string LoadSequentialFile(std::string fname) {
 
   buffer.resize(fsize + 1);
   fread(&buffer[0], 1, fsize, f);
-  buffer.back() = '\0';
   fclose(f);
 #endif  // defined(__unix__)
+  buffer.back() = '\0';
   return buffer;
 }
Original file line number	Diff line number	Diff line change
`@@ -112,7 +112,7 @@ using bst_float = float; // NOLINT`
`112`	`112`
`113`	`113`	`/! \brief Type for data column (feature) index. /`
`114`	`114`	`using bst_feature_t = uint32_t; // NOLINT`
`115`		`-/*! \breif Type for data row index.`
	`115`	`+/*! \brief Type for data row index.`
`116`	`116`	`*`
`117`	`117`	* Be careful `std::size_t' is implementation-defined. Meaning that the binary
`118`	`118`	`* representation of DMatrix might not be portable across platform. Booster model should`
Original file line number	Diff line number	Diff line change
`@@ -136,9 +136,9 @@ std::string LoadSequentialFile(std::string fname) {`
`136`	`136`
`137`	`137`	`buffer.resize(fsize + 1);`
`138`	`138`	`fread(&buffer[0], 1, fsize, f);`
`139`		`- buffer.back() = '\0';`
`140`	`139`	`fclose(f);`
`141`	`140`	`#endif // defined(__unix__)`
	`141`	`+ buffer.back() = '\0';`
`142`	`142`	`return buffer;`
`143`	`143`	`}`
`144`	`144`