From 0e8c3a821a8a1a7d609b6bd78b51bf90a24dbcce Mon Sep 17 00:00:00 2001
From: Jiaming Yuan <jm.yuan@outlook.com>
Date: Wed, 5 Mar 2025 03:35:42 +0800
Subject: [PATCH 1/6] [WIP] Drop the deprecated binary format.

---
 include/xgboost/learner.h    |   5 +-
 include/xgboost/model.h      |  13 +-
 include/xgboost/tree_model.h |  11 --
 src/c_api/c_api.cc           |  73 ++++++-----
 src/gbm/gblinear.cc          |   7 -
 src/gbm/gblinear_model.cc    |   5 +-
 src/gbm/gblinear_model.h     |  11 --
 src/gbm/gbtree.h             |   5 -
 src/gbm/gbtree_model.cc      |  56 --------
 src/gbm/gbtree_model.h       |   3 -
 src/learner.cc               | 245 +++++------------------------------
 src/tree/tree_model.cc       |  70 ----------
 12 files changed, 87 insertions(+), 417 deletions(-)
diff --git a/include/xgboost/learner.h b/include/xgboost/learner.h
index 1499804c8592..43e97babf2a8 100644
--- a/include/xgboost/learner.h
+++ b/include/xgboost/learner.h
@@ -1,5 +1,5 @@
 /**
- * Copyright 2015-2023 by XGBoost Contributors
+ * Copyright 2015-2025, XGBoost Contributors
  * \file learner.h
  * \brief Learner interface that integrates objective, gbm and evaluation together.
  *  This is the user facing XGBoost training module.
@@ -151,9 +151,6 @@ class Learner : public Model, public Configurable, public dmlc::Serializable {
   void LoadModel(Json const& in) override = 0;
   void SaveModel(Json* out) const override = 0;
 
-  virtual void LoadModel(dmlc::Stream* fi) = 0;
-  virtual void SaveModel(dmlc::Stream* fo) const = 0;
-
   /*!
    * \brief Set multiple parameters at once.
    *
diff --git a/include/xgboost/model.h b/include/xgboost/model.h
index 610c7a0f5c48..c9c045234501 100644
--- a/include/xgboost/model.h
+++ b/include/xgboost/model.h
@@ -1,15 +1,12 @@
-/*!
- * Copyright (c) 2019 by Contributors
- * \file model.h
- * \brief Defines the abstract interface for different components in XGBoost.
+/**
+ * Copyright 2019-2025, XGBoost Contributors
+ *
+ * @file model.h
+ * @brief Defines the abstract interface for different components in XGBoost.
  */
 #ifndef XGBOOST_MODEL_H_
 #define XGBOOST_MODEL_H_
 
-namespace dmlc {
-class Stream;
-}  // namespace dmlc
-
 namespace xgboost {
 
 class Json;
diff --git a/include/xgboost/tree_model.h b/include/xgboost/tree_model.h
index 921fc5a1ebc8..7deb5f7d2f78 100644
--- a/include/xgboost/tree_model.h
+++ b/include/xgboost/tree_model.h
@@ -365,17 +365,6 @@ class RegTree : public Model {
     return stats_[nid];
   }
 
-  /*!
-   * \brief load model from stream
-   * \param fi input stream
-   */
-  void Load(dmlc::Stream* fi);
-  /*!
-   * \brief save model to stream
-   * \param fo output stream
-   */
-  void Save(dmlc::Stream* fo) const;
-
   void LoadModel(Json const& in) override;
   void SaveModel(Json* out) const override;
 
diff --git a/src/c_api/c_api.cc b/src/c_api/c_api.cc
index f64bd3324406..e762519f0adc 100644
--- a/src/c_api/c_api.cc
+++ b/src/c_api/c_api.cc
@@ -1420,7 +1420,38 @@ XGB_DLL int XGBoosterPredictFromCUDAColumnar(BoosterHandle handle, char const *,
 }
 #endif  // !defined(XGBOOST_USE_CUDA)
 
-XGB_DLL int XGBoosterLoadModel(BoosterHandle handle, const char* fname) {
+namespace {
+template <typename Buffer, typename Iter = typename Buffer::const_iterator>
+Json DispatchModelType(Buffer const &buffer, StringView ext, bool warn) {
+  auto first_non_space = [&](Iter beg, Iter end) {
+    for (auto i = beg; i != end; ++i) {
+      if (!std::isspace(*i)) {
+        return i;
+      }
+    }
+    return end;
+  };
+
+  Json model;
+  auto it = first_non_space(buffer.cbegin() + 1, buffer.cend());
+  if (it != buffer.cend() && *it == '"') {
+    if (warn) {
+      LOG(WARNING) << "Unknown file format: `" << ext << "`. Using JSON as a guess.";
+    }
+    model = Json::Load(StringView{buffer.data(), buffer.size()});
+  } else if (it != buffer.cend() && std::isalpha(*it)) {
+    if (warn) {
+      LOG(WARNING) << "Unknown file format: `" << ext << "`. Using UBJ as a guess.";
+    }
+    model = Json::Load(StringView{buffer.data(), buffer.size()}, std::ios::binary);
+  } else {
+    LOG(FATAL) << "Invalid model format";
+  }
+  return model;
+}
+}  // namespace
+
+XGB_DLL int XGBoosterLoadModel(BoosterHandle handle, const char *fname) {
   API_BEGIN();
   CHECK_HANDLE();
   xgboost_CHECK_C_ARG_PTR(fname);
@@ -1430,28 +1461,23 @@ XGB_DLL int XGBoosterLoadModel(BoosterHandle handle, const char* fname) {
     CHECK_EQ(str[0], '{');
     return str;
   };
-  if (common::FileExtension(fname) == "json") {
+  auto ext = common::FileExtension(fname);
+  if (ext == "json") {
     auto buffer = read_file();
     Json in{Json::Load(StringView{buffer.data(), buffer.size()})};
-    static_cast<Learner*>(handle)->LoadModel(in);
-  } else if (common::FileExtension(fname) == "ubj") {
+    static_cast<Learner *>(handle)->LoadModel(in);
+  } else if (ext == "ubj") {
     auto buffer = read_file();
     Json in = Json::Load(StringView{buffer.data(), buffer.size()}, std::ios::binary);
     static_cast<Learner *>(handle)->LoadModel(in);
   } else {
-    std::unique_ptr<dmlc::Stream> fi(dmlc::Stream::Create(fname, "r"));
-    static_cast<Learner*>(handle)->LoadModel(fi.get());
+    auto buffer = read_file();
+    auto in = DispatchModelType(buffer, ext, true);
+    static_cast<Learner *>(handle)->LoadModel(in);
   }
   API_END();
 }
 
-namespace {
-void WarnOldModel() {
-  LOG(WARNING) << "Saving into deprecated binary model format, please consider using `json` or "
-                  "`ubj`. Model format is default to UBJSON in XGBoost 2.1 if not specified.";
-}
-}  // anonymous namespace
-
 XGB_DLL int XGBoosterSaveModel(BoosterHandle handle, const char *fname) {
   API_BEGIN();
   CHECK_HANDLE();
@@ -1471,13 +1497,9 @@ XGB_DLL int XGBoosterSaveModel(BoosterHandle handle, const char *fname) {
     save_json(std::ios::out);
   } else if (common::FileExtension(fname) == "ubj") {
     save_json(std::ios::binary);
-  } else if (common::FileExtension(fname) == "deprecated") {
-    WarnOldModel();
-    auto *bst = static_cast<Learner *>(handle);
-    bst->SaveModel(fo.get());
   } else {
     LOG(WARNING) << "Saving model in the UBJSON format as default.  You can use file extension:"
-                    " `json`, `ubj` or `deprecated` to choose between formats.";
+                    " `json` or `ubj` to choose between formats.";
     save_json(std::ios::binary);
   }
   API_END();
@@ -1488,9 +1510,11 @@ XGB_DLL int XGBoosterLoadModelFromBuffer(BoosterHandle handle, const void *buf,
   API_BEGIN();
   CHECK_HANDLE();
   xgboost_CHECK_C_ARG_PTR(buf);
-
+  auto buffer = common::Span<char const>{static_cast<char const *>(buf), len};
+  // Don't warn, we have to guess the format with buffer input.
+  auto in = DispatchModelType(buffer, "", false);
   common::MemoryFixSizeBuffer fs((void *)buf, len);  // NOLINT(*)
-  static_cast<Learner *>(handle)->LoadModel(&fs);
+  static_cast<Learner *>(handle)->LoadModel(in);
   API_END();
 }
 
@@ -1523,15 +1547,6 @@ XGB_DLL int XGBoosterSaveModelToBuffer(BoosterHandle handle, char const *json_co
     save_json(std::ios::out);
   } else if (format == "ubj") {
     save_json(std::ios::binary);
-  } else if (format == "deprecated") {
-    WarnOldModel();
-    auto &raw_str = learner->GetThreadLocal().ret_str;
-    raw_str.clear();
-    common::MemoryBufferStream fo(&raw_str);
-    learner->SaveModel(&fo);
-
-    *out_dptr = dmlc::BeginPtr(raw_str);
-    *out_len = static_cast<xgboost::bst_ulong>(raw_str.size());
   } else {
     LOG(FATAL) << "Unknown format: `" << format << "`";
   }
diff --git a/src/gbm/gblinear.cc b/src/gbm/gblinear.cc
index 2cacfe078b4b..5c9208f39a75 100644
--- a/src/gbm/gblinear.cc
+++ b/src/gbm/gblinear.cc
@@ -101,13 +101,6 @@ class GBLinear : public GradientBooster {
 
   bool ModelFitted() const override { return BoostedRounds() != 0; }
 
-  void Load(dmlc::Stream* fi) override {
-    model_.Load(fi);
-  }
-  void Save(dmlc::Stream* fo) const override {
-    model_.Save(fo);
-  }
-
   void SaveModel(Json* p_out) const override {
     auto& out = *p_out;
     out["name"] = String{"gblinear"};
diff --git a/src/gbm/gblinear_model.cc b/src/gbm/gblinear_model.cc
index 5e6f5dda9a1f..0be4b5a2914f 100644
--- a/src/gbm/gblinear_model.cc
+++ b/src/gbm/gblinear_model.cc
@@ -1,9 +1,8 @@
-/*!
- * Copyright 2019-2022 by Contributors
+/**
+ * Copyright 2019-2025, XGBoost Contributors
  */
 #include <algorithm>
 #include <utility>
-#include <limits>
 #include "xgboost/json.h"
 #include "gblinear_model.h"
 
diff --git a/src/gbm/gblinear_model.h b/src/gbm/gblinear_model.h
index 91760346ca47..c82627067b2c 100644
--- a/src/gbm/gblinear_model.h
+++ b/src/gbm/gblinear_model.h
@@ -71,17 +71,6 @@ class GBLinearModel : public Model {
   void SaveModel(Json *p_out) const override;
   void LoadModel(Json const &in) override;
 
-  // save the model to file
-  void Save(dmlc::Stream *fo) const {
-    fo->Write(&param_, sizeof(param_));
-    fo->Write(weight);
-  }
-  // load model from file
-  void Load(dmlc::Stream *fi) {
-    CHECK_EQ(fi->Read(&param_, sizeof(param_)), sizeof(param_));
-    fi->Read(&weight);
-  }
-
   // model bias
   inline bst_float *Bias() {
     return &weight[learner_model_param->num_feature *
diff --git a/src/gbm/gbtree.h b/src/gbm/gbtree.h
index 1fbf0ebdaf7f..2df185e6db92 100644
--- a/src/gbm/gbtree.h
+++ b/src/gbm/gbtree.h
@@ -188,11 +188,6 @@ class GBTree : public GradientBooster {
 
   [[nodiscard]] GBTreeTrainParam const& GetTrainParam() const { return tparam_; }
 
-  void Load(dmlc::Stream* fi) override { model_.Load(fi); }
-  void Save(dmlc::Stream* fo) const override {
-    model_.Save(fo);
-  }
-
   void LoadConfig(Json const& in) override;
   void SaveConfig(Json* p_out) const override;
 
diff --git a/src/gbm/gbtree_model.cc b/src/gbm/gbtree_model.cc
index c94c6525fea2..6400f4980d9c 100644
--- a/src/gbm/gbtree_model.cc
+++ b/src/gbm/gbtree_model.cc
@@ -50,62 +50,6 @@ void Validate(GBTreeModel const& model) {
 }
 }  // namespace
 
-void GBTreeModel::Save(dmlc::Stream* fo) const {
-  CHECK_EQ(param.num_trees, static_cast<int32_t>(trees.size()));
-
-  if (DMLC_IO_NO_ENDIAN_SWAP) {
-    fo->Write(&param, sizeof(param));
-  } else {
-    auto x = param.ByteSwap();
-    fo->Write(&x, sizeof(x));
-  }
-  for (const auto & tree : trees) {
-    tree->Save(fo);
-  }
-  if (tree_info.size() != 0) {
-    if (DMLC_IO_NO_ENDIAN_SWAP) {
-      fo->Write(dmlc::BeginPtr(tree_info), sizeof(int32_t) * tree_info.size());
-    } else {
-      for (const auto& e : tree_info) {
-        auto x = e;
-        dmlc::ByteSwap(&x, sizeof(x), 1);
-        fo->Write(&x, sizeof(x));
-      }
-    }
-  }
-}
-
-void GBTreeModel::Load(dmlc::Stream* fi) {
-  CHECK_EQ(fi->Read(&param, sizeof(param)), sizeof(param))
-      << "GBTree: invalid model file";
-  if (!DMLC_IO_NO_ENDIAN_SWAP) {
-    param = param.ByteSwap();
-  }
-  trees.clear();
-  trees_to_update.clear();
-  for (int32_t i = 0; i < param.num_trees; ++i) {
-    std::unique_ptr<RegTree> ptr(new RegTree());
-    ptr->Load(fi);
-    trees.push_back(std::move(ptr));
-  }
-  tree_info.resize(param.num_trees);
-  if (param.num_trees != 0) {
-    if (DMLC_IO_NO_ENDIAN_SWAP) {
-      CHECK_EQ(
-          fi->Read(dmlc::BeginPtr(tree_info), sizeof(int32_t) * param.num_trees),
-          sizeof(int32_t) * param.num_trees);
-    } else {
-      for (auto& info : tree_info) {
-        CHECK_EQ(fi->Read(&info, sizeof(int32_t)), sizeof(int32_t));
-        dmlc::ByteSwap(&info, sizeof(info), 1);
-      }
-    }
-  }
-
-  MakeIndptr(this);
-  Validate(*this);
-}
-
 void GBTreeModel::SaveModel(Json* p_out) const {
   auto& out = *p_out;
   CHECK_EQ(param.num_trees, static_cast<int>(trees.size()));
diff --git a/src/gbm/gbtree_model.h b/src/gbm/gbtree_model.h
index 7d7893fb3391..05182f3a0ce0 100644
--- a/src/gbm/gbtree_model.h
+++ b/src/gbm/gbtree_model.h
@@ -108,9 +108,6 @@ struct GBTreeModel : public Model {
     }
   }
 
-  void Load(dmlc::Stream* fi);
-  void Save(dmlc::Stream* fo) const;
-
   void SaveModel(Json* p_out) const override;
   void LoadModel(Json const& p_out) override;
 
diff --git a/src/learner.cc b/src/learner.cc
index d45b533396db..c4976449c36e 100644
--- a/src/learner.cc
+++ b/src/learner.cc
@@ -853,11 +853,6 @@ class LearnerConfiguration : public Learner {
 std::string const LearnerConfiguration::kEvalMetric {"eval_metric"};  // NOLINT
 
 class LearnerIO : public LearnerConfiguration {
- private:
-  // Used to identify the offset of JSON string when
-  // Will be removed once JSON takes over.  Right now we still loads some RDS files from R.
-  std::string const serialisation_header_ { u8"CONFIG-offset:" };
-
  protected:
   void ClearCaches() { this->prediction_container_ = PredictionContainer{}; }
 
@@ -956,186 +951,34 @@ class LearnerIO : public LearnerConfiguration {
   void LoadModel(dmlc::Stream* fi) override {
     ctx_.UpdateAllowUnknown(Args{});
     tparam_.Init(std::vector<std::pair<std::string, std::string>>{});
+
     // TODO(tqchen) mark deprecation of old format.
     common::PeekableInStream fp(fi);
 
     // backward compatible header check.
     std::string header;
     header.resize(4);
+    StringView msg = "Only `json` and `ubj` is supported starting from 3.1.";
     if (fp.PeekRead(&header[0], 4) == 4) {
-      CHECK_NE(header, "bs64")
-          << "Base64 format is no longer supported in brick.";
-      if (header == "binf") {
-        CHECK_EQ(fp.Read(&header[0], 4), 4U);
-      }
+      CHECK_NE(header, "bs64") << msg;
+      CHECK_NE(header, "binf") << msg;
     }
+    CHECK_EQ(header[0], '{') << msg;
 
     // FIXME(jiamingy): Move this out of learner after the old binary model is remove.
-    auto first_non_space = [&](std::string::const_iterator beg, std::string::const_iterator end) {
-      for (auto i = beg; i != end; ++i) {
-        if (!std::isspace(*i)) {
-          return i;
-        }
-      }
-      return end;
-    };
 
-    if (header[0] == '{') {  // Dispatch to JSON
-      auto buffer = common::ReadAll(fi, &fp);
-      Json model;
-      auto it = first_non_space(buffer.cbegin() + 1, buffer.cend());
-      if (it != buffer.cend() && *it == '"') {
-        model = Json::Load(StringView{buffer});
-      } else if (it != buffer.cend() && std::isalpha(*it)) {
-        model = Json::Load(StringView{buffer}, std::ios::binary);
-      } else {
-        LOG(FATAL) << "Invalid model format";
-      }
-      this->LoadModel(model);
-      return;
-    }
-
-    // use the peekable reader.
-    fi = &fp;
-    // read parameter
-    CHECK_EQ(fi->Read(&mparam_, sizeof(mparam_)), sizeof(mparam_))
-        << "BoostLearner: wrong model format";
-    if (!DMLC_IO_NO_ENDIAN_SWAP) {
-      mparam_ = mparam_.ByteSwap();
-    }
-    CHECK(fi->Read(&tparam_.objective)) << "BoostLearner: wrong model format";
-    CHECK(fi->Read(&tparam_.booster)) << "BoostLearner: wrong model format";
-
-    obj_.reset(ObjFunction::Create(tparam_.objective, &ctx_));
-    gbm_.reset(GradientBooster::Create(tparam_.booster, &ctx_, &learner_model_param_));
-    gbm_->Load(fi);
-    if (mparam_.contain_extra_attrs != 0) {
-      std::vector<std::pair<std::string, std::string> > attr;
-      fi->Read(&attr);
-      attributes_ = std::map<std::string, std::string>(attr.begin(), attr.end());
-    }
-    bool warn_old_model { false };
-    if (attributes_.find("count_poisson_max_delta_step") != attributes_.cend()) {
-      // Loading model from < 1.0.0, objective is not saved.
-      cfg_["max_delta_step"] = attributes_.at("count_poisson_max_delta_step");
-      attributes_.erase("count_poisson_max_delta_step");
-      warn_old_model = true;
+    // Dispatch to JSON
+    auto buffer = common::ReadAll(fi, &fp);
+    Json model;
+    auto it = first_non_space(buffer.cbegin() + 1, buffer.cend());
+    if (it != buffer.cend() && *it == '"') {
+      model = Json::Load(StringView{buffer});
+    } else if (it != buffer.cend() && std::isalpha(*it)) {
+      model = Json::Load(StringView{buffer}, std::ios::binary);
     } else {
-      warn_old_model = false;
-    }
-
-    if (mparam_.major_version < 1) {
-      // Before 1.0.0, base_score is saved as a transformed value, and there's no version
-      // attribute (saved a 0) in the saved model.
-      std::string multi{"multi:"};
-      if (!std::equal(multi.cbegin(), multi.cend(), tparam_.objective.cbegin())) {
-        HostDeviceVector<float> t;
-        t.HostVector().resize(1);
-        t.HostVector().at(0) = mparam_.base_score;
-        this->obj_->PredTransform(&t);
-        auto base_score = t.HostVector().at(0);
-        mparam_.base_score = base_score;
-      }
-      warn_old_model = true;
-    }
-
-    learner_model_param_ =
-        LearnerModelParam(&ctx_, mparam_,
-                          linalg::Tensor<float, 1>{{std::isnan(mparam_.base_score)
-                                                        ? std::numeric_limits<float>::quiet_NaN()
-                                                        : obj_->ProbToMargin(mparam_.base_score)},
-                                                   {1},
-                                                   DeviceOrd::CPU()},
-                          obj_->Task(), tparam_.multi_strategy);
-
-    if (attributes_.find("objective") != attributes_.cend()) {
-      auto obj_str = attributes_.at("objective");
-      auto j_obj = Json::Load({obj_str.c_str(), obj_str.size()});
-      obj_->LoadConfig(j_obj);
-      attributes_.erase("objective");
-    } else {
-      warn_old_model = true;
-    }
-    if (attributes_.find("metrics") != attributes_.cend()) {
-      auto metrics_str = attributes_.at("metrics");
-      std::vector<std::string> names { common::Split(metrics_str, ';') };
-      attributes_.erase("metrics");
-      for (auto const& n : names) {
-        this->SetParam(kEvalMetric, n);
-      }
-    }
-
-    if (warn_old_model) {
-      LOG(WARNING) << "Loading model from XGBoost < 1.0.0, consider saving it "
-                      "again for improved compatibility";
-    }
-
-    // Renew the version.
-    mparam_.major_version = std::get<0>(Version::Self());
-    mparam_.minor_version = std::get<1>(Version::Self());
-
-    cfg_["num_feature"] = std::to_string(mparam_.num_feature);
-
-    auto n = tparam_.__DICT__();
-    cfg_.insert(n.cbegin(), n.cend());
-
-    this->need_configuration_ = true;
-    this->ClearCaches();
-  }
-
-  // Save model into binary format.  The code is about to be deprecated by more robust
-  // JSON serialization format.
-  void SaveModel(dmlc::Stream* fo) const override {
-    this->CheckModelInitialized();
-    CHECK(!this->learner_model_param_.IsVectorLeaf())
-        << "Please use JSON/UBJ format for model serialization with multi-output models.";
-
-    LearnerModelParamLegacy mparam = mparam_;  // make a copy to potentially modify
-    std::vector<std::pair<std::string, std::string> > extra_attr;
-    mparam.contain_extra_attrs = 1;
-
-    if (!this->feature_names_.empty() || !this->feature_types_.empty()) {
-      LOG(WARNING) << "feature names and feature types are being disregarded, use JSON/UBJSON "
-                      "format instead.";
-    }
-
-    {
-      // Similar to JSON model IO, we save the objective.
-      Json j_obj { Object() };
-      obj_->SaveConfig(&j_obj);
-      std::string obj_doc;
-      Json::Dump(j_obj, &obj_doc);
-      extra_attr.emplace_back("objective", obj_doc);
-    }
-    // As of 1.0.0, JVM Package and R Package uses Save/Load model for serialization.
-    // Remove this part once they are ported to use actual serialization methods.
-    if (mparam.contain_eval_metrics != 0) {
-      std::stringstream os;
-      for (auto& ev : metrics_) {
-        os << ev->Name() << ";";
-      }
-      extra_attr.emplace_back("metrics", os.str());
-    }
-
-    std::string header {"binf"};
-    fo->Write(header.data(), 4);
-    if (DMLC_IO_NO_ENDIAN_SWAP) {
-      fo->Write(&mparam, sizeof(LearnerModelParamLegacy));
-    } else {
-      LearnerModelParamLegacy x = mparam.ByteSwap();
-      fo->Write(&x, sizeof(LearnerModelParamLegacy));
-    }
-    fo->Write(tparam_.objective);
-    fo->Write(tparam_.booster);
-    gbm_->Save(fo);
-    if (mparam.contain_extra_attrs != 0) {
-      std::map<std::string, std::string> attr(attributes_);
-      for (const auto& kv : extra_attr) {
-        attr[kv.first] = kv.second;
-      }
-      fo->Write(std::vector<std::pair<std::string, std::string>>(
-          attr.begin(), attr.end()));
+      LOG(FATAL) << "Invalid model format";
     }
+    this->LoadModel(model);
   }
 
   void Save(dmlc::Stream* fo) const override {
@@ -1158,46 +1001,28 @@ class LearnerIO : public LearnerConfiguration {
     common::PeekableInStream fp(fi);
     char header[2];
     fp.PeekRead(header, 2);
-    if (header[0] == '{') {
-      auto buffer = common::ReadAll(fi, &fp);
-      Json memory_snapshot;
-      if (header[1] == '"') {
-        memory_snapshot = Json::Load(StringView{buffer});
-        error::WarnOldSerialization();
-      } else if (std::isalpha(header[1])) {
-        memory_snapshot = Json::Load(StringView{buffer}, std::ios::binary);
-      } else {
-        LOG(FATAL) << "Invalid serialization file.";
-      }
-      if (IsA<Null>(memory_snapshot["Model"])) {
-        // R has xgb.load that doesn't distinguish whether configuration is saved.
-        // We should migrate to use `xgb.load.raw` instead.
-        this->LoadModel(memory_snapshot);
-      } else {
-        this->LoadModel(memory_snapshot["Model"]);
-        this->LoadConfig(memory_snapshot["Config"]);
-      }
+    StringView msg = "Invalid serialization file.";
+    CHECK_EQ(header[0], '{') << msg;
+
+    auto buffer = common::ReadAll(fi, &fp);
+    Json memory_snapshot;
+    CHECK(std::isalpha(header[1])) << msg;
+    if (header[1] == '"') {
+      memory_snapshot = Json::Load(StringView{buffer});
+      error::WarnOldSerialization();
+    } else if (std::isalpha(header[1])) {
+      memory_snapshot = Json::Load(StringView{buffer}, std::ios::binary);
     } else {
-      std::string header;
-      header.resize(serialisation_header_.size());
-      CHECK_EQ(fp.Read(&header[0], header.size()), serialisation_header_.size());
-      // Avoid printing the content in loaded header, which might be random binary code.
-      CHECK(header == serialisation_header_) << error::OldSerialization();
-      int64_t sz {-1};
-      CHECK_EQ(fp.Read(&sz, sizeof(sz)), sizeof(sz));
-      if (!DMLC_IO_NO_ENDIAN_SWAP) {
-        dmlc::ByteSwap(&sz, sizeof(sz), 1);
-      }
-      CHECK_GT(sz, 0);
-      size_t json_offset = static_cast<size_t>(sz);
-      std::string buffer;
-      common::FixedSizeStream{&fp}.Take(&buffer);
-
-      common::MemoryFixSizeBuffer binary_buf(&buffer[0], json_offset);
-      this->LoadModel(&binary_buf);
+      LOG(FATAL) << "Invalid serialization file.";
+    }
 
-      auto config = Json::Load({buffer.c_str() + json_offset, buffer.size() - json_offset});
-      this->LoadConfig(config);
+    if (IsA<Null>(memory_snapshot["Model"])) {
+      // R has xgb.load that doesn't distinguish whether configuration is saved.
+      // We should migrate to use `xgb.load.raw` instead.
+      this->LoadModel(memory_snapshot);
+    } else {
+      this->LoadModel(memory_snapshot["Model"]);
+      this->LoadConfig(memory_snapshot["Config"]);
     }
   }
 };
diff --git a/src/tree/tree_model.cc b/src/tree/tree_model.cc
index 0639233510f7..a35df0424b49 100644
--- a/src/tree/tree_model.cc
+++ b/src/tree/tree_model.cc
@@ -911,76 +911,6 @@ void RegTree::ExpandCategorical(bst_node_t nid, bst_feature_t split_index,
   this->split_categories_segments_.at(nid).size = split_cat.size();
 }
 
-void RegTree::Load(dmlc::Stream* fi) {
-  CHECK_EQ(fi->Read(&param_, sizeof(TreeParam)), sizeof(TreeParam));
-  if (!DMLC_IO_NO_ENDIAN_SWAP) {
-    param_ = param_.ByteSwap();
-  }
-  nodes_.resize(param_.num_nodes);
-  stats_.resize(param_.num_nodes);
-  CHECK_NE(param_.num_nodes, 0);
-  CHECK_EQ(fi->Read(dmlc::BeginPtr(nodes_), sizeof(Node) * nodes_.size()),
-           sizeof(Node) * nodes_.size());
-  if (!DMLC_IO_NO_ENDIAN_SWAP) {
-    for (Node& node : nodes_) {
-      node = node.ByteSwap();
-    }
-  }
-  CHECK_EQ(fi->Read(dmlc::BeginPtr(stats_), sizeof(RTreeNodeStat) * stats_.size()),
-           sizeof(RTreeNodeStat) * stats_.size());
-  if (!DMLC_IO_NO_ENDIAN_SWAP) {
-    for (RTreeNodeStat& stat : stats_) {
-      stat = stat.ByteSwap();
-    }
-  }
-  // chg deleted nodes
-  deleted_nodes_.resize(0);
-  for (int i = 1; i < param_.num_nodes; ++i) {
-    if (nodes_[i].IsDeleted()) {
-      deleted_nodes_.push_back(i);
-    }
-  }
-  CHECK_EQ(static_cast<int>(deleted_nodes_.size()), param_.num_deleted);
-
-  split_types_.resize(param_.num_nodes, FeatureType::kNumerical);
-  split_categories_segments_.resize(param_.num_nodes);
-}
-
-void RegTree::Save(dmlc::Stream* fo) const {
-  CHECK_EQ(param_.num_nodes, static_cast<int>(nodes_.size()));
-  CHECK_EQ(param_.num_nodes, static_cast<int>(stats_.size()));
-  CHECK_EQ(param_.deprecated_num_roots, 1);
-  CHECK_NE(param_.num_nodes, 0);
-  CHECK(!IsMultiTarget())
-      << "Please use JSON/UBJSON for saving models with multi-target trees.";
-  CHECK(!HasCategoricalSplit())
-      << "Please use JSON/UBJSON for saving models with categorical splits.";
-
-  if (DMLC_IO_NO_ENDIAN_SWAP) {
-    fo->Write(&param_, sizeof(TreeParam));
-  } else {
-    TreeParam x = param_.ByteSwap();
-    fo->Write(&x, sizeof(x));
-  }
-
-  if (DMLC_IO_NO_ENDIAN_SWAP) {
-    fo->Write(dmlc::BeginPtr(nodes_), sizeof(Node) * nodes_.size());
-  } else {
-    for (const Node& node : nodes_) {
-      Node x = node.ByteSwap();
-      fo->Write(&x, sizeof(x));
-    }
-  }
-  if (DMLC_IO_NO_ENDIAN_SWAP) {
-    fo->Write(dmlc::BeginPtr(stats_), sizeof(RTreeNodeStat) * nodes_.size());
-  } else {
-    for (const RTreeNodeStat& stat : stats_) {
-      RTreeNodeStat x = stat.ByteSwap();
-      fo->Write(&x, sizeof(x));
-    }
-  }
-}
-
 template <bool typed>
 void RegTree::LoadCategoricalSplit(Json const& in) {
   auto const& categories_segments = get<I64ArrayT<typed>>(in["categories_segments"]);

From 87e282c98143f65429117ea5e58e5feef5f17d70 Mon Sep 17 00:00:00 2001
From: Jiaming Yuan <jm.yuan@outlook.com>
Date: Tue, 8 Apr 2025 18:59:56 +0800
Subject: [PATCH 2/6] Remove.

---
 include/xgboost/gbm.h             | 11 +---
 src/gbm/gbtree.cc                 | 14 -----
 src/learner.cc                    | 34 -----------
 src/tree/updater_sync.cc          | 27 ++++-----
 tests/cpp/test_learner.cc         | 34 +----------
 tests/cpp/tree/test_tree_model.cc | 96 -------------------------------
 6 files changed, 16 insertions(+), 200 deletions(-)

diff --git a/include/xgboost/gbm.h b/include/xgboost/gbm.h
index 3f4e8540efa5..c65ed71b8e53 100644
--- a/include/xgboost/gbm.h
+++ b/include/xgboost/gbm.h
@@ -47,16 +47,7 @@ class GradientBooster : public Model, public Configurable {
    * @param cfg configurations on both training and model parameters.
    */
   virtual void Configure(Args const& cfg) = 0;
-  /*!
-   * \brief load model from stream
-   * \param fi input stream.
-   */
-  virtual void Load(dmlc::Stream* fi) = 0;
-  /*!
-   * \brief save model to stream.
-   * \param fo output stream
-   */
-  virtual void Save(dmlc::Stream* fo) const = 0;
+
   /**
    * \brief Slice a model using boosting index. The slice m:n indicates taking all trees
    *        that were fit during the boosting rounds m, (m+1), (m+2), ..., (n-1).
diff --git a/src/gbm/gbtree.cc b/src/gbm/gbtree.cc
index ae0b5b5020f1..8d14846a5c29 100644
--- a/src/gbm/gbtree.cc
+++ b/src/gbm/gbtree.cc
@@ -717,20 +717,6 @@ class Dart : public GBTree {
     }
   }
 
-  void Load(dmlc::Stream* fi) override {
-    GBTree::Load(fi);
-    weight_drop_.resize(model_.param.num_trees);
-    if (model_.param.num_trees != 0) {
-      fi->Read(&weight_drop_);
-    }
-  }
-  void Save(dmlc::Stream* fo) const override {
-    GBTree::Save(fo);
-    if (weight_drop_.size() != 0) {
-      fo->Write(weight_drop_);
-    }
-  }
-
   void LoadConfig(Json const& in) override {
     CHECK_EQ(get<String>(in["name"]), "dart");
     auto const& gbtree = in["gbtree"];
diff --git a/src/learner.cc b/src/learner.cc
index c4976449c36e..0747934a19b7 100644
--- a/src/learner.cc
+++ b/src/learner.cc
@@ -947,40 +947,6 @@ class LearnerIO : public LearnerConfiguration {
     }
   }
 
-  // About to be deprecated by JSON format
-  void LoadModel(dmlc::Stream* fi) override {
-    ctx_.UpdateAllowUnknown(Args{});
-    tparam_.Init(std::vector<std::pair<std::string, std::string>>{});
-
-    // TODO(tqchen) mark deprecation of old format.
-    common::PeekableInStream fp(fi);
-
-    // backward compatible header check.
-    std::string header;
-    header.resize(4);
-    StringView msg = "Only `json` and `ubj` is supported starting from 3.1.";
-    if (fp.PeekRead(&header[0], 4) == 4) {
-      CHECK_NE(header, "bs64") << msg;
-      CHECK_NE(header, "binf") << msg;
-    }
-    CHECK_EQ(header[0], '{') << msg;
-
-    // FIXME(jiamingy): Move this out of learner after the old binary model is remove.
-
-    // Dispatch to JSON
-    auto buffer = common::ReadAll(fi, &fp);
-    Json model;
-    auto it = first_non_space(buffer.cbegin() + 1, buffer.cend());
-    if (it != buffer.cend() && *it == '"') {
-      model = Json::Load(StringView{buffer});
-    } else if (it != buffer.cend() && std::isalpha(*it)) {
-      model = Json::Load(StringView{buffer}, std::ios::binary);
-    } else {
-      LOG(FATAL) << "Invalid model format";
-    }
-    this->LoadModel(model);
-  }
-
   void Save(dmlc::Stream* fo) const override {
     this->CheckModelInitialized();
 
diff --git a/src/tree/updater_sync.cc b/src/tree/updater_sync.cc
index 6526e519c9d5..033f1e42f23f 100644
--- a/src/tree/updater_sync.cc
+++ b/src/tree/updater_sync.cc
@@ -1,17 +1,17 @@
 /**
- * Copyright 2014-2024, XBGoost Contributors
+ * Copyright 2014-2025, XBGoost Contributors
  * \file updater_sync.cc
  * \brief synchronize the tree in all distributed nodes
  */
-#include <xgboost/tree_updater.h>
-
 #include <string>
 #include <vector>
 
 #include "../collective/broadcast.h"
-#include "../collective/communicator-inl.h"
-#include "../common/io.h"
-#include "xgboost/json.h"
+#include "../collective/communicator-inl.h"  // for GetRank, GetWorldSize
+#include "xgboost/context.h"                 // for Context
+#include "xgboost/json.h"                    // for Json, Object
+#include "xgboost/linalg.h"                  // for Matrix
+#include "xgboost/tree_updater.h"            // for TreeUpdater
 
 namespace xgboost::tree {
 
@@ -29,25 +29,26 @@ class TreeSyncher : public TreeUpdater {
   void LoadConfig(Json const&) override {}
   void SaveConfig(Json*) const override {}
 
-  [[nodiscard]] char const* Name() const override { return "prune"; }
+  [[nodiscard]] char const* Name() const override { return "sync"; }
 
   void Update(TrainParam const*, linalg::Matrix<GradientPair>*, DMatrix*,
               common::Span<HostDeviceVector<bst_node_t>> /*out_position*/,
               const std::vector<RegTree*>& trees) override {
-    if (collective::GetWorldSize() == 1) return;
-    std::string s_model;
-    common::MemoryBufferStream fs(&s_model);
+    if (collective::GetWorldSize() == 1) {
+      return;
+    }
+    Json model{Object{}};
     int rank = collective::GetRank();
     if (rank == 0) {
       for (auto tree : trees) {
-        tree->Save(&fs);
+        tree->SaveModel(&model);
       }
     }
-    fs.Seek(0);
+    auto s_model = Json::Dump(model);
     auto rc = collective::Broadcast(ctx_, linalg::MakeVec(s_model.data(), s_model.size()), 0);
     SafeColl(rc);
     for (auto tree : trees) {
-      tree->Load(&fs);
+      tree->LoadModel(model);
     }
   }
 };
diff --git a/tests/cpp/test_learner.cc b/tests/cpp/test_learner.cc
index a8551aa23ce9..eaa9406d1c1e 100644
--- a/tests/cpp/test_learner.cc
+++ b/tests/cpp/test_learner.cc
@@ -1,5 +1,5 @@
 /**
- * Copyright 2017-2024, XGBoost contributors
+ * Copyright 2017-2025, XGBoost contributors
  */
 #include <gmock/gmock.h>
 #include <gtest/gtest.h>
@@ -283,38 +283,6 @@ TEST(Learner, MultiThreadedPredict) {
   }
 }
 
-TEST(Learner, BinaryModelIO) {
-  size_t constexpr kRows = 8;
-  int32_t constexpr kIters = 4;
-  auto p_dmat = RandomDataGenerator{kRows, 10, 0}.GenerateDMatrix();
-  p_dmat->Info().labels.Reshape(kRows);
-
-  std::unique_ptr<Learner> learner{Learner::Create({p_dmat})};
-  learner->SetParam("eval_metric", "rmsle");
-  learner->Configure();
-  for (int32_t iter = 0; iter < kIters; ++iter) {
-    learner->UpdateOneIter(iter, p_dmat);
-  }
-  dmlc::TemporaryDirectory tempdir;
-  std::string const fname = tempdir.path + "binary_model_io.bin";
-  {
-    // Make sure the write is complete before loading.
-    std::unique_ptr<dmlc::Stream> fo(dmlc::Stream::Create(fname.c_str(), "w"));
-    learner->SaveModel(fo.get());
-  }
-
-  learner.reset(Learner::Create({p_dmat}));
-  std::unique_ptr<dmlc::Stream> fi(dmlc::Stream::Create(fname.c_str(), "r"));
-  learner->LoadModel(fi.get());
-  learner->Configure();
-  Json config { Object() };
-  learner->SaveConfig(&config);
-  std::string config_str;
-  Json::Dump(config, &config_str);
-  ASSERT_NE(config_str.find("rmsle"), std::string::npos);
-  ASSERT_EQ(config_str.find("WARNING"), std::string::npos);
-}
-
 #if defined(XGBOOST_USE_CUDA)
 // Tests for automatic GPU configuration.
 TEST(Learner, GPUConfiguration) {
diff --git a/tests/cpp/tree/test_tree_model.cc b/tests/cpp/tree/test_tree_model.cc
index 2491f3973f9a..73544d89985e 100644
--- a/tests/cpp/tree/test_tree_model.cc
+++ b/tests/cpp/tree/test_tree_model.cc
@@ -15,20 +15,6 @@ TEST(Tree, ModelShape) {
   RegTree tree{1u, n_features};
   ASSERT_EQ(tree.NumFeatures(), n_features);
 
-  dmlc::TemporaryDirectory tempdir;
-  const std::string tmp_file = tempdir.path + "/tree.model";
-  {
-    // binary dump
-    std::unique_ptr<dmlc::Stream> fo(dmlc::Stream::Create(tmp_file.c_str(), "w"));
-    tree.Save(fo.get());
-  }
-  {
-    // binary load
-    RegTree new_tree;
-    std::unique_ptr<dmlc::Stream> fi(dmlc::Stream::Create(tmp_file.c_str(), "r"));
-    new_tree.Load(fi.get());
-    ASSERT_EQ(new_tree.NumFeatures(), n_features);
-  }
   {
     // json
     Json j_tree{Object{}};
@@ -55,88 +41,6 @@ TEST(Tree, ModelShape) {
   }
 }
 
-#if DMLC_IO_NO_ENDIAN_SWAP  // skip on big-endian machines
-// Manually construct tree in binary format
-// Do not use structs in case they change
-// We want to preserve backwards compatibility
-TEST(Tree, Load) {
-  dmlc::TemporaryDirectory tempdir;
-  const std::string tmp_file = tempdir.path + "/tree.model";
-  std::unique_ptr<dmlc::Stream> fo(dmlc::Stream::Create(tmp_file.c_str(), "w"));
-
-  // Write params
-  EXPECT_EQ(sizeof(TreeParam), (31 + 6) * sizeof(int));
-  int num_roots = 1;
-  int num_nodes = 2;
-  int num_deleted = 0;
-  int max_depth = 1;
-  int num_feature = 0;
-  int size_leaf_vector = 0;
-  int reserved[31];
-  fo->Write(&num_roots, sizeof(int));
-  fo->Write(&num_nodes, sizeof(int));
-  fo->Write(&num_deleted, sizeof(int));
-  fo->Write(&max_depth, sizeof(int));
-  fo->Write(&num_feature, sizeof(int));
-  fo->Write(&size_leaf_vector, sizeof(int));
-  fo->Write(reserved, sizeof(int) * 31);
-
-  // Write 2 nodes
-  EXPECT_EQ(sizeof(RegTree::Node),
-            3 * sizeof(int) + 1 * sizeof(unsigned) + sizeof(float));
-  int parent = -1;
-  int cleft = 1;
-  int cright = -1;
-  unsigned sindex = 5;
-  float split_or_weight = 0.5;
-  fo->Write(&parent, sizeof(int));
-  fo->Write(&cleft, sizeof(int));
-  fo->Write(&cright, sizeof(int));
-  fo->Write(&sindex, sizeof(unsigned));
-  fo->Write(&split_or_weight, sizeof(float));
-  parent = 0;
-  cleft = -1;
-  cright = -1;
-  sindex = 2;
-  split_or_weight = 0.1;
-  fo->Write(&parent, sizeof(int));
-  fo->Write(&cleft, sizeof(int));
-  fo->Write(&cright, sizeof(int));
-  fo->Write(&sindex, sizeof(unsigned));
-  fo->Write(&split_or_weight, sizeof(float));
-
-  // Write 2x node stats
-  EXPECT_EQ(sizeof(RTreeNodeStat), 3 * sizeof(float) + sizeof(int));
-  bst_float loss_chg = 5.0;
-  bst_float sum_hess = 1.0;
-  bst_float base_weight = 3.0;
-  int leaf_child_cnt = 0;
-  fo->Write(&loss_chg, sizeof(float));
-  fo->Write(&sum_hess, sizeof(float));
-  fo->Write(&base_weight, sizeof(float));
-  fo->Write(&leaf_child_cnt, sizeof(int));
-
-  loss_chg = 50.0;
-  sum_hess = 10.0;
-  base_weight = 30.0;
-  leaf_child_cnt = 0;
-  fo->Write(&loss_chg, sizeof(float));
-  fo->Write(&sum_hess, sizeof(float));
-  fo->Write(&base_weight, sizeof(float));
-  fo->Write(&leaf_child_cnt, sizeof(int));
-  fo.reset();
-  std::unique_ptr<dmlc::Stream> fi(dmlc::Stream::Create(tmp_file.c_str(), "r"));
-
-  xgboost::RegTree tree;
-  tree.Load(fi.get());
-  EXPECT_EQ(tree.GetDepth(1), 1);
-  EXPECT_EQ(tree[0].SplitCond(), 0.5f);
-  EXPECT_EQ(tree[0].SplitIndex(), 5ul);
-  EXPECT_EQ(tree[1].LeafValue(), 0.1f);
-  EXPECT_TRUE(tree[1].IsLeaf());
-}
-#endif  // DMLC_IO_NO_ENDIAN_SWAP
-
 TEST(Tree, AllocateNode) {
   RegTree tree;
   tree.ExpandNode(0, 0, 0.0f, false, 0.0f, 0.0f, 0.0f, 0.0f, 0.0f,

From e6873becbd605ac2e90ffca110f772bab5229c4d Mon Sep 17 00:00:00 2001
From: Jiaming Yuan <jm.yuan@outlook.com>
Date: Tue, 8 Apr 2025 19:07:33 +0800
Subject: [PATCH 3/6] Basic model test.

---
 tests/python/test_basic_models.py | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/tests/python/test_basic_models.py b/tests/python/test_basic_models.py
index b24152e5dc9a..b0fb673fb2f7 100644
--- a/tests/python/test_basic_models.py
+++ b/tests/python/test_basic_models.py
@@ -516,12 +516,6 @@ def test_slice(self, booster_name: str) -> None:
             booster, dtrain, num_parallel_tree, num_classes, num_boost_round, False
         )
 
-        bytesarray = booster.save_raw(raw_format="deprecated")
-        booster = xgb.Booster(model_file=bytesarray)
-        self.run_slice(
-            booster, dtrain, num_parallel_tree, num_classes, num_boost_round, True
-        )
-
     def test_slice_multi(self) -> None:
         from sklearn.datasets import make_classification
 

From 68d4017c8619c2c4d44b2e4f081c29f9a23062db Mon Sep 17 00:00:00 2001
From: Jiaming Yuan <jm.yuan@outlook.com>
Date: Tue, 8 Apr 2025 19:13:31 +0800
Subject: [PATCH 4/6] Cleanup.

---
 include/xgboost/c_api.h | 22 ++++++++++++----------
 src/c_api/c_api.cc      |  5 +++--
 2 files changed, 15 insertions(+), 12 deletions(-)

diff --git a/include/xgboost/c_api.h b/include/xgboost/c_api.h
index b268e84f4ab4..5796389e8787 100644
--- a/include/xgboost/c_api.h
+++ b/include/xgboost/c_api.h
@@ -1333,21 +1333,23 @@ XGB_DLL int XGBoosterPredictFromCudaColumnar(BoosterHandle handle, char const *d
  * @{
  */
 
-/*!
- * \brief Load model from existing file
+/**
+ * @brief Load the model from an existing file
  *
- * \param handle handle
- * \param fname File URI or file name. The string must be UTF-8 encoded.
- * \return 0 when success, -1 when failure happens
+ * @param handle handle
+ * @param fname File name. The string must be UTF-8 encoded.
+ *
+ * @return 0 when success, -1 when failure happens
  */
 XGB_DLL int XGBoosterLoadModel(BoosterHandle handle,
                                const char *fname);
-/*!
- * \brief Save model into existing file
+/**
+ * @brief Save the model into an existing file
  *
- * \param handle handle
- * \param fname File URI or file name. The string must be UTF-8 encoded.
- * \return 0 when success, -1 when failure happens
+ * @param handle handle
+ * @param fname File name. The string must be UTF-8 encoded.
+ *
+ * @return 0 when success, -1 when failure happens
  */
 XGB_DLL int XGBoosterSaveModel(BoosterHandle handle,
                                const char *fname);
diff --git a/src/c_api/c_api.cc b/src/c_api/c_api.cc
index e762519f0adc..16c973bd90e0 100644
--- a/src/c_api/c_api.cc
+++ b/src/c_api/c_api.cc
@@ -1493,9 +1493,10 @@ XGB_DLL int XGBoosterSaveModel(BoosterHandle handle, const char *fname) {
     Json::Dump(out, &str, mode);
     fo->Write(str.data(), str.size());
   };
-  if (common::FileExtension(fname) == "json") {
+  auto ext = common::FileExtension(fname);
+  if (ext == "json") {
     save_json(std::ios::out);
-  } else if (common::FileExtension(fname) == "ubj") {
+  } else if (ext == "ubj") {
     save_json(std::ios::binary);
   } else {
     LOG(WARNING) << "Saving model in the UBJSON format as default.  You can use file extension:"

From 5b3da6ceb6c29d6ccae1384e65b57db80c4dad12 Mon Sep 17 00:00:00 2001
From: Jiaming Yuan <jm.yuan@outlook.com>
Date: Tue, 8 Apr 2025 19:22:10 +0800
Subject: [PATCH 5/6] cli.

---
 src/cli_main.cc | 40 ++++++++++++++++++++++++++++------------
 1 file changed, 28 insertions(+), 12 deletions(-)

diff --git a/src/cli_main.cc b/src/cli_main.cc
index 1c388cf845c2..13731fa67528 100644
--- a/src/cli_main.cc
+++ b/src/cli_main.cc
@@ -329,29 +329,45 @@ class CLI {
   }
 
   void LoadModel(std::string const& path, Learner* learner) const {
-    if (common::FileExtension(path) == "json") {
-      auto buffer = common::LoadSequentialFile(path);
-      CHECK_GT(buffer.size(), 2);
-      CHECK_EQ(buffer[0], '{');
-      Json in{Json::Load({buffer.data(), buffer.size()})};
+    auto ext = common::FileExtension(path);
+    auto read_file = [&]() {
+      auto str = common::LoadSequentialFile(path);
+      CHECK_GE(str.size(), 3);  // "{}\0"
+      CHECK_EQ(str[0], '{');
+      return str;
+    };
+
+    if (ext == "json") {
+      auto buffer = read_file();
+      Json in{Json::Load(StringView{buffer.data(), buffer.size()})};
+      learner->LoadModel(in);
+    } else if (ext == "ubj") {
+      auto buffer = read_file();
+      Json in = Json::Load(StringView{buffer.data(), buffer.size()}, std::ios::binary);
       learner->LoadModel(in);
     } else {
-      std::unique_ptr<dmlc::Stream> fi(dmlc::Stream::Create(path.c_str(), "r"));
-      learner->LoadModel(fi.get());
+      LOG(FATAL) << "Unknown model format:" << path << ", expecting either json or ubj.";
     }
   }
 
   void SaveModel(std::string const& path, Learner* learner) const {
     learner->Configure();
     std::unique_ptr<dmlc::Stream> fo(dmlc::Stream::Create(path.c_str(), "w"));
-    if (common::FileExtension(path) == "json") {
+    auto ext = common::FileExtension(path);
+    auto save_json = [&](std::ios::openmode mode) {
       Json out{Object()};
       learner->SaveModel(&out);
-      std::string str;
-      Json::Dump(out, &str);
-      fo->Write(str.c_str(), str.size());
+      std::vector<char> str;
+      Json::Dump(out, &str, mode);
+      fo->Write(str.data(), str.size());
+    };
+
+    if (ext == "json") {
+      save_json(std::ios::out);
+    } else if (ext == "ubj") {
+      save_json(std::ios::binary);
     } else {
-      learner->SaveModel(fo.get());
+      LOG(FATAL) << "Unknown model format:" << path << ", expecting either json or ubj.";
     }
   }
 

From 3127c66a036b63ffc62c61102d1ce7a91d6eb907 Mon Sep 17 00:00:00 2001
From: Jiaming Yuan <jm.yuan@outlook.com>
Date: Tue, 8 Apr 2025 19:59:33 +0800
Subject: [PATCH 6/6] adaptive test.

---
 tests/python/test_updaters.py | 6 ------
 1 file changed, 6 deletions(-)

diff --git a/tests/python/test_updaters.py b/tests/python/test_updaters.py
index 3f2eb8aed52f..7f7175d149c8 100644
--- a/tests/python/test_updaters.py
+++ b/tests/python/test_updaters.py
@@ -411,12 +411,6 @@ def get_score(config: Dict) -> float:
 
         assert get_score(config_0) == get_score(config_1)
 
-        with pytest.warns(Warning, match="Model format is default to UBJSON"):
-            raw_booster = booster_1.save_raw(raw_format="deprecated")
-        booster_2 = xgb.Booster(model_file=raw_booster)
-        config_2 = json.loads(booster_2.save_config())
-        assert get_score(config_1) == get_score(config_2)
-
         raw_booster = booster_1.save_raw(raw_format="ubj")
         booster_2 = xgb.Booster(model_file=raw_booster)
         config_2 = json.loads(booster_2.save_config())