stable/dev/gbm_8h_source.html

 #ifndef XGBOOST_GBM_H_

 #define XGBOOST_GBM_H_


 #include <dmlc/registry.h>

 #include <xgboost/base.h>

 #include <xgboost/data.h>

 #include <xgboost/host_device_vector.h>

 #include <xgboost/model.h>


 #include <vector>

 #include <string>

 #include <functional>

 #include <memory>


 namespace xgboost {


 class Json;

 class FeatureMap;

 class ObjFunction;

 class CatContainer;


 struct Context;

 struct LearnerModelParam;

 struct PredictionCacheEntry;


 class GradientBooster : public Model, public Configurable {

  protected

  Context const* ctx_;

  explicit GradientBooster(Context const* ctx) : ctx_{ctx} {}


  public

  ~GradientBooster() override = default;

  virtual void Configure(Args const& cfg) = 0;


  virtual void Slice(bst_layer_t /*begin*/, bst_layer_t /*end*/, bst_layer_t /*step*/,

  GradientBooster* /*out*/, bool* /*out_of_bound*/) const {

  LOG(FATAL) << "当前增强器不支持切片操作。";

   }

  [[nodiscard]] virtual std::int32_t BoostedRounds() const = 0;

  [[nodiscard]] virtual bool ModelFitted() const = 0;

  virtual void DoBoost(DMatrix* p_fmat, linalg::Matrix<GradientPair>* in_gpair,

  PredictionCacheEntry*, ObjFunction const* obj) = 0;


  virtual void PredictBatch(DMatrix* dmat, PredictionCacheEntry* out_preds, bool training,

  bst_layer_t begin, bst_layer_t end) = 0;


  virtual void InplacePredict(std::shared_ptr<DMatrix>, float, PredictionCacheEntry*, bst_layer_t,

  bst_layer_t) const {

  LOG(FATAL) << "当前增强器不支持原地预测。";

   }

  virtual void PredictLeaf(DMatrix *dmat,

  HostDeviceVector<bst_float> *out_preds,

  unsigned layer_begin, unsigned layer_end) = 0;


  virtual void PredictContribution(DMatrix* dmat, HostDeviceVector<float>* out_contribs,

  bst_layer_t layer_begin, bst_layer_t layer_end,

  bool approximate = false) = 0;


  virtual void PredictInteractionContributions(DMatrix* dmat, HostDeviceVector<float>* out_contribs,

  bst_layer_t layer_begin, bst_layer_t layer_end,

  bool approximate) = 0;


  [[nodiscard]] virtual std::vector<std::string> DumpModel(const FeatureMap& fmap, bool with_stats,

  std::string format) const = 0;


  virtual void FeatureScore(std::string const& importance_type,

  common::Span<int32_t const> trees,

  std::vector<bst_feature_t>* features,

  std::vector<float>* scores) const = 0;

  [[nodiscard]] virtual CatContainer const* Cats() const {

  LOG(FATAL) << "当前增强器不支持获取类别。";

  return nullptr;

   }

  static GradientBooster* Create(const std::string& name, Context const* ctx,

  LearnerModelParam const* learner_model_param);

 };


 struct GradientBoosterReg

  : public dmlc::FunctionRegEntryBase<

  GradientBoosterReg,

  std::function<GradientBooster*(LearnerModelParam const* learner_model_param,

  Context const* ctx)> > {};


 #define XGBOOST_REGISTER_GBM(UniqueId, Name) \

  static DMLC_ATTRIBUTE_UNUSED ::xgboost::GradientBoosterReg & \

  __make_ ## GradientBoosterReg ## _ ## UniqueId ## __ = \

  ::dmlc::Registry< ::xgboost::GradientBoosterReg>::Get()->__REGISTER__(Name)


 } // namespace xgboost

 #endif // XGBOOST_GBM_H_

base.h
为 xgboost 定义配置宏和基本类型。

xgboost::DMatrix
内部数据结构，由XGBoost用于保存所有外部数据。
Definition: data.h:573

xgboost::FeatureMap
特征映射数据结构，用于辅助文本模型转储。TODO(tqchen) 考虑使其更轻量级...
定义： feature_map.h:22

xgboost::GradientBooster
梯度提升模型的接口。
定义： gbm.h:36

xgboost::GradientBooster::~GradientBooster
~GradientBooster() override=default
虚析构函数

xgboost::GradientBooster::GradientBooster
GradientBooster(Context const *ctx)
定义： gbm.h:39

xgboost::GradientBooster::BoostedRounds
virtual std::int32_t BoostedRounds() const =0
返回已提升的轮数。

xgboost::GradientBooster::PredictLeaf
virtual void PredictLeaf(DMatrix *dmat, HostDeviceVector< bst_float > *out_preds, unsigned layer_begin, unsigned layer_end)=0
预测每棵树的叶子索引，输出将是 nsample * ntree 向量，这仅在...时有效。

xgboost::GradientBooster::DumpModel
virtual std::vector< std::string > DumpModel(const FeatureMap &fmap, bool with_stats, std::string format) const =0
以请求的格式转储模型

xgboost::GradientBooster::PredictInteractionContributions
virtual void PredictInteractionContributions(DMatrix *dmat, HostDeviceVector< float > *out_contribs, bst_layer_t layer_begin, bst_layer_t layer_end, bool approximate)=0

xgboost::GradientBooster::Configure
virtual void Configure(Args const &cfg)=0
设置梯度提升的配置。用户必须在 InitModel 和 Traini... 之前调用一次 configure。

xgboost::GradientBooster::InplacePredict
virtual void InplacePredict(std::shared_ptr< DMatrix >, float, PredictionCacheEntry *, bst_layer_t, bst_layer_t) const
原地预测。
定义： gbm.h:106

xgboost::GradientBooster::Create
static GradientBooster * Create(const std::string &name, Context const *ctx, LearnerModelParam const *learner_model_param)
从给定名称创建一个梯度提升器

xgboost::GradientBooster::FeatureScore
virtual void FeatureScore(std::string const &importance_type, common::Span< int32_t const > trees, std::vector< bst_feature_t > *features, std::vector< float > *scores) const =0

xgboost::GradientBooster::ModelFitted
virtual bool ModelFitted() const =0
模型是否已经训练。当选择树增强器时，当...时返回 true。

xgboost::GradientBooster::PredictContribution
virtual void PredictContribution(DMatrix *dmat, HostDeviceVector< float > *out_contribs, bst_layer_t layer_begin, bst_layer_t layer_end, bool approximate=false)=0
特征对个体预测的贡献；输出将是一个长度为 (nfeats + 1) *... 的向量。

xgboost::GradientBooster::DoBoost
virtual void DoBoost(DMatrix *p_fmat, linalg::Matrix< GradientPair > *in_gpair, PredictionCacheEntry *, ObjFunction const *obj)=0
对模型进行更新（提升）

xgboost::GradientBooster::ctx_
Context const * ctx_
定义： gbm.h:38

xgboost::GradientBooster::Cats
virtual CatContainer const * Cats() const
类别的 Getter。
定义： gbm.h:156

xgboost::GradientBooster::PredictBatch
virtual void PredictBatch(DMatrix *dmat, PredictionCacheEntry *out_preds, bool training, bst_layer_t begin, bst_layer_t end)=0
为给定的特征矩阵生成预测。

xgboost::GradientBooster::Slice
virtual void Slice(bst_layer_t, bst_layer_t, bst_layer_t, GradientBooster *, bool *) const
使用 boosting 索引对模型进行切片。切片 m:n 表示获取在...期间拟合的所有树。
定义： gbm.h:59

xgboost::HostDeviceVector< bst_float >

xgboost::ObjFunction
目标函数的接口。
定义： objective.h:28

xgboost::common::Span
span类实现，基于ISO++20 span<T>。接口应相同。
Definition: span.h:431

xgboost::linalg::Tensor
一个张量存储。要将其用于切片等其他功能，首先需要获取一个视图...
定义： linalg.h:745

data.h
xgboost 的输入数据结构。

host_device_vector.h
设备与主机向量抽象层。

model.h
定义 XGBoost 中不同组件的抽象接口。

xgboost
集成目标、gbm和评估的学习器接口。这是用户面临的XGB...
Definition: base.h:97

xgboost::Args
std::vector< std::pair< std::string, std::string > > Args
定义： base.h:324

xgboost::bst_layer_t
std::int32_t bst_layer_t
用于索引提升层的类型。
定义： base.h:131

xgboost::Configurable
定义： model.h:28

xgboost::Context
XGBoost的运行时上下文。包含线程和设备等信息。
Definition: context.h:133

xgboost::GradientBoosterReg
树更新器的注册表项。
定义： gbm.h:178

xgboost::LearnerModelParam
基本的模型参数，用于描述助推器。
定义： learner.h:297

xgboost::Model
定义： model.h:14

xgboost::PredictionCacheEntry
包含指向输入矩阵和相关缓存预测的指针。
定义： predictor.h:30