xgboost
predictor.h
Go to the documentation of this file.
1 
7 #pragma once
8 #include <dmlc/registry.h> // for FunctionRegEntryBase
9 #include <xgboost/base.h> // for bst_tree_t
10 #include <xgboost/cache.h> // for DMatrixCache
11 #include <xgboost/context.h> // for Context
12 #include <xgboost/context.h>
13 #include <xgboost/data.h>
15 
16 #include <functional> // for function
17 #include <memory> // for shared_ptr
18 #include <string>
19 #include <vector>
20 
21 // Forward declarations
22 namespace xgboost::gbm {
23 struct GBTreeModel;
24 } // namespace xgboost::gbm
25 
26 namespace xgboost {
31  // A storage for caching prediction values
33  // The version of current cache, corresponding number of layers of trees
34  std::uint32_t version{0};
35 
36  PredictionCacheEntry() = default;
42  void Update(std::uint32_t v) { version += v; }
43  void Reset() { version = 0; }
44 };
45 
49 class PredictionContainer : public DMatrixCache<PredictionCacheEntry> {
50  // We cache up to 64 DMatrix for all threads
51  std::size_t static constexpr DefaultSize() { return 64; }
52 
53  public:
55  std::shared_ptr<PredictionCacheEntry> Cache(std::shared_ptr<DMatrix> m, DeviceOrd device) {
56  auto p_cache = this->CacheItem(m);
57  if (!device.IsCPU()) {
58  p_cache->predictions.SetDevice(device);
59  }
60  return p_cache;
61  }
62 };
63 
72 class Predictor {
73  protected:
74  Context const* ctx_;
75 
76  public:
77  explicit Predictor(Context const* ctx) : ctx_{ctx} {}
78 
79  virtual ~Predictor() = default;
80 
86  virtual void Configure(Args const&);
87 
95  virtual void InitOutPredictions(const MetaInfo& info, HostDeviceVector<float>* out_predt,
96  const gbm::GBTreeModel& model) const;
97 
108  virtual void PredictBatch(DMatrix* dmat, PredictionCacheEntry* out_preds,
109  gbm::GBTreeModel const& model, bst_tree_t tree_begin,
110  bst_tree_t tree_end = 0,
111  std::vector<float> const* tree_weights = nullptr) const = 0;
112 
126  virtual bool InplacePredict(std::shared_ptr<DMatrix> p_fmat, const gbm::GBTreeModel& model,
127  float missing, PredictionCacheEntry* out_preds,
128  bst_tree_t tree_begin = 0, bst_tree_t tree_end = 0,
129  std::vector<float> const* tree_weights = nullptr) const = 0;
130 
141  virtual void PredictLeaf(DMatrix* dmat, HostDeviceVector<float>* out_preds,
142  gbm::GBTreeModel const& model, bst_tree_t tree_end = 0) const = 0;
143 
159  virtual void PredictContribution(DMatrix* dmat, HostDeviceVector<float>* out_contribs,
160  gbm::GBTreeModel const& model, bst_tree_t tree_end = 0,
161  std::vector<float> const* tree_weights = nullptr,
162  bool approximate = false, int condition = 0,
163  unsigned condition_feature = 0) const = 0;
164 
166  gbm::GBTreeModel const& model,
167  bst_tree_t tree_end = 0,
168  std::vector<float> const* tree_weights = nullptr,
169  bool approximate = false) const = 0;
170 
177  static Predictor* Create(std::string const& name, Context const* ctx);
178 };
179 
184  : public dmlc::FunctionRegEntryBase<PredictorReg, std::function<Predictor*(Context const*)>> {};
185 
186 #define XGBOOST_REGISTER_PREDICTOR(UniqueId, Name) \
187  static DMLC_ATTRIBUTE_UNUSED ::xgboost::PredictorReg& __make_##PredictorReg##_##UniqueId##__ = \
188  ::dmlc::Registry<::xgboost::PredictorReg>::Get()->__REGISTER__(Name)
189 } // namespace xgboost
Defines configuration macros and basic types for xgboost.
Thread-aware FIFO cache for DMatrix related data.
Definition: cache.h:26
std::shared_ptr< PredictionCacheEntry > CacheItem(std::shared_ptr< DMatrix > m, Args const &... args)
Cache a new DMatrix if it's not in the cache already.
Definition: cache.h:145
Internal data structured used by XGBoost to hold all external data.
Definition: data.h:577
Meta information about dataset, always sit in memory.
Definition: data.h:67
A container for managed prediction caches.
Definition: predictor.h:49
std::shared_ptr< PredictionCacheEntry > Cache(std::shared_ptr< DMatrix > m, DeviceOrd device)
Definition: predictor.h:55
PredictionContainer()
Definition: predictor.h:54
Performs prediction on individual training instances or batches of instances for GBTree....
Definition: predictor.h:72
virtual void InitOutPredictions(const MetaInfo &info, HostDeviceVector< float > *out_predt, const gbm::GBTreeModel &model) const
Initialize output prediction.
virtual void Configure(Args const &)
Configure and register input matrices in prediction cache.
Predictor(Context const *ctx)
Definition: predictor.h:77
virtual void PredictContribution(DMatrix *dmat, HostDeviceVector< float > *out_contribs, gbm::GBTreeModel const &model, bst_tree_t tree_end=0, std::vector< float > const *tree_weights=nullptr, bool approximate=false, int condition=0, unsigned condition_feature=0) const =0
feature contributions to individual predictions; the output will be a vector of length (nfeats + 1) *...
Context const * ctx_
Definition: predictor.h:74
virtual void PredictBatch(DMatrix *dmat, PredictionCacheEntry *out_preds, gbm::GBTreeModel const &model, bst_tree_t tree_begin, bst_tree_t tree_end=0, std::vector< float > const *tree_weights=nullptr) const =0
Generate batch predictions for a given feature matrix. May use cached predictions if available instea...
static Predictor * Create(std::string const &name, Context const *ctx)
Creates a new Predictor*.
virtual ~Predictor()=default
virtual void PredictLeaf(DMatrix *dmat, HostDeviceVector< float > *out_preds, gbm::GBTreeModel const &model, bst_tree_t tree_end=0) const =0
predict the leaf index of each tree, the output will be nsample * ntree vector this is only valid in ...
virtual void PredictInteractionContributions(DMatrix *dmat, HostDeviceVector< float > *out_contribs, gbm::GBTreeModel const &model, bst_tree_t tree_end=0, std::vector< float > const *tree_weights=nullptr, bool approximate=false) const =0
virtual bool InplacePredict(std::shared_ptr< DMatrix > p_fmat, const gbm::GBTreeModel &model, float missing, PredictionCacheEntry *out_preds, bst_tree_t tree_begin=0, bst_tree_t tree_end=0, std::vector< float > const *tree_weights=nullptr) const =0
Inplace prediction.
The input data structure of xgboost.
A device-and-host vector abstraction layer.
Definition: linear_updater.h:23
Learner interface that integrates objective, gbm and evaluation together. This is the user facing XGB...
Definition: base.h:89
std::vector< std::pair< std::string, std::string > > Args
Definition: base.h:306
std::int32_t bst_tree_t
Type for indexing trees.
Definition: base.h:127
Runtime context for XGBoost. Contains information like threads and device.
Definition: context.h:142
A type for device ordinal. The type is packed into 32-bit for efficient use in viewing types like lin...
Definition: context.h:40
bool IsCPU() const
Definition: context.h:56
Contains pointer to input matrix and associated cached predictions.
Definition: predictor.h:30
std::uint32_t version
Definition: predictor.h:34
HostDeviceVector< float > predictions
Definition: predictor.h:32
void Reset()
Definition: predictor.h:43
void Update(std::uint32_t v)
Update the cache entry by number of versions.
Definition: predictor.h:42
Registry entry for predictor.
Definition: predictor.h:184