cpp/8.8.1/cb__explore__adf__common_8h_source.html

 /*
 Copyright (c) by respective owners including Yahoo!, Microsoft, and
 individual contributors. All rights reserved.  Released under a BSD
 license as described in the file LICENSE.
 */
 #pragma once
 #include <stdint.h>
 #include <algorithm>

 // Most of these includes are required because templated functions are using the objects defined in them
 // A few options to get rid of them:
 // - Use virtual function calls in predict/learn to get rid of the templates entirely (con: virtual function calls)
 // - Cut out the portions of code that actually use the objects and put them into new functions
 //   defined in the cc file (con: can't inline those functions)
 // - templatize all input parameters (con: no type safety)
 #include "v_array.h"         // required by action_score.h
 #include "action_score.h"    // used in sort_action_probs
 #include "cb.h"              // required for CB::label
 #include "cb_adf.h"          // used for function call in predict/learn
 #include "example.h"         // used in predict
 #include "gen_cs_example.h"  // required for GEN_CS::cb_to_cs_adf
 #include "reductions_fwd.h"

 namespace VW
 {
 namespace cb_explore_adf
 {
 // Free functions
 inline void sort_action_probs(v_array<ACTION_SCORE::action_score>& probs, const std::vector<float>& scores)
 {
   // We want to preserve the score order in the returned action_probs if possible.  To do this,
   // sort top_actions and action_probs by the order induced in scores.
   std::sort(probs.begin(), probs.end(),
       [&scores](const ACTION_SCORE::action_score& as1, const ACTION_SCORE::action_score& as2) {
         if (as1.score > as2.score)
           return true;
         else if (as1.score < as2.score)
           return false;
         // equal probabilities
         if (scores[as1.action] < scores[as2.action])
           return true;
         else if (scores[as1.action] > scores[as2.action])
           return false;
         // equal probabilities and equal cost estimates
         return as1.action < as2.action;
       });
 }
 inline size_t fill_tied(v_array<ACTION_SCORE::action_score>& preds)
 {
   if (preds.size() == 0)
     return 0;
   size_t ret = 1;
   for (size_t i = 1; i < preds.size(); ++i)
     if (preds[i].score == preds[0].score)
       ++ret;
     else
       return ret;
   return ret;
 }

 // Object
 template <typename ExploreType>
 // data common to all cb_explore_adf reductions
 struct cb_explore_adf_base
 {
  private:
   CB::cb_class _known_cost;
   // used in output_example
   CB::label _action_label;
   CB::label _empty_label;
   ExploreType explore;

  public:
   template <typename... Args>
   cb_explore_adf_base(Args&&... args) : explore(std::forward<Args>(args)...)
   {
   }
   static void finish_multiline_example(vw& all, cb_explore_adf_base<ExploreType>& data, multi_ex& ec_seq);
   static void predict(cb_explore_adf_base<ExploreType>& data, LEARNER::multi_learner& base, multi_ex& examples);
   static void learn(cb_explore_adf_base<ExploreType>& data, LEARNER::multi_learner& base, multi_ex& examples);

  private:
   void output_example_seq(vw& all, multi_ex& ec_seq);
   void output_example(vw& all, multi_ex& ec_seq);
 };

 template <typename ExploreType>
 inline void cb_explore_adf_base<ExploreType>::predict(
     cb_explore_adf_base<ExploreType>& data, LEARNER::multi_learner& base, multi_ex& examples)
 {
   example* label_example = CB_ADF::test_adf_sequence(examples);
   data._known_cost = CB_ADF::get_observed_cost(examples);

   if (label_example != nullptr)
   {
     // predict path, replace the label example with an empty one
     data._action_label = label_example->l.cb;
     label_example->l.cb = data._empty_label;
   }

   data.explore.predict(base, examples);

   if (label_example != nullptr)
   {
     // predict path, restore label
     label_example->l.cb = data._action_label;
   }
 }

 template <typename ExploreType>
 inline void cb_explore_adf_base<ExploreType>::learn(
     cb_explore_adf_base<ExploreType>& data, LEARNER::multi_learner& base, multi_ex& examples)
 {
   example* label_example = CB_ADF::test_adf_sequence(examples);
   if (label_example != nullptr)
   {
     data._known_cost = CB_ADF::get_observed_cost(examples);
     // learn iff label_example != nullptr
     data.explore.learn(base, examples);
   }
   else
   {
     predict(data, base, examples);
   }
 }

 template <typename ExploreType>
 void cb_explore_adf_base<ExploreType>::output_example(vw& all, multi_ex& ec_seq)
 {
   if (ec_seq.size() <= 0)
     return;

   size_t num_features = 0;

   float loss = 0.;

   auto& ec = *ec_seq[0];
   ACTION_SCORE::action_scores preds = ec.pred.a_s;

   for (const auto& example : ec_seq)
   {
     num_features += example->num_features;
   }

   bool labeled_example = true;
   if (_known_cost.probability > 0)
   {
     for (uint32_t i = 0; i < preds.size(); i++)
     {
       float l = CB_ALGS::get_cost_estimate(&_known_cost, preds[i].action);
       loss += l * preds[i].score;
     }
   }
   else
     labeled_example = false;

   bool holdout_example = labeled_example;
   for (size_t i = 0; i < ec_seq.size(); i++) holdout_example &= ec_seq[i]->test_only;

   all.sd->update(holdout_example, labeled_example, loss, ec.weight, num_features);

   for (auto sink : all.final_prediction_sink) ACTION_SCORE::print_action_score(sink, ec.pred.a_s, ec.tag);

   if (all.raw_prediction > 0)
   {
     std::string outputString;
     std::stringstream outputStringStream(outputString);
     v_array<CB::cb_class> costs = ec.l.cb.costs;

     for (size_t i = 0; i < costs.size(); i++)
     {
       if (i > 0)
         outputStringStream << ' ';
       outputStringStream << costs[i].action << ':' << costs[i].partial_prediction;
     }
     all.print_text(all.raw_prediction, outputStringStream.str(), ec.tag);
   }

   CB::print_update(all, !labeled_example, ec, &ec_seq, true);
 }

 template <typename ExploreType>
 void cb_explore_adf_base<ExploreType>::output_example_seq(vw& all, multi_ex& ec_seq)
 {
   if (ec_seq.size() > 0)
   {
     output_example(all, ec_seq);
     if (all.raw_prediction > 0)
       all.print_text(all.raw_prediction, "", ec_seq[0]->tag);
   }
 }

 template <typename ExploreType>
 void cb_explore_adf_base<ExploreType>::finish_multiline_example(
     vw& all, cb_explore_adf_base<ExploreType>& data, multi_ex& ec_seq)
 {
   if (ec_seq.size() > 0)
   {
     data.output_example_seq(all, ec_seq);
     CB_ADF::global_print_newline(all.final_prediction_sink);
   }

   VW::finish_example(all, ec_seq);
 }
 }  // namespace cb_explore_adf
 }  // namespace VW
vw::raw_prediction
int raw_prediction
Definition: global_data.h:519

example.h

VW::cb_explore_adf::cb_explore_adf_base::learn
static void learn(cb_explore_adf_base< ExploreType > &data, LEARNER::multi_learner &base, multi_ex &examples)
Definition: cb_explore_adf_common.h:111

ACTION_SCORE::action_score::action
uint32_t action
Definition: action_score.h:6

polylabel::cb
CB::label cb
Definition: example.h:31

action_score.h

ACTION_SCORE::action_score::score
float score
Definition: action_score.h:7

vw::final_prediction_sink
v_array< int > final_prediction_sink
Definition: global_data.h:518

CB_ADF::test_adf_sequence
example * test_adf_sequence(multi_ex &ec_seq)
Definition: cb_adf.cc:268

action
uint32_t action
Definition: search.h:19

std
Definition: options_boost_po.h:17

loss
float loss(cbify &data, uint32_t label, uint32_t final_prediction)
Definition: cbify.cc:60

VW::cb_explore_adf::cb_explore_adf_base::explore
ExploreType explore
Definition: cb_explore_adf_common.h:71

CB_ALGS::get_cost_estimate
float get_cost_estimate(CB::cb_class *observation, uint32_t action, float offset=0.)
Definition: cb_algs.h:58

LEARNER::learner
Definition: cb_explore.h:11

v_array::begin
T *& begin()
Definition: v_array.h:42

v_array::size
size_t size() const
Definition: v_array.h:68

vw
Definition: global_data.h:369

v_array.h

CB_ADF::get_observed_cost
CB::cb_class get_observed_cost(multi_ex &examples)
Definition: cb_adf.cc:99

VW::cb_explore_adf::fill_tied
size_t fill_tied(v_array< ACTION_SCORE::action_score > &preds)
Definition: cb_explore_adf_common.h:48

CB::cb_class
Definition: cb.h:15

CB::print_update
void print_update(vw &all, bool is_test, example &ec, multi_ex *ec_seq, bool action_scores)
Definition: cb.cc:180

vw::sd
shared_data * sd
Definition: global_data.h:375

CB::cb_class::probability
float probability
Definition: cb.h:19

VW::cb_explore_adf::cb_explore_adf_base::_empty_label
CB::label _empty_label
Definition: cb_explore_adf_common.h:70

ACTION_SCORE::action_score
Definition: action_score.h:4

example::num_features
size_t num_features
Definition: example.h:67

CB_ADF::global_print_newline
void global_print_newline(const v_array< int > &final_prediction_sink)
Definition: cb_adf.cc:342

VW::cb_explore_adf::cb_explore_adf_base::_action_label
CB::label _action_label
Definition: cb_explore_adf_common.h:69

example
Definition: example.h:54

VW::cb_explore_adf::cb_explore_adf_base::output_example
void output_example(vw &all, multi_ex &ec_seq)
Definition: cb_explore_adf_common.h:128

vw::print_text
void(* print_text)(int, std::string, v_array< char >)
Definition: global_data.h:522

VW::finish_example
void finish_example(vw &, example &)
Definition: parser.cc:881

v_array::end
T *& end()
Definition: v_array.h:43

reductions_fwd.h

VW::cb_explore_adf::cb_explore_adf_base::_known_cost
CB::cb_class _known_cost
Definition: cb_explore_adf_common.h:67

shared_data::update
void update(bool test_example, bool labeled_example, float loss, float weight, size_t num_features)
Definition: global_data.h:190

cb_adf.h

multi_ex
std::vector< example * > multi_ex
Definition: example.h:122

example::l
polylabel l
Definition: example.h:57

CB::label
Definition: cb.h:25

VW::cb_explore_adf::cb_explore_adf_base
Definition: cb_explore_adf_common.h:64

VW
Definition: autolink.cc:11

VW::cb_explore_adf::cb_explore_adf_base::cb_explore_adf_base
cb_explore_adf_base(Args &&... args)
Definition: cb_explore_adf_common.h:75

VW::cb_explore_adf::cb_explore_adf_base::finish_multiline_example
static void finish_multiline_example(vw &all, cb_explore_adf_base< ExploreType > &data, multi_ex &ec_seq)
Definition: cb_explore_adf_common.h:194

cb.h

VW::cb_explore_adf::cb_explore_adf_base::predict
static void predict(cb_explore_adf_base< ExploreType > &data, LEARNER::multi_learner &base, multi_ex &examples)
Definition: cb_explore_adf_common.h:88

VW::cb_explore_adf::sort_action_probs
void sort_action_probs(v_array< ACTION_SCORE::action_score > &probs, const std::vector< float > &scores)
Definition: cb_explore_adf_common.h:29

ACTION_SCORE::print_action_score
void print_action_score(int f, v_array< action_score > &a_s, v_array< char > &tag)
Definition: action_score.cc:8

v_array< ACTION_SCORE::action_score >

gen_cs_example.h

VW::cb_explore_adf::cb_explore_adf_base::output_example_seq
void output_example_seq(vw &all, multi_ex &ec_seq)
Definition: cb_explore_adf_common.h:183