cpp/8.8.1/cb__algs_8cc_source.html

 /*
 Copyright (c) by respective owners including Yahoo!, Microsoft, and
 individual contributors. All rights reserved.  Released under a BSD (revised)
 license as described in the file LICENSE.
  */
 #include <float.h>

 #include "vw.h"
 #include "reductions.h"
 #include "cb_algs.h"
 #include "vw_exception.h"
 #include "gen_cs_example.h"

 using namespace LEARNER;
 using namespace VW::config;

 using namespace CB;
 using namespace GEN_CS;
 namespace CB_ALGS
 {
 struct cb
 {
   cb_to_cs cbcs;
   COST_SENSITIVE::label cb_cs_ld;

   ~cb()
   {
     cb_cs_ld.costs.delete_v();
     COST_SENSITIVE::cs_label.delete_label(&cbcs.pred_scores);
   }
 };

 bool know_all_cost_example(CB::label& ld)
 {
   if (ld.costs.size() <= 1)  // this means we specified an example where all actions are possible but only specified the
                              // cost for the observed action
     return false;

   // if we specified more than 1 action for this example, i.e. either we have a limited set of possible actions, or all
   // actions are specified than check if all actions have a specified cost
   for (auto& cl : ld.costs)
     if (cl.cost == FLT_MAX)
       return false;

   return true;
 }

 template <bool is_learn>
 void predict_or_learn(cb& data, single_learner& base, example& ec)
 {
   CB::label ld = ec.l.cb;
   cb_to_cs& c = data.cbcs;
   c.known_cost = get_observed_cost(ld);
   if (c.known_cost != nullptr && (c.known_cost->action < 1 || c.known_cost->action > c.num_actions))
     std::cerr << "invalid action: " << c.known_cost->action << std::endl;

   // generate a cost-sensitive example to update classifiers
   gen_cs_example<is_learn>(c, ec, ld, data.cb_cs_ld);

   if (c.cb_type != CB_TYPE_DM)
   {
     ec.l.cs = data.cb_cs_ld;

     if (is_learn)
       base.learn(ec);
     else
       base.predict(ec);

     for (size_t i = 0; i < ld.costs.size(); i++)
       ld.costs[i].partial_prediction = data.cb_cs_ld.costs[i].partial_prediction;
     ec.l.cb = ld;
   }
 }

 void predict_eval(cb&, single_learner&, example&) { THROW("can not use a test label for evaluation"); }

 void learn_eval(cb& data, single_learner&, example& ec)
 {
   CB_EVAL::label ld = ec.l.cb_eval;

   cb_to_cs& c = data.cbcs;
   c.known_cost = get_observed_cost(ld.event);
   gen_cs_example<true>(c, ec, ld.event, data.cb_cs_ld);

   for (size_t i = 0; i < ld.event.costs.size(); i++)
     ld.event.costs[i].partial_prediction = data.cb_cs_ld.costs[i].partial_prediction;

   ec.pred.multiclass = ec.l.cb_eval.action;
 }

 void output_example(vw& all, cb& data, example& ec, CB::label& ld)
 {
   float loss = 0.;

   cb_to_cs& c = data.cbcs;
   if (!CB::cb_label.test_label(&ld))
     loss = get_cost_estimate(c.known_cost, c.pred_scores, ec.pred.multiclass);

   all.sd->update(ec.test_only, !CB::cb_label.test_label(&ld), loss, 1.f, ec.num_features);

   for (int sink : all.final_prediction_sink) all.print(sink, (float)ec.pred.multiclass, 0, ec.tag);

   if (all.raw_prediction > 0)
   {
     std::stringstream outputStringStream;
     for (unsigned int i = 0; i < ld.costs.size(); i++)
     {
       cb_class cl = ld.costs[i];
       if (i > 0)
         outputStringStream << ' ';
       outputStringStream << cl.action << ':' << cl.partial_prediction;
     }
     all.print_text(all.raw_prediction, outputStringStream.str(), ec.tag);
   }

   print_update(all, CB::cb_label.test_label(&ld), ec, nullptr, false);
 }

 void finish_example(vw& all, cb& c, example& ec)
 {
   output_example(all, c, ec, ec.l.cb);
   VW::finish_example(all, ec);
 }

 void eval_finish_example(vw& all, cb& c, example& ec)
 {
   output_example(all, c, ec, ec.l.cb_eval.event);
   VW::finish_example(all, ec);
 }
 }  // namespace CB_ALGS
 using namespace CB_ALGS;
 base_learner* cb_algs_setup(options_i& options, vw& all)
 {
   auto data = scoped_calloc_or_throw<cb>();
   std::string type_string = "dr";
   bool eval = false;

   option_group_definition new_options("Contextual Bandit Options");
   new_options
       .add(make_option("cb", data->cbcs.num_actions).keep().help("Use contextual bandit learning with <k> costs"))
       .add(make_option("cb_type", type_string).keep().help("contextual bandit method to use in {ips,dm,dr}"))
       .add(make_option("eval", eval).help("Evaluate a policy rather than optimizing."));
   options.add_and_parse(new_options);

   if (!options.was_supplied("cb"))
     return nullptr;

   // Ensure serialization of this option in all cases.
   if (!options.was_supplied("cb_type"))
   {
     options.insert("cb_type", type_string);
     options.add_and_parse(new_options);
   }

   cb_to_cs& c = data->cbcs;

   size_t problem_multiplier = 2;  // default for DR
   if (type_string.compare("dr") == 0)
     c.cb_type = CB_TYPE_DR;
   else if (type_string.compare("dm") == 0)
   {
     if (eval)
       THROW("direct method can not be used for evaluation --- it is biased.");
     c.cb_type = CB_TYPE_DM;
     problem_multiplier = 1;
   }
   else if (type_string.compare("ips") == 0)
   {
     c.cb_type = CB_TYPE_IPS;
     problem_multiplier = 1;
   }
   else
   {
     std::cerr << "warning: cb_type must be in {'ips','dm','dr'}; resetting to dr." << std::endl;
     c.cb_type = CB_TYPE_DR;
   }

   if (!options.was_supplied("csoaa"))
   {
     std::stringstream ss;
     ss << data->cbcs.num_actions;
     options.insert("csoaa", ss.str());
   }

   auto base = as_singleline(setup_base(options, all));
   if (eval)
   {
     all.p->lp = CB_EVAL::cb_eval;
     all.label_type = label_type::cb_eval;
   }
   else
   {
     all.p->lp = CB::cb_label;
     all.label_type = label_type::cb;
   }

   learner<cb, example>* l;
   if (eval)
   {
     l = &init_learner(data, base, learn_eval, predict_eval, problem_multiplier, prediction_type::multiclass);
     l->set_finish_example(eval_finish_example);
   }
   else
   {
     l = &init_learner(
         data, base, predict_or_learn<true>, predict_or_learn<false>, problem_multiplier, prediction_type::multiclass);
     l->set_finish_example(finish_example);
   }
   c.scorer = all.scorer;

   return make_base(*l);
 }
CB_EVAL::cb_eval
label_parser cb_eval
Definition: cb.cc:292

example::tag
v_array< char > tag
Definition: example.h:63

vw::raw_prediction
int raw_prediction
Definition: global_data.h:519

polyprediction::multiclass
uint32_t multiclass
Definition: example.h:49

GEN_CS::cb_to_cs::pred_scores
COST_SENSITIVE::label pred_scores
Definition: gen_cs_example.h:20

LEARNER::learner::predict
void predict(E &ec, size_t i=0)
Definition: learner.h:169

CB_TYPE_IPS
#define CB_TYPE_IPS
Definition: cb_algs.h:15

CB_ALGS::finish_example
void finish_example(vw &all, cb &c, example &ec)
Definition: cb_algs.cc:119

COST_SENSITIVE::cs_label
label_parser cs_label
Definition: cost_sensitive.cc:187

label_parser::delete_label
void(* delete_label)(void *)
Definition: label_parser.h:16

CB_ALGS::know_all_cost_example
bool know_all_cost_example(CB::label &ld)
Definition: cb_algs.cc:33

polylabel::cb
CB::label cb
Definition: example.h:31

vw::label_type
label_type::label_type_t label_type
Definition: global_data.h:550

GEN_CS
Definition: gen_cs_example.cc:13

CB_ALGS::cb::cb_cs_ld
COST_SENSITIVE::label cb_cs_ld
Definition: cb_algs.cc:24

label_parser::test_label
bool(* test_label)(void *)
Definition: label_parser.h:22

vw::final_prediction_sink
v_array< int > final_prediction_sink
Definition: global_data.h:518

CB::label::costs
v_array< cb_class > costs
Definition: cb.h:27

LEARNER::make_base
base_learner * make_base(learner< T, E > &base)
Definition: learner.h:462

VW::config::option_group_definition
Definition: options.h:85

polylabel::cb_eval
CB_EVAL::label cb_eval
Definition: example.h:33

CB_TYPE_DM
#define CB_TYPE_DM
Definition: cb_algs.h:14

VW::config::options_i::add_and_parse
virtual void add_and_parse(const option_group_definition &group)=0

loss
float loss(cbify &data, uint32_t label, uint32_t final_prediction)
Definition: cbify.cc:60

CB_ALGS::learn_eval
void learn_eval(cb &data, single_learner &, example &ec)
Definition: cb_algs.cc:77

CB_ALGS::get_cost_estimate
float get_cost_estimate(CB::cb_class *observation, uint32_t action, float offset=0.)
Definition: cb_algs.h:58

COST_SENSITIVE::label
Definition: cost_sensitive.h:29

LEARNER::learner
Definition: cb_explore.h:11

prediction_type::multiclass
Definition: learner.h:24

CB_TYPE_DR
#define CB_TYPE_DR
Definition: cb_algs.h:13

CB_EVAL::label::event
CB::label event
Definition: cb.h:42

vw_exception.h

vw
Definition: global_data.h:369

CB_ADF::get_observed_cost
CB::cb_class get_observed_cost(multi_ex &examples)
Definition: cb_adf.cc:99

vw::p
parser * p
Definition: global_data.h:377

CB::cb_class
Definition: cb.h:15

LEARNER::as_singleline
single_learner * as_singleline(learner< T, E > *l)
Definition: learner.h:476

CB::print_update
void print_update(vw &all, bool is_test, example &ec, multi_ex *ec_seq, bool action_scores)
Definition: cb.cc:180

GEN_CS::cb_to_cs::known_cost
CB::cb_class * known_cost
Definition: gen_cs_example.h:27

CB
Definition: cb.cc:15

LEARNER::learner::set_finish_example
void set_finish_example(void(*f)(vw &all, T &, E &))
Definition: learner.h:307

CB::cb_class::action
uint32_t action
Definition: cb.h:18

CB::cb_class::partial_prediction
float partial_prediction
Definition: cb.h:21

LEARNER::init_learner
learner< T, E > & init_learner(free_ptr< T > &dat, L *base, void(*learn)(T &, L &, E &), void(*predict)(T &, L &, E &), size_t ws, prediction_type::prediction_type_t pred_type)
Definition: learner.h:369

cb_algs_setup
base_learner * cb_algs_setup(options_i &options, vw &all)
Definition: cb_algs.cc:132

vw::sd
shared_data * sd
Definition: global_data.h:375

example::num_features
size_t num_features
Definition: example.h:67

VW::config::options_i::was_supplied
virtual bool was_supplied(const std::string &key)=0

CB_ALGS
Definition: cb_algs.cc:19

label_type::cb_eval
Definition: global_data.h:347

CB_ALGS::cb::~cb
~cb()
Definition: cb_algs.cc:26

GEN_CS::cb_to_cs::num_actions
uint32_t num_actions
Definition: gen_cs_example.h:19

CB_ALGS::predict_eval
void predict_eval(cb &, single_learner &, example &)
Definition: cb_algs.cc:75

VW::config::options_i
Definition: options.h:107

GEN_CS::cb_to_cs
Definition: gen_cs_example.h:16

example
Definition: example.h:54

vw::print_text
void(* print_text)(int, std::string, v_array< char >)
Definition: global_data.h:522

CB_ALGS::predict_or_learn
void predict_or_learn(cb &data, single_learner &base, example &ec)
Definition: cb_algs.cc:49

GEN_CS::cb_to_cs::scorer
LEARNER::single_learner * scorer
Definition: gen_cs_example.h:21

VW::finish_example
void finish_example(vw &, example &)
Definition: parser.cc:881

reductions.h

vw::scorer
LEARNER::single_learner * scorer
Definition: global_data.h:384

VW::config::options_i::insert
virtual void insert(const std::string &key, const std::string &value)=0

shared_data::update
void update(bool test_example, bool labeled_example, float loss, float weight, size_t num_features)
Definition: global_data.h:190

VW::config::option_group_definition::add
option_group_definition & add(T &&op)
Definition: options.h:90

add
int add(svm_params &params, svm_example *fec)
Definition: kernel_svm.cc:546

CB::cb_label
label_parser cb_label
Definition: cb.cc:167

VW::config
Definition: options.h:11

example::l
polylabel l
Definition: example.h:57

VW::config::make_option
typed_option< T > make_option(std::string name, T &location)
Definition: options.h:80

CB_ALGS::cb
Definition: cb_algs.cc:21

CB::label
Definition: cb.h:25

CB_ALGS::eval_finish_example
void eval_finish_example(vw &all, cb &c, example &ec)
Definition: cb_algs.cc:125

CB_ALGS::output_example
void output_example(vw &all, cb &data, example &ec, CB::label &ld)
Definition: cb_algs.cc:91

vw.h

test_label
bool test_label(void *v)
Definition: simple_label.cc:70

setup_base
LEARNER::base_learner * setup_base(options_i &options, vw &all)
Definition: parse_args.cc:1222

label_type::cb
Definition: global_data.h:346

CB_EVAL::label
Definition: cb.h:39

example::pred
polyprediction pred
Definition: example.h:60

LEARNER
Definition: cb_explore.h:8

cb_algs.h

LEARNER::learner::learn
void learn(E &ec, size_t i=0)
Definition: learner.h:160

CB_ALGS::cb::cbcs
cb_to_cs cbcs
Definition: cb_algs.cc:23

COST_SENSITIVE::label::costs
v_array< wclass > costs
Definition: cost_sensitive.h:31

gen_cs_example.h

THROW
#define THROW(args)
Definition: vw_exception.h:181

c
constexpr uint64_t c
Definition: rand48.cc:12

vw::print
void(* print)(int, float, float, v_array< char >)
Definition: global_data.h:521

parser::lp
label_parser lp
Definition: parser.h:102

GEN_CS::cb_to_cs::cb_type
size_t cb_type
Definition: gen_cs_example.h:18

example::test_only
bool test_only
Definition: example.h:76