cpp/8.8.1/gen__cs__example_8h_source.html

 /*
   Copyright (c) by respective owners including Yahoo!, Microsoft, and
   individual contributors. All rights reserved.  Released under a BSD (revised)
   license as described in the file LICENSE.
 */
 #pragma once
 #include <float.h>

 #include "vw.h"
 #include "reductions.h"
 #include "cb_algs.h"
 #include "vw_exception.h"

 namespace GEN_CS
 {
 struct cb_to_cs
 {
   size_t cb_type;
   uint32_t num_actions;
   COST_SENSITIVE::label pred_scores;
   LEARNER::single_learner* scorer;
   float avg_loss_regressors;
   size_t nb_ex_regressors;
   float last_pred_reg;
   float last_correct_cost;

   CB::cb_class* known_cost;
 };

 struct cb_to_cs_adf
 {
   size_t cb_type;

   // for MTR
   uint64_t action_sum;
   uint64_t event_sum;
   uint32_t mtr_example;
   multi_ex mtr_ec_seq;  // shared + the one example.

   // for DR
   COST_SENSITIVE::label pred_scores;
   CB::cb_class known_cost;
   LEARNER::single_learner* scorer;
 };

 CB::cb_class* get_observed_cost(CB::label& ld);

 float safe_probability(float prob);

 void gen_cs_example_ips(cb_to_cs& c, CB::label& ld, COST_SENSITIVE::label& cs_ld, float clip_p = 0.f);

 template <bool is_learn>
 void gen_cs_example_dm(cb_to_cs& c, example& ec, COST_SENSITIVE::label& cs_ld)
 {  // this implements the direct estimation method, where costs are directly specified by the learned regressor.
   CB::label ld = ec.l.cb;

   float min = FLT_MAX;
   uint32_t argmin = 1;
   // generate cost sensitive example
   cs_ld.costs.clear();
   c.pred_scores.costs.clear();

   if (ld.costs.size() == 0 ||
       (ld.costs.size() == 1 &&
           ld.costs[0].cost != FLT_MAX))  // this is a typical example where we can perform all actions
   {                                      // in this case generate cost-sensitive example with all actions
     for (uint32_t i = 1; i <= c.num_actions; i++)
     {
       COST_SENSITIVE::wclass wc = {0., i, 0., 0.};
       // get cost prediction for this action
       wc.x = CB_ALGS::get_cost_pred<is_learn>(c.scorer, c.known_cost, ec, i, 0);
       if (wc.x < min)
       {
         min = wc.x;
         argmin = i;
       }

       c.pred_scores.costs.push_back(wc);

       if (c.known_cost != nullptr && c.known_cost->action == i)
       {
         c.nb_ex_regressors++;
         c.avg_loss_regressors += (1.0f / c.nb_ex_regressors) *
             ((c.known_cost->cost - wc.x) * (c.known_cost->cost - wc.x) - c.avg_loss_regressors);
         c.last_pred_reg = wc.x;
         c.last_correct_cost = c.known_cost->cost;
       }

       cs_ld.costs.push_back(wc);
     }
   }
   else  // this is an example where we can only perform a subset of the actions
   {     // in this case generate cost-sensitive example with only allowed actions
     for (auto& cl : ld.costs)
     {
       COST_SENSITIVE::wclass wc = {0., cl.action, 0., 0.};

       // get cost prediction for this action
       wc.x = CB_ALGS::get_cost_pred<is_learn>(c.scorer, c.known_cost, ec, cl.action, 0);
       if (wc.x < min || (wc.x == min && cl.action < argmin))
       {
         min = wc.x;
         argmin = cl.action;
       }
       c.pred_scores.costs.push_back(wc);

       if (c.known_cost != nullptr && c.known_cost->action == cl.action)
       {
         c.nb_ex_regressors++;
         c.avg_loss_regressors += (1.0f / c.nb_ex_regressors) *
             ((c.known_cost->cost - wc.x) * (c.known_cost->cost - wc.x) - c.avg_loss_regressors);
         c.last_pred_reg = wc.x;
         c.last_correct_cost = c.known_cost->cost;
       }

       cs_ld.costs.push_back(wc);
     }
   }

   ec.pred.multiclass = argmin;
 }

 template <bool is_learn>
 void gen_cs_label(cb_to_cs& c, example& ec, COST_SENSITIVE::label& cs_ld, uint32_t action, float clip_p = 0.f)
 {
   COST_SENSITIVE::wclass wc = {0., action, 0., 0.};

   // get cost prediction for this action
   wc.x = CB_ALGS::get_cost_pred<is_learn>(c.scorer, c.known_cost, ec, action, c.num_actions);

   c.pred_scores.costs.push_back(wc);
   // add correction if we observed cost for this action and regressor is wrong
   if (c.known_cost != nullptr && c.known_cost->action == action)
   {
     c.nb_ex_regressors++;
     c.avg_loss_regressors += (1.0f / c.nb_ex_regressors) *
         ((c.known_cost->cost - wc.x) * (c.known_cost->cost - wc.x) - c.avg_loss_regressors);
     c.last_pred_reg = wc.x;
     c.last_correct_cost = c.known_cost->cost;
     wc.x += (c.known_cost->cost - wc.x) / std::max(c.known_cost->probability, clip_p);
   }

   cs_ld.costs.push_back(wc);
 }

 template <bool is_learn>
 void gen_cs_example_dr(cb_to_cs& c, example& ec, CB::label& ld, COST_SENSITIVE::label& cs_ld, float /*clip_p*/ = 0.f)
 {  // this implements the doubly robust method
   cs_ld.costs.clear();
   c.pred_scores.costs.clear();
   if (ld.costs.size() == 0)  // a test example
     for (uint32_t i = 1; i <= c.num_actions; i++)
     {  // Explicit declaration for a weak compiler.
       COST_SENSITIVE::wclass temp = {FLT_MAX, i, 0., 0.};
       cs_ld.costs.push_back(temp);
     }
   else if (ld.costs.size() == 0 || (ld.costs.size() == 1 && ld.costs[0].cost != FLT_MAX))
     // this is a typical example where we can perform all actions
     // in this case generate cost-sensitive example with all actions
     for (uint32_t i = 1; i <= c.num_actions; i++) gen_cs_label<is_learn>(c, ec, cs_ld, i);
   else  // this is an example where we can only perform a subset of the actions
     // in this case generate cost-sensitive example with only allowed actions
     for (auto& cl : ld.costs) gen_cs_label<is_learn>(c, ec, cs_ld, cl.action);
 }

 template <bool is_learn>
 void gen_cs_example(cb_to_cs& c, example& ec, CB::label& ld, COST_SENSITIVE::label& cs_ld)
 {
   switch (c.cb_type)
   {
     case CB_TYPE_IPS:
       gen_cs_example_ips(c, ld, cs_ld);
       break;
     case CB_TYPE_DM:
       gen_cs_example_dm<is_learn>(c, ec, cs_ld);
       break;
     case CB_TYPE_DR:
       gen_cs_example_dr<is_learn>(c, ec, ld, cs_ld);
       break;
     default:
       THROW("Unknown cb_type specified for contextual bandit learning: " << c.cb_type);
   }
 }

 void gen_cs_test_example(multi_ex& examples, COST_SENSITIVE::label& cs_labels);

 void gen_cs_example_ips(multi_ex& examples, COST_SENSITIVE::label& cs_labels, float clip_p = 0.f);

 void gen_cs_example_dm(multi_ex& examples, COST_SENSITIVE::label& cs_labels);

 void gen_cs_example_mtr(cb_to_cs_adf& c, multi_ex& ec_seq, COST_SENSITIVE::label& cs_labels);

 void gen_cs_example_sm(multi_ex& examples, uint32_t chosen_action, float sign_offset,
     ACTION_SCORE::action_scores action_vals, COST_SENSITIVE::label& cs_labels);

 template <bool is_learn>
 void gen_cs_example_dr(cb_to_cs_adf& c, multi_ex& examples, COST_SENSITIVE::label& cs_labels, float clip_p = 0.f)
 {  // size_t mysize = examples.size();
   c.pred_scores.costs.clear();

   cs_labels.costs.clear();
   for (size_t i = 0; i < examples.size(); i++)
   {
     if (CB_ALGS::example_is_newline_not_header(*examples[i]))
       continue;

     COST_SENSITIVE::wclass wc = {0., (uint32_t)i, 0., 0.};

     if (c.known_cost.action == i)
     {
       int known_index = c.known_cost.action;
       c.known_cost.action = 0;
       // get cost prediction for this label
       // num_actions should be 1 effectively.
       // my get_cost_pred function will use 1 for 'index-1+base'
       wc.x = CB_ALGS::get_cost_pred<is_learn>(c.scorer, &(c.known_cost), *(examples[i]), 0, 2);
       c.known_cost.action = known_index;
     }
     else
       wc.x = CB_ALGS::get_cost_pred<is_learn>(c.scorer, nullptr, *(examples[i]), 0, 2);

     c.pred_scores.costs.push_back(wc);  // done

     // add correction if we observed cost for this action and regressor is wrong
     if (c.known_cost.probability != -1 && c.known_cost.action == i)
       wc.x += (c.known_cost.cost - wc.x) / std::max(c.known_cost.probability, clip_p);
     cs_labels.costs.push_back(wc);
   }
 }

 template <bool is_learn>
 void gen_cs_example(cb_to_cs_adf& c, multi_ex& ec_seq, COST_SENSITIVE::label& cs_labels)
 {
   switch (c.cb_type)
   {
     case CB_TYPE_IPS:
       gen_cs_example_ips(ec_seq, cs_labels);
       break;
     case CB_TYPE_DR:
       gen_cs_example_dr<is_learn>(c, ec_seq, cs_labels);
       break;
     case CB_TYPE_MTR:
       gen_cs_example_mtr(c, ec_seq, cs_labels);
       break;
     default:
       THROW("Unknown cb_type specified for contextual bandit learning: " << c.cb_type);
   }
 }

 template <bool is_learn>
 void call_cs_ldf(LEARNER::multi_learner& base, multi_ex& examples, v_array<CB::label>& cb_labels,
     COST_SENSITIVE::label& cs_labels, v_array<COST_SENSITIVE::label>& prepped_cs_labels, uint64_t offset, size_t id = 0)
 {
   cb_labels.clear();
   if (prepped_cs_labels.size() < cs_labels.costs.size() + 1)
   {
     prepped_cs_labels.resize(cs_labels.costs.size() + 1);
     prepped_cs_labels.end() = prepped_cs_labels.end_array;
   }

   // 1st: save cb_label (into mydata) and store cs_label for each example, which will be passed into base.learn.
   // also save offsets
   uint64_t saved_offset = examples[0]->ft_offset;
   size_t index = 0;
   for (auto ec : examples)
   {
     cb_labels.push_back(ec->l.cb);
     prepped_cs_labels[index].costs.clear();
     prepped_cs_labels[index].costs.push_back(cs_labels.costs[index]);
     ec->l.cs = prepped_cs_labels[index++];
     ec->ft_offset = offset;
   }

   // 2nd: predict for each ex
   // // call base.predict for all examples
   if (is_learn)
     base.learn(examples, (int32_t)id);
   else
     base.predict(examples, (int32_t)id);

   // 3rd: restore cb_label for each example
   // (**ec).l.cb = array.element.
   // and restore offsets
   for (size_t i = 0; i < examples.size(); ++i)
   {
     examples[i]->l.cb = cb_labels[i];
     examples[i]->ft_offset = saved_offset;
   }
 }
 }  // namespace GEN_CS
GEN_CS::gen_cs_example_sm
void gen_cs_example_sm(multi_ex &, uint32_t chosen_action, float sign_offset, ACTION_SCORE::action_scores action_vals, COST_SENSITIVE::label &cs_labels)
Definition: gen_cs_example.cc:163

GEN_CS::cb_to_cs_adf::known_cost
CB::cb_class known_cost
Definition: gen_cs_example.h:42

v_array::resize
void resize(size_t length)
Definition: v_array.h:69

GEN_CS::call_cs_ldf
void call_cs_ldf(LEARNER::multi_learner &base, multi_ex &examples, v_array< CB::label > &cb_labels, COST_SENSITIVE::label &cs_labels, v_array< COST_SENSITIVE::label > &prepped_cs_labels, uint64_t offset, size_t id=0)
Definition: gen_cs_example.h:251

GEN_CS::cb_to_cs_adf
Definition: gen_cs_example.h:30

CB_ALGS::example_is_newline_not_header
bool example_is_newline_not_header(example const &ec)
Definition: cb_algs.h:80

polyprediction::multiclass
uint32_t multiclass
Definition: example.h:49

GEN_CS::cb_to_cs::pred_scores
COST_SENSITIVE::label pred_scores
Definition: gen_cs_example.h:20

GEN_CS::gen_cs_label
void gen_cs_label(cb_to_cs &c, example &ec, COST_SENSITIVE::label &cs_ld, uint32_t action, float clip_p=0.f)
Definition: gen_cs_example.h:124

LEARNER::learner::predict
void predict(E &ec, size_t i=0)
Definition: learner.h:169

CB_TYPE_IPS
#define CB_TYPE_IPS
Definition: cb_algs.h:15

polylabel::cb
CB::label cb
Definition: example.h:31

COST_SENSITIVE::wclass
Definition: cost_sensitive.h:15

GEN_CS::get_observed_cost
cb_class * get_observed_cost(CB::label &ld)
Definition: gen_cs_example.cc:25

GEN_CS
Definition: gen_cs_example.cc:13

CB::label::costs
v_array< cb_class > costs
Definition: cb.h:27

GEN_CS::cb_to_cs_adf::event_sum
uint64_t event_sum
Definition: gen_cs_example.h:36

action
uint32_t action
Definition: search.h:19

CB_TYPE_DM
#define CB_TYPE_DM
Definition: cb_algs.h:14

prediction_type::prob
Definition: learner.h:26

COST_SENSITIVE::label
Definition: cost_sensitive.h:29

LEARNER::learner
Definition: cb_explore.h:11

GEN_CS::gen_cs_example_dm
void gen_cs_example_dm(multi_ex &examples, COST_SENSITIVE::label &cs_labels)
Definition: gen_cs_example.cc:60

CB_TYPE_DR
#define CB_TYPE_DR
Definition: cb_algs.h:13

v_array::size
size_t size() const
Definition: v_array.h:68

GEN_CS::cb_to_cs::last_pred_reg
float last_pred_reg
Definition: gen_cs_example.h:24

vw_exception.h

GEN_CS::gen_cs_example_dr
void gen_cs_example_dr(cb_to_cs &c, example &ec, CB::label &ld, COST_SENSITIVE::label &cs_ld, float=0.f)
Definition: gen_cs_example.h:147

CB::cb_class
Definition: cb.h:15

GEN_CS::cb_to_cs_adf::action_sum
uint64_t action_sum
Definition: gen_cs_example.h:35

GEN_CS::cb_to_cs::known_cost
CB::cb_class * known_cost
Definition: gen_cs_example.h:27

CB::cb_class::action
uint32_t action
Definition: cb.h:18

v_array::push_back
void push_back(const T &new_ele)
Definition: v_array.h:107

GEN_CS::cb_to_cs::nb_ex_regressors
size_t nb_ex_regressors
Definition: gen_cs_example.h:23

CB::cb_class::probability
float probability
Definition: cb.h:19

v_array::clear
void clear()
Definition: v_array.h:88

GEN_CS::cb_to_cs_adf::mtr_example
uint32_t mtr_example
Definition: gen_cs_example.h:37

GEN_CS::cb_to_cs::num_actions
uint32_t num_actions
Definition: gen_cs_example.h:19

GEN_CS::cb_to_cs
Definition: gen_cs_example.h:16

GEN_CS::cb_to_cs::avg_loss_regressors
float avg_loss_regressors
Definition: gen_cs_example.h:22

example
Definition: example.h:54

GEN_CS::cb_to_cs::scorer
LEARNER::single_learner * scorer
Definition: gen_cs_example.h:21

GEN_CS::gen_cs_example_ips
void gen_cs_example_ips(multi_ex &examples, COST_SENSITIVE::label &cs_labels, float clip_p)
Definition: gen_cs_example.cc:45

reductions.h

v_array::end
T *& end()
Definition: v_array.h:43

GEN_CS::gen_cs_example
void gen_cs_example(cb_to_cs &c, example &ec, CB::label &ld, COST_SENSITIVE::label &cs_ld)
Definition: gen_cs_example.h:167

multi_ex
std::vector< example * > multi_ex
Definition: example.h:122

example::l
polylabel l
Definition: example.h:57

GEN_CS::safe_probability
float safe_probability(float prob)
Definition: gen_cs_example.cc:33

GEN_CS::cb_to_cs::last_correct_cost
float last_correct_cost
Definition: gen_cs_example.h:25

CB::label
Definition: cb.h:25

CB::cb_class::cost
float cost
Definition: cb.h:17

GEN_CS::gen_cs_example_mtr
void gen_cs_example_mtr(cb_to_cs_adf &c, multi_ex &ec_seq, COST_SENSITIVE::label &cs_labels)
Definition: gen_cs_example.cc:140

vw.h

GEN_CS::cb_to_cs_adf::scorer
LEARNER::single_learner * scorer
Definition: gen_cs_example.h:43

GEN_CS::cb_to_cs_adf::mtr_ec_seq
multi_ex mtr_ec_seq
Definition: gen_cs_example.h:38

COST_SENSITIVE::wclass::x
float x
Definition: cost_sensitive.h:17

example::pred
polyprediction pred
Definition: example.h:60

cb_algs.h

LEARNER::learner::learn
void learn(E &ec, size_t i=0)
Definition: learner.h:160

COST_SENSITIVE::label::costs
v_array< wclass > costs
Definition: cost_sensitive.h:31

GEN_CS::cb_to_cs_adf::cb_type
size_t cb_type
Definition: gen_cs_example.h:32

v_array< action_score >

THROW
#define THROW(args)
Definition: vw_exception.h:181

c
constexpr uint64_t c
Definition: rand48.cc:12

GEN_CS::gen_cs_test_example
void gen_cs_test_example(multi_ex &examples, COST_SENSITIVE::label &cs_labels)
Definition: gen_cs_example.cc:75

f
float f
Definition: cache.cc:40

GEN_CS::cb_to_cs_adf::pred_scores
COST_SENSITIVE::label pred_scores
Definition: gen_cs_example.h:41

v_array::end_array
T * end_array
Definition: v_array.h:38

GEN_CS::cb_to_cs::cb_type
size_t cb_type
Definition: gen_cs_example.h:18

CB_TYPE_MTR
#define CB_TYPE_MTR
Definition: cb_algs.h:16