cpp/8.8.1/gen__cs__example_8cc_source.html

 /*
   Copyright (c) by respective owners including Yahoo!, Microsoft, and
   individual contributors. All rights reserved.  Released under a BSD (revised)
   license as described in the file LICENSE.
 */
 #include <float.h>

 #include "vw.h"
 #include "reductions.h"
 #include "vw_exception.h"
 #include "gen_cs_example.h"

 namespace GEN_CS
 {
 using namespace LEARNER;
 using namespace CB_ALGS;
 using namespace CB;

 constexpr inline bool observed_cost(cb_class* cl)
 {
   // cost observed for this action if it has non zero probability and cost != FLT_MAX
   return (cl != nullptr && cl->cost != FLT_MAX && cl->probability > .0);
 }

 cb_class* get_observed_cost(CB::label& ld)
 {
   for (auto& cl : ld.costs)
     if (observed_cost(&cl))
       return &cl;
   return nullptr;
 }

 float safe_probability(float prob)
 {
   if (prob <= 0.)
   {
     std::cout << "Probability " << prob << " is not possible, replacing with 1e-3.  Fix your dataset. " << std::endl;
     return 1e-3f;
   }
   else
     return prob;
 }

 // Multiline version
 void gen_cs_example_ips(multi_ex& examples, COST_SENSITIVE::label& cs_labels, float clip_p)
 {
   cs_labels.costs.clear();
   for (uint32_t i = 0; i < examples.size(); i++)
   {
     CB::label ld = examples[i]->l.cb;

     COST_SENSITIVE::wclass wc = {0., i, 0., 0.};
     if (ld.costs.size() == 1 && ld.costs[0].cost != FLT_MAX)
       wc.x = ld.costs[0].cost / safe_probability(std::max(ld.costs[0].probability, clip_p));
     cs_labels.costs.push_back(wc);
   }
 }

 // Multiline version
 void gen_cs_example_dm(multi_ex& examples, COST_SENSITIVE::label& cs_labels)
 {
   cs_labels.costs.clear();
   for (uint32_t i = 0; i < examples.size(); i++)
   {
     CB::label ld = examples[i]->l.cb;

     COST_SENSITIVE::wclass wc = {0., i, 0., 0.};
     if (ld.costs.size() == 1 && ld.costs[0].cost != FLT_MAX)
       wc.x = ld.costs[0].cost;
     cs_labels.costs.push_back(wc);
   }
 }

 // Multiline version
 void gen_cs_test_example(multi_ex& examples, COST_SENSITIVE::label& cs_labels)
 {
   cs_labels.costs.clear();
   for (uint32_t i = 0; i < examples.size(); i++)
   {
     COST_SENSITIVE::wclass wc = {FLT_MAX, i, 0., 0.};
     cs_labels.costs.push_back(wc);
   }
 }

 // single line version
 void gen_cs_example_ips(cb_to_cs& c, CB::label& ld, COST_SENSITIVE::label& cs_ld, float clip_p)
 {
   // this implements the inverse propensity score method, where cost are importance weighted by the probability of the
   // chosen action generate cost-sensitive example
   cs_ld.costs.clear();
   if (ld.costs.size() == 0 || (ld.costs.size() == 1 && ld.costs[0].cost != FLT_MAX))
   // this is a typical example where we can perform all actions
   {
     // in this case generate cost-sensitive example with all actions
     for (uint32_t i = 1; i <= c.num_actions; i++)
     {
       COST_SENSITIVE::wclass wc = {0., i, 0., 0.};
       if (c.known_cost != nullptr && i == c.known_cost->action)
       {
         // use importance weighted cost for observed action, 0 otherwise
         wc.x = c.known_cost->cost / safe_probability(std::max(c.known_cost->probability, clip_p));

         // ips can be thought as the doubly robust method with a fixed regressor that predicts 0 costs for everything
         // update the loss of this regressor
         c.nb_ex_regressors++;
         c.avg_loss_regressors +=
             (1.0f / c.nb_ex_regressors) * ((c.known_cost->cost) * (c.known_cost->cost) - c.avg_loss_regressors);
         c.last_pred_reg = 0;
         c.last_correct_cost = c.known_cost->cost;
       }

       cs_ld.costs.push_back(wc);
     }
   }
   else  // this is an example where we can only perform a subset of the actions
   {
     // in this case generate cost-sensitive example with only allowed actions
     for (auto& cl : ld.costs)
     {
       COST_SENSITIVE::wclass wc = {0., cl.action, 0., 0.};
       if (c.known_cost != nullptr && cl.action == c.known_cost->action)
       {
         // use importance weighted cost for observed action, 0 otherwise
         wc.x = c.known_cost->cost / safe_probability(std::max(c.known_cost->probability, clip_p));

         // ips can be thought as the doubly robust method with a fixed regressor that predicts 0 costs for everything
         // update the loss of this regressor
         c.nb_ex_regressors++;
         c.avg_loss_regressors +=
             (1.0f / c.nb_ex_regressors) * ((c.known_cost->cost) * (c.known_cost->cost) - c.avg_loss_regressors);
         c.last_pred_reg = 0;
         c.last_correct_cost = c.known_cost->cost;
       }

       cs_ld.costs.push_back(wc);
     }
   }
 }

 void gen_cs_example_mtr(cb_to_cs_adf& c, multi_ex& ec_seq, COST_SENSITIVE::label& cs_labels)
 {
   c.action_sum += ec_seq.size();
   c.event_sum++;

   c.mtr_ec_seq.clear();
   cs_labels.costs.clear();
   for (size_t i = 0; i < ec_seq.size(); i++)
   {
     CB::label ld = ec_seq[i]->l.cb;

     COST_SENSITIVE::wclass wc = {0, 0, 0, 0};

     if (ld.costs.size() == 1 && ld.costs[0].cost != FLT_MAX)
     {
       wc.x = ld.costs[0].cost;
       c.mtr_example = (uint32_t)i;
       c.mtr_ec_seq.push_back(ec_seq[i]);
       cs_labels.costs.push_back(wc);
     }
   }
 }

 void gen_cs_example_sm(multi_ex&, uint32_t chosen_action, float sign_offset, ACTION_SCORE::action_scores action_vals,
     COST_SENSITIVE::label& cs_labels)
 {
   cs_labels.costs.clear();
   for (uint32_t i = 0; i < action_vals.size(); i++)
   {
     uint32_t current_action = action_vals[i].action;
     COST_SENSITIVE::wclass wc = {0., current_action, 0., 0.};

     if (current_action == chosen_action)
       wc.x = action_vals[i].score + sign_offset;
     else
       wc.x = action_vals[i].score - sign_offset;

     // TODO: This clipping is conceptually unnecessary because the example weight for this instance should be close to
     // 0.
     if (wc.x > 100.)
       wc.x = 100.0;
     if (wc.x < -100.)
       wc.x = -100.0;

     cs_labels.costs.push_back(wc);
   }
 }
 }  // namespace GEN_CS
GEN_CS::gen_cs_example_sm
void gen_cs_example_sm(multi_ex &, uint32_t chosen_action, float sign_offset, ACTION_SCORE::action_scores action_vals, COST_SENSITIVE::label &cs_labels)
Definition: gen_cs_example.cc:163

GEN_CS::cb_to_cs_adf
Definition: gen_cs_example.h:30

COST_SENSITIVE::wclass
Definition: cost_sensitive.h:15

GEN_CS::get_observed_cost
cb_class * get_observed_cost(CB::label &ld)
Definition: gen_cs_example.cc:25

GEN_CS
Definition: gen_cs_example.cc:13

CB::label::costs
v_array< cb_class > costs
Definition: cb.h:27

GEN_CS::cb_to_cs_adf::event_sum
uint64_t event_sum
Definition: gen_cs_example.h:36

prediction_type::prob
Definition: learner.h:26

COST_SENSITIVE::label
Definition: cost_sensitive.h:29

GEN_CS::gen_cs_example_dm
void gen_cs_example_dm(multi_ex &examples, COST_SENSITIVE::label &cs_labels)
Definition: gen_cs_example.cc:60

v_array::size
size_t size() const
Definition: v_array.h:68

GEN_CS::cb_to_cs::last_pred_reg
float last_pred_reg
Definition: gen_cs_example.h:24

vw_exception.h

CB::cb_class
Definition: cb.h:15

GEN_CS::cb_to_cs_adf::action_sum
uint64_t action_sum
Definition: gen_cs_example.h:35

GEN_CS::cb_to_cs::known_cost
CB::cb_class * known_cost
Definition: gen_cs_example.h:27

CB
Definition: cb.cc:15

CB::cb_class::action
uint32_t action
Definition: cb.h:18

GEN_CS::cb_to_cs::nb_ex_regressors
size_t nb_ex_regressors
Definition: gen_cs_example.h:23

CB::cb_class::probability
float probability
Definition: cb.h:19

GEN_CS::cb_to_cs_adf::mtr_example
uint32_t mtr_example
Definition: gen_cs_example.h:37

CB_ALGS
Definition: cb_algs.cc:19

GEN_CS::cb_to_cs::num_actions
uint32_t num_actions
Definition: gen_cs_example.h:19

GEN_CS::cb_to_cs
Definition: gen_cs_example.h:16

GEN_CS::cb_to_cs::avg_loss_regressors
float avg_loss_regressors
Definition: gen_cs_example.h:22

GEN_CS::observed_cost
constexpr bool observed_cost(cb_class *cl)
Definition: gen_cs_example.cc:19

GEN_CS::gen_cs_example_ips
void gen_cs_example_ips(multi_ex &examples, COST_SENSITIVE::label &cs_labels, float clip_p)
Definition: gen_cs_example.cc:45

reductions.h

multi_ex
std::vector< example * > multi_ex
Definition: example.h:122

GEN_CS::safe_probability
float safe_probability(float prob)
Definition: gen_cs_example.cc:33

GEN_CS::cb_to_cs::last_correct_cost
float last_correct_cost
Definition: gen_cs_example.h:25

CB::label
Definition: cb.h:25

CB::cb_class::cost
float cost
Definition: cb.h:17

GEN_CS::gen_cs_example_mtr
void gen_cs_example_mtr(cb_to_cs_adf &c, multi_ex &ec_seq, COST_SENSITIVE::label &cs_labels)
Definition: gen_cs_example.cc:140

vw.h

GEN_CS::cb_to_cs_adf::mtr_ec_seq
multi_ex mtr_ec_seq
Definition: gen_cs_example.h:38

COST_SENSITIVE::wclass::x
float x
Definition: cost_sensitive.h:17

LEARNER
Definition: cb_explore.h:8

COST_SENSITIVE::label::costs
v_array< wclass > costs
Definition: cost_sensitive.h:31

v_array< action_score >

gen_cs_example.h

c
constexpr uint64_t c
Definition: rand48.cc:12

GEN_CS::gen_cs_test_example
void gen_cs_test_example(multi_ex &examples, COST_SENSITIVE::label &cs_labels)
Definition: gen_cs_example.cc:75

f
float f
Definition: cache.cc:40