Vowpal Wabbit slim predictor. Supports: regression, multi-class classification and contextual bandits. More...

#include <vw_slim_predict.h>

Public Member Functions
	vw_predict ()

int	load (const char *model, size_t length)
	Reads the Vowpal Wabbit model from the supplied buffer (produced using vw -f <modelname>) More...

bool	is_cb_explore_adf ()
	True if the model describes a contextual bandit (cb) model using action dependent features (afd) More...

bool	is_csoaa_ldf ()
	True if the model describes a cost sensitive one-against-all (csoaa). This is also true for cb_explore_adf models, as they are reduced to csoaa. More...

int	predict (example_predict &ex, float &score)
	Predicts a score (as in regression) for the provided example. More...

int	predict (example_predict &shared, example_predict *actions, size_t num_actions, std::vector< float > &out_scores)

int	predict (const char event_id, example_predict &shared, example_predict actions, size_t num_actions, std::vector< float > &pdf, std::vector< int > &ranking)

uint32_t	feature_index_num_bits ()

Static Public Member Functions
template<typename PdfIt , typename InputScoreIt , typename OutputIt >
static int	sort_by_scores (PdfIt pdf_first, PdfIt pdf_last, InputScoreIt scores_first, InputScoreIt scores_last, OutputIt ranking_begin, OutputIt ranking_last)

Private Attributes
std::unique_ptr< W >	_weights

std::string	_id

std::string	_version

std::string	_command_line_arguments

std::vector< std::string >	_interactions

std::array< bool, NUM_NAMESPACES >	_ignore_linear

bool	_no_constant

vw_predict_exploration	_exploration

float	_minimum_epsilon

float	_epsilon

float	_lambda

int	_bag_size

uint32_t	_num_bits

uint32_t	_stride_shift

bool	_model_loaded

Detailed Description

template<typename W>
class vw_slim::vw_predict< W >

Vowpal Wabbit slim predictor. Supports: regression, multi-class classification and contextual bandits.

Definition at line 218 of file vw_slim_predict.h.

Constructor & Destructor Documentation

◆ vw_predict()

template<typename W>

vw_slim::vw_predict< W >::vw_predict ( )

inline

Definition at line 239 of file vw_slim_predict.h.

239 : _model_loaded(false) {}

vw_slim::vw_predict::_model_loaded

bool _model_loaded

Definition: vw_slim_predict.h:236

Member Function Documentation

◆ feature_index_num_bits()

template<typename W>

uint32_t vw_slim::vw_predict< W >::feature_index_num_bits ( )

inline

Definition at line 587 of file vw_slim_predict.h.

Referenced by TEST().

587 { return _num_bits; }

vw_slim::vw_predict::_num_bits

uint32_t _num_bits

Definition: vw_slim_predict.h:233

◆ is_cb_explore_adf()

template<typename W>

bool vw_slim::vw_predict< W >::is_cb_explore_adf ( )

inline

True if the model describes a contextual bandit (cb) model using action dependent features (afd)

Returns: true True if contextual bandit predict method can be used.; false False if contextual bandit predict method cannot be used.

Definition at line 385 of file vw_slim_predict.h.

Referenced by run_predict_in_memory(), and TEST_P().

385 { return _command_line_arguments.find("--cb_explore_adf") != std::string::npos; }

vw_slim::vw_predict::_command_line_arguments

std::string _command_line_arguments

Definition: vw_slim_predict.h:223

◆ is_csoaa_ldf()

template<typename W>

bool vw_slim::vw_predict< W >::is_csoaa_ldf ( )

inline

True if the model describes a cost sensitive one-against-all (csoaa). This is also true for cb_explore_adf models, as they are reduced to csoaa.

Returns: true True if csoaa predict method can be used.; false False if csoaa predict method cannot be used.

Definition at line 394 of file vw_slim_predict.h.

394 { return _command_line_arguments.find("--csoaa_ldf") != std::string::npos; }

vw_slim::vw_predict::_command_line_arguments

std::string _command_line_arguments

Definition: vw_slim_predict.h:223

◆ load()

template<typename W>

int vw_slim::vw_predict< W >::load	(	const char *	model,
		size_t	length
	)

inline

Reads the Vowpal Wabbit model from the supplied buffer (produced using vw -f <modelname>)

Parameters

model	The binary model.
length	The length of the binary model.

Returns: int Returns 0 (S_VW_PREDICT_OK) if succesful, otherwise one of the error codes (see E_VW_PREDICT_ERR_*).

Definition at line 248 of file vw_slim_predict.h.

References vw_slim::bag, vw_slim::ceil_log_2(), vw_slim::model_parser::checksum(), E_VW_PREDICT_ERR_CB_EXPLORATION_MISSING, E_VW_PREDICT_ERR_GD_RESUME_NOT_SUPPORTED, E_VW_PREDICT_ERR_HASH_SEED_NOT_SUPPORTED, E_VW_PREDICT_ERR_INVALID_MODEL, E_VW_PREDICT_ERR_INVALID_MODEL_CHECK_SUM, vw_slim::epsilon_greedy, vw_slim::find_opt(), vw_slim::find_opt_float(), vw_slim::find_opt_int(), VW::num_weights(), vw_slim::model_parser::read(), vw_slim::model_parser::read_string(), vw_slim::model_parser::read_weights(), RETURN_ON_FAIL, S_VW_PREDICT_OK, vw_slim::model_parser::skip(), and vw_slim::softmax.

Referenced by cb_data_epsilon_0_skype_jb_test_runner(), run_predict_in_memory(), TEST(), TEST_P(), and TYPED_TEST_P().

   {
     if (!model || length == 0)
       return E_VW_PREDICT_ERR_INVALID_MODEL;
 
     _model_loaded = false;
 
     // required for inline_predict
     _ignore_linear.fill(false);
 
     model_parser mp(model, length);
 
     // parser_regressor.cc: save_load_header
     RETURN_ON_FAIL(mp.read_string<false>("version", _version));
 
     // read model id
     RETURN_ON_FAIL(mp.read_string<true>("model_id", _id));
 
     RETURN_ON_FAIL(mp.skip(sizeof(char)));   // "model character"
     RETURN_ON_FAIL(mp.skip(sizeof(float)));  // "min_label"
     RETURN_ON_FAIL(mp.skip(sizeof(float)));  // "max_label"
 
     RETURN_ON_FAIL(mp.read("num_bits", _num_bits));
 
     RETURN_ON_FAIL(mp.skip(sizeof(uint32_t)));  // "lda"
 
     uint32_t ngram_len;
     RETURN_ON_FAIL(mp.read("ngram_len", ngram_len));
     mp.skip(3 * ngram_len);
 
     uint32_t skips_len;
     RETURN_ON_FAIL(mp.read("skips_len", skips_len));
     mp.skip(3 * skips_len);
 
     RETURN_ON_FAIL(mp.read_string<true>("file_options", _command_line_arguments));
 
     // command line arg parsing
     _no_constant = _command_line_arguments.find("--noconstant") != std::string::npos;
 
     // only 0-valued hash_seed supported
     int hash_seed;
     if (find_opt_int(_command_line_arguments, "--hash_seed", hash_seed) && hash_seed)
       return E_VW_PREDICT_ERR_HASH_SEED_NOT_SUPPORTED;
 
     _interactions.clear();
     find_opt(_command_line_arguments, "-q", _interactions);
     find_opt(_command_line_arguments, "--quadratic", _interactions);
     find_opt(_command_line_arguments, "--cubic", _interactions);
     find_opt(_command_line_arguments, "--interactions", _interactions);
 
     // VW performs the following transformation as a side-effect of looking for duplicates.
     // This affects how interaction hashes are generated.
     std::vector<std::string> vec_sorted;
     for (const std::string& interaction : _interactions)
     {
       std::string sorted_i(interaction);
       std::sort(std::begin(sorted_i), std::end(sorted_i));
       vec_sorted.push_back(sorted_i);
     }
     _interactions = vec_sorted;
 
     // TODO: take --cb_type dr into account
     uint64_t num_weights = 0;
 
     if (_command_line_arguments.find("--cb_explore_adf") != std::string::npos)
     {
       // parse exploration options
       if (find_opt_int(_command_line_arguments, "--bag", _bag_size))
       {
         _exploration = vw_predict_exploration::bag;
         num_weights = _bag_size;
 
         // check for additional minimum epsilon greedy
         _minimum_epsilon = 0.f;
         find_opt_float(_command_line_arguments, "--epsilon", _minimum_epsilon);
       }
       else if (_command_line_arguments.find("--softmax") != std::string::npos)
       {
         if (find_opt_float(_command_line_arguments, "--lambda", _lambda))
         {
           if (_lambda > 0)  // Lambda should always be negative because we are using a cost basis.
             _lambda = -_lambda;
           _exploration = vw_predict_exploration::softmax;
         }
       }
       else if (find_opt_float(_command_line_arguments, "--epsilon", _epsilon))
         _exploration = vw_predict_exploration::epsilon_greedy;
       else
         return E_VW_PREDICT_ERR_CB_EXPLORATION_MISSING;
     }
 
     // VW style check_sum validation
     uint32_t check_sum_computed = mp.checksum();
 
     // perform check sum check
     uint32_t check_sum_len;
     RETURN_ON_FAIL((mp.read<uint32_t, false>("check_sum_len", check_sum_len)));
     if (check_sum_len != sizeof(uint32_t))
       return E_VW_PREDICT_ERR_INVALID_MODEL;
 
     uint32_t check_sum;
     RETURN_ON_FAIL((mp.read<uint32_t, false>("check_sum", check_sum)));
 
     if (check_sum_computed != check_sum)
       return E_VW_PREDICT_ERR_INVALID_MODEL_CHECK_SUM;
 
     if (_command_line_arguments.find("--cb_adf") != std::string::npos)
     {
       RETURN_ON_FAIL(mp.skip(sizeof(uint64_t)));  // cb_adf.cc: event_sum
       RETURN_ON_FAIL(mp.skip(sizeof(uint64_t)));  // cb_adf.cc: action_sum
     }
 
     // gd.cc: save_load
     bool gd_resume;
     RETURN_ON_FAIL(mp.read("resume", gd_resume));
     if (gd_resume)
       return E_VW_PREDICT_ERR_GD_RESUME_NOT_SUPPORTED;
 
     // read sparse weights into dense
     uint64_t weight_length = (uint64_t)1 << _num_bits;
     _stride_shift = (uint32_t)ceil_log_2(num_weights);
 
     RETURN_ON_FAIL(mp.read_weights<W>(_weights, _num_bits, _stride_shift));
 
     // TODO: check that permutations is not enabled (or parse it)
 
     _model_loaded = true;
 
     return S_VW_PREDICT_OK;
   }

◆ predict() [1/3]

template<typename W>

int vw_slim::vw_predict< W >::predict	(	example_predict &	ex,
		float &	score
	)

inline

Predicts a score (as in regression) for the provided example.

Regular regression with support for constant feature (bias term) and interactions

Parameters

ex	The example to get the prediction for.
score	The output score produced by the model.

Returns: int Returns 0 (S_VW_PREDICT_OK) if succesful, otherwise one of the error codes (see E_VW_PREDICT_ERR_*).

Definition at line 405 of file vw_slim_predict.h.

References constant, constant_namespace, E_VW_PREDICT_ERR_NO_MODEL_LOADED, f, example_predict::ft_offset, and S_VW_PREDICT_OK.

Referenced by cb_data_epsilon_0_skype_jb_test_runner(), run_predict_in_memory(), TEST(), TEST_P(), and TYPED_TEST_P().

   {
     if (!_model_loaded)
       return E_VW_PREDICT_ERR_NO_MODEL_LOADED;
 
     std::unique_ptr<namespace_copy_guard> ns_copy_guard;
 
     if (!_no_constant)
     {
       // add constant feature
       ns_copy_guard = std::unique_ptr<namespace_copy_guard>(new namespace_copy_guard(ex, constant_namespace));
       ns_copy_guard->feature_push_back(1.f, (constant << _stride_shift) + ex.ft_offset);
     }
 
     score = GD::inline_predict<W>(*_weights, false, _ignore_linear, _interactions, /* permutations */ false, ex);
 
     return S_VW_PREDICT_OK;
   }

◆ predict() [2/3]

template<typename W>

int vw_slim::vw_predict< W >::predict	(	example_predict &	shared,
		example_predict *	actions,
		size_t	num_actions,
		std::vector< float > &	out_scores
	)

inline

Definition at line 425 of file vw_slim_predict.h.

References E_VW_PREDICT_ERR_NO_A_CSOAA_MODEL, E_VW_PREDICT_ERR_NO_MODEL_LOADED, example_predict::feature_space, example_predict::indices, predict(), RETURN_ON_FAIL, and S_VW_PREDICT_OK.

   {
     if (!_model_loaded)
       return E_VW_PREDICT_ERR_NO_MODEL_LOADED;
 
     if (!is_csoaa_ldf())
       return E_VW_PREDICT_ERR_NO_A_CSOAA_MODEL;
 
     out_scores.resize(num_actions);
 
     example_predict* action = actions;
     for (size_t i = 0; i < num_actions; i++, action++)
     {
       std::vector<std::unique_ptr<namespace_copy_guard>> ns_copy_guards;
 
       // shared feature copying
       for (auto ns : shared.indices)
       {
         // insert namespace
         auto ns_copy_guard = std::unique_ptr<namespace_copy_guard>(new namespace_copy_guard(*action, ns));
 
         // copy features
         for (auto fs : shared.feature_space[ns]) ns_copy_guard->feature_push_back(fs.value(), fs.index());
 
         // keep guard around
         ns_copy_guards.push_back(std::move(ns_copy_guard));
       }
 
       RETURN_ON_FAIL(predict(*action, out_scores[i]));
     }
 
     return S_VW_PREDICT_OK;
   }

◆ predict() [3/3]

template<typename W>

int vw_slim::vw_predict< W >::predict	(	const char *	event_id,
		example_predict &	shared,
		example_predict *	actions,
		size_t	num_actions,
		std::vector< float > &	pdf,
		std::vector< int > &	ranking
	)

inline

Definition at line 459 of file vw_slim_predict.h.

References vw_slim::bag, E_VW_PREDICT_ERR_NO_MODEL_LOADED, E_VW_PREDICT_ERR_NOT_A_CB_MODEL, exploration::enforce_minimum_probability(), vw_slim::epsilon_greedy, exploration::generate_bag(), exploration::generate_epsilon_greedy(), exploration::generate_softmax(), predict(), RETURN_EXPLORATION_ON_FAIL, RETURN_ON_FAIL, S_VW_PREDICT_OK, exploration::sample_after_normalizing(), and vw_slim::softmax.

   {
     if (!_model_loaded)
       return E_VW_PREDICT_ERR_NO_MODEL_LOADED;
 
     if (!is_cb_explore_adf())
       return E_VW_PREDICT_ERR_NOT_A_CB_MODEL;
 
     std::vector<float> scores;
 
     // add exploration
     pdf.resize(num_actions);
     ranking.resize(num_actions);
 
     switch (_exploration)
     {
       case vw_predict_exploration::epsilon_greedy:
       {
         // get the prediction
         RETURN_ON_FAIL(predict(shared, actions, num_actions, scores));
 
         // generate exploration distribution
         // model is trained against cost -> minimum is better
         auto top_action_iterator = std::min_element(std::begin(scores), std::end(scores));
         uint32_t top_action = (uint32_t)(top_action_iterator - std::begin(scores));
 
         RETURN_EXPLORATION_ON_FAIL(
             exploration::generate_epsilon_greedy(_epsilon, top_action, std::begin(pdf), std::end(pdf)));
         break;
       }
       case vw_predict_exploration::softmax:
       {
         // get the prediction
         RETURN_ON_FAIL(predict(shared, actions, num_actions, scores));
 
         // generate exploration distribution
         RETURN_EXPLORATION_ON_FAIL(exploration::generate_softmax(
             _lambda, std::begin(scores), std::end(scores), std::begin(pdf), std::end(pdf)));
         break;
       }
       case vw_predict_exploration::bag:
       {
         std::vector<uint32_t> top_actions(num_actions);
 
         // apply stride shifts
         std::vector<std::unique_ptr<stride_shift_guard>> stride_shift_guards;
         stride_shift_guards.push_back(
             std::unique_ptr<stride_shift_guard>(new stride_shift_guard(shared, _stride_shift)));
         example_predict* actions_end = actions + num_actions;
         for (example_predict* action = actions; action != actions_end; ++action)
           stride_shift_guards.push_back(
               std::unique_ptr<stride_shift_guard>(new stride_shift_guard(*action, _stride_shift)));
 
         for (size_t i = 0; i < _bag_size; i++)
         {
           std::vector<std::unique_ptr<feature_offset_guard>> feature_offset_guards;
           for (example_predict* action = actions; action != actions_end; ++action)
             feature_offset_guards.push_back(
                 std::unique_ptr<feature_offset_guard>(new feature_offset_guard(*action, i)));
 
           RETURN_ON_FAIL(predict(shared, actions, num_actions, scores));
 
           auto top_action_iterator = std::min_element(std::begin(scores), std::end(scores));
           uint32_t top_action = (uint32_t)(top_action_iterator - std::begin(scores));
 
           top_actions[top_action]++;
         }
 
         // generate exploration distribution
         RETURN_EXPLORATION_ON_FAIL(
             exploration::generate_bag(std::begin(top_actions), std::end(top_actions), std::begin(pdf), std::end(pdf)));
 
         if (_minimum_epsilon > 0)
           RETURN_EXPLORATION_ON_FAIL(
               exploration::enforce_minimum_probability(_minimum_epsilon, true, std::begin(pdf), std::end(pdf)));
 
         break;
       }
       default:
         return E_VW_PREDICT_ERR_NOT_A_CB_MODEL;
     }
 
     RETURN_EXPLORATION_ON_FAIL(sort_by_scores(
         std::begin(pdf), std::end(pdf), std::begin(scores), std::end(scores), std::begin(ranking), std::end(ranking)));
 
     // Sample from the pdf
     uint32_t chosen_action_idx;
     RETURN_EXPLORATION_ON_FAIL(
         exploration::sample_after_normalizing(event_id, std::begin(pdf), std::end(pdf), chosen_action_idx));
 
     // Swap top element with chosen one (unless chosen is the top)
     if (chosen_action_idx != 0)
     {
       std::iter_swap(std::begin(ranking), std::begin(ranking) + chosen_action_idx);
       std::iter_swap(std::begin(pdf), std::begin(pdf) + chosen_action_idx);
     }
 
     return S_VW_PREDICT_OK;
   }

◆ sort_by_scores()

template<typename W>

template<typename PdfIt , typename InputScoreIt , typename OutputIt >

static int vw_slim::vw_predict< W >::sort_by_scores	(	PdfIt	pdf_first,
		PdfIt	pdf_last,
		InputScoreIt	scores_first,
		InputScoreIt	scores_last,
		OutputIt	ranking_begin,
		OutputIt	ranking_last
	)

inlinestatic

Definition at line 561 of file vw_slim_predict.h.

References E_EXPLORATION_PDF_RANKING_SIZE_MISMATCH, and S_EXPLORATION_OK.

   {
     const size_t pdf_size = pdf_last - pdf_first;
     const size_t ranking_size = ranking_last - ranking_begin;
 
     if (pdf_size != ranking_size)
       return E_EXPLORATION_PDF_RANKING_SIZE_MISMATCH;
 
     // Initialize ranking with actions 0,1,2,3 ...
     std::iota(ranking_begin, ranking_last, 0);
 
     // Pdf starts out in the same order as ranking.  Ranking and pdf should been sorted
     // in the order specified by scores.
     using CP = internal::collection_pair_iterator<OutputIt, PdfIt>;
     using Iter = typename CP::Iter;
     using Loc = typename CP::Loc;
     const Iter begin_coll(ranking_begin, pdf_first);
     const Iter end_coll(ranking_last, pdf_last);
     std::sort(begin_coll, end_coll, [&scores_first](const Loc& l, const Loc& r) {
       return scores_first[size_t(l._val1)] < scores_first[size_t(r._val1)];
     });
 
     return S_EXPLORATION_OK;
   }

Member Data Documentation

◆ _bag_size

template<typename W>

int vw_slim::vw_predict< W >::_bag_size

private

Definition at line 232 of file vw_slim_predict.h.

◆ _command_line_arguments

template<typename W>

std::string vw_slim::vw_predict< W >::_command_line_arguments

private

Definition at line 223 of file vw_slim_predict.h.

◆ _epsilon

template<typename W>

float vw_slim::vw_predict< W >::_epsilon

private

Definition at line 230 of file vw_slim_predict.h.

◆ _exploration

template<typename W>

vw_predict_exploration vw_slim::vw_predict< W >::_exploration

private

Definition at line 228 of file vw_slim_predict.h.

◆ _id

template<typename W>

std::string vw_slim::vw_predict< W >::_id

private

Definition at line 221 of file vw_slim_predict.h.

◆ _ignore_linear

template<typename W>

std::array<bool, NUM_NAMESPACES> vw_slim::vw_predict< W >::_ignore_linear

private

Definition at line 225 of file vw_slim_predict.h.

◆ _interactions

template<typename W>

std::vector<std::string> vw_slim::vw_predict< W >::_interactions

private

Definition at line 224 of file vw_slim_predict.h.

◆ _lambda

template<typename W>

float vw_slim::vw_predict< W >::_lambda

private

Definition at line 231 of file vw_slim_predict.h.

◆ _minimum_epsilon

template<typename W>

float vw_slim::vw_predict< W >::_minimum_epsilon

private

Definition at line 229 of file vw_slim_predict.h.

◆ _model_loaded

template<typename W>

bool vw_slim::vw_predict< W >::_model_loaded

private

Definition at line 236 of file vw_slim_predict.h.

◆ _no_constant

template<typename W>

bool vw_slim::vw_predict< W >::_no_constant

private

Definition at line 226 of file vw_slim_predict.h.

◆ _num_bits

template<typename W>

uint32_t vw_slim::vw_predict< W >::_num_bits

private

Definition at line 233 of file vw_slim_predict.h.

◆ _stride_shift

template<typename W>

uint32_t vw_slim::vw_predict< W >::_stride_shift

private

Definition at line 235 of file vw_slim_predict.h.

◆ _version

template<typename W>

std::string vw_slim::vw_predict< W >::_version

private

Definition at line 222 of file vw_slim_predict.h.

◆ _weights

template<typename W>

std::unique_ptr<W> vw_slim::vw_predict< W >::_weights

private

Definition at line 220 of file vw_slim_predict.h.

The documentation for this class was generated from the following file:

/mnt/c/w/linux/vowpal_wabbit/vowpalwabbit/slim/include/vw_slim_predict.h

Public Member Functions

Static Public Member Functions

Private Attributes

Detailed Description

template<typename W> class vw_slim::vw_predict< W >

Constructor & Destructor Documentation

◆ vw_predict()

Member Function Documentation

◆ feature_index_num_bits()

◆ is_cb_explore_adf()

◆ is_csoaa_ldf()

◆ load()

◆ predict() [1/3]

◆ predict() [2/3]

◆ predict() [3/3]

◆ sort_by_scores()

Member Data Documentation

◆ _bag_size

◆ _command_line_arguments

◆ _epsilon

◆ _exploration

◆ _id

◆ _ignore_linear

◆ _interactions

◆ _lambda

◆ _minimum_epsilon

◆ _model_loaded

◆ _no_constant

◆ _num_bits

◆ _stride_shift

◆ _version

◆ _weights

template<typename W>
class vw_slim::vw_predict< W >