#include <netdb.h>
#include "reductions.h"
#include "gd.h"

Classes
struct	mf

Functions
template<bool cache_sub_predictions>
void	predict (mf &data, single_learner &base, example &ec)

void	learn (mf &data, single_learner &base, example &ec)

void	finish (mf &o)

base_learner *	mf_setup (options_i &options, vw &all)

Function Documentation

◆ finish()

void finish ( mf & o )

Definition at line 189 of file mf.cc.

References mf::all, mf::pairs, and vw::pairs.

Referenced by mf_setup().

 {
   // restore global pairs
   o.all->pairs = o.pairs;
 }

◆ learn()

void learn	(	mf &	data,
		single_learner &	base,
		example &	ec
	)

Definition at line 111 of file mf.cc.

References v_array< T >::clear(), copy_array(), features::deep_copy_from(), example_predict::feature_space, example_predict::indices, example::pred, v_array< T >::push_back(), polyprediction::scalar, features::size(), example::updated_prediction, and features::values.

Referenced by mf_setup().

 {
   // predict with current weights
   predict<true>(data, base, ec);
   float predicted = ec.pred.scalar;
 
   // update linear weights
   base.update(ec);
   ec.pred.scalar = ec.updated_prediction;
 
   // store namespace indices
   copy_array(data.indices, ec.indices);
 
   // erase indices
   ec.indices.clear();
   ec.indices.push_back(0);
 
   // update interaction terms
   // looping over all pairs of non-empty namespaces
   for (std::string& i : data.pairs)
   {
     int left_ns = (int)i[0];
     int right_ns = (int)i[1];
 
     if (ec.feature_space[left_ns].size() > 0 && ec.feature_space[right_ns].size() > 0)
     {
       // set example to left namespace only
       ec.indices[0] = left_ns;
 
       // store feature values in left namespace
       data.temp_features.deep_copy_from(ec.feature_space[left_ns]);
 
       for (size_t k = 1; k <= data.rank; k++)
       {
         features& fs = ec.feature_space[left_ns];
         // multiply features in left namespace by r^k * x_r
         for (size_t i = 0; i < fs.size(); ++i) fs.values[i] *= data.sub_predictions[2 * k];
 
         // update l^k using base learner
         base.update(ec, k);
 
         // restore left namespace features (undoing multiply)
         fs.deep_copy_from(data.temp_features);
 
         // compute new l_k * x_l scaling factors
         // base.predict(ec, k);
         // data.sub_predictions[2*k-1] = ec.partial_prediction;
         // ec.pred.scalar = ec.updated_prediction;
       }
 
       // set example to right namespace only
       ec.indices[0] = right_ns;
 
       // store feature values for right namespace
       data.temp_features.deep_copy_from(ec.feature_space[right_ns]);
 
       for (size_t k = 1; k <= data.rank; k++)
       {
         features& fs = ec.feature_space[right_ns];
         // multiply features in right namespace by l^k * x_l
         for (size_t i = 0; i < fs.size(); ++i) fs.values[i] *= data.sub_predictions[2 * k - 1];
 
         // update r^k using base learner
         base.update(ec, k + data.rank);
         ec.pred.scalar = ec.updated_prediction;
 
         // restore right namespace features
         fs.deep_copy_from(data.temp_features);
       }
     }
   }
   // restore namespace indices
   copy_array(ec.indices, data.indices);
 
   // restore original prediction
   ec.pred.scalar = predicted;
 }

◆ mf_setup()

base_learner* mf_setup	(	options_i &	options,
		vw &	all
	)

Definition at line 195 of file mf.cc.

References VW::config::options_i::add_and_parse(), LEARNER::as_singleline(), finish(), LEARNER::init_learner(), learn(), LEARNER::make_base(), VW::config::make_option(), vw::pairs, vw::random_positive_weights, LEARNER::learner< T, E >::set_finish(), setup_base(), and VW::config::options_i::was_supplied().

Referenced by parse_reductions().

 {
   auto data = scoped_calloc_or_throw<mf>();
   option_group_definition new_options("Matrix Factorization Reduction");
   new_options.add(make_option("new_mf", data->rank).keep().help("rank for reduction-based matrix factorization"));
   options.add_and_parse(new_options);
 
   if (!options.was_supplied("new_mf"))
     return nullptr;
 
   data->all = &all;
   // store global pairs in local data structure and clear global pairs
   // for eventual calls to base learner
   data->pairs = all.pairs;
   all.pairs.clear();
 
   all.random_positive_weights = true;
 
   learner<mf, example>& l =
       init_learner(data, as_singleline(setup_base(options, all)), learn, predict<false>, 2 * data->rank + 1);
   l.set_finish(finish);
   return make_base(l);
 }

◆ predict()

template<bool cache_sub_predictions>

void predict	(	mf &	data,
		single_learner &	base,
		example &	ec
	)

Definition at line 50 of file mf.cc.

References mf::all, v_array< T >::clear(), copy_array(), example_predict::feature_space, GD::finalize_prediction(), example_predict::indices, mf::pairs, example::partial_prediction, example::pred, LEARNER::learner< T, E >::predict(), mf::predict_indices, v_array< T >::push_back(), mf::rank, v_array< T >::resize(), polyprediction::scalar, vw::sd, and mf::sub_predictions.

 {
   float prediction = 0;
   if (cache_sub_predictions)
     data.sub_predictions.resize(2 * data.rank + 1);
 
   // predict from linear terms
   base.predict(ec);
 
   // store linear prediction
   if (cache_sub_predictions)
     data.sub_predictions[0] = ec.partial_prediction;
   prediction += ec.partial_prediction;
 
   // store namespace indices
   copy_array(data.predict_indices, ec.indices);
 
   // erase indices
   ec.indices.clear();
   ec.indices.push_back(0);
 
   // add interaction terms to prediction
   for (std::string& i : data.pairs)
   {
     int left_ns = (int)i[0];
     int right_ns = (int)i[1];
 
     if (ec.feature_space[left_ns].size() > 0 && ec.feature_space[right_ns].size() > 0)
     {
       for (size_t k = 1; k <= data.rank; k++)
       {
         ec.indices[0] = left_ns;
 
         // compute l^k * x_l using base learner
         base.predict(ec, k);
         float x_dot_l = ec.partial_prediction;
         if (cache_sub_predictions)
           data.sub_predictions[2 * k - 1] = x_dot_l;
 
         // set example to right namespace only
         ec.indices[0] = right_ns;
 
         // compute r^k * x_r using base learner
         base.predict(ec, k + data.rank);
         float x_dot_r = ec.partial_prediction;
         if (cache_sub_predictions)
           data.sub_predictions[2 * k] = x_dot_r;
 
         // accumulate prediction
         prediction += (x_dot_l * x_dot_r);
       }
     }
   }
   // restore namespace indices and label
   copy_array(ec.indices, data.predict_indices);
 
   // finalize prediction
   ec.partial_prediction = prediction;
   ec.pred.scalar = GD::finalize_prediction(data.all->sd, ec.partial_prediction);
 }

Classes

Functions

Function Documentation

◆ finish()

◆ learn()

◆ mf_setup()

◆ predict()