Vowpal Wabbit
|
#include "explore_internal.h"
Go to the source code of this file.
Namespaces | |
exploration | |
Macros | |
#define | S_EXPLORATION_OK 0 |
#define | E_EXPLORATION_BAD_RANGE 1 |
#define | E_EXPLORATION_PDF_RANKING_SIZE_MISMATCH 2 |
Functions | |
template<typename It > | |
int | exploration::generate_epsilon_greedy (float epsilon, uint32_t top_action, It pdf_first, It pdf_last) |
Generates epsilon-greedy style exploration distribution. More... | |
template<typename InputIt , typename OutputIt > | |
int | exploration::generate_softmax (float lambda, InputIt scores_first, InputIt scores_last, OutputIt pdf_first, OutputIt pdf_last) |
Generates softmax style exploration distribution. More... | |
template<typename InputIt , typename OutputIt > | |
int | exploration::generate_bag (InputIt top_actions_first, InputIt top_actions_last, OutputIt pdf_first, OutputIt pdf_last) |
Generates an exploration distribution according to votes on actions. More... | |
template<typename It > | |
int | exploration::enforce_minimum_probability (float minimum_uniform, bool update_zero_elements, It pdf_first, It pdf_last) |
Updates the pdf to ensure each action is explored with at least minimum_uniform/num_actions. More... | |
template<typename It > | |
int | exploration::sample_after_normalizing (uint64_t seed, It pdf_first, It pdf_last, uint32_t &chosen_index) |
Sample an index from the provided pdf. If the pdf is not normalized it will be updated in-place. More... | |
template<typename It > | |
int | exploration::sample_after_normalizing (const char *seed, It pdf_first, It pdf_last, uint32_t &chosen_index) |
Sample an index from the provided pdf. If the pdf is not normalized it will be updated in-place. More... | |
template<typename ActionIt > | |
int | exploration::swap_chosen (ActionIt action_first, ActionIt action_last, uint32_t chosen_index) |
Swap the first value with the chosen index. More... | |
#define E_EXPLORATION_BAD_RANGE 1 |
Definition at line 4 of file explore.h.
Referenced by exploration::enforce_minimum_probability(), exploration::generate_bag(), exploration::generate_epsilon_greedy(), exploration::generate_softmax(), exploration::sample_after_normalizing(), exploration::swap_chosen(), and TEST().
#define E_EXPLORATION_PDF_RANKING_SIZE_MISMATCH 2 |
Definition at line 5 of file explore.h.
Referenced by vw_slim::vw_predict< W >::sort_by_scores().
#define S_EXPLORATION_OK 0 |
Definition at line 3 of file explore.h.
Referenced by exploration::enforce_minimum_probability(), exploration::generate_bag(), exploration::generate_epsilon_greedy(), exploration::generate_softmax(), VW::cb_sample_data::learn_or_predict(), exploration::sample_after_normalizing(), vw_slim::vw_predict< W >::sort_by_scores(), exploration::swap_chosen(), and TEST().