cpp/8.8.1/explore_8h_source.html

 #pragma once

 #define S_EXPLORATION_OK                             0
 #define E_EXPLORATION_BAD_RANGE                      1
 #define E_EXPLORATION_PDF_RANKING_SIZE_MISMATCH      2

 #include "explore_internal.h"

 namespace exploration {
   template<typename It>
   int generate_epsilon_greedy(float epsilon, uint32_t top_action, It pdf_first, It pdf_last);

   template<typename InputIt, typename OutputIt>
   int generate_softmax(float lambda, InputIt scores_first, InputIt scores_last, OutputIt pdf_first, OutputIt pdf_last);

   template<typename InputIt, typename OutputIt>
   int generate_bag(InputIt top_actions_first, InputIt top_actions_last, OutputIt pdf_first, OutputIt pdf_last);

   template<typename It>
   int enforce_minimum_probability(float minimum_uniform, bool update_zero_elements, It pdf_first, It pdf_last);

   template<typename It>
   int sample_after_normalizing(uint64_t seed, It pdf_first, It pdf_last, uint32_t& chosen_index);

   template<typename It>
   int sample_after_normalizing(const char* seed, It pdf_first, It pdf_last, uint32_t& chosen_index);

   template<typename ActionIt>
   int swap_chosen(ActionIt action_first, ActionIt action_last, uint32_t chosen_index);
 }
exploration::generate_bag
int generate_bag(InputIt top_actions_first, InputIt top_actions_last, OutputIt pdf_first, OutputIt pdf_last)
Generates an exploration distribution according to votes on actions.
Definition: explore_internal.h:149

exploration
Definition: explore.h:9

exploration::sample_after_normalizing
int sample_after_normalizing(uint64_t seed, It pdf_first, It pdf_last, uint32_t &chosen_index)
Sample an index from the provided pdf. If the pdf is not normalized it will be updated in-place...
Definition: explore_internal.h:286

exploration::generate_softmax
int generate_softmax(float lambda, InputIt scores_first, InputIt scores_last, OutputIt pdf_first, OutputIt pdf_last)
Generates softmax style exploration distribution.
Definition: explore_internal.h:113

explore_internal.h

exploration::generate_epsilon_greedy
int generate_epsilon_greedy(float epsilon, uint32_t top_action, It pdf_first, It pdf_last)
Generates epsilon-greedy style exploration distribution.
Definition: explore_internal.h:61

exploration::swap_chosen
int swap_chosen(ActionIt action_first, ActionIt action_last, uint32_t chosen_index)
Swap the first value with the chosen index.

exploration::enforce_minimum_probability
int enforce_minimum_probability(float minimum_uniform, bool update_zero_elements, It pdf_first, It pdf_last)
Updates the pdf to ensure each action is explored with at least minimum_uniform/num_actions.
Definition: explore_internal.h:226