cpp/8.8.1/lda__core_8cc_source.html

 /*
 Copyright (c) by respective owners including Yahoo!, Microsoft, and
 individual contributors. All rights reserved.  Released under a BSD (revised)
 license as described in the file LICENSE.
  */
 #ifdef _WIN32
 #pragma warning(disable : 4996)  // generated by inner_product use
 #endif
 #include <fstream>
 #include <vector>
 #include <queue>
 #include <algorithm>
 #include <numeric>
 #include <cmath>
 #include "correctedMath.h"
 #include "vw_versions.h"
 #include "vw.h"
 #include "mwt.h"
 #include <boost/math/special_functions/digamma.hpp>
 #include <boost/math/special_functions/gamma.hpp>

 #ifdef _WIN32
 #define NOMINMAX
 #include <winsock2.h>
 #else
 #include <netdb.h>
 #endif

 #include <cstring>
 #include <cstdio>
 #include <cassert>
 #include "no_label.h"
 #include "gd.h"
 #include "rand48.h"
 #include "reductions.h"
 #include "array_parameters.h"
 #include <boost/version.hpp>

 #if BOOST_VERSION >= 105600
 #include <boost/align/is_aligned.hpp>
 #endif

 using namespace VW::config;

 enum lda_math_mode
 {
   USE_SIMD,
   USE_PRECISE,
   USE_FAST_APPROX
 };

 class index_feature
 {
  public:
   uint32_t document;
   feature f;
   bool operator<(const index_feature b) const { return f.weight_index < b.f.weight_index; }
 };

 struct lda
 {
   size_t topics;
   float lda_alpha;
   float lda_rho;
   float lda_D;
   float lda_epsilon;
   size_t minibatch;
   lda_math_mode mmode;

   v_array<float> Elogtheta;
   v_array<float> decay_levels;
   v_array<float> total_new;
   v_array<example *> examples;
   v_array<float> total_lambda;
   v_array<int> doc_lengths;
   v_array<float> digammas;
   v_array<float> v;
   std::vector<index_feature> sorted_features;

   bool compute_coherence_metrics;

   // size by 1 << bits
   std::vector<uint32_t> feature_counts;
   std::vector<std::vector<size_t>> feature_to_example_map;

   bool total_lambda_init;

   double example_t;
   vw *all;  // regressor, lda

   static constexpr float underflow_threshold = 1.0e-10f;
   inline float digamma(float x);
   inline float lgamma(float x);
   inline float powf(float x, float p);
   inline void expdigammify(vw &all, float *gamma);
   inline void expdigammify_2(vw &all, float *gamma, float *norm);

   ~lda()
   {
     Elogtheta.delete_v();
     decay_levels.delete_v();
     total_new.delete_v();
     examples.delete_v();
     total_lambda.delete_v();
     doc_lengths.delete_v();
     digammas.delete_v();
     v.delete_v();
   }
 };

 // #define VW_NO_INLINE_SIMD

 namespace
 {
 inline bool is_aligned16(void *ptr)
 {
 #if BOOST_VERSION >= 105600
   return boost::alignment::is_aligned(16, ptr);
 #else
   return ((reinterpret_cast<uintptr_t>(ptr) & 0x0f) == 0);
 #endif
 }
 }  // namespace

 namespace ldamath
 {
 inline float fastlog2(float x)
 {
   uint32_t mx;
   memcpy(&mx, &x, sizeof(uint32_t));
   mx = (mx & 0x007FFFFF) | (0x7e << 23);

   float mx_f;
   memcpy(&mx_f, &mx, sizeof(float));

   uint32_t vx;
   memcpy(&vx, &x, sizeof(uint32_t));

   float y = static_cast<float>(vx);
   y *= 1.0f / (float)(1 << 23);

   return y - 124.22544637f - 1.498030302f * mx_f - 1.72587999f / (0.3520887068f + mx_f);
 }

 inline float fastlog(float x) { return 0.69314718f * fastlog2(x); }

 inline float fastpow2(float p)
 {
   float offset = (p < 0) * 1.0f;
   float clipp = (p < -126.0) ? -126.0f : p;
   int w = (int)clipp;
   float z = clipp - w + offset;
   uint32_t approx = (uint32_t)((1 << 23) * (clipp + 121.2740838f + 27.7280233f / (4.84252568f - z) - 1.49012907f * z));

   float v;
   memcpy(&v, &approx, sizeof(uint32_t));
   return v;
 }

 inline float fastexp(float p) { return fastpow2(1.442695040f * p); }

 inline float fastpow(float x, float p) { return fastpow2(p * fastlog2(x)); }

 inline float fastlgamma(float x)
 {
   float logterm = fastlog(x * (1.0f + x) * (2.0f + x));
   float xp3 = 3.0f + x;

   return -2.081061466f - x + 0.0833333f / xp3 - logterm + (2.5f + x) * fastlog(xp3);
 }

 inline float fastdigamma(float x)
 {
   float twopx = 2.0f + x;
   float logterm = fastlog(twopx);

   return -(1.0f + 2.0f * x) / (x * (1.0f + x)) - (13.0f + 6.0f * x) / (12.0f * twopx * twopx) + logterm;
 }

 #if !defined(VW_NO_INLINE_SIMD)

 #if defined(__SSE2__) || defined(__SSE3__) || defined(__SSE4_1__)

 // Include headers for the various SSE versions:
 #if defined(__SSE2__)
 #include <emmintrin.h>
 #endif
 #if defined(__SSE3__)
 #include <tmmintrin.h>
 #endif
 #if defined(__SSE4_1__)
 #include <smmintrin.h>
 #endif

 #define HAVE_SIMD_MATHMODE

 typedef __m128 v4sf;
 typedef __m128i v4si;

 inline v4sf v4si_to_v4sf(v4si x) { return _mm_cvtepi32_ps(x); }

 inline v4si v4sf_to_v4si(v4sf x) { return _mm_cvttps_epi32(x); }

 // Extract v[idx]
 template <const int idx>
 float v4sf_index(const v4sf x)
 {
 #if defined(__SSE4_1__)
   float ret;
   uint32_t val;

   val = _mm_extract_ps(x, idx);
   // Portably convert uint32_t bit pattern to float. Optimizers will generally
   // make this disappear.
   memcpy(&ret, &val, sizeof(uint32_t));
   return ret;
 #else
   return _mm_cvtss_f32(_mm_shuffle_ps(x, x, _MM_SHUFFLE(idx, idx, idx, idx)));
 #endif
 }

 // Specialization for the 0'th element
 template <>
 float v4sf_index<0>(const v4sf x)
 {
   return _mm_cvtss_f32(x);
 }

 inline v4sf v4sfl(const float x) { return _mm_set1_ps(x); }

 inline v4si v4sil(const uint32_t x) { return _mm_set1_epi32(x); }

 #ifdef WIN32

 inline __m128 operator+(const __m128 a, const __m128 b) { return _mm_add_ps(a, b); }

 inline __m128 operator-(const __m128 a, const __m128 b) { return _mm_sub_ps(a, b); }

 inline __m128 operator*(const __m128 a, const __m128 b) { return _mm_mul_ps(a, b); }

 inline __m128 operator/(const __m128 a, const __m128 b) { return _mm_div_ps(a, b); }

 #endif

 inline v4sf vfastpow2(const v4sf p)
 {
   v4sf ltzero = _mm_cmplt_ps(p, v4sfl(0.0f));
   v4sf offset = _mm_and_ps(ltzero, v4sfl(1.0f));
   v4sf lt126 = _mm_cmplt_ps(p, v4sfl(-126.0f));
   v4sf clipp = _mm_andnot_ps(lt126, p) + _mm_and_ps(lt126, v4sfl(-126.0f));
   v4si w = v4sf_to_v4si(clipp);
   v4sf z = clipp - v4si_to_v4sf(w) + offset;

   const v4sf c_121_2740838 = v4sfl(121.2740838f);
   const v4sf c_27_7280233 = v4sfl(27.7280233f);
   const v4sf c_4_84252568 = v4sfl(4.84252568f);
   const v4sf c_1_49012907 = v4sfl(1.49012907f);

   v4sf v = v4sfl(1 << 23) * (clipp + c_121_2740838 + c_27_7280233 / (c_4_84252568 - z) - c_1_49012907 * z);

   return _mm_castsi128_ps(v4sf_to_v4si(v));
 }

 inline v4sf vfastexp(const v4sf p)
 {
   const v4sf c_invlog_2 = v4sfl(1.442695040f);

   return vfastpow2(c_invlog_2 * p);
 }

 inline v4sf vfastlog2(v4sf x)
 {
   v4si vx_i = _mm_castps_si128(x);
   v4sf mx_f = _mm_castsi128_ps(_mm_or_si128(_mm_and_si128(vx_i, v4sil(0x007FFFFF)), v4sil(0x3f000000)));
   v4sf y = v4si_to_v4sf(vx_i) * v4sfl(1.1920928955078125e-7f);

   const v4sf c_124_22551499 = v4sfl(124.22551499f);
   const v4sf c_1_498030302 = v4sfl(1.498030302f);
   const v4sf c_1_725877999 = v4sfl(1.72587999f);
   const v4sf c_0_3520087068 = v4sfl(0.3520887068f);

   return y - c_124_22551499 - c_1_498030302 * mx_f - c_1_725877999 / (c_0_3520087068 + mx_f);
 }

 inline v4sf vfastlog(v4sf x)
 {
   const v4sf c_0_69314718 = v4sfl(0.69314718f);

   return c_0_69314718 * vfastlog2(x);
 }

 inline v4sf vfastdigamma(v4sf x)
 {
   v4sf twopx = v4sfl(2.0f) + x;
   v4sf logterm = vfastlog(twopx);

   return (v4sfl(-48.0f) + x * (v4sfl(-157.0f) + x * (v4sfl(-127.0f) - v4sfl(30.0f) * x))) /
       (v4sfl(12.0f) * x * (v4sfl(1.0f) + x) * twopx * twopx) +
       logterm;
 }

 void vexpdigammify(vw &all, float *gamma, const float underflow_threshold)
 {
   float extra_sum = 0.0f;
   v4sf sum = v4sfl(0.0f);
   float *fp;
   const float *fpend = gamma + all.lda;

   // Iterate through the initial part of the array that isn't 128-bit SIMD
   // aligned.
   for (fp = gamma; fp < fpend && !is_aligned16(fp); ++fp)
   {
     extra_sum += *fp;
     *fp = fastdigamma(*fp);
   }

   // Rip through the aligned portion...
   for (; is_aligned16(fp) && fp + 4 < fpend; fp += 4)
   {
     v4sf arg = _mm_load_ps(fp);
     sum = sum + arg;
     arg = vfastdigamma(arg);
     _mm_store_ps(fp, arg);
   }

   for (; fp < fpend; ++fp)
   {
     extra_sum += *fp;
     *fp = fastdigamma(*fp);
   }

 #if defined(__SSE3__) || defined(__SSE4_1__)
   // Do two horizontal adds on sum, extract the total from the 0 element:
   sum = _mm_hadd_ps(sum, sum);
   sum = _mm_hadd_ps(sum, sum);
   extra_sum += v4sf_index<0>(sum);
 #else
   extra_sum += v4sf_index<0>(sum) + v4sf_index<1>(sum) + v4sf_index<2>(sum) + v4sf_index<3>(sum);
 #endif

   extra_sum = fastdigamma(extra_sum);
   sum = v4sfl(extra_sum);

   for (fp = gamma; fp < fpend && !is_aligned16(fp); ++fp)
   {
     *fp = fmax(underflow_threshold, fastexp(*fp - extra_sum));
   }

   for (; is_aligned16(fp) && fp + 4 < fpend; fp += 4)
   {
     v4sf arg = _mm_load_ps(fp);
     arg = arg - sum;
     arg = vfastexp(arg);
     arg = _mm_max_ps(v4sfl(underflow_threshold), arg);
     _mm_store_ps(fp, arg);
   }

   for (; fp < fpend; ++fp)
   {
     *fp = fmax(underflow_threshold, fastexp(*fp - extra_sum));
   }
 }

 void vexpdigammify_2(vw &all, float *gamma, const float *norm, const float underflow_threshold)
 {
   float *fp = gamma;
   const float *np;
   const float *fpend = gamma + all.lda;

   for (np = norm; fp < fpend && !is_aligned16(fp); ++fp, ++np)
     *fp = fmax(underflow_threshold, fastexp(fastdigamma(*fp) - *np));

   for (; is_aligned16(fp) && fp + 4 < fpend; fp += 4, np += 4)
   {
     v4sf arg = _mm_load_ps(fp);
     arg = vfastdigamma(arg);
     v4sf vnorm = _mm_loadu_ps(np);
     arg = arg - vnorm;
     arg = vfastexp(arg);
     arg = _mm_max_ps(v4sfl(underflow_threshold), arg);
     _mm_store_ps(fp, arg);
   }

   for (; fp < fpend; ++fp, ++np) *fp = fmax(underflow_threshold, fastexp(fastdigamma(*fp) - *np));
 }

 #else
 // PLACEHOLDER for future ARM NEON code
 // Also remember to define HAVE_SIMD_MATHMODE
 #endif

 #endif  // !VW_NO_INLINE_SIMD

 // Templates for common code shared between the three math modes (SIMD, fast approximations
 // and accurate).
 //
 // The generic template takes a type and a specialization flag, mtype.
 //
 // mtype == USE_PRECISE: Use the accurate computation for lgamma, digamma.
 // mtype == USE_FAST_APPROX: Use the fast approximations for lgamma, digamma.
 // mtype == USE_SIMD: Use CPU SIMD instruction
 //
 // The generic template is specialized for the particular accuracy setting.

 // Log gamma:
 template <typename T, const lda_math_mode mtype>
 inline T lgamma(T /* x */)
 {
   BOOST_STATIC_ASSERT_MSG(true, "ldamath::lgamma is not defined for this type and math mode.");
 }

 // Digamma:
 template <typename T, const lda_math_mode mtype>
 inline T digamma(T /* x */)
 {
   BOOST_STATIC_ASSERT_MSG(true, "ldamath::digamma is not defined for this type and math mode.");
 }

 // Exponential
 template <typename T, lda_math_mode mtype>
 inline T exponential(T /* x */)
 {
   BOOST_STATIC_ASSERT_MSG(true, "ldamath::exponential is not defined for this type and math mode.");
 }

 // Powf
 template <typename T, lda_math_mode mtype>
 inline T powf(T /* x */, T /* p */)
 {
   BOOST_STATIC_ASSERT_MSG(true, "ldamath::powf is not defined for this type and math mode.");
 }

 // High accuracy float specializations:

 template <>
 inline float lgamma<float, USE_PRECISE>(float x)
 {
   return boost::math::lgamma(x);
 }
 template <>
 inline float digamma<float, USE_PRECISE>(float x)
 {
   return boost::math::digamma(x);
 }
 template <>
 inline float exponential<float, USE_PRECISE>(float x)
 {
   return correctedExp(x);
 }
 template <>
 inline float powf<float, USE_PRECISE>(float x, float p)
 {
   return std::pow(x, p);
 }

 // Fast approximation float specializations:

 template <>
 inline float lgamma<float, USE_FAST_APPROX>(float x)
 {
   return fastlgamma(x);
 }
 template <>
 inline float digamma<float, USE_FAST_APPROX>(float x)
 {
   return fastdigamma(x);
 }
 template <>
 inline float exponential<float, USE_FAST_APPROX>(float x)
 {
   return fastexp(x);
 }
 template <>
 inline float powf<float, USE_FAST_APPROX>(float x, float p)
 {
   return fastpow(x, p);
 }

 // SIMD specializations:

 template <>
 inline float lgamma<float, USE_SIMD>(float x)
 {
   return lgamma<float, USE_FAST_APPROX>(x);
 }
 template <>
 inline float digamma<float, USE_SIMD>(float x)
 {
   return digamma<float, USE_FAST_APPROX>(x);
 }
 template <>
 inline float exponential<float, USE_SIMD>(float x)
 {
   return exponential<float, USE_FAST_APPROX>(x);
 }
 template <>
 inline float powf<float, USE_SIMD>(float x, float p)
 {
   return powf<float, USE_FAST_APPROX>(x, p);
 }

 template <typename T, const lda_math_mode mtype>
 inline void expdigammify(vw &all, T *gamma, T threshold, T initial)
 {
   T sum = digamma<T, mtype>(std::accumulate(gamma, gamma + all.lda, initial));

   std::transform(gamma, gamma + all.lda, gamma,
       [sum, threshold](T g) { return fmax(threshold, exponential<T, mtype>(digamma<T, mtype>(g) - sum)); });
 }
 template <>
 inline void expdigammify<float, USE_SIMD>(vw &all, float *gamma, float threshold, float)
 {
 #if defined(HAVE_SIMD_MATHMODE)
   vexpdigammify(all, gamma, threshold);
 #else
   // Do something sensible if SIMD math isn't available:
   expdigammify<float, USE_FAST_APPROX>(all, gamma, threshold, 0.0);
 #endif
 }

 template <typename T, const lda_math_mode mtype>
 inline void expdigammify_2(vw &all, float *gamma, T *norm, const T threshold)
 {
   std::transform(gamma, gamma + all.lda, norm, gamma,
       [threshold](float g, float n) { return fmax(threshold, exponential<T, mtype>(digamma<T, mtype>(g) - n)); });
 }
 template <>
 inline void expdigammify_2<float, USE_SIMD>(vw &all, float *gamma, float *norm, const float threshold)
 {
 #if defined(HAVE_SIMD_MATHMODE)
   vexpdigammify_2(all, gamma, norm, threshold);
 #else
   // Do something sensible if SIMD math isn't available:
   expdigammify_2<float, USE_FAST_APPROX>(all, gamma, norm, threshold);
 #endif
 }

 }  // namespace ldamath

 float lda::digamma(float x)
 {
   switch (mmode)
   {
     case USE_FAST_APPROX:
       // std::cerr << "lda::digamma FAST_APPROX ";
       return ldamath::digamma<float, USE_FAST_APPROX>(x);
     case USE_PRECISE:
       // std::cerr << "lda::digamma PRECISE ";
       return ldamath::digamma<float, USE_PRECISE>(x);
     case USE_SIMD:
       // std::cerr << "lda::digamma SIMD ";
       return ldamath::digamma<float, USE_SIMD>(x);
     default:
       // Should not happen.
       std::cerr << "lda::digamma: Trampled or invalid math mode, aborting" << std::endl;
       abort();
       return 0.0f;
   }
 }

 float lda::lgamma(float x)
 {
   switch (mmode)
   {
     case USE_FAST_APPROX:
       // std::cerr << "lda::lgamma FAST_APPROX ";
       return ldamath::lgamma<float, USE_FAST_APPROX>(x);
     case USE_PRECISE:
       // std::cerr << "lda::lgamma PRECISE ";
       return ldamath::lgamma<float, USE_PRECISE>(x);
     case USE_SIMD:
       // std::cerr << "lda::gamma SIMD ";
       return ldamath::lgamma<float, USE_SIMD>(x);
     default:
       std::cerr << "lda::lgamma: Trampled or invalid math mode, aborting" << std::endl;
       abort();
       return 0.0f;
   }
 }

 float lda::powf(float x, float p)
 {
   switch (mmode)
   {
     case USE_FAST_APPROX:
       // std::cerr << "lda::powf FAST_APPROX ";
       return ldamath::powf<float, USE_FAST_APPROX>(x, p);
     case USE_PRECISE:
       // std::cerr << "lda::powf PRECISE ";
       return ldamath::powf<float, USE_PRECISE>(x, p);
     case USE_SIMD:
       // std::cerr << "lda::powf SIMD ";
       return ldamath::powf<float, USE_SIMD>(x, p);
     default:
       std::cerr << "lda::powf: Trampled or invalid math mode, aborting" << std::endl;
       abort();
       return 0.0f;
   }
 }

 void lda::expdigammify(vw &all, float *gamma)
 {
   switch (mmode)
   {
     case USE_FAST_APPROX:
       ldamath::expdigammify<float, USE_FAST_APPROX>(all, gamma, underflow_threshold, 0.0f);
       break;
     case USE_PRECISE:
       ldamath::expdigammify<float, USE_PRECISE>(all, gamma, underflow_threshold, 0.0f);
       break;
     case USE_SIMD:
       ldamath::expdigammify<float, USE_SIMD>(all, gamma, underflow_threshold, 0.0f);
       break;
     default:
       std::cerr << "lda::expdigammify: Trampled or invalid math mode, aborting" << std::endl;
       abort();
   }
 }

 void lda::expdigammify_2(vw &all, float *gamma, float *norm)
 {
   switch (mmode)
   {
     case USE_FAST_APPROX:
       ldamath::expdigammify_2<float, USE_FAST_APPROX>(all, gamma, norm, underflow_threshold);
       break;
     case USE_PRECISE:
       ldamath::expdigammify_2<float, USE_PRECISE>(all, gamma, norm, underflow_threshold);
       break;
     case USE_SIMD:
       ldamath::expdigammify_2<float, USE_SIMD>(all, gamma, norm, underflow_threshold);
       break;
     default:
       std::cerr << "lda::expdigammify_2: Trampled or invalid math mode, aborting" << std::endl;
       abort();
   }
 }

 static inline float average_diff(vw &all, float *oldgamma, float *newgamma)
 {
   float sum;
   float normalizer;

   // This warps the normal sense of "inner product", but it accomplishes the same
   // thing as the "plain old" for loop. clang does a good job of reducing the
   // common subexpressions.
   sum = std::inner_product(
       oldgamma, oldgamma + all.lda, newgamma, 0.0f, [](float accum, float absdiff) { return accum + absdiff; },
       [](float old_g, float new_g) { return std::abs(old_g - new_g); });

   normalizer = std::accumulate(newgamma, newgamma + all.lda, 0.0f);
   return sum / normalizer;
 }

 // Returns E_q[log p(\theta)] - E_q[log q(\theta)].
 float theta_kl(lda &l, v_array<float> &Elogtheta, float *gamma)
 {
   float gammasum = 0;
   Elogtheta.clear();
   for (size_t k = 0; k < l.topics; k++)
   {
     Elogtheta.push_back(l.digamma(gamma[k]));
     gammasum += gamma[k];
   }
   float digammasum = l.digamma(gammasum);
   gammasum = l.lgamma(gammasum);
   float kl = -(l.topics * l.lgamma(l.lda_alpha));
   kl += l.lgamma(l.lda_alpha * l.topics) - gammasum;
   for (size_t k = 0; k < l.topics; k++)
   {
     Elogtheta[k] -= digammasum;
     kl += (l.lda_alpha - gamma[k]) * Elogtheta[k];
     kl += l.lgamma(gamma[k]);
   }

   return kl;
 }

 static inline float find_cw(lda &l, float *u_for_w, float *v)
 {
   return 1.0f / std::inner_product(u_for_w, u_for_w + l.topics, v, 0.0f);
 }

 namespace
 {
 // Effectively, these are static and not visible outside the compilation unit.
 v_array<float> new_gamma = v_init<float>();
 v_array<float> old_gamma = v_init<float>();
 }  // namespace

 // Returns an estimate of the part of the variational bound that
 // doesn't have to do with beta for the entire corpus for the current
 // setting of lambda based on the document passed in. The value is
 // divided by the total number of words in the document This can be
 // used as a (possibly very noisy) estimate of held-out likelihood.
 float lda_loop(lda &l, v_array<float> &Elogtheta, float *v, example *ec, float)
 {
   parameters &weights = l.all->weights;
   new_gamma.clear();
   old_gamma.clear();

   for (size_t i = 0; i < l.topics; i++)
   {
     new_gamma.push_back(1.f);
     old_gamma.push_back(0.f);
   }
   size_t num_words = 0;
   for (features &fs : *ec) num_words += fs.size();

   float xc_w = 0;
   float score = 0;
   float doc_length = 0;
   do
   {
     memcpy(v, new_gamma.begin(), sizeof(float) * l.topics);
     l.expdigammify(*l.all, v);

     memcpy(old_gamma.begin(), new_gamma.begin(), sizeof(float) * l.topics);
     memset(new_gamma.begin(), 0, sizeof(float) * l.topics);

     score = 0;
     size_t word_count = 0;
     doc_length = 0;
     for (features &fs : *ec)
     {
       for (features::iterator &f : fs)
       {
         float *u_for_w = &(weights[f.index()]) + l.topics + 1;
         float c_w = find_cw(l, u_for_w, v);
         xc_w = c_w * f.value();
         score += -f.value() * log(c_w);
         size_t max_k = l.topics;
         for (size_t k = 0; k < max_k; k++, ++u_for_w) new_gamma[k] += xc_w * *u_for_w;
         word_count++;
         doc_length += f.value();
       }
     }
     for (size_t k = 0; k < l.topics; k++) new_gamma[k] = new_gamma[k] * v[k] + l.lda_alpha;
   } while (average_diff(*l.all, old_gamma.begin(), new_gamma.begin()) > l.lda_epsilon);

   ec->pred.scalars.clear();
   ec->pred.scalars.resize(l.topics);
   memcpy(ec->pred.scalars.begin(), new_gamma.begin(), l.topics * sizeof(float));
   ec->pred.scalars.end() = ec->pred.scalars.begin() + l.topics;

   score += theta_kl(l, Elogtheta, new_gamma.begin());

   return score / doc_length;
 }

 size_t next_pow2(size_t x)
 {
   int i = 0;
   x = x > 0 ? x - 1 : 0;
   while (x > 0)
   {
     x >>= 1;
     i++;
   }
   return ((size_t)1) << i;
 }

 struct initial_weights
 {
   weight _initial;
   weight _initial_random;
   bool _random;
   uint32_t _lda;
   uint32_t _stride;
   initial_weights(weight initial, weight initial_random, bool random, uint32_t lda, uint32_t stride)
       : _initial(initial), _initial_random(initial_random), _random(random), _lda(lda), _stride(stride)
   {
   }
 };

 template <class T>
 class set_initial_lda_wrapper
 {
  public:
   static void func(weight &w, initial_weights &iw, uint64_t index)
   {
     uint32_t lda = iw._lda;
     weight initial_random = iw._initial_random;
     if (iw._random)
     {
       weight *pw = &w;
       for (size_t i = 0; i != lda; ++i, ++index) pw[i] = (float)(-log(merand48(index) + 1e-6) + 1.0f) * initial_random;
     }
     (&w)[lda] = iw._initial;
   }
 };

 void save_load(lda &l, io_buf &model_file, bool read, bool text)
 {
   vw &all = *(l.all);
   uint64_t length = (uint64_t)1 << all.num_bits;
   if (read)
   {
     initialize_regressor(all);
     initial_weights init(all.initial_t, (float)(l.lda_D / all.lda / all.length() * 200), all.random_weights, all.lda,
         all.weights.stride());
     if (all.weights.sparse)
       all.weights.sparse_weights.set_default<initial_weights, set_initial_lda_wrapper<sparse_parameters>>(init);
     else
       all.weights.dense_weights.set_default<initial_weights, set_initial_lda_wrapper<dense_parameters>>(init);
   }
   if (!model_file.files.empty())
   {
     uint64_t i = 0;
     std::stringstream msg;
     size_t brw = 1;

     do
     {
       brw = 0;
       size_t K = all.lda;
       if (!read && text)
         msg << i << " ";

       if (!read || all.model_file_ver >= VERSION_FILE_WITH_HEADER_ID)
         brw += bin_text_read_write_fixed(model_file, (char *)&i, sizeof(i), "", read, msg, text);
       else
       {
         // support 32bit build models
         uint32_t j;
         brw += bin_text_read_write_fixed(model_file, (char *)&j, sizeof(j), "", read, msg, text);
         i = j;
       }

       if (brw != 0)
       {
         weight *w = &(all.weights.strided_index(i));
         for (uint64_t k = 0; k < K; k++)
         {
           weight *v = w + k;
           if (!read && text)
             msg << *v + l.lda_rho << " ";
           brw += bin_text_read_write_fixed(model_file, (char *)v, sizeof(*v), "", read, msg, text);
         }
       }
       if (text)
       {
         if (!read)
           msg << "\n";
         brw += bin_text_read_write_fixed(model_file, nullptr, 0, "", read, msg, text);
       }
       if (!read)
         ++i;
     } while ((!read && i < length) || (read && brw > 0));
   }
 }

 void return_example(vw &all, example &ec)
 {
   all.sd->update(ec.test_only, true, ec.loss, ec.weight, ec.num_features);
   for (int f : all.final_prediction_sink) MWT::print_scalars(f, ec.pred.scalars, ec.tag);

   if (all.sd->weighted_examples() >= all.sd->dump_interval && !all.quiet)
     all.sd->print_update(
         all.holdout_set_off, all.current_pass, "none", 0, ec.num_features, all.progress_add, all.progress_arg);
   VW::finish_example(all, ec);
 }

 void learn_batch(lda &l)
 {
   parameters &weights = l.all->weights;
   if (l.sorted_features.empty())  // FAST-PASS for real "true"
   {
     // This can happen when the socket connection is dropped by the client.
     // If l.sorted_features is empty, then l.sorted_features[0] does not
     // exist, so we should not try to take its address in the beginning of
     // the for loops down there. Since it seems that there's not much to
     // do in this case, we just return.
     for (size_t d = 0; d < l.examples.size(); d++)
     {
       l.examples[d]->pred.scalars.clear();
       l.examples[d]->pred.scalars.resize(l.topics);
       memset(l.examples[d]->pred.scalars.begin(), 0, l.topics * sizeof(float));
       l.examples[d]->pred.scalars.end() = l.examples[d]->pred.scalars.begin() + l.topics;

       l.examples[d]->pred.scalars.clear();
       return_example(*l.all, *l.examples[d]);
     }
     l.examples.clear();
     return;
   }

   float eta = -1;
   float minuseta = -1;

   if (l.total_lambda.empty())
   {
     for (size_t k = 0; k < l.all->lda; k++) l.total_lambda.push_back(0.f);
     // This part does not work with sparse parameters
     size_t stride = weights.stride();
     for (size_t i = 0; i <= weights.mask(); i += stride)
     {
       weight *w = &(weights[i]);
       for (size_t k = 0; k < l.all->lda; k++) l.total_lambda[k] += w[k];
     }
   }

   l.example_t++;
   l.total_new.clear();
   for (size_t k = 0; k < l.all->lda; k++) l.total_new.push_back(0.f);

   size_t batch_size = l.examples.size();

   sort(l.sorted_features.begin(), l.sorted_features.end());

   eta = l.all->eta * l.powf((float)l.example_t, -l.all->power_t);
   minuseta = 1.0f - eta;
   eta *= l.lda_D / batch_size;
   l.decay_levels.push_back(l.decay_levels.last() + log(minuseta));

   l.digammas.clear();
   float additional = (float)(l.all->length()) * l.lda_rho;
   for (size_t i = 0; i < l.all->lda; i++) l.digammas.push_back(l.digamma(l.total_lambda[i] + additional));

   uint64_t last_weight_index = -1;
   for (index_feature *s = &l.sorted_features[0]; s <= &l.sorted_features.back(); s++)
   {
     if (last_weight_index == s->f.weight_index)
       continue;
     last_weight_index = s->f.weight_index;
     // float *weights_for_w = &(weights[s->f.weight_index]);
     float *weights_for_w = &(weights[s->f.weight_index & weights.mask()]);
     float decay_component =
         l.decay_levels.end()[-2] - l.decay_levels.end()[(int)(-1 - l.example_t + *(weights_for_w + l.all->lda))];
     float decay = fmin(1.0f, correctedExp(decay_component));
     float *u_for_w = weights_for_w + l.all->lda + 1;

     *(weights_for_w + l.all->lda) = (float)l.example_t;
     for (size_t k = 0; k < l.all->lda; k++)
     {
       weights_for_w[k] *= decay;
       u_for_w[k] = weights_for_w[k] + l.lda_rho;
     }

     l.expdigammify_2(*l.all, u_for_w, l.digammas.begin());
   }

   for (size_t d = 0; d < batch_size; d++)
   {
     float score = lda_loop(l, l.Elogtheta, &(l.v[d * l.all->lda]), l.examples[d], l.all->power_t);
     if (l.all->audit)
       GD::print_audit_features(*l.all, *l.examples[d]);
     // If the doc is empty, give it loss of 0.
     if (l.doc_lengths[d] > 0)
     {
       l.all->sd->sum_loss -= score;
       l.all->sd->sum_loss_since_last_dump -= score;
     }
     return_example(*l.all, *l.examples[d]);
   }

   // -t there's no need to update weights (especially since it's a noop)
   if (eta != 0)
   {
     for (index_feature *s = &l.sorted_features[0]; s <= &l.sorted_features.back();)
     {
       index_feature *next = s + 1;
       while (next <= &l.sorted_features.back() && next->f.weight_index == s->f.weight_index) next++;

       float *word_weights = &(weights[s->f.weight_index]);
       for (size_t k = 0; k < l.all->lda; k++, ++word_weights)
       {
         float new_value = minuseta * *word_weights;
         *word_weights = new_value;
       }

       for (; s != next; s++)
       {
         float *v_s = &(l.v[s->document * l.all->lda]);
         float *u_for_w = &(weights[s->f.weight_index]) + l.all->lda + 1;
         float c_w = eta * find_cw(l, u_for_w, v_s) * s->f.x;
         word_weights = &(weights[s->f.weight_index]);
         for (size_t k = 0; k < l.all->lda; k++, ++u_for_w, ++word_weights)
         {
           float new_value = *u_for_w * v_s[k] * c_w;
           l.total_new[k] += new_value;
           *word_weights += new_value;
         }
       }
     }

     for (size_t k = 0; k < l.all->lda; k++)
     {
       l.total_lambda[k] *= minuseta;
       l.total_lambda[k] += l.total_new[k];
     }
   }
   l.sorted_features.resize(0);

   l.examples.clear();
   l.doc_lengths.clear();
 }

 void learn(lda &l, LEARNER::single_learner &, example &ec)
 {
   uint32_t num_ex = (uint32_t)l.examples.size();
   l.examples.push_back(&ec);
   l.doc_lengths.push_back(0);
   for (features &fs : ec)
   {
     for (features::iterator &f : fs)
     {
       index_feature temp = {num_ex, feature(f.value(), f.index())};
       l.sorted_features.push_back(temp);
       l.doc_lengths[num_ex] += (int)f.value();
     }
   }
   if (++num_ex == l.minibatch)
     learn_batch(l);
 }

 void learn_with_metrics(lda &l, LEARNER::single_learner &base, example &ec)
 {
   if (l.all->passes_complete == 0)
   {
     // build feature to example map
     uint64_t stride_shift = l.all->weights.stride_shift();
     uint64_t weight_mask = l.all->weights.mask();

     for (features &fs : ec)
     {
       for (features::iterator &f : fs)
       {
         uint64_t idx = (f.index() & weight_mask) >> stride_shift;
         l.feature_counts[idx] += (uint32_t)f.value();
         l.feature_to_example_map[idx].push_back(ec.example_counter);
       }
     }
   }

   learn(l, base, ec);
 }

 // placeholder
 void predict(lda &l, LEARNER::single_learner &base, example &ec) { learn(l, base, ec); }
 void predict_with_metrics(lda &l, LEARNER::single_learner &base, example &ec) { learn_with_metrics(l, base, ec); }

 struct word_doc_frequency
 {
   // feature/word index
   uint64_t idx;
   // document count
   uint32_t count;
 };

 // cooccurence of 2 features/words
 struct feature_pair
 {
   // feature/word 1
   uint64_t f1;
   // feature/word 2
   uint64_t f2;

   feature_pair(uint64_t _f1, uint64_t _f2) : f1(_f1), f2(_f2) {}
 };

 template <class T>
 void get_top_weights(vw *all, int top_words_count, int topic, std::vector<feature> &output, T &weights)
 {
   uint64_t length = (uint64_t)1 << all->num_bits;

   // get top features for this topic
   auto cmp = [](feature left, feature right) { return left.x > right.x; };
   std::priority_queue<feature, std::vector<feature>, decltype(cmp)> top_features(cmp);
   typename T::iterator iter = weights.begin();

   for (uint64_t i = 0; i < std::min(static_cast<uint64_t>(top_words_count), length); i++, ++iter)
     top_features.push({(&(*iter))[topic], iter.index()});

   for (uint64_t i = top_words_count; i < length; i++, ++iter)
   {
     weight v = (&(*iter))[topic];
     if (v > top_features.top().x)
     {
       top_features.pop();
       top_features.push({v, i});
     }
   }

   // extract idx and sort descending
   output.resize(top_features.size());
   for (int i = (int)top_features.size() - 1; i >= 0; i--)
   {
     output[i] = top_features.top();
     top_features.pop();
   }
 }

 void get_top_weights(vw *all, int top_words_count, int topic, std::vector<feature> &output)
 {
   if (all->weights.sparse)
     get_top_weights(all, top_words_count, topic, output, all->weights.sparse_weights);
   else
     get_top_weights(all, top_words_count, topic, output, all->weights.dense_weights);
 }

 template <class T>
 void compute_coherence_metrics(lda &l, T &weights)
 {
   uint64_t length = (uint64_t)1 << l.all->num_bits;

   std::vector<std::vector<feature_pair>> topics_word_pairs;
   topics_word_pairs.resize(l.topics);

   int top_words_count = 10;  // parameterize and check

   for (size_t topic = 0; topic < l.topics; topic++)
   {
     // get top features for this topic
     auto cmp = [](feature &left, feature &right) { return left.x > right.x; };
     std::priority_queue<feature, std::vector<feature>, decltype(cmp)> top_features(cmp);
     typename T::iterator iter = weights.begin();
     for (uint64_t i = 0; i < std::min(static_cast<uint64_t>(top_words_count), length); i++, ++iter)
       top_features.push(feature((&(*iter))[topic], iter.index()));

     for (typename T::iterator v = weights.begin(); v != weights.end(); ++v)
       if ((&(*v))[topic] > top_features.top().x)
       {
         top_features.pop();
         top_features.push(feature((&(*v))[topic], v.index()));
       }

     // extract idx and sort descending
     std::vector<uint64_t> top_features_idx;
     top_features_idx.resize(top_features.size());
     for (int i = (int)top_features.size() - 1; i >= 0; i--)
     {
       top_features_idx[i] = top_features.top().weight_index;
       top_features.pop();
     }

     auto &word_pairs = topics_word_pairs[topic];
     for (size_t i = 0; i < top_features_idx.size(); i++)
       for (size_t j = i + 1; j < top_features_idx.size(); j++)
         word_pairs.emplace_back(top_features_idx[i], top_features_idx[j]);
   }

   // compress word pairs and create record for storing frequency
   std::map<uint64_t, std::vector<word_doc_frequency>> coWordsDFSet;
   for (auto &vec : topics_word_pairs)
   {
     for (auto &wp : vec)
     {
       auto f1 = wp.f1;
       auto f2 = wp.f2;
       auto wdf = coWordsDFSet.find(f1);

       if (wdf != coWordsDFSet.end())
       {
         // http://stackoverflow.com/questions/5377434/does-stdmapiterator-return-a-copy-of-value-or-a-value-itself
         // if (wdf->second.find(f2) == wdf->second.end())

         if (std::find_if(wdf->second.begin(), wdf->second.end(),
                 [&f2](const word_doc_frequency &v) { return v.idx == f2; }) != wdf->second.end())
         {
           wdf->second.push_back({f2, 0});
           // printf(" add %d %d\n", f1, f2);
         }
       }
       else
       {
         std::vector<word_doc_frequency> vec = {{f2, 0}};
         coWordsDFSet.insert(std::make_pair(f1, vec));
         // printf(" insert %d %d\n", f1, f2);
       }
     }
   }

   // this.GetWordPairsDocumentFrequency(coWordsDFSet);
   for (auto &pair : coWordsDFSet)
   {
     auto &examples_for_f1 = l.feature_to_example_map[pair.first];
     for (auto &wdf : pair.second)
     {
       auto &examples_for_f2 = l.feature_to_example_map[wdf.idx];

       // assumes examples_for_f1 and examples_for_f2 are orderd
       size_t i = 0;
       size_t j = 0;
       while (i < examples_for_f1.size() && j < examples_for_f2.size())
       {
         if (examples_for_f1[i] == examples_for_f2[j])
         {
           wdf.count++;
           i++;
           j++;
         }
         else if (examples_for_f2[j] < examples_for_f1[i])
           j++;
         else
           i++;
       }
     }
   }

   float epsilon = 1e-6f;  // TODO
   float avg_coherence = 0;
   for (size_t topic = 0; topic < l.topics; topic++)
   {
     float coherence = 0;

     for (auto &pairs : topics_word_pairs[topic])
     {
       auto f1 = pairs.f1;
       if (l.feature_counts[f1] == 0)
         continue;

       auto f2 = pairs.f2;
       auto &co_feature = coWordsDFSet[f1];
       auto co_feature_df = std::find_if(
           co_feature.begin(), co_feature.end(), [&f2](const word_doc_frequency &v) { return v.idx == f2; });

       if (co_feature_df != co_feature.end())
       {
         // printf("(%d:%d + eps)/(%d:%d)\n", f2, co_feature_df->count, f1, l.feature_counts[f1]);
         coherence += logf((co_feature_df->count + epsilon) / l.feature_counts[f1]);
       }
     }

     printf("Topic %3d coherence: %f\n", (int)topic, coherence);

     // TODO: expose per topic coherence

     // TODO: good vs. bad topics
     avg_coherence += coherence;
   }

   avg_coherence /= l.topics;

   printf("Avg topic coherence: %f\n", avg_coherence);
 }

 void compute_coherence_metrics(lda &l)
 {
   if (l.all->weights.sparse)
     compute_coherence_metrics(l, l.all->weights.sparse_weights);
   else
     compute_coherence_metrics(l, l.all->weights.dense_weights);
 }

 void end_pass(lda &l)
 {
   if (!l.examples.empty())
     learn_batch(l);

   if (l.compute_coherence_metrics && l.all->passes_complete == l.all->numpasses)
   {
     compute_coherence_metrics(l);
     // FASTPASS return;
   }
 }

 template <class T>
 void end_examples(lda &l, T &weights)
 {
   for (typename T::iterator iter = weights.begin(); iter != weights.end(); ++iter)
   {
     float decay_component =
         l.decay_levels.last() - l.decay_levels.end()[(int)(-1 - l.example_t + (&(*iter))[l.all->lda])];
     float decay = fmin(1.f, correctedExp(decay_component));

     weight *wp = &(*iter);
     for (size_t i = 0; i < l.all->lda; ++i) wp[i] *= decay;
   }
 }

 void end_examples(lda &l)
 {
   if (l.all->weights.sparse)
     end_examples(l, l.all->weights.sparse_weights);
   else
     end_examples(l, l.all->weights.dense_weights);
 }

 void finish_example(vw &, lda &, example &) {}

 std::istream &operator>>(std::istream &in, lda_math_mode &mmode)
 {
   using namespace boost::program_options;

   std::string token;
   in >> token;
   if (token == "simd")
     mmode = USE_SIMD;
   else if (token == "accuracy" || token == "precise")
     mmode = USE_PRECISE;
   else if (token == "fast-approx" || token == "approx")
     mmode = USE_FAST_APPROX;
   else
     throw boost::program_options::invalid_option_value(token);
   return in;
 }

 LEARNER::base_learner *lda_setup(options_i &options, vw &all)
 {
   auto ld = scoped_calloc_or_throw<lda>();
   option_group_definition new_options("Latent Dirichlet Allocation");
   int math_mode;
   new_options.add(make_option("lda", ld->topics).keep().help("Run lda with <int> topics"))
       .add(make_option("lda_alpha", ld->lda_alpha)
                .keep()
                .default_value(0.1f)
                .help("Prior on sparsity of per-document topic weights"))
       .add(make_option("lda_rho", ld->lda_rho)
                .keep()
                .default_value(0.1f)
                .help("Prior on sparsity of topic distributions"))
       .add(make_option("lda_D", ld->lda_D).default_value(10000.0f).help("Number of documents"))
       .add(make_option("lda_epsilon", ld->lda_epsilon).default_value(0.001f).help("Loop convergence threshold"))
       .add(make_option("minibatch", ld->minibatch).default_value(1).help("Minibatch size, for LDA"))
       .add(make_option("math-mode", math_mode).default_value(USE_SIMD).help("Math mode: simd, accuracy, fast-approx"))
       .add(make_option("metrics", ld->compute_coherence_metrics).help("Compute metrics"));
   options.add_and_parse(new_options);

   // Convert from int to corresponding enum value.
   ld->mmode = static_cast<lda_math_mode>(math_mode);

   if (!options.was_supplied("lda"))
     return nullptr;

   all.lda = (uint32_t)ld->topics;
   all.delete_prediction = delete_scalars;
   ld->sorted_features = std::vector<index_feature>();
   ld->total_lambda_init = false;
   ld->all = &all;
   ld->example_t = all.initial_t;
   if (ld->compute_coherence_metrics)
   {
     ld->feature_counts.resize((uint32_t)(UINT64_ONE << all.num_bits));
     ld->feature_to_example_map.resize((uint32_t)(UINT64_ONE << all.num_bits));
   }

   float temp = ceilf(logf((float)(all.lda * 2 + 1)) / logf(2.f));

   all.weights.stride_shift((size_t)temp);
   all.random_weights = true;
   all.add_constant = false;

   if (all.eta > 1.)
   {
     std::cerr << "your learning rate is too high, setting it to 1" << std::endl;
     all.eta = std::min(all.eta, 1.f);
   }

   size_t minibatch2 = next_pow2(ld->minibatch);
   if (minibatch2 > all.p->ring_size)
   {
     bool previous_strict_parse = all.p->strict_parse;
     delete all.p;
     all.p = new parser{minibatch2, previous_strict_parse};
   }

   ld->v.resize(all.lda * ld->minibatch);

   ld->decay_levels.push_back(0.f);

   all.p->lp = no_label::no_label_parser;

   LEARNER::learner<lda, example> &l = init_learner(ld, ld->compute_coherence_metrics ? learn_with_metrics : learn,
       ld->compute_coherence_metrics ? predict_with_metrics : predict, UINT64_ONE << all.weights.stride_shift(),
       prediction_type::scalars);

   l.set_save_load(save_load);
   l.set_finish_example(finish_example);
   l.set_end_examples(end_examples);
   l.set_end_pass(end_pass);

   return make_base(l);
 }
lda::examples
v_array< example * > examples
Definition: lda_core.cc:73

lda::doc_lengths
v_array< int > doc_lengths
Definition: lda_core.cc:75

shared_data::sum_loss
double sum_loss
Definition: global_data.h:145

ldamath::powf< float, USE_SIMD >
float powf< float, USE_SIMD >(float x, float p)
Definition: lda_core.cc:497

v_array::resize
void resize(size_t length)
Definition: v_array.h:69

example::tag
v_array< char > tag
Definition: example.h:63

vw::length
size_t length()
Definition: global_data.h:513

fastexp
static float fastexp(float p)
Definition: nn.cc:79

index_feature::operator<
bool operator<(const index_feature b) const
Definition: lda_core.cc:57

learn_batch
void learn_batch(lda &l)
Definition: lda_core.cc:864

correctedExp
#define correctedExp
Definition: correctedMath.h:27

initial_weights::_initial
weight _initial
Definition: lda_core.cc:765

VERSION_FILE_WITH_HEADER_ID
#define VERSION_FILE_WITH_HEADER_ID
Definition: vw_versions.h:19

vw::weights
parameters weights
Definition: global_data.h:537

compute_coherence_metrics
void compute_coherence_metrics(lda &l, T &weights)
Definition: lda_core.cc:1103

GD::print_audit_features
void print_audit_features(vw &all, example &ec)
Definition: gd.cc:331

lda::minibatch
size_t minibatch
Definition: lda_core.cc:67

accumulate
void accumulate(vw &all, parameters &weights, size_t offset)
Definition: accumulate.cc:20

lda::total_lambda
v_array< float > total_lambda
Definition: lda_core.cc:74

lda::decay_levels
v_array< float > decay_levels
Definition: lda_core.cc:71

learn_with_metrics
void learn_with_metrics(lda &l, LEARNER::single_learner &base, example &ec)
Definition: lda_core.cc:1017

vw::delete_prediction
void(* delete_prediction)(void *)
Definition: global_data.h:485

initialize_regressor
void initialize_regressor(vw &all, T &weights)
Definition: parse_regressor.cc:97

ldamath
Definition: lda_core.cc:125

lda::powf
float powf(float x, float p)
Definition: lda_core.cc:581

feature_pair::f2
uint64_t f2
Definition: lda_core.cc:1057

stride_shift
uint64_t stride_shift(const stagewise_poly &poly, uint64_t idx)
Definition: stagewise_poly.cc:81

feature::x
float x
Definition: feature_group.h:27

vw::initial_t
float initial_t
Definition: global_data.h:530

MWT::print_scalars
void print_scalars(int f, v_array< float > &scalars, v_array< char > &tag)
Definition: mwt.cc:149

ldamath::expdigammify< float, USE_SIMD >
void expdigammify< float, USE_SIMD >(vw &all, float *gamma, float threshold, float)
Definition: lda_core.cc:511

lda::mmode
lda_math_mode mmode
Definition: lda_core.cc:68

ldamath::expdigammify_2
void expdigammify_2(vw &all, float *gamma, T *norm, const T threshold)
Definition: lda_core.cc:522

gd.h

lda_math_mode
lda_math_mode
Definition: lda_core.cc:45

ldamath::digamma< float, USE_SIMD >
float digamma< float, USE_SIMD >(float x)
Definition: lda_core.cc:487

word_doc_frequency
Definition: lda_core.cc:1043

vw::add_constant
bool add_constant
Definition: global_data.h:496

ldamath::lgamma< float, USE_PRECISE >
float lgamma< float, USE_PRECISE >(float x)
Definition: lda_core.cc:436

correctedMath.h

ldamath::powf< float, USE_PRECISE >
float powf< float, USE_PRECISE >(float x, float p)
Definition: lda_core.cc:451

lda::lda_rho
float lda_rho
Definition: lda_core.cc:64

vw::power_t
float power_t
Definition: global_data.h:447

vw::final_prediction_sink
v_array< int > final_prediction_sink
Definition: global_data.h:518

ldamath::fastdigamma
float fastdigamma(float x)
Definition: lda_core.cc:172

parameters::stride
uint32_t stride()
Definition: array_parameters.h:252

lda::all
vw * all
Definition: lda_core.cc:89

lda::expdigammify_2
void expdigammify_2(vw &all, float *gamma, float *norm)
Definition: lda_core.cc:620

features
the core definition of a set of features.
Definition: feature_group.h:241

dense_parameters::set_default
void set_default(R &info)
Definition: array_parameters_dense.h:91

ldamath::exponential< float, USE_PRECISE >
float exponential< float, USE_PRECISE >(float x)
Definition: lda_core.cc:446

lda_setup
LEARNER::base_learner * lda_setup(options_i &options, vw &all)
Definition: lda_core.cc:1299

LEARNER::make_base
base_learner * make_base(learner< T, E > &base)
Definition: learner.h:462

VW::config::option_group_definition
Definition: options.h:85

USE_SIMD
Definition: lda_core.cc:47

ldamath::exponential
T exponential(T)
Definition: lda_core.cc:421

predict_with_metrics
void predict_with_metrics(lda &l, LEARNER::single_learner &base, example &ec)
Definition: lda_core.cc:1041

ldamath::exponential< float, USE_FAST_APPROX >
float exponential< float, USE_FAST_APPROX >(float x)
Definition: lda_core.cc:469

vw::quiet
bool quiet
Definition: global_data.h:487

array_parameters.h

ldamath::exponential< float, USE_SIMD >
float exponential< float, USE_SIMD >(float x)
Definition: lda_core.cc:492

VW::config::options_i::add_and_parse
virtual void add_and_parse(const option_group_definition &group)=0

LEARNER::learner::set_save_load
void set_save_load(void(*sl)(T &, io_buf &, bool, bool))
Definition: learner.h:257

initial_weights::_stride
uint32_t _stride
Definition: lda_core.cc:769

sparse_parameters::set_default
void set_default(R &info)
Definition: array_parameters.h:171

merand48
float merand48(uint64_t &initial)
Definition: rand48.cc:16

mwt.h

lda::example_t
double example_t
Definition: lda_core.cc:88

initial_weights::_random
bool _random
Definition: lda_core.cc:767

prediction_type::scalars
Definition: learner.h:21

vw::holdout_set_off
bool holdout_set_off
Definition: global_data.h:499

anonymous_namespace{lda_core.cc}::is_aligned16
bool is_aligned16(void *ptr)
Definition: lda_core.cc:115

LEARNER::learner
Definition: cb_explore.h:11

vw::num_bits
uint32_t num_bits
Definition: global_data.h:398

v_array::begin
T *& begin()
Definition: v_array.h:42

feature::weight_index
uint64_t weight_index
Definition: feature_group.h:28

vw::progress_add
bool progress_add
Definition: global_data.h:545

parser::strict_parse
bool strict_parse
Definition: parser.h:107

v_array::size
size_t size() const
Definition: v_array.h:68

anonymous_namespace{lda_core.cc}::new_gamma
v_array< float > new_gamma
Definition: lda_core.cc:687

return_example
void return_example(vw &all, example &ec)
Definition: lda_core.cc:853

vw_versions.h

no_label.h

lda::lda_epsilon
float lda_epsilon
Definition: lda_core.cc:66

vw
Definition: global_data.h:369

shared_data::sum_loss_since_last_dump
double sum_loss_since_last_dump
Definition: global_data.h:146

vw::p
parser * p
Definition: global_data.h:377

vw::lda
uint32_t lda
Definition: global_data.h:508

next_pow2
size_t next_pow2(size_t x)
Definition: lda_core.cc:751

lda::lgamma
float lgamma(float x)
Definition: lda_core.cc:561

ldamath::digamma< float, USE_PRECISE >
float digamma< float, USE_PRECISE >(float x)
Definition: lda_core.cc:441

LEARNER::learner::set_finish_example
void set_finish_example(void(*f)(vw &all, T &, E &))
Definition: learner.h:307

lda::lda_alpha
float lda_alpha
Definition: lda_core.cc:63

word_doc_frequency::idx
uint64_t idx
Definition: lda_core.cc:1046

ldamath::powf< float, USE_FAST_APPROX >
float powf< float, USE_FAST_APPROX >(float x, float p)
Definition: lda_core.cc:474

ldamath::lgamma< float, USE_FAST_APPROX >
float lgamma< float, USE_FAST_APPROX >(float x)
Definition: lda_core.cc:459

ldamath::lgamma< float, USE_SIMD >
float lgamma< float, USE_SIMD >(float x)
Definition: lda_core.cc:482

initial_weights::initial_weights
initial_weights(weight initial, weight initial_random, bool random, uint32_t lda, uint32_t stride)
Definition: lda_core.cc:770

lda::Elogtheta
v_array< float > Elogtheta
Definition: lda_core.cc:70

LEARNER::init_learner
learner< T, E > & init_learner(free_ptr< T > &dat, L *base, void(*learn)(T &, L &, E &), void(*predict)(T &, L &, E &), size_t ws, prediction_type::prediction_type_t pred_type)
Definition: learner.h:369

USE_PRECISE
Definition: lda_core.cc:48

v_array::push_back
void push_back(const T &new_ele)
Definition: v_array.h:107

parameters
Definition: array_parameters.h:226

vw::sd
shared_data * sd
Definition: global_data.h:375

ldamath::powf
T powf(T, T)
Definition: lda_core.cc:428

Search::random
size_t random(std::shared_ptr< rand_state > &rs, size_t max)
Definition: search.cc:768

ldamath::fastlgamma
float fastlgamma(float x)
Definition: lda_core.cc:164

word_doc_frequency::count
uint32_t count
Definition: lda_core.cc:1048

vw::model_file_ver
VW::version_struct model_file_ver
Definition: global_data.h:419

vw::progress_arg
float progress_arg
Definition: global_data.h:546

lda_loop
float lda_loop(lda &l, v_array< float > &Elogtheta, float *v, example *ec, float)
Definition: lda_core.cc:696

lda::lda_D
float lda_D
Definition: lda_core.cc:65

delete_scalars
void delete_scalars(void *v)
Definition: example.h:37

io_buf::files
v_array< int > files
Definition: io_buf.h:64

v_array::clear
void clear()
Definition: v_array.h:88

lda::~lda
~lda()
Definition: lda_core.cc:98

shared_data::print_update
void print_update(bool holdout_set_off, size_t current_pass, float label, float prediction, size_t num_features, bool progress_add, float progress_arg)
Definition: global_data.h:225

example::num_features
size_t num_features
Definition: example.h:67

VW::config::options_i::was_supplied
virtual bool was_supplied(const std::string &key)=0

ldamath::fastlog2
float fastlog2(float x)
Definition: lda_core.cc:127

Search::absdiff
size_t absdiff(size_t a, size_t b)
Definition: search.cc:1946

ldamath::expdigammify_2< float, USE_SIMD >
void expdigammify_2< float, USE_SIMD >(vw &all, float *gamma, float *norm, const float threshold)
Definition: lda_core.cc:528

theta_kl
float theta_kl(lda &l, v_array< float > &Elogtheta, float *gamma)
Definition: lda_core.cc:656

VW::config::options_i
Definition: options.h:107

rand48.h

vw::random_weights
bool random_weights
Definition: global_data.h:492

lda::feature_counts
std::vector< uint32_t > feature_counts
Definition: lda_core.cc:83

USE_FAST_APPROX
Definition: lda_core.cc:49

parameters::dense_weights
dense_parameters dense_weights
Definition: array_parameters.h:233

lda::feature_to_example_map
std::vector< std::vector< size_t > > feature_to_example_map
Definition: lda_core.cc:84

example
Definition: example.h:54

ldamath::fastpow
float fastpow(float x, float p)
Definition: lda_core.cc:162

vw::current_pass
uint64_t current_pass
Definition: global_data.h:396

parameters::strided_index
weight & strided_index(size_t index)
Definition: array_parameters.h:311

lda::compute_coherence_metrics
bool compute_coherence_metrics
Definition: lda_core.cc:80

set_initial_lda_wrapper::func
static void func(weight &w, initial_weights &iw, uint64_t index)
Definition: lda_core.cc:780

parser::ring_size
const size_t ring_size
Definition: parser.h:80

io_buf
Definition: io_buf.h:54

learn
void learn(lda &l, LEARNER::single_learner &, example &ec)
Definition: lda_core.cc:999

ldamath::expdigammify
void expdigammify(vw &all, T *gamma, T threshold, T initial)
Definition: lda_core.cc:503

VW::finish_example
void finish_example(vw &, example &)
Definition: parser.cc:881

reductions.h

v_array::end
T *& end()
Definition: v_array.h:43

save_load
void save_load(lda &l, io_buf &model_file, bool read, bool text)
Definition: lda_core.cc:793

lda::digammas
v_array< float > digammas
Definition: lda_core.cc:76

set_initial_lda_wrapper
Definition: lda_core.cc:777

vw::numpasses
size_t numpasses
Definition: global_data.h:451

shared_data::update
void update(bool test_example, bool labeled_example, float loss, float weight, size_t num_features)
Definition: global_data.h:190

example::loss
float loss
Definition: example.h:70

vw::eta
float eta
Definition: global_data.h:531

index_feature
Definition: lda_core.cc:52

ldamath::digamma
T digamma(T)
Definition: lda_core.cc:414

weight
float weight
Definition: array_parameters_dense.h:6

add
int add(svm_params &params, svm_example *fec)
Definition: kernel_svm.cc:546

features_value_index_iterator
iterator over values and indicies
Definition: feature_group.h:112

initial_weights
Definition: lda_core.cc:763

feature
Definition: feature_group.h:25

VW::config
Definition: options.h:11

lda::total_new
v_array< float > total_new
Definition: lda_core.cc:72

lda::topics
size_t topics
Definition: lda_core.cc:62

a
constexpr uint64_t a
Definition: rand48.cc:11

vw::passes_complete
size_t passes_complete
Definition: global_data.h:452

VW::config::make_option
typed_option< T > make_option(std::string name, T &location)
Definition: options.h:80

get_top_weights
void get_top_weights(vw *all, int top_words_count, int topic, std::vector< feature > &output, T &weights)
Definition: lda_core.cc:1063

UINT64_ONE
constexpr uint64_t UINT64_ONE
Definition: crossplat_compat.h:16

LEARNER::learner::set_end_pass
void set_end_pass(void(*f)(T &))
Definition: learner.h:286

lda::expdigammify
void expdigammify(vw &all, float *gamma)
Definition: lda_core.cc:601

parameters::sparse_weights
sparse_parameters sparse_weights
Definition: array_parameters.h:234

lda::digamma
float digamma(float x)
Definition: lda_core.cc:540

v_array::empty
bool empty() const
Definition: v_array.h:59

feature_pair::f1
uint64_t f1
Definition: lda_core.cc:1055

operator>>
std::istream & operator>>(std::istream &in, lda_math_mode &mmode)
Definition: lda_core.cc:1282

initial_weights::_initial_random
weight _initial_random
Definition: lda_core.cc:766

ldamath::fastlog
float fastlog(float x)
Definition: lda_core.cc:145

vw.h

predict
void predict(lda &l, LEARNER::single_learner &base, example &ec)
Definition: lda_core.cc:1040

average_diff
static float average_diff(vw &all, float *oldgamma, float *newgamma)
Definition: lda_core.cc:639

parameters::stride_shift
uint32_t stride_shift()
Definition: array_parameters.h:244

ACTION_SCORE::cmp
int cmp(size_t a, size_t b)
Definition: action_score.h:47

lda::sorted_features
std::vector< index_feature > sorted_features
Definition: lda_core.cc:78

fastpow2
static float fastpow2(float p)
Definition: nn.cc:64

anonymous_namespace{lda_core.cc}::old_gamma
v_array< float > old_gamma
Definition: lda_core.cc:688

parser
Definition: parser.h:38

find_cw
static float find_cw(lda &l, float *u_for_w, float *v)
Definition: lda_core.cc:679

vw::audit
bool audit
Definition: global_data.h:486

v_array::last
T last() const
Definition: v_array.h:57

index_feature::document
uint32_t document
Definition: lda_core.cc:55

example::pred
polyprediction pred
Definition: example.h:60

v_array::delete_v
void delete_v()
Definition: v_array.h:98

end_examples
void end_examples(lda &l, T &weights)
Definition: lda_core.cc:1259

initial_weights::_lda
uint32_t _lda
Definition: lda_core.cc:768

index_feature::f
feature f
Definition: lda_core.cc:56

lda::total_lambda_init
bool total_lambda_init
Definition: lda_core.cc:86

end_pass
void end_pass(lda &l)
Definition: lda_core.cc:1246

example::weight
float weight
Definition: example.h:62

v_array< float >

shared_data::weighted_examples
double weighted_examples()
Definition: global_data.h:188

shared_data::dump_interval
float dump_interval
Definition: global_data.h:147

polyprediction::scalars
v_array< float > scalars
Definition: example.h:46

bin_text_read_write_fixed
size_t bin_text_read_write_fixed(io_buf &io, char *data, size_t len, const char *read_message, bool read, std::stringstream &msg, bool text)
Definition: io_buf.h:326

parameters::mask
uint64_t mask()
Definition: array_parameters.h:260

ldamath::digamma< float, USE_FAST_APPROX >
float digamma< float, USE_FAST_APPROX >(float x)
Definition: lda_core.cc:464

parameters::sparse
bool sparse
Definition: array_parameters.h:232

f
float f
Definition: cache.cc:40

LEARNER::learner::set_end_examples
void set_end_examples(void(*f)(T &))
Definition: learner.h:295

parser::lp
label_parser lp
Definition: parser.h:102

lda::v
v_array< float > v
Definition: lda_core.cc:77

lda
Definition: lda_core.cc:60

feature_pair
Definition: lda_core.cc:1052

feature_pair::feature_pair
feature_pair(uint64_t _f1, uint64_t _f2)
Definition: lda_core.cc:1059

ldamath::lgamma
T lgamma(T)
Definition: lda_core.cc:407

no_label::no_label_parser
label_parser no_label_parser
Definition: no_label.cc:41

example::test_only
bool test_only
Definition: example.h:76