1 files changed, 159 insertions, 160 deletions
diff --git a/src/neuralNetwork.h b/src/neuralNetwork.h
index ef96488..6386a0f 100644
--- a/src/neuralNetwork.h
+++ b/src/neuralNetwork.h
@@ -3,7 +3,6 @@
 
 #include <vector>
 #include <boost/shared_ptr.hpp>
-//#include <../3rdparty/Eigen/Dense>
 #include <Eigen/Dense>
 
 #include "util.h"
@@ -16,191 +15,191 @@ namespace nplm
 
 class neuralNetwork
 {
-protected:
-    boost::shared_ptr<model> m;
+ protected:
+  boost::shared_ptr<model> m;
 
-private:
-    bool normalization;
-    double weight;
+ private:
+  bool normalization;
+  double weight;
 
-    propagator prop;
+  propagator prop;
 
-    std::size_t cache_size;
-    Eigen::Matrix<int,Dynamic,Dynamic> cache_keys;
-    std::vector<double> cache_values;
-    int cache_lookups, cache_hits;
+  std::size_t cache_size;
+  Eigen::Matrix<int,Dynamic,Dynamic> cache_keys;
+  std::vector<double> cache_values;
+  int cache_lookups, cache_hits;
 
-public:
-    neuralNetwork() 
+ public:
+  neuralNetwork()
       : m(new model()),
         normalization(false),
-	weight(1.),
-	prop(*m, 1),
+        weight(1.),
+        prop(*m, 1),
         cache_size(0)
-    { 
-    }
+  {
+  }
 
-    void set_normalization(bool value) { normalization = value; }
-    void set_log_base(double value) { weight = 1./std::log(value); }
-
-    // This must be called if the underlying model is resized.
-    void resize() {
-	if (cache_size)
-	{
-	  cache_keys.resize(m->ngram_size, cache_size);
-	  cache_keys.fill(-1);
-	}
-	prop.resize();
-    }
+  void set_normalization(bool value) { normalization = value; }
+  void set_log_base(double value) { weight = 1./std::log(value); }
 
-    void set_width(int width)
+  // This must be called if the underlying model is resized.
+  void resize() {
+    if (cache_size)
     {
-	prop.resize(width);
+      cache_keys.resize(m->ngram_size, cache_size);
+      cache_keys.fill(-1);
     }
-
-    template <typename Derived>
-    double lookup_ngram(const Eigen::MatrixBase<Derived> &ngram)
+    prop.resize();
+  }
+
+  void set_width(int width)
+  {
+    prop.resize(width);
+  }
+
+  template <typename Derived>
+  double lookup_ngram(const Eigen::MatrixBase<Derived> &ngram)
+  {
+    assert (ngram.rows() == m->ngram_size);
+    assert (ngram.cols() == 1);
+
+    std::size_t hash;
+    if (cache_size)
     {
-	assert (ngram.rows() == m->ngram_size);
-	assert (ngram.cols() == 1);
-
-	std::size_t hash;
-	if (cache_size)
-	{
-	    // First look in cache
-	    hash = Eigen::hash_value(ngram) % cache_size; // defined in util.h
-	    cache_lookups++;
-	    if (cache_keys.col(hash) == ngram)
-	    {
-	        cache_hits++;
-		return cache_values[hash];
-	    }
-	}
-
-	// Make sure that we're single threaded. Multithreading doesn't help,
-	// and in some cases can hurt quite a lot
-	int save_threads = omp_get_max_threads();
-	omp_set_num_threads(1);
-	int save_eigen_threads = Eigen::nbThreads();
-	Eigen::setNbThreads(1);
-	#ifdef __INTEL_MKL__
-	int save_mkl_threads = mkl_get_max_threads();
-	mkl_set_num_threads(1);
-	#endif
-
-        prop.fProp(ngram.col(0));
-
-	int output = ngram(m->ngram_size-1, 0);
-	double log_prob;
-
-	start_timer(3);
-	if (normalization)
-	{
-	    Eigen::Matrix<double,Eigen::Dynamic,1> scores(m->output_vocab_size);
-            if (prop.skip_hidden)
-                prop.output_layer_node.param->fProp(prop.first_hidden_activation_node.fProp_matrix, scores);
-            else
-                prop.output_layer_node.param->fProp(prop.second_hidden_activation_node.fProp_matrix, scores);
-	    double logz = logsum(scores.col(0));
-	    log_prob = weight * (scores(output, 0) - logz);
-	}
-	else
-	{
-            if (prop.skip_hidden)
-                log_prob = weight * prop.output_layer_node.param->fProp(prop.first_hidden_activation_node.fProp_matrix, output, 0);
-            else
-                log_prob = weight * prop.output_layer_node.param->fProp(prop.second_hidden_activation_node.fProp_matrix, output, 0);
-	}
-	stop_timer(3);
-
-	if (cache_size)
-	{
-	    // Update cache
-	    cache_keys.col(hash) = ngram;
-	    cache_values[hash] = log_prob;
-	}
-
-	#ifdef __INTEL_MKL__
-	mkl_set_num_threads(save_mkl_threads);
-	#endif
-	Eigen::setNbThreads(save_eigen_threads);
-	omp_set_num_threads(save_threads);
-
-	return log_prob;
+      // First look in cache
+      hash = Eigen::hash_value(ngram) % cache_size; // defined in util.h
+      cache_lookups++;
+      if (cache_keys.col(hash) == ngram)
+      {
+        cache_hits++;
+        return cache_values[hash];
+      }
     }
 
-    // Look up many n-grams in parallel.
-    template <typename DerivedA, typename DerivedB>
-    void lookup_ngram(const Eigen::MatrixBase<DerivedA> &ngram, const Eigen::MatrixBase<DerivedB> &log_probs_const)
-    {
-        UNCONST(DerivedB, log_probs_const, log_probs);
-	assert (ngram.rows() == m->ngram_size);
-	//assert (ngram.cols() <= prop.get_minibatch_size());
-
-        prop.fProp(ngram);
-
-	if (normalization)
-	{
-	    Eigen::Matrix<double,Eigen::Dynamic,Eigen::Dynamic> scores(m->output_vocab_size, ngram.cols());
-            if (prop.skip_hidden)
-                prop.output_layer_node.param->fProp(prop.first_hidden_activation_node.fProp_matrix, scores);
-            else
-                prop.output_layer_node.param->fProp(prop.second_hidden_activation_node.fProp_matrix, scores);
-
-	    // And softmax and loss
-	    Matrix<double,Dynamic,Dynamic> output_probs(m->output_vocab_size, ngram.cols());
-	    double minibatch_log_likelihood;
-	    SoftmaxLogLoss().fProp(scores.leftCols(ngram.cols()), ngram.row(m->ngram_size-1), output_probs, minibatch_log_likelihood);
-	    for (int j=0; j<ngram.cols(); j++)
-	    {
-	        int output = ngram(m->ngram_size-1, j);
-		log_probs(0, j) = weight * output_probs(output, j);
-	    }
-	}
-	else
-	{
-	    for (int j=0; j<ngram.cols(); j++)
-	    {
-	        int output = ngram(m->ngram_size-1, j);
-                if (prop.skip_hidden)
-                    log_probs(0, j) = weight * prop.output_layer_node.param->fProp(prop.first_hidden_activation_node.fProp_matrix, output, j);
-                else
-                    log_probs(0, j) = weight * prop.output_layer_node.param->fProp(prop.second_hidden_activation_node.fProp_matrix, output, j);
-	    }
-	}
-    }
+    // Make sure that we're single threaded. Multithreading doesn't help,
+    // and in some cases can hurt quite a lot
+    int save_threads = omp_get_max_threads();
+    omp_set_num_threads(1);
+    int save_eigen_threads = Eigen::nbThreads();
+    Eigen::setNbThreads(1);
+#ifdef __INTEL_MKL__
+    int save_mkl_threads = mkl_get_max_threads();
+    mkl_set_num_threads(1);
+#endif
+
+    prop.fProp(ngram.col(0));
 
-    int get_order() const { return m->ngram_size; }
+    int output = ngram(m->ngram_size-1, 0);
+    double log_prob;
 
-    void read(const std::string &filename)
+    start_timer(3);
+    if (normalization)
     {
-        m->read(filename);
-        resize();
-	// this is faster but takes more memory
-        //m->premultiply();
+      Eigen::Matrix<double,Eigen::Dynamic,1> scores(m->output_vocab_size);
+      if (prop.skip_hidden)
+        prop.output_layer_node.param->fProp(prop.first_hidden_activation_node.fProp_matrix, scores);
+      else
+        prop.output_layer_node.param->fProp(prop.second_hidden_activation_node.fProp_matrix, scores);
+      double logz = logsum(scores.col(0));
+      log_prob = weight * (scores(output, 0) - logz);
     }
-
-    void set_cache(std::size_t cache_size)
+    else
     {
-        this->cache_size = cache_size;
-	cache_keys.resize(m->ngram_size, cache_size);
-	cache_keys.fill(-1); // clears cache
-	cache_values.resize(cache_size);
-	cache_lookups = cache_hits = 0;
+      if (prop.skip_hidden)
+        log_prob = weight * prop.output_layer_node.param->fProp(prop.first_hidden_activation_node.fProp_matrix, output, 0);
+      else
+        log_prob = weight * prop.output_layer_node.param->fProp(prop.second_hidden_activation_node.fProp_matrix, output, 0);
     }
+    stop_timer(3);
 
-    double cache_hit_rate()
+    if (cache_size)
     {
-        return static_cast<double>(cache_hits)/cache_lookups;
+      // Update cache
+      cache_keys.col(hash) = ngram;
+      cache_values[hash] = log_prob;
     }
 
-    void premultiply()
+#ifdef __INTEL_MKL__
+    mkl_set_num_threads(save_mkl_threads);
+#endif
+    Eigen::setNbThreads(save_eigen_threads);
+    omp_set_num_threads(save_threads);
+
+    return log_prob;
+  }
+
+  // Look up many n-grams in parallel.
+  template <typename DerivedA, typename DerivedB>
+  void lookup_ngram(const Eigen::MatrixBase<DerivedA> &ngram, const Eigen::MatrixBase<DerivedB> &log_probs_const)
+  {
+    UNCONST(DerivedB, log_probs_const, log_probs);
+    assert (ngram.rows() == m->ngram_size);
+    //assert (ngram.cols() <= prop.get_minibatch_size());
+
+    prop.fProp(ngram);
+
+    if (normalization)
+    {
+      Eigen::Matrix<double,Eigen::Dynamic,Eigen::Dynamic> scores(m->output_vocab_size, ngram.cols());
+      if (prop.skip_hidden)
+        prop.output_layer_node.param->fProp(prop.first_hidden_activation_node.fProp_matrix, scores);
+      else
+        prop.output_layer_node.param->fProp(prop.second_hidden_activation_node.fProp_matrix, scores);
+
+      // And softmax and loss
+      Matrix<double,Dynamic,Dynamic> output_probs(m->output_vocab_size, ngram.cols());
+      double minibatch_log_likelihood;
+      SoftmaxLogLoss().fProp(scores.leftCols(ngram.cols()), ngram.row(m->ngram_size-1), output_probs, minibatch_log_likelihood);
+      for (int j=0; j<ngram.cols(); j++)
+      {
+        int output = ngram(m->ngram_size-1, j);
+        log_probs(0, j) = weight * output_probs(output, j);
+      }
+    }
+    else
+    {
+      for (int j=0; j<ngram.cols(); j++)
+      {
+        int output = ngram(m->ngram_size-1, j);
+        if (prop.skip_hidden)
+          log_probs(0, j) = weight * prop.output_layer_node.param->fProp(prop.first_hidden_activation_node.fProp_matrix, output, j);
+        else
+          log_probs(0, j) = weight * prop.output_layer_node.param->fProp(prop.second_hidden_activation_node.fProp_matrix, output, j);
+      }
+    }
+  }
+
+  int get_order() const { return m->ngram_size; }
+
+  void read(const std::string &filename)
+  {
+    m->read(filename);
+    resize();
+    // this is faster but takes more memory
+    //m->premultiply();
+  }
+
+  void set_cache(std::size_t cache_size)
+  {
+    this->cache_size = cache_size;
+    cache_keys.resize(m->ngram_size, cache_size);
+    cache_keys.fill(-1); // clears cache
+    cache_values.resize(cache_size);
+    cache_lookups = cache_hits = 0;
+  }
+
+  double cache_hit_rate()
+  {
+    return static_cast<double>(cache_hits)/cache_lookups;
+  }
+
+  void premultiply()
+  {
+    if (!m->premultiplied)
     {
-        if (!m->premultiplied)
-        {
-            m->premultiply();
-        }
+      m->premultiply();
     }
+  }
 
 };