FFM CPU

h2oai · Jun 13, 2018 · 1732077 · 1732077
1 parent 665237a
commit 1732077
Show file tree

Hide file tree

Showing 9 changed files with 229 additions and 115 deletions.
diff --git a/src/base/ffm/batching.h b/src/base/ffm/batching.h
@@ -5,6 +5,7 @@
 #pragma once
 
 #include "../../include/data/ffm/data.h"
+#include "../../include/solver/ffm_api.h"
 #include "../../common/logger.h"
 
 namespace ffm {
@@ -66,6 +67,8 @@ class DatasetBatcher {
 
   DatasetBatcher(int numRows) : numRows(numRows) {}
 
+  DatasetBatcher(Dataset<T> &dataset, Params const &params, int rows) : dataset(&dataset), numRows(rows) {}
+
   bool hasNext() const {
     return pos < numRows;
   }
@@ -78,7 +81,21 @@ class DatasetBatcher {
     pos = 0;
   }
 
-  virtual DatasetBatch<T> *nextBatch(int batchSize) {}
+  virtual DatasetBatch<T> *nextBatch(int batchSize) {
+    int actualBatchSize = batchSize <= this->remaining() && batchSize > 0 ? batchSize : this->remaining();
+
+    int moveBy = this->dataset->rowPositions[this->pos];
+    DatasetBatch<T> *batch = new DatasetBatch<T>(this->dataset->features + moveBy,
+                                                 this->dataset->fields + moveBy,
+                                                 this->dataset->values + moveBy,
+                                                 this->dataset->labels + this->pos,
+                                                 this->dataset->scales + this->pos,
+                                                 this->dataset->rowPositions + this->pos,
+                                                 actualBatchSize);
+    this->pos = this->pos + actualBatchSize;
+
+    return batch;
+  }
 
   bool empty() {
     return numRows <= 0;

diff --git a/src/base/ffm/ffm.cpp b/src/base/ffm/ffm.cpp
@@ -26,12 +26,12 @@ int FFM<T>::fit(Dataset<T> &dataset, Dataset<T> &valid_dataset) {
   for (; epoch <= this->params.nIter; epoch++) {
     log_info(this->params.verbose, "Iteration %d/%d.", epoch, this->params.nIter);
     timer.tic();
-    T trainingLoss = trainer.trainOneEpoch();
+    double trainingLoss = trainer.trainOneEpoch();
 
     log_info(this->params.verbose, "Train log loss = %f", trainingLoss);
 
     if(this->validate()) {
-      T validationLoss = trainer.validationLoss();
+      double validationLoss = trainer.validationLoss();
 
       log_info(this->params.verbose, "Validation log loss = %f", validationLoss);
 

diff --git a/src/base/ffm/trainer.h b/src/base/ffm/trainer.h
@@ -22,11 +22,11 @@ class Trainer {
   void setTrainingDataset(Dataset<T> &dataset);
   void setValidationDataset(Dataset<T> &dataset);
 
-  T validationLoss();
+  double validationLoss();
 
-  T trainOneEpoch();
+  double trainOneEpoch();
 
-  T oneEpoch(std::vector<DatasetBatcher<T> *> dataBatcher, bool update);
+  double oneEpoch(std::vector<DatasetBatcher<T> *> dataBatcher, bool update);
 
   void predict(T *predictions);
 

diff --git a/src/cpu/ffm/trainer.cpp b/src/cpu/ffm/trainer.cpp
@@ -7,36 +7,172 @@
 namespace ffm {
 
 template<typename T>
-Trainer<T>::Trainer(Params &params) : params(params) {
-  // TODO implement
+Trainer<T>::Trainer(Params &params) : params(params), trainDataBatcher(1), validationDataBatcher(1) {
+  this->model = new Model<T>(params);
 }
 
 template<typename T>
-Trainer<T>::Trainer(const T* weights, Params &params) : params(params) {
-  // TODO implement
+Trainer<T>::Trainer(const T* weights, Params &params) : params(params),
+                                                        trainDataBatcher(1),
+                                                        validationDataBatcher(1) {
+  this->model = new Model<T>(params, weights);
 }
 
 template<typename T>
 void Trainer<T>::setTrainingDataset(Dataset<T> &dataset) {
-  // TODO implement
+  DatasetBatcher<T> *batcher = new DatasetBatcher<T>(dataset, params, params.numRows);
+  trainDataBatcher[0] = batcher;
 }
 
 template<typename T>
 void Trainer<T>::setValidationDataset(Dataset<T> &dataset) {
-  // TODO implement
+  DatasetBatcher<T> *batcher = new DatasetBatcher<T>(dataset, params, params.numRowsVal);
+  validationDataBatcher[0] = batcher;
+}
+
+template<typename T>
+Trainer<T>::~Trainer() {
+  delete trainDataBatcher[0];
+  delete validationDataBatcher[0];
+  delete model;
+}
+
+// Original code at https://github.com/guestwalk/libffm
+template<typename T>
+inline double wTx(
+    int start, int end,
+    const int *__restrict__ features, const int *__restrict__ fields, const T *__restrict__ values, const T r,
+    T *__restrict__ weights,
+    int kALIGN, int k, int numFields, float lambda, float eta, T kappa, const bool update) {
+  int align0 = kALIGN * k;
+  int align1 = numFields * align0;
+
+  double t = 0;
+  for (int n1 = start; n1 < end; n1++) {
+    int j1 = features[n1];
+    int f1 = fields[n1];
+    T v1 = values[n1];
+
+    for (int n2 = n1 + 1; n2 < end; n2++) {
+      int j2 = features[n2];
+      int f2 = fields[n2];
+      T v2 = values[n2];
+
+      int idx1 = (int) j1 * align1 + f2 * align0;
+      int idx2 = (int) j2 * align1 + f1 * align0;
+      T *w1 = weights + idx1;
+      T *w2 = weights + idx2;
+
+      double v = v1 * v2 * r;
+
+      if (update) {
+        T *wg1 = w1 + 1;
+        T *wg2 = w2 + 1;
+
+        for (int d = 0; d < align0; d += kALIGN) {
+          T g1 = lambda * w1[d] + kappa * w2[d] * v;
+          T g2 = lambda * w2[d] + kappa * w1[d] * v;
+
+          wg1[d] += g1 * g1;
+          wg2[d] += g2 * g2;
+
+          w1[d] -= eta / std::sqrt(wg1[d]) * g1;
+          w2[d] -= eta / std::sqrt(wg2[d]) * g2;
+
+        }
+      } else {
+        for (int d = 0; d < align0; d += kALIGN) {
+          t += w1[d] * w2[d] * v;
+        }
+      }
+    }
+  }
+
+  return t;
 }
 
 template<typename T>
 void Trainer<T>::predict(T *predictions) {
-  // TODO implement
+  double loss = 0;
+
+  while (this->trainDataBatcher[0]->hasNext()) {
+    DatasetBatch<T> *batch = this->trainDataBatcher[0]->nextBatch(this->params.batchSize);
+
+    T *weightsPtr = this->model->weights.data();
+
+    // Used to cast from global indexing to batch local indexing of row positions
+    int offset = batch->rowPositions[0];
+#pragma omp parallel for
+    for(int row = 0; row < batch->numRows; row++) {
+      T t = wTx(
+          batch->rowPositions[row] - offset, batch->rowPositions[row + 1] - offset,
+          batch->features, batch->fields, batch->values, batch->scales[row],
+          weightsPtr, 1, params.k, params.numFields, params.regLambda, params.learningRate, (T)0, false);
+
+      predictions[row] = 1.0 / (1.0 + std::exp(-t));
+
+    }
+    delete batch;
+  }
+
+  this->trainDataBatcher[0]->reset();
+}
+
+template<typename T>
+double Trainer<T>::validationLoss() {
+  return this->oneEpoch(this->validationDataBatcher, false);
 }
 
 template<typename T>
-T Trainer<T>::trainOneEpoch() {
-  // TODO implement
+double Trainer<T>::trainOneEpoch() {
+  return this->oneEpoch(this->trainDataBatcher, true);
+}
+
+template<typename T>
+double Trainer<T>::oneEpoch(std::vector<DatasetBatcher<T>*> dataBatcher, bool update) {
+  log_debug(this->params.verbose, "Computing an FFM epoch (update = %s)", update ? "true" : "false");
+
+  double loss = 0;
+
+  while (dataBatcher[0]->hasNext()) {
+    DatasetBatch<T> *batch = dataBatcher[0]->nextBatch(this->params.batchSize);
+
+    T *weightsPtr = this->model->weights.data();
+
+    // Used to cast from global indexing to batch local indexing of row positions
+    int offset = batch->rowPositions[0];
+#pragma omp parallel for schedule(static) reduction(+: loss)
+    for(int row = 0; row < batch->numRows; row++) {
+      double t = wTx(
+          batch->rowPositions[row] - offset, batch->rowPositions[row + 1] - offset,
+          batch->features, batch->fields, batch->values, batch->scales[row],
+          weightsPtr, 2, params.k, params.numFields, params.regLambda, params.learningRate, (T)0, false);
+
+      int y = batch->labels[row];
+
+      T expnyt = std::exp(-y*t);
+
+      loss += std::log(1+expnyt);
+
+      if (update) {
+        T kappa = -y * expnyt/(1+expnyt);
+
+        wTx(batch->rowPositions[row] - offset, batch->rowPositions[row + 1] - offset,
+                  batch->features, batch->fields, batch->values, batch->scales[row],
+                  weightsPtr, 2, params.k, params.numFields, params.regLambda, params.learningRate, kappa, true);
+      }
+    }
+    delete batch;
+  }
+
+  dataBatcher[0]->reset();
+
+  return loss / params.numRows;
 }
 
-template class Trainer<float>;
-template class Trainer<double>;
+template
+class Trainer<float>;
+template
+class Trainer<double>;
 
 }