Refactor parallel DNN by removing unused structs

clin99 · clin99 · commit 62174c3edb2a · 2019-03-14T11:55:23.000-05:00
diff --git a/benchmark/parallel_dnn/dnn.hpp b/benchmark/parallel_dnn/dnn.hpp
@@ -170,172 +170,6 @@ inline void deactivate(Eigen::MatrixXf& mat, Activation act) {
 }
 
 
-
-struct MNIST {
-
-  // Ctor
-  MNIST() {
-    std::string path = std::experimental::filesystem::current_path();                                                                  
-    //path = path.substr(0, path.rfind("cpp-taskflow") + 12);
-    //path += "/benchmark/mnist/";
-    
-    images = read_mnist_image("./train-images.data");
-    labels = read_mnist_label("./train-labels.data");
-
-    test_images = read_mnist_image("./t10k-images-idx3-ubyte");
-    test_labels = read_mnist_label("./t10k-labels-idx1-ubyte");
-  }
-
-  void add_layer(size_t in_degree, size_t out_degree, Activation act) {
-    acts.emplace_back(act);
-    Ys.emplace_back().resize(batch_size, out_degree);
-    Ws.push_back(Eigen::MatrixXf::Random(in_degree, out_degree));
-    Bs.push_back(Eigen::MatrixXf::Random(1, out_degree));
-
-    dW.emplace_back().resize(in_degree, out_degree);
-    dB.emplace_back().resize(1, out_degree);
-  }
-
-  void forward(size_t layer, const Eigen::MatrixXf& mat) {
-    Ys[layer] = mat * Ws[layer] + Bs[layer].replicate(mat.rows(), 1);
-    activate(Ys[layer], acts[layer]);
-  }
-
-  void loss(const Eigen::VectorXi& labels) {
-    delta = Ys.back();
-    delta = (delta - delta.rowwise().maxCoeff().replicate(1, delta.cols())).array().exp().matrix();
-    delta = delta.cwiseQuotient(delta.rowwise().sum().replicate(1, delta.cols()));
-    for(size_t i=beg_row, j=0; j<batch_size; i++, j++) {
-      delta(j, labels[i]) -= 1.0;
-    }
-  }
-
-  void backward(size_t layer, const Eigen::MatrixXf& Xin) {
-    deactivate(Ys[layer], acts[layer]);
-    delta = delta.cwiseProduct(Ys[layer]);
-    //std::cout << Xin.rows() << "/" << Xin.cols() << " = " << delta.rows() << "/" << delta.cols() << std::endl;
-    dB[layer] = delta.colwise().sum();
-    dW[layer] = Xin.transpose() * delta;
-    //dW[layer] = Xin * delta;
-
-    if(layer > 0) {
-      delta = delta * Ws[layer].transpose();
-    }
-  }
-
-  void update(size_t layer) {
-    Ws[layer] -= lrate*(dW[layer] + decay*Ws[layer]);
-    Bs[layer] -= lrate*(dB[layer] + decay*Bs[layer]); 
-  }
-
-  void shuffle(Eigen::MatrixXf& mat, Eigen::VectorXi& vec, const size_t row_num) {
-
-    static thread_local std::mt19937 gen(0);
-
-    Eigen::PermutationMatrix<Eigen::Dynamic, Eigen::Dynamic> p(row_num);
-    p.setIdentity();
-    std::shuffle(p.indices().data(), p.indices().data() + p.indices().size(), gen);
-
-    mat = p * mat;
-    vec = p * vec;
-  }
-
-  void validate() {
-    Eigen::MatrixXf res = test_images; 
-    //auto t1 = std::chrono::high_resolution_clock::now();
-    for(size_t i=0; i<acts.size(); i++) {
-      res = res * Ws[i] + Bs[i].replicate(res.rows(), 1);
-      if(acts[i] == Activation::RELU) {
-        relu(res);
-      }
-      else if(acts[i] == Activation::SIGMOID) {
-        sigmoid(res);
-      }
-    }
-    //auto t2 = std::chrono::high_resolution_clock::now();
-    //std::cout << "Infer runtime: " << time_diff(t1, t2) << " ms\n";
-
-    size_t correct_num {0};
-    for(int k=0; k<res.rows(); k++) {
-      int pred ; 
-      res.row(k).maxCoeff(&pred);
-      if(pred == test_labels[k]) {
-        correct_num ++;
-      }
-    }
-    //std::cout << "Accuracy: " << correct_num << '/' << res.rows() << '\n';
-  }
-
-
-  // Parameter functions ------------------------------------------------------
-  auto& epoch_num(unsigned e) {
-    epoch = e;
-    return *this;
-  }
-  auto& batch(size_t b) {
-    batch_size = b;
-    assert(images.rows()%batch_size == 0);
-    return *this;
-  }
-  auto& learning_rate(float l) {
-    lrate = l;
-    return *this;
-  }
-
-  std::vector<Eigen::MatrixXf> Ys;
-  std::vector<Eigen::MatrixXf> Ws;
-  std::vector<Eigen::MatrixXf> Bs;
-  std::vector<Eigen::MatrixXf> dW;
-  std::vector<Eigen::MatrixXf> dB;
-
-  std::vector<Activation> acts;
-
-  // Training images # = 60000 x 784 (28 x 28)
-  Eigen::MatrixXf images;
-  Eigen::VectorXi labels;
-  Eigen::MatrixXf delta;
-
-  // Testing images # = 10000 x 784 (28 x 28)
-  Eigen::MatrixXf test_images;
-  Eigen::VectorXi test_labels;
-
-  int beg_row {0};
-
-  float lrate {0.01f};
-  float decay {0.01f};
-
-  unsigned epoch {0};
-  size_t batch_size {1};
-};
-
-inline auto build_dnn(unsigned epoch) {
-  MNIST dnn;
-  dnn.epoch_num(epoch).batch(60).learning_rate(0.001);
- 
-  //dnn.add_layer(784, 64, Activation::RELU);
-  //dnn.add_layer(64, 32, Activation::RELU);
-  //dnn.add_layer(32, 10, Activation::NONE);
-
-  //dnn.add_layer(784, 64, Activation::RELU);
-  //dnn.add_layer(64, 32, Activation::RELU);
-  //dnn.add_layer(32, 16, Activation::RELU);
-  //dnn.add_layer(16, 8, Activation::RELU);
-  //dnn.add_layer(8, 10, Activation::NONE); 
-
-  //dnn.add_layer(784, 256, Activation::RELU);
-  //dnn.add_layer(256, 128, Activation::RELU);
-  //dnn.add_layer(128, 64, Activation::RELU);
-  //dnn.add_layer(64, 32, Activation::RELU);
-  //dnn.add_layer(32, 10, Activation::NONE); 
-
-  dnn.add_layer(784, 100, Activation::RELU);
-  dnn.add_layer(100, 30, Activation::RELU);
-  dnn.add_layer(30, 10, Activation::NONE); 
-
-  return dnn;
-}
-
-
 // ----------------------------------------------------------------------------
 
 struct MNIST_DNN {
@@ -544,11 +378,5 @@ inline void report_runtime(std::chrono::time_point<std::chrono::high_resolution_
 void run_tbb(unsigned, unsigned);
 void run_taskflow(unsigned, unsigned);
 void run_omp(unsigned, unsigned);
-
-//void run_omp(MNIST&, unsigned);
-void run_sequential(MNIST&, unsigned);
-void run_sequential(MNIST_DNN&, unsigned);
-
-//void run_sequential2(MNIST_DNN&, unsigned);
-void run_sequential2(unsigned, unsigned);
+void run_sequential(unsigned, unsigned);
 
diff --git a/benchmark/parallel_dnn/omp.cpp b/benchmark/parallel_dnn/omp.cpp
@@ -124,8 +124,6 @@ void run_omp(unsigned num_epochs, unsigned num_threads) {
 
 
 
-void run_omp(MNIST& D, unsigned num_threads) {
-}
 
 /*
 void run_omp(MNIST& D, unsigned num_threads) {
diff --git a/benchmark/parallel_dnn/seq.cpp b/benchmark/parallel_dnn/seq.cpp
@@ -1,5 +1,6 @@
 #include "dnn.hpp" 
 
+/*
 void run_sequential(MNIST& D, unsigned num_threads) {
 
   const auto iter_num = D.images.rows()/D.batch_size;
@@ -48,71 +49,10 @@ void run_sequential(MNIST& D, unsigned num_threads) {
     D.shuffle(D.images, D.labels, D.images.rows());
   } // End of epoch
 }
+*/
 
 
-
-
-void run_sequential(MNIST_DNN& D, unsigned num_threads) {
-
-  const auto iter_num = IMAGES.rows()/D.batch_size;
-
-  std::cout << D.epoch << std::endl;
-  std::cout << iter_num << std::endl;
-  std::cout << D.batch_size << std::endl;
-  D.epoch = 20;
-
-  for(auto e=0u; e<D.epoch; e++) { 
-    for(auto it=0u; it<iter_num; it++) {
-      // Foward propagation
-      for(size_t i=0; i<D.acts.size(); i++) {
-        if(i == 0){
-          D.forward(i, IMAGES.middleRows(D.beg_row, D.batch_size));
-        }
-        else {
-          D.forward(i, D.Ys[i-1]);
-        }
-      }
-
-      // Calculate loss  
-      D.loss(LABELS);
-
-      // Backward propagation
-      for(int i=D.acts.size()-1; i>=0; i--) {
-        if(i > 0) {
-          //D.backward(i, D.Ys[i-1].transpose()); 
-          D.backward(i, D.Ys[i-1]);
-        }
-        else {
-          //D.backward(i, D.images.middleRows(D.beg_row, D.batch_size).transpose());
-          D.backward(i, IMAGES.middleRows(D.beg_row, D.batch_size));
-        }
-      }
-
-      // Update parameters
-      for(int i=D.acts.size()-1; i>=0; i--) {
-        D.update(i);
-      }
-
-      // Get next batch
-      D.beg_row += D.batch_size;
-      if(D.beg_row >= IMAGES.rows()) {
-        D.beg_row = 0;
-      }
-    } // End of iterations 
-
-    // Shuffle input 
-    shuffle(IMAGES, LABELS);
-
-    D.validate(TEST_IMAGES, TEST_LABELS);
-
-  } // End of epoch
-}
-
-
-
-
-//void run_sequential2(MNIST_DNN& D, unsigned num_threads) {
-void run_sequential2(unsigned num_epochs, unsigned num_threads) {
+void run_sequential(unsigned num_epochs, unsigned num_threads) {
 
   MNIST_DNN D;
   init_dnn(D); 
diff --git a/benchmark/parallel_dnn/taskflow.cpp b/benchmark/parallel_dnn/taskflow.cpp
@@ -13,8 +13,6 @@ struct TF_DNNTrainingPattern : public tf::Framework {
       dnn.validate(mat, vec);
     }
 
-
-
     void build_task_graph() {
       auto f_task = emplace(
         [&]() { forward_task(dnn, IMAGES, LABELS); }

Original file line number	Diff line number	Diff line change
`@@ -13,8 +13,6 @@ struct TF_DNNTrainingPattern : public tf::Framework {`
`13`	`13`	`dnn.validate(mat, vec);`
`14`	`14`	`}`
`15`	`15`
`16`		`-`
`17`		`-`
`18`	`16`	`void build_task_graph() {`
`19`	`17`	`auto f_task = emplace(`
`20`	`18`	`[&]() { forward_task(dnn, IMAGES, LABELS); }`