From 7672fdc62c50ff7bb13586bee6872a8efd98d966 Mon Sep 17 00:00:00 2001
From: Yimin Jiang <jiangyimin@bytedance.com>
Date: Tue, 19 Nov 2019 18:15:47 +0800
Subject: [PATCH] customer: fallback to fifo (#11)

* customer: refactor and reduce cpu load

* initial change

* improve performance

* improve hash and terminate

* cleaning

* fine-grained mutex

* improvement

* fall back to map_mu_

* customer: fallback to fifo

* clean customer.h

* not functional change

* non-functional change
---
 include/ps/internal/customer.h |  23 --
 src/customer.cc                | 419 +--------------------------------
 src/van.cc                     |   2 +-
 3 files changed, 14 insertions(+), 430 deletions(-)
diff --git a/include/ps/internal/customer.h b/include/ps/internal/customer.h
index f25298b66..bdf70a1c9 100644
--- a/include/ps/internal/customer.h
+++ b/include/ps/internal/customer.h
@@ -14,18 +14,6 @@
 #include "ps/internal/message.h"
 #include "ps/internal/threadsafe_queue.h"
 namespace ps {
-
-/**
- * \brief The structure for profiling
- */
-struct Profile {
-  uint64_t key;
-  int sender;
-  bool is_push;
-  std::string ts;
-  bool is_begin;
-};
-
 /**
  * \brief The object for communication.
  *
@@ -100,14 +88,6 @@ class Customer {
     recv_queue_.Push(recved);
   }
 
-  void ProcessPullRequest(int worker_id);
-  void ProcessPushRequest(int thread_id);
-  void ProcessProfileData();
-  bool IsValidPushpull(const Message& msg);
-  uint64_t GetKeyFromMsg(const Message& msg);
-  void ProcessResponse(int thread_id);
-  std::string GetTimestampNow();
-
  private:
   /**
    * \brief the thread function
@@ -126,9 +106,6 @@ class Customer {
   std::condition_variable tracker_cond_;
   std::vector<std::pair<int, int>> tracker_;
 
-  // for storing profile data
-  ThreadsafeQueue<Profile> pdata_queue_;
-
   DISALLOW_COPY_AND_ASSIGN(Customer);
 };
 
diff --git a/src/customer.cc b/src/customer.cc
index 606b0ed63..27d8596b0 100644
--- a/src/customer.cc
+++ b/src/customer.cc
@@ -1,5 +1,5 @@
-/**
- *  Copyright (c) 2015 by Contributors
+/**	
+ *  Copyright (c) 2015 by Contributors	
  */
 #include "ps/internal/customer.h"
 #include "ps/internal/postoffice.h"
@@ -10,33 +10,15 @@
 #include <list>
 #include <fstream>
 #include <chrono>
+
 namespace ps {
 const int Node::kEmpty = std::numeric_limits<int>::max();
 const int Meta::kEmpty = std::numeric_limits<int>::max();
-size_t num_worker, num_server;
-std::mutex mu_;
-std::mutex key_mu_;
-std::vector<std::list<Message> > buffered_push_;
-std::vector<std::list<Message> > buffered_pull_;
-std::unordered_map<uint64_t, std::atomic<bool> > is_push_finished_;
-std::unordered_map<uint64_t, std::set<int> > pull_collected_;
-std::vector<std::list<Message> > worker_buffer_;
-
-std::atomic<int> thread_barrier_{0};
-bool enable_profile_ = false;
 
 Customer::Customer(int app_id, int customer_id, const Customer::RecvHandle& recv_handle)
     : app_id_(app_id), customer_id_(customer_id), recv_handle_(recv_handle) {
   Postoffice::Get()->AddCustomer(this);
   recv_thread_ = std::unique_ptr<std::thread>(new std::thread(&Customer::Receiving, this));
-  // get the number of worker
-  const char *val;
-  val = Environment::Get()->find("DMLC_NUM_WORKER");
-  num_worker = atoi(val);
-  CHECK_GE(num_worker, 1);
-  val = Environment::Get()->find("DMLC_NUM_SERVER");
-  num_server = atoi(val);
-  CHECK_GE(num_server, 1);
 }
 
 Customer::~Customer() {
@@ -71,396 +53,21 @@ void Customer::AddResponse(int timestamp, int num) {
   tracker_[timestamp].second += num;
 }
 
-bool Customer::IsValidPushpull(const Message &msg) {
-  if (!msg.meta.control.empty()) return false;
-  if (msg.meta.simple_app) return false;
-  return true;
-}
-
-uint64_t Customer::GetKeyFromMsg(const Message &msg) { // should check if this is valid push/pull
-  CHECK(IsValidPushpull(msg)) << "Perform key derivation on an invalid message";
-  CHECK_GT(msg.data.size(), 0) << "Invalid data message: msg.data.size() is 0";
-  uint64_t key = 0;
-  uint64_t coef = 1;
-  for (unsigned int i = 0; i < msg.data[0].size(); ++i) {
-    key += coef * (uint8_t) msg.data[0].data()[i];
-    coef *= 256; // 256=2^8 (uint8_t)
-  }
-  return key;
-}
-
-void Customer::ProcessPullRequest(int worker_id) {
-  {
-    std::lock_guard<std::mutex> lock(mu_);
-    LOG(INFO) << "Server inits Pull Thread-" << worker_id;
-    thread_barrier_.fetch_add(1);
-  }
-  std::list<Message> pull_consumer;
-  bool should_stop = false;
-  while (!should_stop) {
-    {
-      std::lock_guard<std::mutex> lock(mu_);
-      CHECK_LE((unsigned int) worker_id, buffered_pull_.size()) << worker_id << ", " << buffered_pull_.size();
-      pull_consumer.splice(pull_consumer.end(), buffered_pull_[worker_id]);
-      buffered_pull_[worker_id].clear();
-    }
-    auto it = pull_consumer.begin();
-    while (it != pull_consumer.end()) {
-      Message &msg = *it;
-      if (!msg.meta.control.empty() && msg.meta.control.cmd == Control::TERMINATE) {
-        if (pull_consumer.size() == 1) {
-          should_stop = true;
-          break;
-        }
-        continue; // should first finish the requests that are still in the buffer
-      }
-      CHECK(!msg.meta.push);
-      uint64_t key = GetKeyFromMsg(msg);
-      std::lock_guard<std::mutex> lock(key_mu_);
-      if (is_push_finished_[key].load() && (pull_collected_[key].find(worker_id) == pull_collected_[key].end())) {
-        pull_collected_[key].insert(worker_id);
-        if (pull_collected_[key].size() == (unsigned int) num_worker) {
-          is_push_finished_[key] = false;
-          pull_collected_[key].clear();
-        }
-        recv_handle_(msg);
-        it = pull_consumer.erase(it);
-        if (enable_profile_) {
-          Profile pdata = {key, msg.meta.sender, false, GetTimestampNow(), false};
-          pdata_queue_.Push(pdata);
-        }
-        break;
-      } else {
-        ++it;
-      }
-    }
-  }
-}
-
-void Customer::ProcessPushRequest(int thread_id) {
-  {
-    std::lock_guard<std::mutex> lock(mu_);
-    LOG(INFO) << "Server inits Push Thread-" << thread_id;
-    thread_barrier_.fetch_add(1);
-  }
-  std::unordered_map<uint64_t, int> push_finished_cnt;
-  std::list<Message> push_consumer;
-  bool should_stop = false;
-  while (!should_stop) {
-    {
-      std::lock_guard<std::mutex> lock(mu_);
-      CHECK_LE((unsigned int) thread_id, buffered_push_.size()) << thread_id << ", " << buffered_push_.size();
-      push_consumer.splice(push_consumer.end(), buffered_push_[thread_id]);
-      buffered_push_[thread_id].clear();
-    }
-    auto it = push_consumer.begin();
-    while (it != push_consumer.end()) {
-      Message &msg = *it;
-
-      if (!msg.meta.control.empty() && msg.meta.control.cmd == Control::TERMINATE) {
-        if (push_consumer.size() == 1) {
-          should_stop = true;
-          break;
-        }
-        continue; // should first finish the requests that are still in the buffer
-      }
-
-      CHECK(msg.meta.push);
-      uint64_t key = GetKeyFromMsg(msg);
-      recv_handle_(msg);
-      if (enable_profile_) {
-        Profile pdata = {key, msg.meta.sender, true, GetTimestampNow(), false};
-        pdata_queue_.Push(pdata);
-      }
-
-      it = push_consumer.erase(it);
-
-      // we probably don't need this, but just in case
-      if (push_finished_cnt.find(key) == push_finished_cnt.end()) push_finished_cnt[key] = 0;
-
-      // we assume the init has already been handled by main thread
-      ++push_finished_cnt[key];
-
-      if ((size_t) push_finished_cnt[key] == num_worker) {
-        std::lock_guard<std::mutex> lock(key_mu_);
-        is_push_finished_[key] = true;
-        push_finished_cnt[key] = 0;
-      }
-
-    }
-  }
-}
-
-void Customer::ProcessProfileData() {
-  LOG(INFO) << "profile thread is inited";
-  bool profile_all = true; // default: profile all keys
-  uint64_t key_to_profile;
-  const char *val;
-  val = Environment::Get()->find("BYTEPS_SERVER_KEY_TO_PROFILE");
-  if (val) {
-    profile_all = false;
-    key_to_profile = atoi(val);
-  }
-
-  std::fstream fout_;
-  val = Environment::Get()->find("BYTEPS_SERVER_PROFILE_OUTPUT_PATH");
-  fout_.open((val ? std::string(val) : "server_profile.json"), std::fstream::out);
-  fout_ << "{\n";
-  fout_ << "\t\"traceEvents\": [\n";
-  bool is_init = true;
-  while (true) {
-    Profile pdata;
-    pdata_queue_.WaitAndPop(&pdata);
-    if (profile_all || key_to_profile==pdata.key) {
-      if (!is_init) {
-        fout_ << ",\n";
-      } else {
-        is_init = false;
-      }
-      fout_ << "\t\t" << "{\"name\": " << "\"" <<(pdata.is_push?"push":"pull") << "-" << pdata.sender << "\"" << ", "
-            << "\"ph\": " << "\"" << (pdata.is_begin?"B":"E") << "\"" << ", "
-            << "\"pid\": " << pdata.key << ", "
-            << "\"tid\": " << pdata.key << ", "
-            << "\"ts\": " << pdata.ts
-            << "}";
-    }
-  }
-  fout_ << "]\n";
-  fout_ << "}";
-  fout_.clear();
-  fout_.flush();
-  fout_.close();
-  LOG(INFO) << "profile thread ended";
-}
-
-void Customer::ProcessResponse(int thread_id) {
-  {
-    std::lock_guard<std::mutex> lock(mu_);
-    LOG(INFO) << "Inits Thread-" << thread_id;
-  }
-  std::list<Message> consumer;
+void Customer::Receiving() {
   while (true) {
-    {
-      std::lock_guard<std::mutex> lock(mu_);
-      consumer.splice(consumer.end(), worker_buffer_[thread_id]);
-      worker_buffer_[thread_id].clear();
-    }
-    auto it = consumer.begin();
-    while (it != consumer.end()) {
-      Message &msg = *it;
-      if (!msg.meta.control.empty() && msg.meta.control.cmd == Control::TERMINATE) { break; }
-      recv_handle_(msg);
-      CHECK(!msg.meta.request); // must be response
+    Message recv;
+    recv_queue_.WaitAndPop(&recv);
+    if (!recv.meta.control.empty() 
+          && recv.meta.control.cmd == Control::TERMINATE) {
+      break;
+    }
+    recv_handle_(recv);
+    if (!recv.meta.request) {
       std::lock_guard<std::mutex> lk(tracker_mu_);
-      tracker_[msg.meta.timestamp].second++;
+      tracker_[recv.meta.timestamp].second++;
       tracker_cond_.notify_all();
-      it = consumer.erase(it);
     }
   }
 }
 
-std::string Customer::GetTimestampNow() {
-  std::chrono::microseconds us =
-      std::chrono::duration_cast<std::chrono::microseconds >(std::chrono::system_clock::now().time_since_epoch());
-  std::stringstream temp_stream;
-  std::string ts_string;
-  temp_stream << us.count();
-  temp_stream >> ts_string;
-  return ts_string;
-}
-
-void Customer::Receiving() {
-  const char *val;
-  val = CHECK_NOTNULL(Environment::Get()->find("DMLC_ROLE"));
-  std::string role(val);
-  bool is_server = role == "server";
-  val = Environment::Get()->find("ENABLE_SERVER_MULTIPULL");
-  bool is_server_multi_pull_enabled = val ? atoi(val) : true; // default enabled
-  val = Environment::Get()->find("ENABLE_WORKER_MULTIPULL");
-  bool is_worker_multi_pull_enabled = val ? atoi(val) : false; // default disabled, has bug yet
-  val = Environment::Get()->find("WORKER_THREAD_NUM");
-  int worker_thread_num = val ? atoi(val) : 4;
-  val = Environment::Get()->find("SERVER_PUSH_NTHREADS");
-  int server_push_nthread = val ? atoi(val) : 1;
-  val = Environment::Get()->find("BYTEPS_ENABLE_ASYNC");
-  bool enable_async = val ? atoi(val) : false;
-  if (is_server && enable_async) {
-    is_server_multi_pull_enabled = false;
-  }
-
-  // profiling
-  val = Environment::Get()->find("BYTEPS_SERVER_ENABLE_PROFILE");
-  enable_profile_ = val ? atoi(val) : false;
-  std::thread* profile_thread;
-  if (enable_profile_ && is_server) {
-    LOG(INFO) << "Enable server profiling";
-    profile_thread = new std::thread(&Customer::ProcessProfileData, this);
-  }
-
-  if (is_server && is_server_multi_pull_enabled){ // server multi-thread
-    LOG(INFO) << "Use separate thread to process pull requests from each worker.";
-
-    std::vector<std::thread *> push_thread;
-    for (int i = 0; i < server_push_nthread; ++i) {
-      std::list<Message> buf;
-      buffered_push_.push_back(buf);
-    }
-    CHECK_EQ(buffered_push_.size(), (unsigned int) server_push_nthread);
-    for (int i = 0; i < server_push_nthread; ++i) {
-      std::lock_guard<std::mutex> lock(mu_);
-      auto t = new std::thread(&Customer::ProcessPushRequest, this, i);
-      push_thread.push_back(t);
-    }
-    LOG(INFO) << "Server uses " << server_push_nthread << " threads to process push requests.";
-
-    std::vector<std::thread *> pull_thread;
-    for (size_t i = 0; i < num_worker; ++i) {
-      std::list<Message> buf;
-      buffered_pull_.push_back(buf);
-    }
-    CHECK_EQ(buffered_pull_.size(), (unsigned int) num_worker);
-    for (size_t i = 0; i < num_worker; ++i) {
-      std::lock_guard<std::mutex> lock(mu_);
-      auto t = new std::thread(&Customer::ProcessPullRequest, this, i);
-      pull_thread.push_back(t);
-    }
-
-    while (1) { // wait until all threads have been inited
-      int total_thread_num = num_worker + server_push_nthread;
-      if (thread_barrier_.fetch_add(0) == total_thread_num) break;
-      std::this_thread::sleep_for(std::chrono::nanoseconds(1000));
-    }
-    LOG(INFO) << "All threads inited, ready to process message ";
-
-    std::unordered_map<uint64_t, std::set<int> > init_push_;
-
-    while (true) {
-      Message recv;
-      recv_queue_.WaitAndPop(&recv);
-      if (!recv.meta.control.empty() && recv.meta.control.cmd == Control::TERMINATE) {
-        Message terminate_msg;
-        terminate_msg.meta.control.cmd = Control::TERMINATE;
-        std::lock_guard<std::mutex> lock(mu_);
-        for (auto buf : buffered_push_) {
-          buf.push_back(terminate_msg);
-        }
-        for (auto buf : buffered_pull_) {
-          buf.push_back(terminate_msg);
-        }
-        break;
-      }
-      if (!IsValidPushpull(recv)) {
-        recv_handle_(recv);
-        continue;
-      }
-      uint64_t key = GetKeyFromMsg(recv);
-
-      if (init_push_[key].size() < num_worker) {
-        CHECK(recv.meta.push) << key;
-        // collect all push from each worker
-        int sender = recv.meta.sender;
-        CHECK_EQ(init_push_[key].find(sender), init_push_[key].end())
-            << key << " " << sender;
-
-        init_push_[key].insert(sender);
-        recv_handle_(recv);
-
-        // Reset the push flag, to guarantee that subsequent pulls are blocked.
-        // We might be able to remove this, but just in case the compiler does not work as we expect.
-        if (init_push_[key].size() == num_worker) {
-          std::lock_guard<std::mutex> lock(key_mu_);
-          is_push_finished_[key] = false;
-        }
-
-        continue;
-      }
-      CHECK_EQ(init_push_[key].size(), num_worker);
-
-      if (recv.meta.push) { // push: same key goes to same thread
-        std::lock_guard<std::mutex> lock(mu_);
-        if (enable_profile_) {
-          Profile pdata = {key, recv.meta.sender, true, GetTimestampNow(), true};
-          pdata_queue_.Push(pdata);
-        }
-        buffered_push_[(key/num_server) % server_push_nthread].push_back(recv);
-      } else { // pull
-        std::lock_guard<std::mutex> lock(mu_);
-        if (enable_profile_) {
-          Profile pdata = {key, recv.meta.sender, false, GetTimestampNow(), true};
-          pdata_queue_.Push(pdata);
-        }
-        int worker_id = (recv.meta.sender - 9) / 2; // worker id: 9, 11, 13 ...
-        buffered_pull_[worker_id].push_back(recv);
-      }
-
-    } // while
-
-    // wait until the threads finish
-    for (auto t : push_thread) t->join();
-    for (auto t : pull_thread) t->join();
-    if (profile_thread) profile_thread->join();
-
-  } // server multi-thread
-
-  else if (!is_server && is_worker_multi_pull_enabled) { // worker multithread
-    CHECK_GE(worker_thread_num, 1);
-    LOG(INFO) << "Use multiple threads to process pull responses.";
-    std::vector<std::thread *> worker_thread;
-    for (int i = 0; i < worker_thread_num; ++i) {
-      std::list<Message> buf;
-      worker_buffer_.push_back(buf);
-      auto t = new std::thread(&Customer::ProcessResponse, this, i);
-      worker_thread.push_back(t);
-    }
-    CHECK_EQ((unsigned int) worker_thread_num, worker_buffer_.size());
-    while (true) {
-      Message recv;
-      recv_queue_.WaitAndPop(&recv);
-      if (!recv.meta.control.empty() && recv.meta.control.cmd == Control::TERMINATE) {
-        Message terminate_msg;
-        terminate_msg.meta.control.cmd = Control::TERMINATE;
-        std::lock_guard<std::mutex> lock(mu_);
-        for (auto buf : worker_buffer_) {
-          buf.push_back(terminate_msg);
-        }
-        break;
-      }
-      if (!IsValidPushpull(recv)) {
-        recv_handle_(recv);
-        if (!recv.meta.request) {
-          std::lock_guard<std::mutex> lk(tracker_mu_);
-          tracker_[recv.meta.timestamp].second++;
-          tracker_cond_.notify_all();
-        }
-        continue;
-      }
-      int thread_id = GetKeyFromMsg(recv) % worker_thread_num; // a simple load balanced strategy
-      std::lock_guard<std::mutex> lock(mu_);
-      worker_buffer_[thread_id].push_back(recv);
-    }
-    for (auto t : worker_thread) {
-      t->join();
-    }
-  }  // worker multithread
-
-  else { // original
-    LOG(INFO) << "Do not use thread pool for receiving.";
-
-    while (true) {
-      Message recv;
-      recv_queue_.WaitAndPop(&recv);
-      if (!recv.meta.control.empty() && recv.meta.control.cmd == Control::TERMINATE) {
-        break;
-      }
-      recv_handle_(recv);
-      if (!recv.meta.request) {
-        std::lock_guard<std::mutex> lk(tracker_mu_);
-        tracker_[recv.meta.timestamp].second++;
-        tracker_cond_.notify_all();
-      }
-    }
-
-  } // original
-}
-
 }  // namespace ps
diff --git a/src/van.cc b/src/van.cc
index 6a217c34e..64f004ed1 100644
--- a/src/van.cc
+++ b/src/van.cc
@@ -165,7 +165,7 @@ void Van::UpdateLocalID(Message* msg, std::unordered_set<int>* deadnodes_set,
   if (msg->meta.sender == Meta::kEmpty) {
     CHECK(is_scheduler_);
     CHECK_EQ(ctrl.node.size(), 1);
-    if (static_cast<int>(nodes->control.node.size()) < num_nodes) {
+    if (static_cast<int>(nodes->control.node.size()) < (int) num_nodes) {
       nodes->control.node.push_back(ctrl.node[0]);
     } else {
       // some node dies and restarts