Fix building issue #2

NVIDIA-Merlin · Jan 5, 2021 · 17b3668 · 17b3668
1 parent 8c982d8
commit 17b3668
Show file tree

Hide file tree

Showing 4 changed files with 1,402 additions and 260 deletions.
diff --git a/HugeCTR/include/parser.hpp b/HugeCTR/include/parser.hpp
@@ -21,53 +21,13 @@
 #include <fstream>
 #include <functional>
 #include <gpu_resource.hpp>
-#include <inference/embedding_feature_combiner.hpp>
 #include <learning_rate_scheduler.hpp>
 #include <metrics.hpp>
 #include <network.hpp>
 #include <nlohmann/json.hpp>
 
 namespace HugeCTR {
 
-nlohmann::json read_json_file(const std::string& filename);
-
-struct SolverParser {
-  //  std::string configure_file;
-  unsigned long long seed;                  /**< seed of data simulator */
-  LrPolicy_t lr_policy;                     /**< the only fixed lr is supported now. */
-  int display;                              /**< the interval of loss display. */
-  int max_iter;                             /**< the number of iterations for training */
-  int num_epochs;                           /**< the number of epochs for training */
-  int snapshot;                             /**< the number of iterations for a snapshot */
-  std::string snapshot_prefix;              /**< naming prefix of snapshot file */
-  int eval_interval;                        /**< the interval of evaluations */
-  int eval_batches;                         /**< the number of batches for evaluations */
-  int batchsize_eval;                       /**< batchsize for eval */
-  int batchsize;                            /**< batchsize */
-  std::string model_file;                   /**< name of model file */
-  std::vector<std::string> embedding_files; /**< name of embedding file */
-  std::vector<std::vector<int>> vvgpu;      /**< device map */
-  bool use_mixed_precision;
-  float scaler;
-  std::map<metrics::Type, float> metrics_spec;
-  bool i64_input_key;
-  bool use_algorithm_search;
-  bool use_cuda_graph;
-  SolverParser(const std::string& file);
-  SolverParser() {}
-};
-struct InferenceParser {
-  //  std::string configure_file;
-  size_t max_batchsize;                        /**< batchsize */
-  std::string dense_model_file;                /**< name of model file */
-  std::vector<std::string> sparse_model_files; /**< name of embedding file */
-  bool use_mixed_precision;
-  float scaler;
-  bool use_algorithm_search;
-  bool use_cuda_graph;
-  InferenceParser(const nlohmann::json& config);
-};
-
 /**
  * @brief The parser of configure file (in json format).
  *
@@ -91,37 +51,42 @@ class Parser {
   const bool use_algorithm_search_;
   const bool use_cuda_graph_;
 
-  template <typename TypeKey>
-  void create_pipeline_internal(std::shared_ptr<IDataReader>& data_reader,
-                                std::shared_ptr<IDataReader>& data_reader_eval,
-                                std::vector<std::shared_ptr<IEmbedding>>& embedding,
-                                std::vector<std::unique_ptr<Network>>& network,
-                                const std::shared_ptr<ResourceManager>& resource_manager);
-
-  template <typename TypeEmbeddingComp>
-  void create_pipeline_inference(const InferenceParser& inference_parser,
-                                 Tensor2<float>& dense_input,
-                                 std::vector<std::shared_ptr<Tensor2<int>>>& rows,
-                                 std::vector<std::shared_ptr<Tensor2<float>>>& embeddingvecs,
-                                 std::vector<size_t>& embedding_table_slot_size,
-                                 std::vector<std::shared_ptr<Layer>>* embedding, Network** network,
-                                 const std::shared_ptr<ResourceManager> resource_manager);
-
  public:
-  std::vector<TensorEntry> tensor_entries;
   /**
    * Ctor.
    * Ctor only verify the configure file, doesn't create pipeline.
    */
-  Parser(const std::string& configure_file, size_t batch_size, size_t batch_size_eval,
-         bool repeat_dataset, bool i64_input_key = false, bool use_mixed_precision = false,
-         float scaler = 1.0f, bool use_algorithm_search = true, bool use_cuda_graph = true);
 
-  /**
-   * Ctor.
-   * Ctor used in inference stage
-   */
-  Parser(const nlohmann::json& config);
+  Parser(const std::string& configure_file,
+         size_t batch_size,
+         size_t batch_size_eval,
+         bool repeat_dataset,
+         bool i64_input_key = false,
+         bool use_mixed_precision = false,
+         float scaler = 1.0f,
+         bool use_algorithm_search = true,
+         bool use_cuda_graph = true)
+      : batch_size_(batch_size),
+        batch_size_eval_(batch_size_eval),
+        repeat_dataset_(repeat_dataset),
+        i64_input_key_(i64_input_key),
+        use_mixed_precision_(use_mixed_precision),
+        scaler_(scaler),
+        use_algorithm_search_(use_algorithm_search),
+        use_cuda_graph_(use_cuda_graph) {
+    try {
+      std::ifstream file(configure_file);
+      if (!file.is_open()) {
+        CK_THROW_(Error_t::FileCannotOpen, "file.is_open() failed: " + configure_file);
+      }
+      file >> config_;
+      file.close();
+    } catch (const std::runtime_error& rt_err) {
+      std::cerr << rt_err.what() << std::endl;
+      throw;
+    }
+    return;
+  }
 
   /**
    * Create the pipeline, which includes data reader, embedding.
@@ -132,15 +97,14 @@ class Parser {
                        std::vector<std::unique_ptr<Network>>& network,
                        const std::shared_ptr<ResourceManager>& resource_manager);
 
-  /**
-   * Create inference pipeline, which only creates network and embedding
-   */
-  void create_pipeline(const InferenceParser& inference_parser, Tensor2<float>& dense_input,
-                       std::vector<std::shared_ptr<Tensor2<int>>>& row,
-                       std::vector<std::shared_ptr<Tensor2<float>>>& embeddingvec,
-                       std::vector<size_t>& embedding_table_slot_size,
-                       std::vector<std::shared_ptr<Layer>>* embedding, Network** network,
-                       const std::shared_ptr<ResourceManager> resource_manager);
+  template <typename TypeKey>
+  friend void create_pipeline_internal(std::shared_ptr<IDataReader>& data_reader,
+                                       std::shared_ptr<IDataReader>& data_reader_eval,
+                                       std::vector<std::shared_ptr<IEmbedding>>& embedding,
+                                       std::vector<std::unique_ptr<Network>>& network,
+                                       const std::shared_ptr<ResourceManager>& resource_manager,
+                                       Parser& parser);
+
 };
 
 std::unique_ptr<LearningRateScheduler> get_learning_rate_scheduler(
@@ -150,6 +114,32 @@ std::unique_ptr<LearningRateScheduler> get_learning_rate_scheduler(
  * Solver Parser.
  * This class is designed to parse the solver clause of the configure file.
  */
+struct SolverParser {
+  //  std::string configure_file;
+  unsigned long long seed;                  /**< seed of data simulator */
+  LrPolicy_t lr_policy;                     /**< the only fixed lr is supported now. */
+  int display;                              /**< the interval of loss display. */
+  int max_iter;                             /**< the number of iterations for training */
+  int num_epochs;                           /**< the number of epochs for training */
+  int snapshot;                             /**< the number of iterations for a snapshot */
+  std::string snapshot_prefix;              /**< naming prefix of snapshot file */
+  int eval_interval;                        /**< the interval of evaluations */
+  int eval_batches;                         /**< the number of batches for evaluations */
+  int batchsize_eval;                       /**< batchsize for eval */
+  int batchsize;                            /**< batchsize */
+  std::string model_file;                   /**< name of model file */
+  std::vector<std::string> embedding_files; /**< name of embedding file */
+  std::vector<std::vector<int>> vvgpu;      /**< device map */
+  bool use_mixed_precision;
+  float scaler;
+  std::map<metrics::Type, float> metrics_spec;
+  bool i64_input_key;
+  bool use_algorithm_search;
+  bool use_cuda_graph;
+  SolverParser(const std::string& file);
+  SolverParser(){}
+};
+
 
 template <typename T>
 struct SparseInput {
@@ -196,57 +186,16 @@ struct SparseInput {
     }                                                   \
   } while (0)
 
-const std::map<std::string, Layer_t> LAYER_TYPE_MAP = {
-    {"BatchNorm", Layer_t::BatchNorm},
-    {"BinaryCrossEntropyLoss", Layer_t::BinaryCrossEntropyLoss},
-    {"Concat", Layer_t::Concat},
-    {"CrossEntropyLoss", Layer_t::CrossEntropyLoss},
-    {"Dropout", Layer_t::Dropout},
-    {"ELU", Layer_t::ELU},
-    {"InnerProduct", Layer_t::InnerProduct},
-    {"Interaction", Layer_t::Interaction},
-    {"MultiCrossEntropyLoss", Layer_t::MultiCrossEntropyLoss},
-    {"ReLU", Layer_t::ReLU},
-    {"Reshape", Layer_t::Reshape},
-    {"Sigmoid", Layer_t::Sigmoid},
-    {"Slice", Layer_t::Slice},
-    {"Multiply", Layer_t::Multiply},
-    {"FmOrder2", Layer_t::FmOrder2},
-    {"Add", Layer_t::Add},
-    {"ReduceSum", Layer_t::ReduceSum},
-    {"MultiCross", Layer_t::MultiCross},
-    {"DotProduct", Layer_t::DotProduct}};
-const std::map<std::string, Layer_t> LAYER_TYPE_MAP_MP = {
-    {"BinaryCrossEntropyLoss", Layer_t::BinaryCrossEntropyLoss},
-    {"Concat", Layer_t::Concat},
-    {"Cast", Layer_t::Cast},
-    {"InnerProduct", Layer_t::InnerProduct},
-    {"FusedInnerProduct", Layer_t::FusedInnerProduct},
-    {"Interaction", Layer_t::Interaction},
-    {"Reshape", Layer_t::Reshape},
-    {"Sigmoid", Layer_t::Sigmoid},
-    {"Slice", Layer_t::Slice},
-    {"ReLU", Layer_t::ReLU},
-    {"Dropout", Layer_t::Dropout},
-    {"Add", Layer_t::Add}};
-const std::map<std::string, Embedding_t> EMBEDDING_TYPE_MAP = {
-    {"DistributedSlotSparseEmbeddingHash", Embedding_t::DistributedSlotSparseEmbeddingHash},
-    {"LocalizedSlotSparseEmbeddingHash", Embedding_t::LocalizedSlotSparseEmbeddingHash},
-    {"LocalizedSlotSparseEmbeddingOneHot", Embedding_t::LocalizedSlotSparseEmbeddingOneHot}};
-const std::map<std::string, Initializer_t> INITIALIZER_TYPE_MAP = {
-    {"Uniform", Initializer_t::Uniform},
-    {"XavierNorm", Initializer_t::XavierNorm},
-    {"XavierUniform", Initializer_t::XavierUniform},
-    {"Zero", Initializer_t::Zero}};
-
 static const std::map<std::string, Optimizer_t> OPTIMIZER_TYPE_MAP = {
     {"Adam", Optimizer_t::Adam},
     {"MomentumSGD", Optimizer_t::MomentumSGD},
     {"Nesterov", Optimizer_t::Nesterov},
     {"SGD", Optimizer_t::SGD}};
 
 static const std::map<std::string, Update_t> UPDATE_TYPE_MAP = {
-    {"Local", Update_t::Local}, {"Global", Update_t::Global}, {"LazyGlobal", Update_t::LazyGlobal}};
+    {"Local", Update_t::Local},
+    {"Global", Update_t::Global},
+    {"LazyGlobal", Update_t::LazyGlobal}};
 
 static const std::map<std::string, Regularizer_t> REGULARIZER_TYPE_MAP = {
     {"L1", Regularizer_t::L1},
@@ -286,40 +235,11 @@ inline T get_value_from_json_soft(const nlohmann::json& json, const std::string
   }
 }
 
-template <typename Type>
-struct get_optimizer_param {
-  OptParams<Type> operator()(const nlohmann::json& j_optimizer);
-};
-
-template <typename TypeKey, typename TypeFP>
-struct create_embedding {
-  void operator()(std::map<std::string, SparseInput<TypeKey>>& sparse_input_map,
-                  std::vector<TensorEntry>* tensor_entries_list,
-                  std::vector<std::shared_ptr<IEmbedding>>& embedding, Embedding_t embedding_type,
-                  const nlohmann::json& config,
-                  const std::shared_ptr<ResourceManager>& resource_manager, size_t batch_size,
-                  size_t batch_size_eval, bool use_mixed_precision, float scaler,
-                  const nlohmann::json& j_layers);
-
-  void operator()(const InferenceParser& inference_parser, const nlohmann::json& j_layers_array,
-                  std::vector<std::shared_ptr<Tensor2<int>>>& rows,
-                  std::vector<std::shared_ptr<Tensor2<float>>>& embeddingvecs,
-                  std::vector<size_t>& embedding_table_slot_size,
-                  std::vector<TensorEntry>* tensor_entries,
-                  std::vector<std::shared_ptr<Layer>>* embeddings,
-                  const std::shared_ptr<GPUResource> gpu_resource,
-                  std::shared_ptr<GeneralBuffer2<CudaAllocator>>& blobs_buff);
-};
-
-template <typename TypeKey>
-struct create_datareader {
-  void operator()(const nlohmann::json& j,
-                  std::map<std::string, SparseInput<TypeKey>>& sparse_input_map,
-                  std::vector<TensorEntry>* tensor_entries_list,
-                  std::shared_ptr<IDataReader>& data_reader,
-                  std::shared_ptr<IDataReader>& data_reader_eval, size_t batch_size,
-                  size_t batch_size_eval, bool use_mixed_precision, bool repeat_dataset,
-                  const std::shared_ptr<ResourceManager> resource_manager);
-};
+void parse_data_layer_helper(const nlohmann::json& j, int& label_dim, int& dense_dim,
+                             Check_t& check_type, std::string& source_data,
+                             std::vector<DataReaderSparseParam>& data_reader_sparse_param_array,
+                             std::string& eval_source, std::string& top_strs_label,
+                             std::string& top_strs_dense, std::vector<std::string>& sparse_names,
+                             std::map<std::string, SparseInput<long long>>& sparse_input_map);
 
 }  // namespace HugeCTR
diff --git a/HugeCTR/src/inference/embedding_cache.cu b/HugeCTR/src/inference/embedding_cache.cu
@@ -17,6 +17,8 @@
 #include <inference/embedding_cache.hpp>
 
 namespace HugeCTR {
+// Temp interface, should be delete later
+nlohmann::json read_json_file(const std::string& filename);
 
 // Kernels to combine the value buffer
 __global__ void merge_emb_vec(

diff --git a/HugeCTR/src/inference/parameter_server.cpp b/HugeCTR/src/inference/parameter_server.cpp
@@ -17,6 +17,8 @@
 #include <inference/parameter_server.hpp>
 
 namespace HugeCTR {
+// Temp interface, should be delete later
+nlohmann::json read_json_file(const std::string& filename);
 
 template <typename TypeHashKey>
 parameter_server<TypeHashKey>::parameter_server(const std::string& framework_name,