LeetcodeCourageK
diff --git a/‎modelzoo/features/pmem/README.md‎
Lines changed: 3 additions & 3 deletions b/‎modelzoo/features/pmem/README.md‎
Lines changed: 3 additions & 3 deletions
diff --git a/‎modelzoo/features/pmem/benchmark.py‎
Lines changed: 10 additions & 2 deletions b/‎modelzoo/features/pmem/benchmark.py‎
Lines changed: 10 additions & 2 deletions
diff --git a/‎scripts/install_pmem_dependencies.sh‎
Lines changed: 4 additions & 0 deletions b/‎scripts/install_pmem_dependencies.sh‎
Lines changed: 4 additions & 0 deletions
diff --git a/‎tensorflow/core/BUILD‎
Lines changed: 9 additions & 2 deletions b/‎tensorflow/core/BUILD‎
Lines changed: 9 additions & 2 deletions
diff --git a/‎tensorflow/core/framework/allocator.cc‎
Lines changed: 11 additions & 0 deletions b/‎tensorflow/core/framework/allocator.cc‎
Lines changed: 11 additions & 0 deletions
diff --git a/‎tensorflow/core/framework/allocator.h‎
Lines changed: 4 additions & 1 deletion b/‎tensorflow/core/framework/allocator.h‎
Lines changed: 4 additions & 1 deletion
diff --git a/‎tensorflow/core/framework/allocator_registry.cc‎
Lines changed: 24 additions & 0 deletions b/‎tensorflow/core/framework/allocator_registry.cc‎
Lines changed: 24 additions & 0 deletions
diff --git a/‎tensorflow/core/framework/allocator_registry.h‎
Lines changed: 2 additions & 0 deletions b/‎tensorflow/core/framework/allocator_registry.h‎
Lines changed: 2 additions & 0 deletions
diff --git a/‎tensorflow/core/framework/embedding/config.proto‎
Lines changed: 3 additions & 2 deletions b/‎tensorflow/core/framework/embedding/config.proto‎
Lines changed: 3 additions & 2 deletions
diff --git a/‎tensorflow/core/framework/embedding/embedding_config.h‎
Lines changed: 9 additions & 2 deletions b/‎tensorflow/core/framework/embedding/embedding_config.h‎
Lines changed: 9 additions & 2 deletions
@@ -26,15 +26,15 @@ pandas                        1.1.5
   --num_mock_cols=30
   --batch_size=12800 \
   --dim_size=256 \
-  --ev_storage=pmem \
+  --ev_storage=pmem_libpmem \
 
 ## use criteo data
 ./launch.sh \
   --use_mock_data=False \
   --data_dir=${path_to_criteo} \
   --batch_size=12800 \
   --dim_size=256 \
-  --ev_storage=pmem \
+  --ev_storage=pmem_libpmem \
 ```
 
 - Here `num_mock_cols` is the number of columns in mock training data, `mock_vocabulary_size` is 
@@ -44,5 +44,5 @@ would increase the `vocabulary_size` of each column (variable) by a factor of 2.
 - The log files are located at `./bench-ps.log` and `./bench-worker.log` for ps and worker process, respectively.
 - The default embedding variable type is hash table-based Embedding Variable, which does not require a specification on `mock_vocabulary_size` and `vocabulary_amplify_factor`
 - by specifying `--use_ev_var=False`, the benchmark would fallback to use TF's native variable for Embeddings, and users shall provide `mock_vocabulary_size` in mock data scenarios.
-- '--ev_storage=pmem/dram' to select EmbeddingVariable StorageType, Default is 'dram'.
+- '--ev_storage=pmem_libpmem/pmem_memkind/dram' to select EmbeddingVariable StorageType, Default is 'dram'. If set pmem_libpmem, please also set pmem path and size with '--ev_storage_path=<pmem_path (default: /mnt/pmem0/allocator/)> and --ev_storage_size_gb=<pmem_size (default: 512)>'
 
@@ -29,6 +29,9 @@
 tf.app.flags.DEFINE_boolean("use_xdl_var", False, "")
 tf.app.flags.DEFINE_boolean("trace_timeline", False, "")
 tf.app.flags.DEFINE_string("ev_storage", 'dram', "")
+tf.app.flags.DEFINE_string("ev_storage_path",
+                           '/mnt/pmem0/pmem_allocator/', "")
+tf.app.flags.DEFINE_integer("ev_storage_size_gb", '512', "")
 
 def main(_):
   cluster_dict = {}
@@ -96,8 +99,13 @@ def main(_):
           if FLAGS.use_ev_var:
             if FLAGS.ev_storage == "dram":
               ev_option = variables.EmbeddingVariableOption(storage_option=variables.StorageOption(storage_type=config_pb2.StorageType.DRAM))
-            elif FLAGS.ev_storage == "pmem":
-              ev_option = variables.EmbeddingVariableOption(storage_option=variables.StorageOption(storage_type=config_pb2.StorageType.PMEM))
+            elif FLAGS.ev_storage == "pmem_memkind":
+              ev_option = variables.EmbeddingVariableOption(storage_option=variables.StorageOption(storage_type=config_pb2.StorageType.PMEM_MEMKIND))
+            elif FLAGS.ev_storage == "pmem_libpmem":
+              ev_option = variables.EmbeddingVariableOption(storage_option=variables.StorageOption(
+                                                              storage_type=config_pb2.StorageType.PMEM_LIBPMEM, 
+                                                              storage_path=FLAGS.ev_storage_path, 
+                                                              storage_size=FLAGS.ev_storage_size_gb * 1024 * 1024 * 1024))
             fm_w = tf.get_embedding_variable(
                name='fm_w{}'.format(sidx),
                embedding_dim=1,
 
@@ -0,0 +1,4 @@
+#!/bin/bash
+
+apt update
+apt install -y libpmem-dev libmemkind-dev
@@ -1014,7 +1014,11 @@ cc_library(
         "framework/type_traits.h",
     ] + select({
         "//tensorflow:with_pmem_support": [
-            "framework/pmem_allocator.cc"
+            "framework/pmem_allocator.cc",
+            "framework/experimental_pmem_allocator.cc",
+            "framework/experimental_pmem_allocator_utils.cc",
+            "framework/experimental_pmem_allocator.h",
+            "framework/experimental_pmem_allocator_utils.h",
         ],
         "//conditions:default": [],
     }),
@@ -1027,7 +1031,8 @@ cc_library(
     linkopts = select({
         "//tensorflow:with_pmem_support": [
             "-L/usr/local/lib",
-            "-lmemkind"
+            "-lmemkind",
+            "-lpmem",
         ],
         "//conditions:default": [],
     }),
@@ -2958,6 +2963,8 @@ tf_cuda_library(
             "framework/allocator.cc",
             "framework/cpu_allocator_impl.cc",
             "framework/pmem_allocator.cc",
+            "framework/experimental_pmem_allocator.*",
+            "framework/experimental_pmem_allocator_utils.*",
             "framework/allocator_registry.cc",
             "framework/tracking_allocator.cc",
             "example/example_parser_configuration.*",
 
@@ -93,6 +93,17 @@ Allocator* pmem_allocator() {
   return pmem_alloc;
 }
 
+Allocator* experimental_pmem_allocator(const std::string& pmem_path, size_t allocator_size) {
+  static Allocator* experimental_pmem_allocator =
+      AllocatorFactoryRegistry::singleton()->GetExperimentalPMEMAllocator(pmem_path, allocator_size);
+  if (experimental_pmem_allocator && cpu_allocator_collect_full_stats &&
+      !experimental_pmem_allocator->TracksAllocationSizes()) {
+    experimental_pmem_allocator =
+        new TrackingAllocator(experimental_pmem_allocator, true);
+  }
+  return experimental_pmem_allocator;
+}
+
 Allocator* ev_allocator() {
   static Allocator* ev_alloc =
       AllocatorFactoryRegistry::singleton()->GetEVAllocator();
 
@@ -337,11 +337,14 @@ Allocator* cpu_allocator_base();
 // call it directly.
 Allocator* cpu_allocator(int numa_node = port::kNUMANoAffinity);
 
-//If use PMEM as allocator, please call this function
+//If use PMEM mode of memkind as allocator, please call this function
 Allocator* pmem_allocator();
 
 Allocator* ev_allocator();
 
+// If use experimental libpmem based PMEM allocator, please call this function
+Allocator* experimental_pmem_allocator(const std::string& pmem_path, size_t allocator_size);
+
 // If 'enable' is true, the default CPU allocator implementation will collect
 // AllocatorStats. By default, it's disabled.
 void EnableCPUAllocatorStats(bool enable);
 
@@ -17,6 +17,7 @@ limitations under the License.
 
 #include "tensorflow/core/framework/allocator_registry.h"
 #include "tensorflow/core/platform/logging.h"
+#include "experimental_pmem_allocator.h"
 
 namespace tensorflow {
 
@@ -87,6 +88,29 @@ Allocator* AllocatorFactoryRegistry::GetAllocator() {
   }
 }
 
+Allocator* AllocatorFactoryRegistry::GetExperimentalPMEMAllocator(const std::string& pmem_path, size_t pmem_size) {
+  mutex_lock l(mu_);
+  first_alloc_made_ = true;
+  FactoryEntry* best_entry = nullptr;
+  for (auto& entry : factories_) {
+    if (entry.name == "ExperimentalPMEMAllocator") {
+      best_entry = &entry;
+      break;
+    }
+  }
+
+  if (best_entry) {
+    if (!best_entry->allocator) {
+      static_cast<ExperimentalPMEMAllocatorFactory*>(best_entry->factory.get())->Init(pmem_path, pmem_size);
+      best_entry->allocator.reset(best_entry->factory->CreateAllocator());
+    }
+    return best_entry->allocator.get();
+  } else {
+    LOG(FATAL) << "No registered Experimental PMEM AllocatorFactory";
+    return nullptr;
+  }
+}
+
 Allocator* AllocatorFactoryRegistry::GetPMEMAllocator() {
   mutex_lock l(mu_);
   first_alloc_made_ = true;
 
@@ -80,6 +80,8 @@ class AllocatorFactoryRegistry {
   //If use PMEMallocator, then factory pick this one
   Allocator* GetPMEMAllocator();
 
+  Allocator* GetExperimentalPMEMAllocator(const std::string& pmem_path, size_t pmem_size);
+
   Allocator* GetEVAllocator();
 
   // Returns 'best fit' SubAllocator.  First look for the highest priority
 
@@ -8,8 +8,9 @@ enum StorageType {
 
   // one level
   DRAM = 1;
-  PMEM = 2;
-  SSD = 3;
+  PMEM_MEMKIND = 2;
+  PMEM_LIBPMEM = 3;
+  SSD = 4;
 
   LEVELDB = 14;
 /*
 
@@ -21,6 +21,7 @@ struct EmbeddingConfig {
   DataType counter_type;
   embedding::StorageType storage_type;
   std::string storage_path;
+  int64 storage_size;
   int64 default_value_dim;
   int normal_fix_flag;
 
@@ -31,7 +32,7 @@ struct EmbeddingConfig {
                   float l2_weight_threshold = -1.0, const std::string& layout = "normal",
                   int64 max_element_size = 0, float false_positive_probability = -1.0,
                   DataType counter_type = DT_UINT64, embedding::StorageType storage_type = embedding::DRAM,
-                  const std::string& storage_path = "",
+                  const std::string& storage_path = "", int64 storage_size = 0,
                   int64 default_value_dim = 4096):
       emb_index(emb_index),
       primary_emb_index(primary_emb_index),
@@ -45,6 +46,7 @@ struct EmbeddingConfig {
       counter_type(counter_type),
       storage_type(storage_type),
       storage_path(storage_path),
+      storage_size(storage_size),
       default_value_dim(default_value_dim),
       normal_fix_flag(0) {
     if ("normal" == layout) {
@@ -106,6 +108,10 @@ struct EmbeddingConfig {
     return storage_path;
   }
 
+  int64 get_storage_size() {
+    return storage_size;
+  }
+
   std::string DebugString() const {
     return strings::StrCat("opname: ", name,
                            " emb_index: ", emb_index,
@@ -118,7 +124,8 @@ struct EmbeddingConfig {
                            " max_freq: ", max_freq,
                            " l2_weight_threshold: ", l2_weight_threshold,
                            " storage_type: ", storage_type,
-                           " storage_path: ", storage_path);
+                           " storage_path: ", storage_path,
+                           " storage_size: ", storage_size);
   }
 };