intel
diff --git a/‎cachelib/cachebench/cache/Cache-inl.h‎
Lines changed: 20 additions & 21 deletions b/‎cachelib/cachebench/cache/Cache-inl.h‎
Lines changed: 20 additions & 21 deletions
diff --git a/‎cachelib/cachebench/cache/Cache.h‎
Lines changed: 2 additions & 2 deletions b/‎cachelib/cachebench/cache/Cache.h‎
Lines changed: 2 additions & 2 deletions
diff --git a/‎cachelib/cachebench/runner/AsyncCacheStressor.h‎
Lines changed: 21 additions & 22 deletions b/‎cachelib/cachebench/runner/AsyncCacheStressor.h‎
Lines changed: 21 additions & 22 deletions
diff --git a/‎cachelib/cachebench/runner/CacheStressor.h‎
Lines changed: 20 additions & 20 deletions b/‎cachelib/cachebench/runner/CacheStressor.h‎
Lines changed: 20 additions & 20 deletions
diff --git a/‎cachelib/cachebench/runner/Stressor.cpp‎
Lines changed: 3 additions & 0 deletions b/‎cachelib/cachebench/runner/Stressor.cpp‎
Lines changed: 3 additions & 0 deletions
@@ -116,7 +116,8 @@ Cache<Allocator>::Cache(const CacheConfig& config,
   allocatorConfig_.maxPromotionBatch = config_.maxPromotionBatch;
   allocatorConfig_.minEvictionBatch = config_.minEvictionBatch;
   allocatorConfig_.minPromotionBatch = config_.minPromotionBatch;
-  allocatorConfig_.maxEvictionPromotionHotness = config_.maxEvictionPromotionHotness;
+  allocatorConfig_.maxEvictionPromotionHotness =
+      config_.maxEvictionPromotionHotness;
 
   if (config_.enableItemDestructorCheck) {
     auto removeCB = [&](const typename Allocator::DestructorData& data) {
@@ -647,10 +648,9 @@ double Cache<Allocator>::getNvmBytesWritten() const {
 
 template <typename Allocator>
 Stats Cache<Allocator>::getStats() const {
-
   Stats ret;
   for (TierId tid = 0; tid < cache_->getNumTiers(); tid++) {
-    PoolStats aggregate = cache_->getPoolStats(tid,pools_[0]);
+    PoolStats aggregate = cache_->getPoolStats(tid, pools_[0]);
     auto usageFraction =
         1.0 - (static_cast<double>(aggregate.freeMemoryBytes())) /
                   aggregate.poolUsableSize;
@@ -668,7 +668,8 @@ Stats Cache<Allocator>::getStats() const {
     ret.numItems.push_back(aggregate.numItems());
   }
 
-  std::map<TierId, std::map<PoolId, std::map<ClassId, ACStats>>> allocationClassStats{};
+  std::map<TierId, std::map<PoolId, std::map<ClassId, ACStats>>>
+      allocationClassStats{};
 
   for (size_t pid = 0; pid < pools_.size(); pid++) {
     PoolId poolId = static_cast<PoolId>(pid);
@@ -686,19 +687,14 @@ Stats Cache<Allocator>::getStats() const {
 
   ret.allocationClassStats = allocationClassStats;
 
-  ret.backgndEvicStats.nEvictedItems =
-            cacheStats.evictionStats.numMovedItems;
-  ret.backgndEvicStats.nTraversals =
-            cacheStats.evictionStats.runCount;
-  ret.backgndEvicStats.nClasses =
-            cacheStats.evictionStats.totalClasses;
-  ret.backgndEvicStats.evictionSize =
-            cacheStats.evictionStats.totalBytesMoved;
-  
+  ret.backgndEvicStats.nEvictedItems = cacheStats.evictionStats.numMovedItems;
+  ret.backgndEvicStats.nTraversals = cacheStats.evictionStats.runCount;
+  ret.backgndEvicStats.nClasses = cacheStats.evictionStats.totalClasses;
+  ret.backgndEvicStats.evictionSize = cacheStats.evictionStats.totalBytesMoved;
+
   ret.backgndPromoStats.nPromotedItems =
-            cacheStats.promotionStats.numMovedItems;
-  ret.backgndPromoStats.nTraversals =
-            cacheStats.promotionStats.runCount;
+      cacheStats.promotionStats.numMovedItems;
+  ret.backgndPromoStats.nTraversals = cacheStats.promotionStats.runCount;
 
   ret.evictAttempts = cacheStats.evictionAttempts;
   ret.allocAttempts = cacheStats.allocAttempts;
@@ -753,8 +749,10 @@ Stats Cache<Allocator>::getStats() const {
     ret.nvmCounters = cache_->getNvmCacheStatsMap().toMap();
   }
 
-  ret.backgroundEvictionClasses = cache_->getBackgroundMoverClassStats(MoverDir::Evict);
-  ret.backgroundPromotionClasses = cache_->getBackgroundMoverClassStats(MoverDir::Promote);
+  ret.backgroundEvictionClasses =
+      cache_->getBackgroundMoverClassStats(MoverDir::Evict);
+  ret.backgroundPromotionClasses =
+      cache_->getBackgroundMoverClassStats(MoverDir::Promote);
 
   // nvm stats from navy
   if (!isRamOnly() && !navyStats.empty()) {
@@ -877,12 +875,13 @@ void Cache<Allocator>::setStringItem(WriteHandle& handle,
   if (dataSize < 1)
     return;
 
-  auto ptr = reinterpret_cast<char*>(getMemory(handle));
-  std::strncpy(ptr, str.c_str(), dataSize);
+  auto ptr = reinterpret_cast<void*>(getMemory(handle));
+  std::memcpy(ptr, str.c_str(), dataSize);
 
+  auto ptr2 = reinterpret_cast<char*>(getMemory(handle));
   // Make sure the copied string ends with null char
   if (str.size() + 1 > dataSize) {
-    ptr[dataSize - 1] = '\0';
+    ptr2[dataSize - 1] = '\0';
   }
 }
 
 
@@ -312,7 +312,7 @@ class Cache {
   // return true if the key was previously detected to be inconsistent. This
   // is useful only when consistency checking is enabled by calling
   // enableConsistencyCheck()
-  bool isInvalidKey(const std::string& key) {
+  bool isInvalidKey(const std::string_view key) {
     return invalidKeys_[key].load(std::memory_order_relaxed);
   }
 
@@ -430,7 +430,7 @@ class Cache {
   // Since this can be accessed from multiple threads, the map is initialized
   // during start up and only the value is updated by flipping the bit
   // atomically.
-  std::unordered_map<std::string, std::atomic<bool>> invalidKeys_;
+  std::unordered_map<std::string_view, std::atomic<bool>> invalidKeys_;
 
   // number of inconsistency detected so far with the operations
   std::atomic<unsigned int> inconsistencyCount_{0};
 
@@ -222,9 +222,9 @@ class AsyncCacheStressor : public Stressor {
                 ThroughputStats& stats,
                 const Request* req,
                 folly::EventBase* evb,
-                const std::string* key) {
+                const std::string_view& key) {
     ++stats.get;
-    auto lock = chainedItemAcquireSharedLock(*key);
+    auto lock = chainedItemAcquireSharedLock(key);
 
     if (ticker_) {
       ticker_->updateTimeStamp(req->timestamp);
@@ -233,8 +233,7 @@ class AsyncCacheStressor : public Stressor {
     // add a distribution over sequences of requests/access patterns
     // e.g. get-no-set and set-no-get
 
-    auto onReadyFn = [&, req, key = *key,
-                      l = std::move(lock)](auto hdl) mutable {
+    auto onReadyFn = [&, req, key, l = std::move(lock)](auto hdl) mutable {
       auto result = OpResultType::kGetMiss;
 
       if (hdl == nullptr) {
@@ -247,7 +246,7 @@ class AsyncCacheStressor : public Stressor {
           // appropriate here)
           l.unlock();
           auto xlock = chainedItemAcquireUniqueLock(key);
-          setKey(pid, stats, &key, *(req->sizeBegin), req->ttlSecs,
+          setKey(pid, stats, key, *(req->sizeBegin), req->ttlSecs,
                  req->admFeatureMap);
         }
       } else {
@@ -260,8 +259,8 @@ class AsyncCacheStressor : public Stressor {
       }
     };
 
-    cache_->recordAccess(*key);
-    auto sf = cache_->asyncFind(*key);
+    cache_->recordAccess(key);
+    auto sf = cache_->asyncFind(key);
     if (sf.isReady()) {
       // If the handle is ready, call onReadyFn directly to process the handle
       onReadyFn(std::move(sf).value());
@@ -283,9 +282,9 @@ class AsyncCacheStressor : public Stressor {
                        ThroughputStats& stats,
                        const Request* req,
                        folly::EventBase* evb,
-                       const std::string* key) {
+                       const std::string_view& key) {
     ++stats.get;
-    auto lock = chainedItemAcquireUniqueLock(*key);
+    auto lock = chainedItemAcquireUniqueLock(key);
 
     // This was moved outside the lambda, as otherwise gcc-8.x crashes with an
     // internal compiler error here (suspected regression in folly).
@@ -297,7 +296,7 @@ class AsyncCacheStressor : public Stressor {
         ++stats.getMiss;
 
         ++stats.set;
-        wHdl = cache_->allocate(pid, *key, *(req->sizeBegin), req->ttlSecs);
+        wHdl = cache_->allocate(pid, key, *(req->sizeBegin), req->ttlSecs);
         if (!wHdl) {
           ++stats.setFailure;
           return;
@@ -327,7 +326,7 @@ class AsyncCacheStressor : public Stressor {
     };
 
     // Always use asyncFind as findToWrite is sync when using HybridCache
-    auto sf = cache_->asyncFind(*key);
+    auto sf = cache_->asyncFind(key);
     if (sf.isReady()) {
       onReadyFn(std::move(sf).value());
       return;
@@ -345,10 +344,10 @@ class AsyncCacheStressor : public Stressor {
   void asyncUpdate(ThroughputStats& stats,
                    const Request* req,
                    folly::EventBase* evb,
-                   const std::string* key) {
+                   const std::string_view& key) {
     ++stats.get;
     ++stats.update;
-    auto lock = chainedItemAcquireUniqueLock(*key);
+    auto lock = chainedItemAcquireUniqueLock(key);
     if (ticker_) {
       ticker_->updateTimeStamp(req->timestamp);
     }
@@ -363,7 +362,7 @@ class AsyncCacheStressor : public Stressor {
       cache_->updateItemRecordVersion(wHdl);
     };
 
-    auto sf = cache_->asyncFind(*key);
+    auto sf = cache_->asyncFind(key);
     if (sf.isReady()) {
       onReadyFn(std::move(sf).value());
       return;
@@ -457,18 +456,18 @@ class AsyncCacheStressor : public Stressor {
         const auto pid = static_cast<PoolId>(opPoolDist(gen));
         const Request& req(getReq(pid, gen, lastRequestId));
         OpType op = req.getOp();
-        const std::string* key = &(req.key);
-        std::string oneHitKey;
+        std::string_view key = req.key;
+        std::string_view oneHitKey;
         if (op == OpType::kLoneGet || op == OpType::kLoneSet) {
           oneHitKey = Request::getUniqueKey();
-          key = &oneHitKey;
+          key = oneHitKey;
         }
 
         OpResultType result(OpResultType::kNop);
         switch (op) {
         case OpType::kLoneSet:
         case OpType::kSet: {
-          auto lock = chainedItemAcquireUniqueLock(*key);
+          auto lock = chainedItemAcquireUniqueLock(key);
           result = setKey(pid, stats, key, *(req.sizeBegin), req.ttlSecs,
                           req.admFeatureMap);
 
@@ -481,8 +480,8 @@ class AsyncCacheStressor : public Stressor {
         }
         case OpType::kDel: {
           ++stats.del;
-          auto lock = chainedItemAcquireUniqueLock(*key);
-          auto res = cache_->remove(*key);
+          auto lock = chainedItemAcquireUniqueLock(key);
+          auto res = cache_->remove(key);
           if (res == CacheT::RemoveRes::kNotFoundInRam) {
             ++stats.delNotFound;
           }
@@ -532,7 +531,7 @@ class AsyncCacheStressor : public Stressor {
   OpResultType setKey(
       PoolId pid,
       ThroughputStats& stats,
-      const std::string* key,
+      const std::string_view& key,
       size_t size,
       uint32_t ttlSecs,
       const std::unordered_map<std::string, std::string>& featureMap) {
@@ -543,7 +542,7 @@ class AsyncCacheStressor : public Stressor {
     }
 
     ++stats.set;
-    auto it = cache_->allocate(pid, *key, size, ttlSecs);
+    auto it = cache_->allocate(pid, key, size, ttlSecs);
     if (it == nullptr) {
       ++stats.setFailure;
       return OpResultType::kSetFailure;
 
@@ -325,24 +325,24 @@ class CacheStressor : public Stressor {
         const auto pid = static_cast<PoolId>(opPoolDist(gen));
         const Request& req(getReq(pid, gen, lastRequestId));
         OpType op = req.getOp();
-        const std::string* key = &(req.key);
-        std::string oneHitKey;
+        std::string_view key = req.key;
+        std::string_view oneHitKey;
         if (op == OpType::kLoneGet || op == OpType::kLoneSet) {
           oneHitKey = Request::getUniqueKey();
-          key = &oneHitKey;
+          key = oneHitKey;
         }
 
         OpResultType result(OpResultType::kNop);
         switch (op) {
         case OpType::kLoneSet:
         case OpType::kSet: {
           if (config_.onlySetIfMiss) {
-            auto it = cache_->find(*key);
+            auto it = cache_->find(key);
             if (it != nullptr) {
               continue;
             }
           }
-          auto lock = chainedItemAcquireUniqueLock(*key);
+          auto lock = chainedItemAcquireUniqueLock(key);
           result = setKey(pid, stats, key, *(req.sizeBegin), req.ttlSecs,
                           req.admFeatureMap, req.itemValue);
 
@@ -352,17 +352,17 @@ class CacheStressor : public Stressor {
         case OpType::kGet: {
           ++stats.get;
 
-          auto slock = chainedItemAcquireSharedLock(*key);
-          auto xlock = decltype(chainedItemAcquireUniqueLock(*key)){};
+          auto slock = chainedItemAcquireSharedLock(key);
+          auto xlock = decltype(chainedItemAcquireUniqueLock(key)){};
 
           if (ticker_) {
             ticker_->updateTimeStamp(req.timestamp);
           }
           // TODO currently pure lookaside, we should
           // add a distribution over sequences of requests/access patterns
           // e.g. get-no-set and set-no-get
-          cache_->recordAccess(*key);
-          auto it = cache_->find(*key);
+          cache_->recordAccess(key);
+          auto it = cache_->find(key);
           if (it == nullptr) {
             ++stats.getMiss;
             result = OpResultType::kGetMiss;
@@ -372,7 +372,7 @@ class CacheStressor : public Stressor {
               // upgrade access privledges, (lock_upgrade is not
               // appropriate here)
               slock = {};
-              xlock = chainedItemAcquireUniqueLock(*key);
+              xlock = chainedItemAcquireUniqueLock(key);
               setKey(pid, stats, key, *(req.sizeBegin), req.ttlSecs,
                      req.admFeatureMap, req.itemValue);
             }
@@ -384,22 +384,22 @@ class CacheStressor : public Stressor {
         }
         case OpType::kDel: {
           ++stats.del;
-          auto lock = chainedItemAcquireUniqueLock(*key);
-          auto res = cache_->remove(*key);
+          auto lock = chainedItemAcquireUniqueLock(key);
+          auto res = cache_->remove(key);
           if (res == CacheT::RemoveRes::kNotFoundInRam) {
             ++stats.delNotFound;
           }
           break;
         }
         case OpType::kAddChained: {
           ++stats.get;
-          auto lock = chainedItemAcquireUniqueLock(*key);
-          auto it = cache_->findToWrite(*key);
+          auto lock = chainedItemAcquireUniqueLock(key);
+          auto it = cache_->findToWrite(key);
           if (!it) {
             ++stats.getMiss;
 
             ++stats.set;
-            it = cache_->allocate(pid, *key, *(req.sizeBegin), req.ttlSecs);
+            it = cache_->allocate(pid, key, *(req.sizeBegin), req.ttlSecs);
             if (!it) {
               ++stats.setFailure;
               break;
@@ -430,11 +430,11 @@ class CacheStressor : public Stressor {
         case OpType::kUpdate: {
           ++stats.get;
           ++stats.update;
-          auto lock = chainedItemAcquireUniqueLock(*key);
+          auto lock = chainedItemAcquireUniqueLock(key);
           if (ticker_) {
             ticker_->updateTimeStamp(req.timestamp);
           }
-          auto it = cache_->findToWrite(*key);
+          auto it = cache_->findToWrite(key);
           if (it == nullptr) {
             ++stats.getMiss;
             ++stats.updateMiss;
@@ -445,7 +445,7 @@ class CacheStressor : public Stressor {
         }
         case OpType::kCouldExist: {
           ++stats.couldExistOp;
-          if (!cache_->couldExist(*key)) {
+          if (!cache_->couldExist(key)) {
             ++stats.couldExistOpFalse;
           }
           break;
@@ -480,7 +480,7 @@ class CacheStressor : public Stressor {
   OpResultType setKey(
       PoolId pid,
       ThroughputStats& stats,
-      const std::string* key,
+      const std::string_view& key,
       size_t size,
       uint32_t ttlSecs,
       const std::unordered_map<std::string, std::string>& featureMap,
@@ -492,7 +492,7 @@ class CacheStressor : public Stressor {
     }
 
     ++stats.set;
-    auto it = cache_->allocate(pid, *key, size, ttlSecs);
+    auto it = cache_->allocate(pid, key, size, ttlSecs);
     if (it == nullptr) {
       ++stats.setFailure;
       return OpResultType::kSetFailure;
 
@@ -21,6 +21,7 @@
 #include "cachelib/cachebench/runner/CacheStressor.h"
 #include "cachelib/cachebench/runner/FastShutdown.h"
 #include "cachelib/cachebench/runner/IntegrationStressor.h"
+#include "cachelib/cachebench/workload/BinaryKVReplayGenerator.h"
 #include "cachelib/cachebench/workload/KVReplayGenerator.h"
 #include "cachelib/cachebench/workload/OnlineGenerator.h"
 #include "cachelib/cachebench/workload/PieceWiseReplayGenerator.h"
@@ -142,6 +143,8 @@ std::unique_ptr<GeneratorBase> makeGenerator(const StressorConfig& config) {
     return std::make_unique<PieceWiseReplayGenerator>(config);
   } else if (config.generator == "replay") {
     return std::make_unique<KVReplayGenerator>(config);
+  } else if (config.generator == "binary-replay") {
+    return std::make_unique<BinaryKVReplayGenerator>(config);
   } else if (config.generator.empty() || config.generator == "workload") {
     // TODO: Remove the empty() check once we label workload-based configs
     // properly