Internal changes

PiperOrigin-RevId: 837001762
2025-11-26 01:05:06 -08:00 · 2025-11-26 01:05:06 -08:00 · c153d5255b
parent 8696f6dd17
commit c153d5255b
4 changed files with 36 additions and 6 deletions
--- a/BUILD.bazel
+++ b/BUILD.bazel
@ -518,6 +518,18 @@ cc_library(
    ],
 )

+cc_test(
+    name = "kv_cache_test",
+    srcs = ["gemma/kv_cache_test.cc"],
+    deps = [
+        ":configs",
+        ":gemma_args",
+        ":kv_cache",
+        ":threading_context",
+        "//testing/base/public:gunit_main",
+    ],
+)
+
 cc_library(
    name = "gemma_args",
    hdrs = ["gemma/gemma_args.h"],
--- a/gemma/kv_cache.cc
+++ b/gemma/kv_cache.cc
@ -51,7 +51,6 @@ KVCache KVCache::Copy() {
  KVCache copy(kv_cache.Extents(), allocator_);

  CopyMat(kv_cache, copy.kv_cache);
-
  return copy;
 }

@ -59,7 +58,9 @@ std::vector<KVCachePtr> ToKVCachePtrs(const hwy::Span<KVCache>& kv_caches) {
  std::vector<KVCachePtr> ptrs;
  ptrs.reserve(kv_caches.size());
  for (size_t i = 0; i < kv_caches.size(); ++i) {
-    ptrs.push_back(KVCachePtr{.kv_cache = kv_caches[i].kv_cache});
+    ptrs.push_back(KVCachePtr{
+        .kv_cache = kv_caches[i].kv_cache,
+    });
  }
  return ptrs;
 }
--- a/gemma/kv_cache.h
+++ b/gemma/kv_cache.h
@ -17,6 +17,8 @@
 #define THIRD_PARTY_GEMMA_CPP_GEMMA_KV_CACHE_H_

 #include <stddef.h>
+
+#include <optional>
 #include <vector>

 #include "gemma/configs.h"     // ModelConfig
@ -31,19 +33,23 @@ using KV_t = float;
 // A non-owning view of a KVCache.
 struct KVCachePtr {
  bool IsEmpty() const { return kv_cache.Rows() == 0; }
-  size_t SeqLen() const { return kv_cache.Rows(); }
+  size_t SeqLen() const {
+    return kv_cache.Rows();
+  }
+
  MatPtrT<KV_t> kv_cache;
 };

 struct KVCache {
  KVCache(const ModelConfig& config, const InferenceArgs& inference_args,
          const Allocator& allocator);
-
  // Returns a deep copy of the KVCache. Use explicit function instead of
  // copy ctor to make the cost explicit.
  KVCache Copy();

-  size_t SeqLen() const { return kv_cache.Rows(); }
+  size_t SeqLen() const {
+    return kv_cache.Rows();
+  }

  MatStorageT<KV_t> kv_cache;  // [seq_len, layers * kv_heads * qkv_dim * 2]

--- a/gemma/kv_cache_test.cc
+++ b/gemma/kv_cache_test.cc
@ -0,0 +1,11 @@
+#include "gemma/kv_cache.h"
+
+#include "gtest/gtest.h"
+#include "gemma/configs.h"
+#include "gemma/gemma_args.h"
+#include "util/threading_context.h"
+namespace gcpp {
+namespace {
+
+}  // namespace
+}  // namespace gcpp