diff --git a/gemma/gemma.cc b/gemma/gemma.cc index f32cde5..1c07c9e 100644 --- a/gemma/gemma.cc +++ b/gemma/gemma.cc @@ -114,7 +114,7 @@ struct CreateKVCache { KVCache operator()() const { KVCache kv_cache = {}; - const size_t size_cache_pos = CacheLayerSize()(); + const size_t size_cache_pos = CachePosSize()(); if (size_cache_pos != 0) { const size_t seq_len = TConfig::kSeqLen + kPrefillBatchSize; kv_cache.kv_cache = hwy::AllocateAligned(seq_len * size_cache_pos);