mirror of https://github.com/google/gemma.cpp.git
Increase the prefill batch size to 64.
PiperOrigin-RevId: 651754772
This commit is contained in:
parent
df3fb70802
commit
c879133a5a
|
|
@ -36,7 +36,7 @@ ByteStorageT AllocateSizeof() {
|
||||||
return hwy::AllocateAligned<uint8_t>(sizeof(T));
|
return hwy::AllocateAligned<uint8_t>(sizeof(T));
|
||||||
}
|
}
|
||||||
|
|
||||||
constexpr size_t kPrefillBatchSize = 16;
|
constexpr size_t kPrefillBatchSize = 64;
|
||||||
constexpr size_t kDecodeBatchSize = 1;
|
constexpr size_t kDecodeBatchSize = 1;
|
||||||
constexpr size_t kBatchedQueryBatchSize = 16;
|
constexpr size_t kBatchedQueryBatchSize = 16;
|
||||||
constexpr size_t kMinAdjustedPrefillBatchSize =
|
constexpr size_t kMinAdjustedPrefillBatchSize =
|
||||||
|
|
|
||||||
Loading…
Reference in New Issue