mirror of https://github.com/google/gemma.cpp.git
Increase the prefill batch size to 64.
PiperOrigin-RevId: 651754772
This commit is contained in:
parent
df3fb70802
commit
c879133a5a
|
|
@ -36,7 +36,7 @@ ByteStorageT AllocateSizeof() {
|
|||
return hwy::AllocateAligned<uint8_t>(sizeof(T));
|
||||
}
|
||||
|
||||
constexpr size_t kPrefillBatchSize = 16;
|
||||
constexpr size_t kPrefillBatchSize = 64;
|
||||
constexpr size_t kDecodeBatchSize = 1;
|
||||
constexpr size_t kBatchedQueryBatchSize = 16;
|
||||
constexpr size_t kMinAdjustedPrefillBatchSize =
|
||||
|
|
|
|||
Loading…
Reference in New Issue