mirror of https://github.com/google/gemma.cpp.git
parent
6721dddf38
commit
79e640a956
|
|
@ -1739,7 +1739,8 @@ void ComputeFlashParams(size_t num_tokens, const size_t target_parallelism,
|
|||
size_t tasks_required = params.back().v_tile_size < k4xNFVTileSize
|
||||
? k4xNFVTileSize
|
||||
: kVTileSize;
|
||||
if (params.back().v_tile_size + tasks_remaining < tasks_required ||
|
||||
if ((params.back().v_tile_size + tasks_remaining < tasks_required &&
|
||||
params.back().v_tile_size > 0) ||
|
||||
params.back().v_tile_size == kVTileSize) {
|
||||
// We don't have enough tasks remaining to fill a tile, or the
|
||||
// current tile is full so start new tile.
|
||||
|
|
|
|||
Loading…
Reference in New Issue