clean up mtp sample typing after rebase

This commit is contained in:
Aaron Lee 2025-12-21 17:53:27 -05:00
parent a8dc54672c
commit d10a5a4a5b
5 changed files with 8 additions and 6 deletions

View File

@ -691,4 +691,4 @@ llama_token common_sampler_sample_speculative(struct common_sampler * gsmpl, str
}
return best_id;
}
}

View File

@ -115,3 +115,5 @@ struct common_sampler_deleter {
};
typedef std::unique_ptr<common_sampler, common_sampler_deleter> common_sampler_ptr;
llama_token common_sampler_sample_speculative(struct common_sampler * gsmpl, struct llama_context * ctx, int idx);

View File

@ -361,8 +361,8 @@ llama_tokens common_speculative_gen_draft(
}
llama_tokens mtp_speculative_gen_draft(
struct common_sampler* smpl,
struct llama_context* ctx,
struct common_sampler * smpl,
struct llama_context * ctx,
struct common_speculative_params params,
llama_token id_last,
int32_t n_past,

View File

@ -57,8 +57,8 @@ llama_tokens common_speculative_gen_draft(
* @return std::vector<llama_token> The generated draft tokens.
*/
llama_tokens mtp_speculative_gen_draft(
struct common_sampler* smpl,
struct llama_context* ctx,
struct common_sampler * smpl,
struct llama_context * ctx,
struct common_speculative_params params,
llama_token id_last,
int32_t n_past,

View File

@ -2001,7 +2001,7 @@ struct server_context_impl {
llama_set_draft_input_hidden_state(ctx, llama_get_embeddings_ith(ctx, -1));
draft = mtp_speculative_gen_draft(
slot.smpl,
slot.smpl.get(),
ctx,
params_spec,
slot.sampled,