server : reconnect the backend_sampling setting in the WebUI

This commit is contained in:
Georgi Gerganov 2025-12-10 15:42:02 +02:00
parent 81cb5783c8
commit 0ecee8be37
No known key found for this signature in database
GPG Key ID: 449E073F9DC10735
4 changed files with 6 additions and 2 deletions

Binary file not shown.

View File

@ -208,10 +208,11 @@ task_params server_task::params_from_json_cmpl(
params.sampling.seed = json_value(data, "seed", defaults.sampling.seed);
params.sampling.n_probs = json_value(data, "n_probs", defaults.sampling.n_probs);
params.sampling.min_keep = json_value(data, "min_keep", defaults.sampling.min_keep);
params.sampling.backend_sampling = json_value(data, "backend_sampling", defaults.sampling.backend_sampling);
params.post_sampling_probs = json_value(data, "post_sampling_probs", defaults.post_sampling_probs);
const bool request_backend_sampling = json_value(data, "backend_sampling", defaults.sampling.backend_sampling);
params.sampling.backend_sampling = defaults.sampling.backend_sampling && request_backend_sampling;
printf("params.sampling.backend_sampling = %d\n", params.sampling.backend_sampling);
printf("defaults.sampling.backend_sampling = %d\n", defaults.sampling.backend_sampling);
params.speculative.n_min = json_value(data, "speculative.n_min", defaults.speculative.n_min);
params.speculative.n_max = json_value(data, "speculative.n_max", defaults.speculative.n_max);

View File

@ -1401,6 +1401,7 @@ class ChatStore {
if (hasValue(currentConfig.dry_penalty_last_n))
apiOptions.dry_penalty_last_n = Number(currentConfig.dry_penalty_last_n);
if (currentConfig.samplers) apiOptions.samplers = currentConfig.samplers;
if (currentConfig.backend_sampling) apiOptions.backend_sampling = currentConfig.backend_sampling;
if (currentConfig.custom) apiOptions.custom = currentConfig.custom;
return apiOptions;

View File

@ -149,6 +149,7 @@ export interface ApiLlamaCppServerProps {
reasoning_in_content: boolean;
thinking_forced_open: boolean;
samplers: string[];
backend_sampling: boolean;
'speculative.n_max': number;
'speculative.n_min': number;
'speculative.p_min': number;
@ -311,6 +312,7 @@ export interface ApiSlotData {
reasoning_in_content: boolean;
thinking_forced_open: boolean;
samplers: string[];
backend_sampling: boolean;
'speculative.n_max': number;
'speculative.n_min': number;
'speculative.p_min': number;