#pragma once #include "chat.h" #include "nlohmann/json.hpp" #include #include #include #include #include using json = nlohmann::ordered_json; // ============================================================================ // Parameters for template application // ============================================================================ struct template_params { json messages; json tools; bool add_generation_prompt = false; bool enable_thinking = true; std::optional extra_context = std::nullopt; }; struct diff_split { std::string prefix; std::string suffix; std::string left; std::string right; bool operator==(struct diff_split & other) const { return prefix == other.prefix && suffix == other.suffix && left == other.left && right == other.right; } }; // Result of compare_variants containing diff and original outputs struct compare_variants_result { diff_split diff; std::string output_A; std::string output_B; }; // ============================================================================ // Marker Registry: All markers extracted via differential analysis // ============================================================================ // Markers extracted from differential analysis of template outputs // Each marker is derived from a specific comparison in the analysis matrix struct marker_registry { // === Reasoning markers (from Phase 1: R1-R3) === std::string reasoning_start; // e.g., "", "[THINK]", "<|START_THINKING|>", "" std::string reasoning_end; // e.g., "", "[BEGIN FINAL RESPONSE]", "<|END_THINKING|>" // === Content markers (from Phase 2: C1-C2) === std::string content_start; // e.g., "", ">>>all\n", "" std::string content_end; // e.g., "", "" // === Tool section markers (from Phase 3: T1-T2) === std::string tool_section_start; // e.g., "", "[TOOL_CALLS]", "" std::string tool_section_end; // e.g., "", "" std::string per_call_start; // e.g., "<|tool_call_begin|>", "" (for multi-call templates) std::string per_call_end; // e.g., "<|tool_call_end|>", "" std::string call_separator; // e.g., ",", "\n", "" (between multiple calls) // === Function markers (from Phase 3: T3-T5) === std::string func_name_prefix; // e.g., "", "\"", ":0" std::string func_close; // e.g., "", "" (for tag-based) std::string args_start; // e.g., "{", "<|tool_call_argument_begin|>" std::string args_end; // e.g., "}", "" // === Argument markers (from Phase 4: A1-A3, for tagged args format) === std::string arg_name_prefix; // e.g., "", "\"" std::string arg_name_suffix; // e.g., ">", "", "\":" std::string arg_value_prefix; // e.g., "", "", "" std::string arg_value_suffix; // e.g., "", "", "" std::string arg_separator; // e.g., "", "\n", "," // === Call ID markers (for non-JSON formats with tool call IDs) === std::string call_id_prefix; // e.g., "[CALL_ID]" (marker before call ID value) std::string call_id_suffix; // e.g., "" (marker after call ID value, before next section) // === Special markers === std::string code_block_marker; // e.g., "Action:" (for markdown code block format) std::string code_block_language; // e.g., "json" std::string function_namespace; // e.g., "functions." (for prefixed-indexed format) }; // ============================================================================ // Analysis Result Enums // ============================================================================ // Reasoning handling mode (derived from R1-R3 comparisons) enum class reasoning_mode { NONE, // No reasoning markers detected TAG_BASED, // Standard tag-based: ... DELIMITER, // Delimiter-based: [BEGIN FINAL RESPONSE] (reasoning ends at delimiter) FORCED_OPEN, // Template ends with open reasoning tag (empty start, non-empty end) FORCED_CLOSED,// Template ends with open reasoning tag on enabled thinking but // with both opened and closed tag for disabled thinking TOOLS_ONLY // Only reason on tool calls, not on normal content }; inline std::ostream & operator<<(std::ostream & os, const reasoning_mode & mode) { switch (mode) { case reasoning_mode::NONE: return os << "NONE"; case reasoning_mode::TAG_BASED: return os << "TAG_BASED"; case reasoning_mode::DELIMITER: return os << "DELIMITER"; case reasoning_mode::FORCED_OPEN: return os << "FORCED_OPEN"; case reasoning_mode::FORCED_CLOSED: return os << "FORCED_CLOSED"; case reasoning_mode::TOOLS_ONLY: return os << "TOOLS_ONLY"; default: return os << "UNKNOWN"; } } // Content wrapping mode (derived from C1 comparison) enum class content_mode { PLAIN, // No content markers ALWAYS_WRAPPED, // Content always wrapped with markers WRAPPED_WITH_REASONING, // Content wrapped only when reasoning present }; inline std::ostream & operator<<(std::ostream & os, const content_mode & mode) { switch (mode) { case content_mode::PLAIN: return os << "PLAIN"; case content_mode::ALWAYS_WRAPPED: return os << "ALWAYS_WRAPPED"; case content_mode::WRAPPED_WITH_REASONING: return os << "WRAPPED_WITH_REASONING"; default: return os << "UNKNOWN"; } } // Call ID position in tool calls (for non-JSON formats) enum class call_id_position { NONE, // No call ID support detected PRE_FUNC_NAME, // Call ID before function name: [CALL_ID]id[FUNC]name{args} BETWEEN_FUNC_AND_ARGS, // Call ID between function and args: [FUNC]name[CALL_ID]id{args} POST_ARGS, // Call ID after arguments: [FUNC]name{args}[CALL_ID]id }; inline std::ostream & operator<<(std::ostream & os, const call_id_position & pos) { switch (pos) { case call_id_position::NONE: return os << "NONE"; case call_id_position::PRE_FUNC_NAME: return os << "PRE_FUNC_NAME"; case call_id_position::BETWEEN_FUNC_AND_ARGS: return os << "BETWEEN_FUNC_AND_ARGS"; case call_id_position::POST_ARGS: return os << "POST_ARGS"; default: return os << "UNKNOWN"; } } // Tool call format classification (derived from T1-T5, A1-A3 comparisons) enum class tool_format { NONE, // No tool support detected JSON_NATIVE, // Pure JSON: {"name": "X", "arguments": {...}} TAG_WITH_JSON, // Tag-based with JSON args: {...} BRACKET_TAG, // Bracket-tag: [TOOL_CALLS]name[CALL_ID]id[ARGS]{...} PREFIXED_INDEXED, // Prefixed-indexed: functions.X:0{...} RECIPIENT_BASED, // Recipient routing: >>>func_name\n{...} TAG_WITH_TAGGED, // Tag-based with tagged args: value MARKDOWN_BLOCK, // Markdown code block: Action:\n```json\n[...]\n``` }; inline std::ostream & operator<<(std::ostream & os, const tool_format & format) { switch (format) { case tool_format::NONE: return os << "NONE"; case tool_format::JSON_NATIVE: return os << "JSON_NATIVE"; case tool_format::TAG_WITH_JSON: return os << "TAG_WITH_JSON"; case tool_format::BRACKET_TAG: return os << "BRACKET_TAG"; case tool_format::PREFIXED_INDEXED: return os << "PREFIXED_INDEXED"; case tool_format::RECIPIENT_BASED: return os << "RECIPIENT_BASED"; case tool_format::TAG_WITH_TAGGED: return os << "TAG_WITH_TAGGED"; case tool_format::MARKDOWN_BLOCK: return os << "MARKDOWN_BLOCK"; default: return os << "UNKNOWN"; } } // Complete result of differential analysis struct diff_analysis_result { // Classification results reasoning_mode reasoning = reasoning_mode::NONE; content_mode content = content_mode::PLAIN; tool_format tools = tool_format::NONE; // All extracted markers marker_registry markers; // JSON field names (for JSON-based formats) bool fun_name_is_key = false; std::string function_field = "function"; std::string name_field = "name"; std::string args_field = "arguments"; std::string id_field; std::string gen_id_field; std::vector parameter_order; // Call ID position (for non-JSON formats) call_id_position call_id_pos = call_id_position::NONE; // Flags bool supports_tools = false; bool supports_parallel_calls = false; bool requires_nonnull_content = false; bool tools_array_wrapped = false; // Tool calls wrapped in JSON array [...] // Preserved tokens for tokenizer (union of all non-empty markers) std::vector preserved_tokens; }; // Performs systematic differential analysis on chat templates // Uses comparison matrix to extract markers without heuristics class differential_analyzer { public: // Main entry point: Run full differential analysis on a template static diff_analysis_result analyze(const common_chat_template & tmpl); // Phase-specific analysis (can be called individually for testing) static void analyze_reasoning(const common_chat_template & tmpl, diff_analysis_result & result); static void analyze_content(const common_chat_template & tmpl, diff_analysis_result & result); static void analyze_tools(const common_chat_template & tmpl, diff_analysis_result & result); static void analyze_arguments(const common_chat_template & tmpl, diff_analysis_result & result); // Factorized differential comparison function (public for testing) // Takes base params and a single modifier lambda to create variant B // Returns compare_variants_result containing diff and both outputs, or std::nullopt on failure static std::optional compare_variants( const common_chat_template & tmpl, const template_params & params_A, const std::function & params_modifier); private: // Comparison helpers (implement the comparison matrix from the plan) // R1: Extract reasoning markers by comparing with/without reasoning_content static void compare_reasoning_presence(const common_chat_template & tmpl, diff_analysis_result & result); // R2: Detect forced-open reasoning by comparing enable_thinking=false vs true static void compare_thinking_enabled(const common_chat_template & tmpl, diff_analysis_result & result); // R3: Detect reasoning scope (content-only vs with tools) static void compare_reasoning_scope(const common_chat_template & tmpl, diff_analysis_result & result); // C1: Extract content markers by comparing different content values static void compare_content_values(const common_chat_template & tmpl, diff_analysis_result & result); // T1: Analyze the tool calls static void analyze_tool_calls(const common_chat_template & tmpl, diff_analysis_result & result); // Analyzes a tool call section to determine the format used (pure JSON, function name markers, or full markers) static void analyze_tool_call_format(const std::string & haystack, const std::string & fun_name_needle, const std::string & arg_name_needle, diff_analysis_result & result); // Helper functions to handle the two branches of analyze_tool_call_format static void analyze_tool_call_format_json_native(const std::string & clean_haystack, const std::string & fun_name_needle, const std::string & arg_name_needle, diff_analysis_result & result); static void analyze_tool_call_format_non_json(const std::string & clean_haystack, const std::string & fun_name_needle, diff_analysis_result & result); // T2: Check if markers are per call or per section static void check_per_call_markers(const common_chat_template & tmpl, diff_analysis_result & result); // T3: Extract call separator; also outputs second_call_content for per-call detection static void extract_call_separator(const common_chat_template & tmpl, diff_analysis_result & result, std::string & second_call_content); // T4: Analyze function name format and extract markers static void extract_function_markers(const common_chat_template & tmpl, diff_analysis_result & result); // T5: Extract argument separator static void extract_argument_separator(const common_chat_template & tmpl, diff_analysis_result & result); // T6: Extract args container markers static void extract_args_markers(const common_chat_template & tmpl, diff_analysis_result & result); // A1: Extract argument name markers static void extract_argument_name_markers(const common_chat_template & tmpl, diff_analysis_result & result); // A2: Extract argument value markers static void extract_argument_value_markers(const common_chat_template & tmpl, diff_analysis_result & result); // T7: Extract call ID markers (for non-JSON formats) static void extract_call_id_markers(const common_chat_template & tmpl, diff_analysis_result & result); // Classify tool format based on extracted markers static void classify_tool_format(diff_analysis_result & result); // Classification helpers static void collect_preserved_tokens(diff_analysis_result & result); // Utility: Apply template with given parameters static std::string apply_template(const common_chat_template & tmpl, const template_params & params); }; enum segment_type { TEXT, MARKER }; inline std::ostream & operator<<(std::ostream & os, const segment_type & type) { switch (type) { case segment_type::TEXT: return os << "TEXT"; case segment_type::MARKER: return os << "MARKER"; default: return os << "UNKNOWN"; } } struct segment { segment_type type; std::string value; segment(segment_type type, std::string value) : type(type), value(std::move(value)) {} };