From e79e8d02d53b757a71388ccd4303467603f63027 Mon Sep 17 00:00:00 2001
From: Georgi Gerganov <ggerganov@gmail.com>
Date: Sat, 31 Jan 2026 18:58:27 +0200
Subject: [PATCH] examples: add task summary table to llama-eval-new.py

---
 examples/llama-eval/llama-eval-new.py | 12 ++++++++++++
 1 file changed, 12 insertions(+)

diff --git a/examples/llama-eval/llama-eval-new.py b/examples/llama-eval/llama-eval-new.py
index f307b1eb31..0dae28116a 100755
--- a/examples/llama-eval/llama-eval-new.py
+++ b/examples/llama-eval/llama-eval-new.py
@@ -208,6 +208,18 @@ class Processor:
         print(f"Max tokens: {self.n_predict}")
         print()
 
+        # Print task summary table
+        print("Tasks:")
+        print("  Task ID         Dataset    Prompt (first 40 chars)                        Expected    Status")
+        for i in range(min(n_cases, len(self.dataset.questions))):
+            question = self.dataset.get_question(i)
+            case_id = f"aime_{self.dataset.split}_{question['id']}"
+            prompt = question["problem"]
+            gold = self.dataset.get_answer(question)
+            truncated_prompt = prompt[:40] + "..." if len(prompt) > 40 else prompt
+            print(f"  {case_id:<15} AIME2025   {truncated_prompt:<40}    {gold:<10} pending")
+        print()
+
         task_states: Dict[str, List[TaskState]] = {task: [] for task in self.eval_state.tasks}
         total = 0
         correct = 0