From c2619c18bfff3cda751213c49f6628ff3e09ec35 Mon Sep 17 00:00:00 2001 From: Georgi Gerganov Date: Sat, 31 Jan 2026 16:38:46 +0200 Subject: [PATCH] examples: use cached dataset path to avoid HF Hub requests --- examples/llama-eval/llama-eval-new.py | 9 ++++++++- 1 file changed, 8 insertions(+), 1 deletion(-) diff --git a/examples/llama-eval/llama-eval-new.py b/examples/llama-eval/llama-eval-new.py index 1026ecee44..d1dd3c048d 100755 --- a/examples/llama-eval/llama-eval-new.py +++ b/examples/llama-eval/llama-eval-new.py @@ -51,7 +51,14 @@ class AimeDataset: def _load_dataset(self): print(f"Loading AIME dataset (split: {self.split})...") from datasets import load_dataset - ds = load_dataset("AI-MO/aimo-validation-aime", split=self.split) + + cache_path = cache_dir / "AI-MO___aimo-validation-aime" / "default" / "0.0.0" + if cache_path.exists(): + print(f"Using cached dataset from {cache_path}") + ds = load_dataset("AI-MO/aimo-validation-aime", split=self.split, cache_dir=str(cache_path)) + else: + ds = load_dataset("AI-MO/aimo-validation-aime", split=self.split) + self.questions = list(ds) print(f"AIME dataset loaded: {len(self.questions)} questions")