From 69aebcb031026f71861465a4e82abae334988a52 Mon Sep 17 00:00:00 2001 From: GrS-AA <171042778+GrS-AA@users.noreply.github.com> Date: Tue, 4 Nov 2025 11:46:17 +0000 Subject: [PATCH 1/5] hardcoded date for consistency in tests --- src/template_formatting/formatter.py | 2 ++ 1 file changed, 2 insertions(+) diff --git a/src/template_formatting/formatter.py b/src/template_formatting/formatter.py index ccf5a206..6f25841f 100644 --- a/src/template_formatting/formatter.py +++ b/src/template_formatting/formatter.py @@ -323,6 +323,8 @@ def format( # type: ignore[override] "continue_final_message": is_prefill, } ) + if "date_string" not in template_kwargs: + template_kwargs["date_string"] = "1 Jan 2025" # hardcoded date for consistency in tests return self.tokenizer.apply_chat_template(hf_chat, **template_kwargs) From 9fda5c5f0664ba8079f64a7b5445e4cf80170c65 Mon Sep 17 00:00:00 2001 From: GrS-AA <171042778+GrS-AA@users.noreply.github.com> Date: Tue, 4 Nov 2025 11:47:26 +0000 Subject: [PATCH 2/5] update changelog --- CHANGELOG.md | 1 + 1 file changed, 1 insertion(+) diff --git a/CHANGELOG.md b/CHANGELOG.md index 38d47b92..f978a9b0 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -34,6 +34,7 @@ - Fix: W&B integration respects WANDB_ARTIFACT_DIR. In addition, new env var WANDB_CACHE_SKIP controls cache use. - Dropped support for S3 storages without proper SSL certificates. - Added support for W&B artifacts on local storage which don't need to be downloaded and may be earlier available. +- Hardcoded a date in template formatting application for consistency in eval results ## 0.2.2 From 6a9c9ec1c33393b0ce175e055b25aae82825a08b Mon Sep 17 00:00:00 2001 From: GrS-AA <171042778+GrS-AA@users.noreply.github.com> Date: Tue, 4 Nov 2025 11:52:30 +0000 Subject: [PATCH 3/5] update changelog --- CHANGELOG.md | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index f978a9b0..743b7100 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -34,7 +34,7 @@ - Fix: W&B integration respects WANDB_ARTIFACT_DIR. In addition, new env var WANDB_CACHE_SKIP controls cache use. - Dropped support for S3 storages without proper SSL certificates. - Added support for W&B artifacts on local storage which don't need to be downloaded and may be earlier available. -- Hardcoded a date in template formatting application for consistency in eval results +- Hardcoded a date in template formatting application for consistency in eval results. ## 0.2.2 From 5f6188bad25276cf63c019ee4597b0978e38ca04 Mon Sep 17 00:00:00 2001 From: GrS-AA <171042778+GrS-AA@users.noreply.github.com> Date: Tue, 4 Nov 2025 11:55:23 +0000 Subject: [PATCH 4/5] fix ruff --- src/template_formatting/formatter.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/template_formatting/formatter.py b/src/template_formatting/formatter.py index 6f25841f..30f4d74b 100644 --- a/src/template_formatting/formatter.py +++ b/src/template_formatting/formatter.py @@ -324,7 +324,7 @@ def format( # type: ignore[override] } ) if "date_string" not in template_kwargs: - template_kwargs["date_string"] = "1 Jan 2025" # hardcoded date for consistency in tests + template_kwargs["date_string"] = "1 Jan 2025" # hardcoded date for consistency in tests return self.tokenizer.apply_chat_template(hf_chat, **template_kwargs) From c4a677a1a831a0d2fc5e757cacf711b07a5ad7f4 Mon Sep 17 00:00:00 2001 From: GrS-AA <171042778+GrS-AA@users.noreply.github.com> Date: Wed, 5 Nov 2025 20:16:33 +0000 Subject: [PATCH 5/5] use unknown (or default llama4 date TBD) --- src/template_formatting/formatter.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/src/template_formatting/formatter.py b/src/template_formatting/formatter.py index 30f4d74b..555c9ce2 100644 --- a/src/template_formatting/formatter.py +++ b/src/template_formatting/formatter.py @@ -324,7 +324,10 @@ def format( # type: ignore[override] } ) if "date_string" not in template_kwargs: - template_kwargs["date_string"] = "1 Jan 2025" # hardcoded date for consistency in tests + # some templates are forcing a date_string, harcoding one here for consistency in evaluations, e.g. + # https://github.com/huggingface/transformers/blob/main/src/transformers/models/llama4/processing_llama4.py + # template_kwargs["date_string"] = "26 Jul 2024" + template_kwargs["date_string"] = "unknown" return self.tokenizer.apply_chat_template(hf_chat, **template_kwargs)