From 048250e45fa9b10f8d4e0f0c3c0ed7359f87b2f3 Mon Sep 17 00:00:00 2001 From: "Sean (Seok-Won) Yi" Date: Sun, 22 Dec 2024 13:11:28 +0900 Subject: [PATCH 1/7] Updated docstring for _determine_best_metric. --- src/transformers/trainer.py | 1 - 1 file changed, 1 deletion(-) diff --git a/src/transformers/trainer.py b/src/transformers/trainer.py index c878d2b345cc31..812655f879ac85 100755 --- a/src/transformers/trainer.py +++ b/src/transformers/trainer.py @@ -3148,7 +3148,6 @@ def _load_rng_state(self, checkpoint): def _determine_best_metric(self, metrics, trial): """ Determine if the model should be saved based on the evaluation metrics. - If args.metric_for_best_model is not set, the loss is used. Returns: bool: True if a new best metric was found, else False From a90313632a61047b4c0bcac2a9199e32ea1d6007 Mon Sep 17 00:00:00 2001 From: "Sean (Seok-Won) Yi" Date: Sun, 22 Dec 2024 13:11:38 +0900 Subject: [PATCH 2/7] Updated docstring for metric_for_best_model. --- src/transformers/training_args.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/transformers/training_args.py b/src/transformers/training_args.py index 6950e8e66d3ac1..214cdde7b282c0 100644 --- a/src/transformers/training_args.py +++ b/src/transformers/training_args.py @@ -477,7 +477,7 @@ class TrainingArguments: metric_for_best_model (`str`, *optional*): Use in conjunction with `load_best_model_at_end` to specify the metric to use to compare two different models. Must be the name of a metric returned by the evaluation with or without the prefix `"eval_"`. Will - default to `"loss"` if unspecified and `load_best_model_at_end=True` (to use the evaluation loss). + default to `"loss"` if unspecified, `load_best_model_at_end=True`, and `save_strategy!="best"`. If you set this value, `greater_is_better` will default to `True`. Don't forget to set it to `False` if your metric is better when lower. From 84e91d1cf1806c0e73d2143037f929f9338d2cc1 Mon Sep 17 00:00:00 2001 From: "Sean (Seok-Won) Yi" Date: Sun, 22 Dec 2024 13:19:56 +0900 Subject: [PATCH 3/7] Added test case for save strategy. --- tests/trainer/test_trainer.py | 14 +++++++++++++- 1 file changed, 13 insertions(+), 1 deletion(-) diff --git a/tests/trainer/test_trainer.py b/tests/trainer/test_trainer.py index d33be2789761da..c787649edca05e 100644 --- a/tests/trainer/test_trainer.py +++ b/tests/trainer/test_trainer.py @@ -4232,9 +4232,21 @@ def test_save_best_checkpoint(self): save_strategy="best", compute_metrics=AlmostAccuracy(), ) - self.assertIn("`args.metric_for_best_model` must be provided", str(context.exception)) + # Case 4: Metric name not provided and save_best_strategy is "steps" (i.e., not "best"). + with tempfile.TemporaryDirectory() as tmpdir: + with self.assertRaises(ValueError) as context: + trainer = get_regression_trainer( + a=1.5, + b=2.5, + output_dir=tmpdir, + learning_rate=0.1, + eval_strategy="epoch", + save_strategy="steps", + ) + self.assertTrue(trainer.args.metric_for_best_model == "loss") + @require_torch @is_staging_test From 8accf30b892d41f308ae87ff78ae030a235d3400 Mon Sep 17 00:00:00 2001 From: "Sean (Seok-Won) Yi" Date: Sun, 22 Dec 2024 14:18:21 +0900 Subject: [PATCH 4/7] Updated incorrect test case. --- tests/trainer/test_trainer.py | 18 +++++++++--------- 1 file changed, 9 insertions(+), 9 deletions(-) diff --git a/tests/trainer/test_trainer.py b/tests/trainer/test_trainer.py index c787649edca05e..7093ce2745a64d 100644 --- a/tests/trainer/test_trainer.py +++ b/tests/trainer/test_trainer.py @@ -4236,15 +4236,15 @@ def test_save_best_checkpoint(self): # Case 4: Metric name not provided and save_best_strategy is "steps" (i.e., not "best"). with tempfile.TemporaryDirectory() as tmpdir: - with self.assertRaises(ValueError) as context: - trainer = get_regression_trainer( - a=1.5, - b=2.5, - output_dir=tmpdir, - learning_rate=0.1, - eval_strategy="epoch", - save_strategy="steps", - ) + trainer = get_regression_trainer( + a=1.5, + b=2.5, + output_dir=tmpdir, + learning_rate=0.1, + eval_strategy="epoch", + save_strategy="steps", + load_best_model_at_end=True, + ) self.assertTrue(trainer.args.metric_for_best_model == "loss") From 20b276ae29bf574e6d54adb371871da4a2482a06 Mon Sep 17 00:00:00 2001 From: "Sean (Seok-Won) Yi" Date: Sun, 22 Dec 2024 14:23:13 +0900 Subject: [PATCH 5/7] Changed eval_strategy to match save_strategy. --- tests/trainer/test_trainer.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/trainer/test_trainer.py b/tests/trainer/test_trainer.py index 7093ce2745a64d..1ee427902bac35 100644 --- a/tests/trainer/test_trainer.py +++ b/tests/trainer/test_trainer.py @@ -4241,7 +4241,7 @@ def test_save_best_checkpoint(self): b=2.5, output_dir=tmpdir, learning_rate=0.1, - eval_strategy="epoch", + eval_strategy="steps", save_strategy="steps", load_best_model_at_end=True, ) From ce460125e8782a1000ea864c71e22253ceba7e3d Mon Sep 17 00:00:00 2001 From: "Sean (Seok-Won) Yi" Date: Sat, 28 Dec 2024 17:55:29 +0900 Subject: [PATCH 6/7] Separated test cases for metric. --- tests/trainer/test_trainer.py | 7 +++++-- 1 file changed, 5 insertions(+), 2 deletions(-) diff --git a/tests/trainer/test_trainer.py b/tests/trainer/test_trainer.py index 1ee427902bac35..f39adf13e0c0c9 100644 --- a/tests/trainer/test_trainer.py +++ b/tests/trainer/test_trainer.py @@ -4220,7 +4220,9 @@ def test_save_best_checkpoint(self): total=total, ) - # Case 3: Metric name not provided; throw error. + def test_metric_for_best_model_behavior(self): + # Case 1: Metric name not provided when `save_strategy == "best"`. + # Should raise ValueError. with tempfile.TemporaryDirectory() as tmpdir: with self.assertRaises(ValueError) as context: trainer = get_regression_trainer( @@ -4234,7 +4236,8 @@ def test_save_best_checkpoint(self): ) self.assertIn("`args.metric_for_best_model` must be provided", str(context.exception)) - # Case 4: Metric name not provided and save_best_strategy is "steps" (i.e., not "best"). + # Case 2: Metric name not provided when `load_best_model_at_end == True`. + # `metric_for_best_model` should be set to `"loss"` by default. with tempfile.TemporaryDirectory() as tmpdir: trainer = get_regression_trainer( a=1.5, From 422304134b0b7b37dd401ff3db8271c5fa458ed9 Mon Sep 17 00:00:00 2001 From: "Sean (Seok-Won) Yi" Date: Sun, 5 Jan 2025 13:34:12 +0900 Subject: [PATCH 7/7] Allow load_best_model when save_strategy == "best". --- src/transformers/training_args.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/src/transformers/training_args.py b/src/transformers/training_args.py index 88b0c68e5a4047..8f408ede48a120 100644 --- a/src/transformers/training_args.py +++ b/src/transformers/training_args.py @@ -1636,7 +1636,7 @@ def __post_init__(self): self.save_steps = int(self.save_steps) # Sanity checks for load_best_model_at_end: we require save and eval strategies to be compatible. - if self.load_best_model_at_end: + if self.load_best_model_at_end and self.save_strategy != SaveStrategy.BEST: if self.eval_strategy != self.save_strategy: raise ValueError( "--load_best_model_at_end requires the save and eval strategy to match, but found\n- Evaluation "