diff --git a/src/transformers/models/aria/configuration_aria.py b/src/transformers/models/aria/configuration_aria.py index bf2b262c0cc398..b9e1705e6f672d 100644 --- a/src/transformers/models/aria/configuration_aria.py +++ b/src/transformers/models/aria/configuration_aria.py @@ -145,7 +145,7 @@ def __init__( initializer_range=0.02, rms_norm_eps=1e-6, use_cache=True, - pad_token_id=None, + pad_token_id=2, bos_token_id=1, eos_token_id=2, pretraining_tp=1, diff --git a/tests/models/aria/test_modeling_aria.py b/tests/models/aria/test_modeling_aria.py index 988aabb00c45fe..5bc8cb3541fbc6 100644 --- a/tests/models/aria/test_modeling_aria.py +++ b/tests/models/aria/test_modeling_aria.py @@ -298,6 +298,10 @@ def test_feed_forward_chunking(self): def test_initialization(self): pass + @unittest.skip(reason="Unstable test") + def test_dola_decoding_sample(self): + pass + @require_torch class AriaForConditionalGenerationIntegrationTest(unittest.TestCase):