From 4137fc7003d2bbf00abdebc6a97f29cfa75460aa Mon Sep 17 00:00:00 2001 From: Marc Sun Date: Thu, 6 Jun 2024 14:59:53 +0200 Subject: [PATCH 1/2] fix accelerate tests for roberta xl --- .../models/xlm_roberta_xl/modeling_xlm_roberta_xl.py | 2 +- tests/models/xlm_roberta_xl/test_modeling_xlm_roberta_xl.py | 2 ++ 2 files changed, 3 insertions(+), 1 deletion(-) diff --git a/src/transformers/models/xlm_roberta_xl/modeling_xlm_roberta_xl.py b/src/transformers/models/xlm_roberta_xl/modeling_xlm_roberta_xl.py index 7534eb4dad3b..d189086cd89e 100644 --- a/src/transformers/models/xlm_roberta_xl/modeling_xlm_roberta_xl.py +++ b/src/transformers/models/xlm_roberta_xl/modeling_xlm_roberta_xl.py @@ -572,7 +572,7 @@ class XLMRobertaXLPreTrainedModel(PreTrainedModel): config_class = XLMRobertaXLConfig base_model_prefix = "roberta" - _no_split_modules = ["XLMRobertaXLEmbeddings", "XLMRobertaXLSelfAttention"] + _no_split_modules = ["XLMRobertaXLEmbeddings", "XLMRobertaXLLayer"] # Copied from transformers.models.bert.modeling_bert.BertPreTrainedModel._init_weights def _init_weights(self, module): diff --git a/tests/models/xlm_roberta_xl/test_modeling_xlm_roberta_xl.py b/tests/models/xlm_roberta_xl/test_modeling_xlm_roberta_xl.py index d8a37d477909..c1467fef4a20 100644 --- a/tests/models/xlm_roberta_xl/test_modeling_xlm_roberta_xl.py +++ b/tests/models/xlm_roberta_xl/test_modeling_xlm_roberta_xl.py @@ -387,6 +387,8 @@ class XLMRobertaXLModelTest(ModelTesterMixin, GenerationTesterMixin, PipelineTes else {} ) + model_split_percents = [0.5,0.85,0.95] + # TODO: Fix the failed tests def is_pipeline_test_to_skip( self, pipeline_test_casse_name, config_class, model_architecture, tokenizer_name, processor_name From eb51b9b488db9445a84e9b2ba256a942d596abab Mon Sep 17 00:00:00 2001 From: Marc Sun Date: Thu, 6 Jun 2024 15:05:02 +0200 Subject: [PATCH 2/2] style --- tests/models/xlm_roberta_xl/test_modeling_xlm_roberta_xl.py | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/tests/models/xlm_roberta_xl/test_modeling_xlm_roberta_xl.py b/tests/models/xlm_roberta_xl/test_modeling_xlm_roberta_xl.py index c1467fef4a20..22663db27c81 100644 --- a/tests/models/xlm_roberta_xl/test_modeling_xlm_roberta_xl.py +++ b/tests/models/xlm_roberta_xl/test_modeling_xlm_roberta_xl.py @@ -387,7 +387,7 @@ class XLMRobertaXLModelTest(ModelTesterMixin, GenerationTesterMixin, PipelineTes else {} ) - model_split_percents = [0.5,0.85,0.95] + model_split_percents = [0.5, 0.85, 0.95] # TODO: Fix the failed tests def is_pipeline_test_to_skip(