diff --git a/src/transformers/modeling_utils.py b/src/transformers/modeling_utils.py index b629c7ad2ac2..9a050c246e84 100755 --- a/src/transformers/modeling_utils.py +++ b/src/transformers/modeling_utils.py @@ -2746,7 +2746,7 @@ def save_pretrained( if module_map: filename_to_tensors = logging.tqdm(filename_to_tensors, desc="Saving checkpoint shards") for shard_file, tensors in filename_to_tensors: - shard = {tensor: state_dict[tensor] for tensor in tensors} + shard = {tensor: state_dict[tensor].contiguous() for tensor in tensors} # remake shard with onloaded parameters if necessary if module_map: if accelerate_version < version.parse("0.31"):