Skip to content

Commit

Permalink
deprecate warning
Browse files Browse the repository at this point in the history
  • Loading branch information
itazap committed Jul 25, 2024
1 parent 5728ea9 commit ec6f78a
Showing 1 changed file with 4 additions and 0 deletions.
4 changes: 4 additions & 0 deletions src/transformers/tokenization_utils_base.py
Original file line number Diff line number Diff line change
Expand Up @@ -1595,6 +1595,10 @@ def __init__(self, **kwargs):

# By default, cleaning tokenization spaces for both fast and slow tokenizers
self.clean_up_tokenization_spaces = kwargs.pop("clean_up_tokenization_spaces", False)
warnings.warn(
"The `clean_up_tokenization_spaces` argument will soon be deprecated. It currently defaults to False if not passed.",
FutureWarning,
)

# By default, do not split special tokens for both fast and slow tokenizers
self.split_special_tokens = kwargs.pop("split_special_tokens", False)
Expand Down

0 comments on commit ec6f78a

Please sign in to comment.