diff --git a/examples/summarization/requirements.txt b/examples/summarization/requirements.txt index 0fbc8285c1..7f9dc2a9c4 100644 --- a/examples/summarization/requirements.txt +++ b/examples/summarization/requirements.txt @@ -2,7 +2,7 @@ datasets >= 2.4.0 sentencepiece != 0.1.92 protobuf rouge-score -nltk == 3.8.1 +nltk py7zr torch >= 1.3 evaluate diff --git a/examples/summarization/run_summarization.py b/examples/summarization/run_summarization.py index 2ea2a59528..5ee0d993a8 100755 --- a/examples/summarization/run_summarization.py +++ b/examples/summarization/run_summarization.py @@ -80,6 +80,8 @@ def check_optimum_habana_min_version(*a, **b): with FileLock(".lock") as lock: nltk.download("punkt", quiet=True) +nltk.download("punkt_tab") # Needed for version 3.8.2 + # A list of all multilingual tokenizer which require lang attribute. MULTILINGUAL_TOKENIZERS = [MBartTokenizer, MBartTokenizerFast, MBart50Tokenizer, MBart50TokenizerFast]