diff --git a/haystack/components/preprocessors/sentence_tokenizer.py b/haystack/components/preprocessors/sentence_tokenizer.py index 9619b851fc..2cb77347d3 100644 --- a/haystack/components/preprocessors/sentence_tokenizer.py +++ b/haystack/components/preprocessors/sentence_tokenizer.py @@ -9,7 +9,7 @@ from haystack import logging from haystack.lazy_imports import LazyImport -with LazyImport("Run 'pip install nltk'") as nltk_imports: +with LazyImport("Run 'pip install nltk>=3.9.1'") as nltk_imports: import nltk logger = logging.getLogger(__name__) diff --git a/pyproject.toml b/pyproject.toml index 1606df3fbf..9a5f15070b 100644 --- a/pyproject.toml +++ b/pyproject.toml @@ -112,7 +112,7 @@ extra-dependencies = [ "openpyxl", # XLSXToDocument "tabulate", # XLSXToDocument - "nltk", # NLTKDocumentSplitter + "nltk>=3.9.1", # NLTKDocumentSplitter # OpenAPI "jsonref", # OpenAPIServiceConnector, OpenAPIServiceToFunctions