diff --git a/unimore_bda_6/analysis/vanilla.py b/unimore_bda_6/analysis/vanilla.py index 403b0b0..7323602 100644 --- a/unimore_bda_6/analysis/vanilla.py +++ b/unimore_bda_6/analysis/vanilla.py @@ -22,11 +22,11 @@ class VanillaSA(BaseSA, metaclass=abc.ABCMeta): super().__init__() self.model: nltk.sentiment.SentimentAnalyzer = nltk.sentiment.SentimentAnalyzer() - def _tokenize_text(self, text: str, language: str = "english") -> list[str]: + def _tokenize_text(self, text: str) -> list[str]: """ Convert a text string into a list of tokens, using the language of the model. """ - tokens = nltk.word_tokenize(text, language=language) + tokens = nltk.word_tokenize(text) nltk.sentiment.util.mark_negation(tokens, shallow=True) return tokens