mirror of
https://github.com/Steffo99/unimore-bda-6.git
synced 2024-11-23 00:14:19 +00:00
30 lines
670 B
Python
30 lines
670 B
Python
|
from ..vendor.potts import Tokenizer
|
||
|
from .vanilla import VanillaSA, VanillaReviewSA
|
||
|
|
||
|
|
||
|
class PottsSA(VanillaSA):
|
||
|
"""
|
||
|
A sentiment analyzer using Potts' tokenizer.
|
||
|
"""
|
||
|
|
||
|
def __init__(self) -> None:
|
||
|
super().__init__()
|
||
|
|
||
|
def _tokenize_text(self, text: str) -> list[str]:
|
||
|
"""
|
||
|
Convert a text string into a list of tokens, using the language of the model.
|
||
|
"""
|
||
|
tokenizer: Tokenizer = Tokenizer(preserve_case=False)
|
||
|
return list(tokenizer.tokenize(text))
|
||
|
|
||
|
|
||
|
class PottsReviewSA(VanillaReviewSA, PottsSA):
|
||
|
"""
|
||
|
A `PottsSA` to be used with `Review`s.
|
||
|
"""
|
||
|
|
||
|
|
||
|
__all__ = (
|
||
|
"PottsSA",
|
||
|
"PottsReviewSA",
|
||
|
)
|