bda-6-steffo/unimore_bda_6/analysis/base.py

import abc
import logging

from ..database import DataSet, Text, Category

log = logging.getLogger(__name__)


class BaseSentimentAnalyzer(metaclass=abc.ABCMeta):
    """
    Abstract base class for sentiment analyzers implemented in this project.
    """

    @abc.abstractmethod
    def train(self, training_set: DataSet) -> None:
        """
        Train the analyzer with the given training dataset.
        """
        raise NotImplementedError()

    def evaluate(self, test_set: DataSet) -> tuple[int, int]:
        """
        Perform a model evaluation by calling repeatedly `.use` on every text of the test dataset and by comparing its resulting category with the expected category.

        Returns a tuple with the number of correct results and the number of evaluated results.
        """
        evaluated: int = 0
        correct: int   = 0

        for text, expected_category in test_set:
            resulting_category = self.use(text)
            evaluated += 1
            correct += 1 if resulting_category == expected_category else 0
            if not evaluated % 100:
                log.debug("%d evaluated, %d correct, %0.2d %% accuracy", evaluated, correct, correct / evaluated * 100)

        return correct, evaluated

    @abc.abstractmethod
    def use(self, text: Text) -> Category:
        """
        Run the model on the given input.
        """
        raise NotImplementedError()


__all__ = (
    "BaseSentimentAnalyzer",
)
Working prototype 2023-02-02 01:56:37 +00:00			`import abc`
New version working nicely 2023-02-03 22:27:44 +00:00			`import logging`
Refactor things to work better 2023-02-02 16:24:11 +00:00
New version working nicely 2023-02-03 22:27:44 +00:00			`from ..database import DataSet, Text, Category`
Refactor things to work better 2023-02-02 16:24:11 +00:00
New version working nicely 2023-02-03 22:27:44 +00:00			`log = logging.getLogger(__name__)`
Working prototype 2023-02-02 01:56:37 +00:00

New version working nicely 2023-02-03 22:27:44 +00:00			`class BaseSentimentAnalyzer(metaclass=abc.ABCMeta):`
Working prototype 2023-02-02 01:56:37 +00:00			`"""`
			`Abstract base class for sentiment analyzers implemented in this project.`
			`"""`

			`@abc.abstractmethod`
New version working nicely 2023-02-03 22:27:44 +00:00			`def train(self, training_set: DataSet) -> None:`
Working prototype 2023-02-02 01:56:37 +00:00			`"""`
New version working nicely 2023-02-03 22:27:44 +00:00			`Train the analyzer with the given training dataset.`
Working prototype 2023-02-02 01:56:37 +00:00			`"""`
			`raise NotImplementedError()`

New version working nicely 2023-02-03 22:27:44 +00:00			`def evaluate(self, test_set: DataSet) -> tuple[int, int]:`
Working prototype 2023-02-02 01:56:37 +00:00			`"""`
New version working nicely 2023-02-03 22:27:44 +00:00			Perform a model evaluation by calling repeatedly `.use` on every text of the test dataset and by comparing its resulting category with the expected category.
Working prototype 2023-02-02 01:56:37 +00:00
New version working nicely 2023-02-03 22:27:44 +00:00			`Returns a tuple with the number of correct results and the number of evaluated results.`
			`"""`
			`evaluated: int = 0`
			`correct: int = 0`
Working prototype 2023-02-02 01:56:37 +00:00
New version working nicely 2023-02-03 22:27:44 +00:00			`for text, expected_category in test_set:`
			`resulting_category = self.use(text)`
			`evaluated += 1`
			`correct += 1 if resulting_category == expected_category else 0`
			`if not evaluated % 100:`
			`log.debug("%d evaluated, %d correct, %0.2d %% accuracy", evaluated, correct, correct / evaluated * 100)`
Working prototype 2023-02-02 01:56:37 +00:00
New version working nicely 2023-02-03 22:27:44 +00:00			`return correct, evaluated`
PEP8 2023-02-03 16:50:40 +00:00
New version working nicely 2023-02-03 22:27:44 +00:00			`@abc.abstractmethod`
			`def use(self, text: Text) -> Category:`
			`"""`
			`Run the model on the given input.`
			`"""`
			`raise NotImplementedError()`
Working prototype 2023-02-02 01:56:37 +00:00

			`__all__ = (`
New version working nicely 2023-02-03 22:27:44 +00:00			`"BaseSentimentAnalyzer",`
Working prototype 2023-02-02 01:56:37 +00:00			`)`