bda-6-steffo/unimore_bda_6/analysis/base.py

import abc
import logging
import dataclasses

from ..database import Text, Category, DatasetFunc

log = logging.getLogger(__name__)


@dataclasses.dataclass
class EvaluationResults:
    correct: int
    evaluated: int
    score: float

    def __repr__(self):
        return f"<EvaluationResults: score of {self.score} out of {self.evaluated} evaluated tuples>"

    def __str__(self):
        return f"{self.evaluated} evaluated, {self.correct} correct, {self.correct / self.evaluated * 100:.2} % accuracy, {self.score:.2} score, {self.score / self.evaluated * 100:.2} scoreaccuracy"


class BaseSentimentAnalyzer(metaclass=abc.ABCMeta):
    """
    Abstract base class for sentiment analyzers implemented in this project.
    """

    @abc.abstractmethod
    def train(self, dataset_func: DatasetFunc) -> None:
        """
        Train the analyzer with the given training dataset.
        """
        raise NotImplementedError()

    def evaluate(self, dataset_func: DatasetFunc) -> EvaluationResults:
        """
        Perform a model evaluation by calling repeatedly `.use` on every text of the test dataset and by comparing its resulting category with the expected category.

        Returns a tuple with the number of correct results and the number of evaluated results.
        """

        evaluated: int = 0
        correct: int = 0
        score: float = 0.0

        for review in dataset_func():
            resulting_category = self.use(review.text)
            evaluated += 1
            correct += 1 if resulting_category == review.category else 0
            score += 1 - (abs(resulting_category - review.category) / 4)
            if not evaluated % 100:
                temp_results = EvaluationResults(correct=correct, evaluated=evaluated, score=score)
                log.debug(f"{temp_results!s}")

        return EvaluationResults(correct=correct, evaluated=evaluated, score=score)

    @abc.abstractmethod
    def use(self, text: Text) -> Category:
        """
        Run the model on the given input.
        """
        raise NotImplementedError()


class AlreadyTrainedError(Exception):
    """
    This model has already been trained and cannot be trained again.
    """


class NotTrainedError(Exception):
    """
    This model has not been trained yet.
    """


class TrainingFailedError(Exception):
    """
    The model wasn't able to complete the training and should not be used anymore.
    """


__all__ = (
    "BaseSentimentAnalyzer",
    "AlreadyTrainedError",
    "NotTrainedError",
    "TrainingFailedError",
)
Working prototype 2023-02-02 01:56:37 +00:00			`import abc`
New version working nicely 2023-02-03 22:27:44 +00:00			`import logging`
Getting closer... 2023-02-04 05:14:24 +00:00			`import dataclasses`
Refactor things to work better 2023-02-02 16:24:11 +00:00
back to i have no idea of what's happening, but at least it works 2023-02-07 09:22:09 +00:00			`from ..database import Text, Category, DatasetFunc`
Refactor things to work better 2023-02-02 16:24:11 +00:00
New version working nicely 2023-02-03 22:27:44 +00:00			`log = logging.getLogger(__name__)`
Working prototype 2023-02-02 01:56:37 +00:00

Getting closer... 2023-02-04 05:14:24 +00:00			`@dataclasses.dataclass`
			`class EvaluationResults:`
			`correct: int`
			`evaluated: int`
stuff's working 2023-02-08 09:54:14 +00:00			`score: float`
Getting closer... 2023-02-04 05:14:24 +00:00
			`def __repr__(self):`
stuff's working 2023-02-08 09:54:14 +00:00			`return f"<EvaluationResults: score of {self.score} out of {self.evaluated} evaluated tuples>"`
Getting closer... 2023-02-04 05:14:24 +00:00
			`def __str__(self):`
stuff's working 2023-02-08 09:54:14 +00:00			`return f"{self.evaluated} evaluated, {self.correct} correct, {self.correct / self.evaluated * 100:.2} % accuracy, {self.score:.2} score, {self.score / self.evaluated * 100:.2} scoreaccuracy"`
Getting closer... 2023-02-04 05:14:24 +00:00

New version working nicely 2023-02-03 22:27:44 +00:00			`class BaseSentimentAnalyzer(metaclass=abc.ABCMeta):`
Working prototype 2023-02-02 01:56:37 +00:00			`"""`
			`Abstract base class for sentiment analyzers implemented in this project.`
			`"""`

			`@abc.abstractmethod`
Getting closer... 2023-02-04 05:14:24 +00:00			`def train(self, dataset_func: DatasetFunc) -> None:`
Working prototype 2023-02-02 01:56:37 +00:00			`"""`
New version working nicely 2023-02-03 22:27:44 +00:00			`Train the analyzer with the given training dataset.`
Working prototype 2023-02-02 01:56:37 +00:00			`"""`
			`raise NotImplementedError()`

Getting closer... 2023-02-04 05:14:24 +00:00			`def evaluate(self, dataset_func: DatasetFunc) -> EvaluationResults:`
Working prototype 2023-02-02 01:56:37 +00:00			`"""`
New version working nicely 2023-02-03 22:27:44 +00:00			Perform a model evaluation by calling repeatedly `.use` on every text of the test dataset and by comparing its resulting category with the expected category.
Working prototype 2023-02-02 01:56:37 +00:00
New version working nicely 2023-02-03 22:27:44 +00:00			`Returns a tuple with the number of correct results and the number of evaluated results.`
			`"""`
Getting closer... 2023-02-04 05:14:24 +00:00
New version working nicely 2023-02-03 22:27:44 +00:00			`evaluated: int = 0`
Getting closer... 2023-02-04 05:14:24 +00:00			`correct: int = 0`
stuff's working 2023-02-08 09:54:14 +00:00			`score: float = 0.0`
Working prototype 2023-02-02 01:56:37 +00:00
Getting closer... 2023-02-04 05:14:24 +00:00			`for review in dataset_func():`
			`resulting_category = self.use(review.text)`
New version working nicely 2023-02-03 22:27:44 +00:00			`evaluated += 1`
Getting closer... 2023-02-04 05:14:24 +00:00			`correct += 1 if resulting_category == review.category else 0`
stuff's working 2023-02-08 09:54:14 +00:00			`score += 1 - (abs(resulting_category - review.category) / 4)`
New version working nicely 2023-02-03 22:27:44 +00:00			`if not evaluated % 100:`
stuff's working 2023-02-08 09:54:14 +00:00			`temp_results = EvaluationResults(correct=correct, evaluated=evaluated, score=score)`
			`log.debug(f"{temp_results!s}")`
Working prototype 2023-02-02 01:56:37 +00:00
stuff's working 2023-02-08 09:54:14 +00:00			`return EvaluationResults(correct=correct, evaluated=evaluated, score=score)`
PEP8 2023-02-03 16:50:40 +00:00
New version working nicely 2023-02-03 22:27:44 +00:00			`@abc.abstractmethod`
			`def use(self, text: Text) -> Category:`
			`"""`
			`Run the model on the given input.`
			`"""`
			`raise NotImplementedError()`
Working prototype 2023-02-02 01:56:37 +00:00

stop here for now 2023-02-04 00:36:42 +00:00			`class AlreadyTrainedError(Exception):`
			`"""`
			`This model has already been trained and cannot be trained again.`
			`"""`


			`class NotTrainedError(Exception):`
			`"""`
			`This model has not been trained yet.`
			`"""`


stuff's working 2023-02-08 09:54:14 +00:00			`class TrainingFailedError(Exception):`
			`"""`
			`The model wasn't able to complete the training and should not be used anymore.`
			`"""`


Working prototype 2023-02-02 01:56:37 +00:00			`__all__ = (`
New version working nicely 2023-02-03 22:27:44 +00:00			`"BaseSentimentAnalyzer",`
stop here for now 2023-02-04 00:36:42 +00:00			`"AlreadyTrainedError",`
			`"NotTrainedError",`
stuff's working 2023-02-08 09:54:14 +00:00			`"TrainingFailedError",`
Working prototype 2023-02-02 01:56:37 +00:00			`)`