From e3005ab8b0a63efe85096aafe08bd459d83cf7a0 Mon Sep 17 00:00:00 2001 From: Stefano Pigozzi Date: Wed, 8 Feb 2023 19:46:05 +0100 Subject: [PATCH] enough --- .idea/inspectionProfiles/Project_Default.xml | 1 + .idea/misc.xml | 3 + .idea/runConfigurations/unimore_bda_6.xml | 4 +- poetry.lock | 57 ++++++++- pyproject.toml | 1 + unimore_bda_6/__main__.py | 117 +++++++++--------- unimore_bda_6/analysis/base.py | 65 ++++++---- unimore_bda_6/analysis/nltk_sentiment.py | 16 ++- unimore_bda_6/analysis/tf_text.py | 43 +++++-- unimore_bda_6/config.py | 50 ++++++-- unimore_bda_6/database/cache.py | 8 +- unimore_bda_6/database/connection.py | 5 +- unimore_bda_6/database/datatypes.py | 5 + unimore_bda_6/database/queries.py | 26 ++-- unimore_bda_6/log.py | 6 +- unimore_bda_6/tokenizer/__init__.py | 2 + unimore_bda_6/tokenizer/base.py | 12 +- unimore_bda_6/tokenizer/lower.py | 6 +- unimore_bda_6/tokenizer/nltk_word_tokenize.py | 2 +- unimore_bda_6/tokenizer/plain.py | 16 +++ unimore_bda_6/tokenizer/potts.py | 13 +- 21 files changed, 309 insertions(+), 149 deletions(-) create mode 100644 unimore_bda_6/tokenizer/plain.py diff --git a/.idea/inspectionProfiles/Project_Default.xml b/.idea/inspectionProfiles/Project_Default.xml index 7253287..1c6334f 100644 --- a/.idea/inspectionProfiles/Project_Default.xml +++ b/.idea/inspectionProfiles/Project_Default.xml @@ -40,6 +40,7 @@ diff --git a/.idea/misc.xml b/.idea/misc.xml index 6b0faad..a0e6536 100644 --- a/.idea/misc.xml +++ b/.idea/misc.xml @@ -10,4 +10,7 @@ + + \ No newline at end of file diff --git a/.idea/runConfigurations/unimore_bda_6.xml b/.idea/runConfigurations/unimore_bda_6.xml index 3718006..f2f821f 100644 --- a/.idea/runConfigurations/unimore_bda_6.xml +++ b/.idea/runConfigurations/unimore_bda_6.xml @@ -1,12 +1,12 @@ -