Remove __main__

2024-11-22 07:54:19 +00:00 · 2023-02-02 04:18:46 +01:00 · 2023-02-02 04:18:46 +01:00 · cf37d13cb4
commit cf37d13cb4
parent ce959f18be
1 changed files with 0 additions and 16 deletions
--- a/unimore_bda_6/vendor/potts.py
+++ b/unimore_bda_6/vendor/potts.py
@ -186,19 +186,3 @@ class Tokenizer:
                pass                    
            s = s.replace(amp, " and ")
        return s
 ###############################################################################
 if __name__ == '__main__':
    tok = Tokenizer(preserve_case=False)
    samples = (
        u"RT @ #happyfuncoding: this is a typical Twitter tweet :-)",
        u"HTML entities &amp; other Web oddities can be an &aacute;cute <em class='grumpy'>pain</em> >:(",
        u"It's perhaps noteworthy that phone numbers like +1 (800) 123-4567, (800) 123-4567, and 123-4567 are treated as words despite their whitespace."
        )
    for s in samples:
        print "======================================================================"
        print s
        tokenized = tok.tokenize(s)
        print "\n".join(tokenized)