no python2 nonsense

2018-05-03 11:35:35 -04:00 · 2018-05-03 11:35:35 -04:00 · 33307aa76f
commit 33307aa76f
parent bb6a336e0e
7 changed files with 11 additions and 44 deletions
--- a/chatter/chatterbot/comparisons.py
+++ b/chatter/chatterbot/comparisons.py
@ -58,19 +58,14 @@ class LevenshteinDistance(Comparator):
        :rtype: float
        """

-        PYTHON = sys.version_info[0]
-
        # Return 0 if either statement has a falsy text value
        if not statement.text or not other_statement.text:
            return 0

        # Get the lowercase version of both strings
-        if PYTHON < 3:
-            statement_text = unicode(statement.text.lower()) # NOQA
-            other_statement_text = unicode(other_statement.text.lower()) # NOQA
-        else:
-            statement_text = str(statement.text.lower())
-            other_statement_text = str(other_statement.text.lower())
+
+        statement_text = str(statement.text.lower())
+        other_statement_text = str(other_statement.text.lower())

        similarity = SequenceMatcher(
            None,
--- a/chatter/chatterbot/conversation.py
+++ b/chatter/chatterbot/conversation.py
@ -33,13 +33,6 @@ class Statement(StatementMixin):
        except UnicodeEncodeError:
            pass

-        # Prefer decoded utf8-strings in Python 2.7
-        if sys.version_info[0] < 3:
-            try:
-                text = text.decode('utf-8')
-            except UnicodeEncodeError:
-                pass
-
        self.text = text
        self.tags = kwargs.pop('tags', [])
        self.in_response_to = kwargs.pop('in_response_to', [])
--- a/chatter/chatterbot/ext/sqlalchemy_app/types.py
+++ b/chatter/chatterbot/ext/sqlalchemy_app/types.py
@ -13,9 +13,4 @@ class UnicodeString(TypeDecorator):
        Coerce Python bytestrings to unicode before
        saving them to the database.
        """
-        import sys
-
-        if sys.version_info[0] < 3:
-            if isinstance(value, str):
-                value = value.decode('utf-8')
        return value
--- a/chatter/chatterbot/input/variable_input_type_adapter.py
+++ b/chatter/chatterbot/input/variable_input_type_adapter.py
@ -14,10 +14,8 @@ class VariableInputTypeAdapter(InputAdapter):
    def detect_type(self, statement):
        import sys

-        if sys.version_info[0] < 3:
-            string_types = basestring # NOQA
-        else:
-            string_types = str
+
+        string_types = str

        if hasattr(statement, 'text'):
            return self.OBJECT
--- a/chatter/chatterbot/preprocessors.py
+++ b/chatter/chatterbot/preprocessors.py
@ -30,11 +30,7 @@ def unescape_html(chatbot, statement):
    import sys

    # Replace HTML escape characters
-    if sys.version_info[0] < 3:
-        from HTMLParser import HTMLParser
-        html = HTMLParser()
-    else:
-        import html
+    import html

    statement.text = html.unescape(statement.text)

@ -49,9 +45,6 @@ def convert_to_ascii(chatbot, statement):
    import unicodedata
    import sys

-    # Normalize unicode characters
-    if sys.version_info[0] < 3:
-        statement.text = unicode(statement.text) # NOQA

    text = unicodedata.normalize('NFKD', statement.text)
    text = text.encode('ascii', 'ignore').decode('utf-8')
--- a/chatter/chatterbot/trainers.py
+++ b/chatter/chatterbot/trainers.py
@ -393,10 +393,10 @@ class UbuntuCorpusTrainer(Trainer):

        file_kwargs = {}

-        if sys.version_info[0] > 2:
-            # Specify the encoding in Python versions 3 and up
-            file_kwargs['encoding'] = 'utf-8'
-            # WARNING: This might fail to read a unicode corpus file in Python 2.x
+
+        # Specify the encoding in Python versions 3 and up
+        file_kwargs['encoding'] = 'utf-8'
+        # WARNING: This might fail to read a unicode corpus file in Python 2.x

        for file in glob.iglob(extracted_corpus_path):
            self.logger.info('Training from: {}'.format(file))
--- a/chatter/chatterbot/utils.py
+++ b/chatter/chatterbot/utils.py
@ -77,15 +77,8 @@ def input_function():
    """
    import sys

-    if sys.version_info[0] < 3:
-        user_input = str(raw_input()) # NOQA

-        # Avoid problems using format strings with unicode characters
-        if user_input:
-            user_input = user_input.decode('utf-8')
-
-    else:
-        user_input = input() # NOQA
+    user_input = input() # NOQA

    return user_input