bitcoder
diff --git a/‎src/robot/parsing/lexer/readers.py
Lines changed: 17 additions & 17 deletions b/‎src/robot/parsing/lexer/readers.py
Lines changed: 17 additions & 17 deletions
diff --git a/‎src/robot/parsing/lexer/splitter.py
Lines changed: 21 additions & 19 deletions b/‎src/robot/parsing/lexer/splitter.py
Lines changed: 21 additions & 19 deletions
diff --git a/‎src/robot/parsing/lexer/tokens.py
Lines changed: 12 additions & 17 deletions b/‎src/robot/parsing/lexer/tokens.py
Lines changed: 12 additions & 17 deletions
@@ -21,7 +21,7 @@
 from .context import TestCaseFileContext, ResourceFileContext
 from .lexers import FileLexer
 from .splitter import Splitter
-from .tokens import EOL, EOS, Token
+from .tokens import EOS, Token
 
 
 def get_tokens(source, data_only=False):
@@ -92,7 +92,7 @@ def get_tokens(self):
         statements = self._handle_old_for(self.statements)
         if not self.data_only:
             statements = chain.from_iterable(
-                self._split_trailing_comment_and_empty_lines(s)
+                self._split_trailing_commented_and_empty_lines(s)
                 for s in statements
             )
         # Setting local variables is performance optimization to avoid
@@ -151,36 +151,36 @@ def _get_first_data_token(self, statement):
                 return token
         return None
 
-    def _split_trailing_comment_and_empty_lines(self, statement):
+    def _split_trailing_commented_and_empty_lines(self, statement):
         lines = list(self._split_to_lines(statement))
-        split_statements = []
+        commented_or_empty = []
         for line in reversed(lines):
-            is_split = False
-            for token in line:
-                if token.type not in (token.IGNORE, token.SEPARATOR):
-                    is_split = token.type in (token.EOL, token.COMMENT)
-                    break
-            if not is_split:
+            if not self._is_commented_or_empty(line):
                 break
-            split_statements.append(line)
+            commented_or_empty.append(line)
             lines.pop()
         yield list(chain.from_iterable(lines))
-        for split in reversed(split_statements):
-            yield split
+        for line in reversed(commented_or_empty):
+            yield line
 
     def _split_to_lines(self, statement):
         current = []
-        eol = Token.EOL
         for token in statement:
             current.append(token)
-            if token.type == eol:
+            if token.type == Token.EOL:
                 yield current
                 current = []
         if current:
-            if current[-1].type != eol:
-                current.append(EOL.from_token(current[-1]))
             yield current
 
+    def _is_commented_or_empty(self, line):
+        separator_or_ignore = (Token.SEPARATOR, Token.IGNORE)
+        comment_or_eol = (Token.COMMENT, Token.EOL)
+        for token in line:
+            if token.type not in separator_or_ignore:
+                return token.type in comment_or_eol
+        return False
+
 
 class TestCaseFileReader(BaseReader):
     context_class = TestCaseFileContext
 
@@ -43,16 +43,15 @@ def _split_line(self, line, lineno, data_only=False):
             splitter = self._split_from_spaces
         else:
             splitter = self._split_from_pipes
-        columnno = 1
+        offset = 0
         data, sepa = Token.DATA, Token.SEPARATOR
         for value, is_data in splitter(rstrip(line)):
             if is_data or not data_only:
-                yield Token(data if is_data else sepa, value, lineno, columnno)
-            columnno += len(value)
+                yield Token(data if is_data else sepa, value, lineno, offset)
+            offset += len(value)
         if not data_only:
-            trailing_whitespace = re.search(r'\s+$', line, flags=re.UNICODE)
-            if trailing_whitespace:
-                yield Token(Token.EOL, trailing_whitespace.group(), lineno, columnno)
+            trailing_whitespace = re.search(r'\s*$', line, flags=re.UNICODE)
+            yield Token(Token.EOL, trailing_whitespace.group(), lineno, offset)
 
     def _split_from_spaces(self, line):
         for index, value in enumerate(self._space_splitter.split(line)):
@@ -82,47 +81,50 @@ def _handle_comments(self, tokens):
         has_data = False
         commented = False
         for token in tokens:
-            if token.type == token.DATA:
+            if token.type == Token.DATA:
                 if token.value.startswith('#') or commented:
-                    token.type = token.COMMENT
+                    token.type = Token.COMMENT
                     commented = True
                 elif token.value:
                     has_data = True
         return has_data
 
     def _handle_continuation(self, tokens):
         for token in tokens:
-            if token.value == '...' and token.type == token.DATA:
-                token.type = token.CONTINUATION
+            if token.value == '...' and token.type == Token.DATA:
+                token.type = Token.CONTINUATION
                 return True
-            elif token.value and token.type != token.SEPARATOR:
+            elif token.value and token.type != Token.SEPARATOR:
                 return False
         return False
 
     def _remove_trailing_empty(self, tokens):
         for token in reversed(tokens):
-            if not token.value:
+            if not token.value and token.type != Token.EOL:
                 tokens.remove(token)
-            elif token.type == token.DATA:
+            elif token.type == Token.DATA:
                 break
 
     def _remove_leading_empty(self, tokens):
+        data_or_continuation = (Token.DATA, Token.CONTINUATION)
         for token in list(tokens):
             if not token.value:
                 tokens.remove(token)
-            elif token.type in (token.DATA, token.CONTINUATION):
+            elif token.type in data_or_continuation:
                 break
 
     def _ensure_data_after_continuation(self, tokens):
-        if not any(t.type == t.DATA for t in tokens):
+        data = Token.DATA
+        if not any(t.type == data for t in tokens):
             cont = self._find_continuation(tokens)
-            data = Token(Token.DATA, '', cont.lineno, cont.columnno + 3)
-            tokens.insert(tokens.index(cont) + 1, data)
+            token = Token(data, '', cont.lineno, cont.end_col_offset)
+            tokens.insert(tokens.index(cont) + 1, token)
 
     def _find_continuation(self, tokens):
         for token in tokens:
-            if token.type == token.CONTINUATION:
+            if token.type == Token.CONTINUATION:
                 return token
 
     def _remove_non_data(self, tokens):
-        return [t for t in tokens if t.type == t.DATA]
+        data = Token.DATA
+        return [t for t in tokens if t.type == data]
@@ -56,10 +56,10 @@ class Token(object):
     END = 'END'
 
     SEPARATOR = 'SEPARATOR'
-    EOL = 'EOL'
     COMMENT = 'COMMENT'
     CONTINUATION = 'CONTINUATION'
     IGNORE = 'IGNORE'
+    EOL = 'EOL'
     EOS = 'EOS'
     ERROR = 'ERROR'
     DATA = 'DATA'
@@ -101,32 +101,27 @@ class Token(object):
         KEYWORD_HEADER
     )
 
-    __slots__ = ['type', 'value', 'lineno', 'columnno', 'error']
+    __slots__ = ['type', 'value', 'lineno', 'col_offset', 'error']
 
-    def __init__(self, type, value='', lineno=-1, columnno=-1):
+    def __init__(self, type, value='', lineno=-1, col_offset=-1):
         self.type = type
         self.value = value
         self.lineno = lineno
-        self.columnno = columnno
+        self.col_offset = col_offset
         self.error = None
 
+    @property
+    def end_col_offset(self):
+        if self.col_offset == -1:
+            return -1
+        return self.col_offset + len(self.value)
+
     def __unicode__(self):
         return self.value
 
     def __repr__(self):
         return 'Token(%s, %r, %s, %s)' % (self.type, self.value,
-                                          self.lineno, self.columnno)
-
-
-class EOL(Token):
-    __slots__ = []
-
-    def __init__(self, value='', lineno=-1, columnno=-1):
-        Token.__init__(self, Token.EOL, value, lineno, columnno)
-
-    @classmethod
-    def from_token(cls, token):
-        return EOL('', token.lineno, token.columnno + len(token.value))
+                                          self.lineno, self.col_offset)
 
 
 class EOS(Token):
@@ -137,4 +132,4 @@ def __init__(self, lineno=-1, columnno=-1):
 
     @classmethod
     def from_token(cls, token):
-        return EOS(token.lineno, token.columnno + len(token.value))
+        return EOS(token.lineno, token.end_col_offset)