doxy/rf_html/lexer_8py_source.html

 #  Copyright 2008-2015 Nokia Networks

 #  Copyright 2016-     Robot Framework Foundation

 #

 #  Licensed under the Apache License, Version 2.0 (the "License");

 #  you may not use this file except in compliance with the License.

 #  You may obtain a copy of the License at

 #

 #      http://www.apache.org/licenses/LICENSE-2.0

 #

 #  Unless required by applicable law or agreed to in writing, software

 #  distributed under the License is distributed on an "AS IS" BASIS,

 #  WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.

 #  See the License for the specific language governing permissions and

 #  limitations under the License.


 from itertools import chain


 from robot.errors import DataError

 from robot.utils import get_error_message, FileReader


 from .blocklexers import FileLexer

 from .context import InitFileContext, TestCaseFileContext, ResourceFileContext

 from .tokenizer import Tokenizer

 from .tokens import EOS, END, Token


 def get_tokens(source, data_only=False, tokenize_variables=False, lang=None):

     lexer = Lexer(TestCaseFileContext(lang=lang), data_only, tokenize_variables)

     lexer.input(source)

     return lexer.get_tokens()


 def get_resource_tokens(source, data_only=False, tokenize_variables=False, lang=None):

     lexer = Lexer(ResourceFileContext(lang=lang), data_only, tokenize_variables)

     lexer.input(source)

     return lexer.get_tokens()


 def get_init_tokens(source, data_only=False, tokenize_variables=False, lang=None):

     lexer = Lexer(InitFileContext(lang=lang), data_only, tokenize_variables)

     lexer.input(source)

     return lexer.get_tokens()


 class Lexer:


     def __init__(self, ctx, data_only=False, tokenize_variables=False):

         self.lexerlexer = FileLexer(ctx)

         self.data_onlydata_only = data_only

         self.tokenize_variablestokenize_variables = tokenize_variables

         self.statementsstatements = []


     def input(self, source):

         for statement in Tokenizer().tokenize(self._read_read(source),

                                               self.data_onlydata_only):

             # Store all tokens but pass only data tokens to lexer.

             self.statementsstatements.append(statement)

             if self.data_onlydata_only:

                 data = statement[:]

             else:

                 # Separators, comments, etc. already have type, data doesn't.

                 data = [t for t in statement if t.type is None]

             if data:

                 self.lexerlexer.input(data)


     def _read(self, source):

         try:

             with FileReader(source, accept_text=True) as reader:

                 return reader.read()

         except Exception:

             raise DataError(get_error_message())


     def get_tokens(self):

         self.lexerlexer.lex()

         statements = self.statementsstatements

         if not self.data_onlydata_only:

             statements = chain.from_iterable(

                 self._split_trailing_commented_and_empty_lines_split_trailing_commented_and_empty_lines(s)

                 for s in statements

             )

         tokens = self._get_tokens_get_tokens(statements)

         if self.tokenize_variablestokenize_variables:

             tokens = self._tokenize_variables_tokenize_variables(tokens)

         return tokens


     def _get_tokens(self, statements):

         if self.data_onlydata_only:

             ignored_types = {None, Token.COMMENT_HEADER, Token.COMMENT}

         else:

             ignored_types = {None}

         inline_if_type = Token.INLINE_IF

         for statement in statements:

             last = None

             inline_if = False

             for token in statement:

                 token_type = token.type

                 if token_type in ignored_types:

                     continue

                 if token._add_eos_before and not (last and last._add_eos_after):

                     yield EOS.from_token(token, before=True)

                 yield token

                 if token._add_eos_after:

                     yield EOS.from_token(token)

                 if token_type == inline_if_type:

                     inline_if = True

                 last = token

             if last and not last._add_eos_after:

                 yield EOS.from_token(last)

             if inline_if:

                 yield END.from_token(last, virtual=True)

                 yield EOS.from_token(last)


     def _split_trailing_commented_and_empty_lines(self, statement):

         lines = self._split_to_lines_split_to_lines(statement)

         commented_or_empty = []

         for line in reversed(lines):

             if not self._is_commented_or_empty_is_commented_or_empty(line):

                 break

             commented_or_empty.append(line)

         if not commented_or_empty:

             return [statement]

         lines = lines[:-len(commented_or_empty)]

         statement = list(chain.from_iterable(lines))

         return [statement] + list(reversed(commented_or_empty))


     def _split_to_lines(self, statement):

         lines = []

         current = []

         for token in statement:

             current.append(token)

             if token.type == Token.EOL:

                 lines.append(current)

                 current = []

         if current:

             lines.append(current)

         return lines


     def _is_commented_or_empty(self, line):

         separator_or_ignore = (Token.SEPARATOR, None)

         comment_or_eol = (Token.COMMENT, Token.EOL)

         for token in line:

             if token.type not in separator_or_ignore:

                 return token.type in comment_or_eol

         return False


     def _tokenize_variables(self, tokens):

         for token in tokens:

             for t in token.tokenize_variables():

                 yield t

robot.errors.DataError
Definition: errors.py:61

robot.parsing.lexer.blocklexers.FileLexer
Definition: blocklexers.py:79

robot.parsing.lexer.context.InitFileContext
Definition: context.py:119

robot.parsing.lexer.context.ResourceFileContext
Definition: context.py:104

robot.parsing.lexer.context.TestCaseFileContext
Definition: context.py:86

robot.parsing.lexer.lexer.Lexer
Definition: lexer.py:78

robot.parsing.lexer.lexer.Lexer.statements
statements
Definition: lexer.py:84

robot.parsing.lexer.lexer.Lexer.input
def input(self, source)
Definition: lexer.py:86

robot.parsing.lexer.lexer.Lexer._tokenize_variables
def _tokenize_variables(self, tokens)
Definition: lexer.py:179

robot.parsing.lexer.lexer.Lexer.get_tokens
def get_tokens(self)
Definition: lexer.py:106

robot.parsing.lexer.lexer.Lexer._read
def _read(self, source)
Definition: lexer.py:99

robot.parsing.lexer.lexer.Lexer._split_to_lines
def _split_to_lines(self, statement)
Definition: lexer.py:159

robot.parsing.lexer.lexer.Lexer.data_only
data_only
Definition: lexer.py:82

robot.parsing.lexer.lexer.Lexer.lexer
lexer
Definition: lexer.py:81

robot.parsing.lexer.lexer.Lexer.tokenize_variables
tokenize_variables
Definition: lexer.py:83

robot.parsing.lexer.lexer.Lexer.__init__
def __init__(self, ctx, data_only=False, tokenize_variables=False)
Definition: lexer.py:80

robot.parsing.lexer.lexer.Lexer._split_trailing_commented_and_empty_lines
def _split_trailing_commented_and_empty_lines(self, statement)
Definition: lexer.py:146

robot.parsing.lexer.lexer.Lexer._get_tokens
def _get_tokens(self, statements)
Definition: lexer.py:119

robot.parsing.lexer.lexer.Lexer._is_commented_or_empty
def _is_commented_or_empty(self, line)
Definition: lexer.py:171

robot.parsing.lexer.tokenizer.Tokenizer
Definition: tokenizer.py:21

robot.errors
Definition: errors.py:1

robot.parsing.lexer.lexer.get_init_tokens
def get_init_tokens(source, data_only=False, tokenize_variables=False, lang=None)
Parses the given source to init file tokens.
Definition: lexer.py:72

robot.parsing.lexer.lexer.get_resource_tokens
def get_resource_tokens(source, data_only=False, tokenize_variables=False, lang=None)
Parses the given source to resource file tokens.
Definition: lexer.py:60

robot.parsing.lexer.lexer.get_tokens
def get_tokens(source, data_only=False, tokenize_variables=False, lang=None)
Parses the given source to tokens.
Definition: lexer.py:49

robot.utils.error.get_error_message
def get_error_message()
Returns error message of the last occurred exception.
Definition: error.py:34

robot.utils
Definition: __init__.py:1