Source code for Gelatin.compiler.SyntaxCompiler

# Copyright (c) 2010-2017 Samuel Abels
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.
import re
from simpleparse.dispatchprocessor import DispatchProcessor, getString, singleMap
from .Function import Function
from .Grammar import Grammar
from .SkipStatement import SkipStatement
from .WhenStatement import WhenStatement
from .MatchStatement import MatchStatement
from .MatchFieldList import MatchFieldList
from .MatchList import MatchList
from .Number import Number
from .Regex import Regex
from .String import String
from .Context import Context

"""
Indent handling:
    o NEWLINE:
        - If the amount of indent matches the previous line, parse the \n
          and skip all indent.
        - If the amount of indent does NOT match the previous line, parse
          the \n and stay at the beginning of the new line to let INDENT
          or DEDENT figure it out.
    o INDENT: Skips all indent, then looks backward to update the indent
      count. Checks to make sure that the indent was increased.
    o DEDENT: Like INDENT, except it does not check for errors.
"""


[docs]class SyntaxCompiler(DispatchProcessor): """ Processor sub-class defining processing functions for the productions. """
[docs] def __init__(self): self.context = None
[docs] def reset(self): self.context = Context()
def _regex(self, token, buffer): tag, left, right, sublist = token regex = Regex() regex.data = getString(sublist[0], buffer) return regex def _string(self, token, buffer): tag, left, right, sublist = token string = getString(sublist[0], buffer) return String(self.context, string) def _varname(self, token, buffer): varname = getString(token, buffer) return self.context.lexicon[varname] def _number(self, token, buffer): number = getString(token, buffer) return Number(int(number)) def _expression(self, token, buffer): tag = token[0] if tag == 'string': return self._string(token, buffer) elif tag == 'regex': return self._regex(token, buffer) elif tag == 'varname': return self._varname(token, buffer) elif tag == 'number': return self._number(token, buffer) else: raise Exception('BUG: invalid token %s' % tag) def _match_field_list(self, token, buffer, flags): tag, left, right, sublist = token field_list = MatchFieldList(flags) for field in sublist: expression = self._expression(field, buffer) field_list.expressions.append(expression) return field_list def _match_list(self, token, buffer, flags): tag, left, right, sublist = token matchlist = MatchList() for field_list in sublist: field_list = self._match_field_list(field_list, buffer, flags) matchlist.field_lists.append(field_list) return matchlist def _match_stmt(self, token, buffer, flags=0): tag, left, right, sublist = token matcher = MatchStatement() matcher.matchlist = self._match_list(sublist[0], buffer, flags) matcher.statements = self._suite(sublist[1], buffer) return matcher def _when_stmt(self, token, buffer, flags=0): tag, left, right, sublist = token matcher = WhenStatement() matcher.matchlist = self._match_list(sublist[0], buffer, flags) matcher.statements = self._suite(sublist[1], buffer) return matcher def _skip_stmt(self, token, buffer): tag, left, right, sublist = token matcher = SkipStatement() matcher.match = self._expression(sublist[0], buffer) return matcher def _function(self, token, buffer): tag, left, right, sublist = token function = Function() function.name = getString(sublist[0], buffer) if len(sublist) == 1: return function for arg in sublist[1][3]: expression = self._expression(arg, buffer) function.args.append(expression) return function def _inherit(self, token, buffer): tag, left, right, sublist = token return getString(sublist[0], buffer) def _suite(self, token, buffer): tag, left, right, sublist = token statements = [] for token in sublist: tag = token[0] if tag == 'match_stmt': statement = self._match_stmt(token, buffer) elif tag == 'imatch_stmt': statement = self._match_stmt(token, buffer, re.I) elif tag == 'when_stmt': statement = self._when_stmt(token, buffer) elif tag == 'skip_stmt': statement = self._skip_stmt(token, buffer) elif tag == 'function': statement = self._function(token, buffer) else: raise Exception('BUG: invalid token %s' % tag) statements.append(statement) return statements
[docs] def define_stmt(self, token, buffer): tag, left, right, sublist = token name_tup, value_tup = sublist value_tag = value_tup[0] name = getString(name_tup, buffer) value = getString(value_tup, buffer) if value_tag == 'regex': value = self._regex(value_tup, buffer) elif value_tag == 'varname': if value not in self.context.lexicon: _error(buffer, value_tup[1], 'no such variable') value = self.context.lexicon[value] else: raise Exception('BUG: invalid token %s' % value_tag) self.context.lexicon[name] = value
[docs] def grammar_stmt(self, token, buffer): tag, left, right, sublist = token map = singleMap(sublist) grammar = Grammar() grammar.name = getString(map['varname'], buffer) grammar.statements = self._suite(map['suite'], buffer) if 'inherit' in map: grammar.inherit = self._inherit(map['inherit'], buffer) self.context.grammars[grammar.name] = grammar