knipknap/Gelatin

View on GitHub
Gelatin/parser/util.py

Summary

Maintainability
A
0 mins
Test Coverage
# Copyright (c) 2010-2017 Samuel Abels
#
# Permission is hereby granted, free of charge, to any person obtaining a copy
# of this software and associated documentation files (the "Software"), to deal
# in the Software without restriction, including without limitation the rights
# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
# copies of the Software, and to permit persons to whom the Software is
# furnished to do so, subject to the following conditions:
#
# The above copyright notice and this permission notice shall be included in all
# copies or substantial portions of the Software.
#
# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
# SOFTWARE.
try:
    import re2 as re
except ImportError:
    import re
from Gelatin import INDENT_WIDTH

whitespace_re = re.compile(' *')


def _format(buffer, end, msg):
    line_start = buffer.rfind('\n', 0, end) + 1
    line_end = buffer.find('\n', line_start)
    line_no = buffer.count('\n', 0, end) + 1
    line = buffer[line_start:line_end]
    offset = end - line_start
    mark = ' ' + ' ' * offset + '^'
    return '%s in line %d:\n%s\n%s' % (msg, line_no, repr(line), mark)


def say(buffer, end, msg):
    print(_format(buffer, end, msg))


def error(buffer, end, msg='Syntax error'):
    msg = _format(buffer, end, msg)
    raise Exception(msg)


def eat_indent(buffer, start, end, expected_indent=None):
    # In Py3, using this may be more efficient:
    # result = whitespace_re.match(buffer, start, end)
    # In Py2/PyRe2, the character count differs from len(str),
    # or str.rfind() if the buffer contains unicode chars.
    result = whitespace_re.match(buffer[start:end])
    if result is None:
        # pyre2 returns None if the start parameter to match() is larger
        # than the length of the buffer.
        return start
    whitespace = result.group(0)
    whitespace_len = len(whitespace)
    indent = whitespace_len / INDENT_WIDTH
    if whitespace_len % INDENT_WIDTH != 0:
        msg = 'indent must be a multiple of %d' % INDENT_WIDTH
        error(buffer, start, msg)
    if expected_indent is None or expected_indent == indent:
        return start + whitespace_len
    return start


def count_indent(buffer, start):
    indent = start - buffer.rfind('\n', 0, start) - 1
    if indent % INDENT_WIDTH != 0:
        msg = 'indent must be a multiple of %d, is %d' % (INDENT_WIDTH, indent)
        error(buffer, start, msg)
    if indent / INDENT_WIDTH > 2:
        msg = 'maximum indent (2 levels) exceeded.'
        error(buffer, start, msg)
    return indent / INDENT_WIDTH