This repo contains code to mirror other repos. It also contains the code that is getting mirrored.
You can not select more than 25 topics Topics must start with a letter or number, can include dashes ('-') and can be up to 35 characters long.

92 lines
2.9 KiB

  1. """This module implements a LALR(1) Parser
  2. """
  3. # Author: Erez Shinan (2017)
  4. # Email : erezshin@gmail.com
  5. from ..exceptions import UnexpectedToken
  6. from ..lexer import Token
  7. from .lalr_analysis import LALR_Analyzer, Shift
  8. class Parser:
  9. def __init__(self, parser_conf, debug=False):
  10. assert all(r.options is None or r.options.priority is None
  11. for r in parser_conf.rules), "LALR doesn't yet support prioritization"
  12. analysis = LALR_Analyzer(parser_conf, debug=debug)
  13. analysis.compute_lookahead()
  14. callbacks = {rule: getattr(parser_conf.callback, rule.alias or rule.origin, None)
  15. for rule in parser_conf.rules}
  16. self._parse_table = analysis.parse_table
  17. self.parser_conf = parser_conf
  18. self.parser = _Parser(analysis.parse_table, callbacks)
  19. self.parse = self.parser.parse
  20. ###{standalone
  21. class _Parser:
  22. def __init__(self, parse_table, callbacks):
  23. self.states = parse_table.states
  24. self.start_state = parse_table.start_state
  25. self.end_state = parse_table.end_state
  26. self.callbacks = callbacks
  27. def parse(self, seq, set_state=None):
  28. token = None
  29. stream = iter(seq)
  30. states = self.states
  31. state_stack = [self.start_state]
  32. value_stack = []
  33. if set_state: set_state(self.start_state)
  34. def get_action(token):
  35. state = state_stack[-1]
  36. try:
  37. return states[state][token.type]
  38. except KeyError:
  39. expected = [s for s in states[state].keys() if s.isupper()]
  40. raise UnexpectedToken(token, expected, state=state)
  41. def reduce(rule):
  42. size = len(rule.expansion)
  43. if size:
  44. s = value_stack[-size:]
  45. del state_stack[-size:]
  46. del value_stack[-size:]
  47. else:
  48. s = []
  49. value = self.callbacks[rule](s)
  50. _action, new_state = states[state_stack[-1]][rule.origin.name]
  51. assert _action is Shift
  52. state_stack.append(new_state)
  53. value_stack.append(value)
  54. # Main LALR-parser loop
  55. for token in stream:
  56. while True:
  57. action, arg = get_action(token)
  58. assert arg != self.end_state
  59. if action is Shift:
  60. state_stack.append(arg)
  61. value_stack.append(token)
  62. if set_state: set_state(arg)
  63. break # next token
  64. else:
  65. reduce(arg)
  66. token = Token.new_borrow_pos('$END', '', token) if token else Token('$END', '', 0, 1, 1)
  67. while True:
  68. _action, arg = get_action(token)
  69. if _action is Shift:
  70. assert arg == self.end_state
  71. val ,= value_stack
  72. return val
  73. else:
  74. reduce(arg)
  75. ###}