earley_common.py 1.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142
  1. """This module implements useful building blocks for the Earley parser
  2. """
  3. class Item:
  4. "An Earley Item, the atom of the algorithm."
  5. __slots__ = ('s', 'rule', 'ptr', 'start', 'is_complete', 'expect', 'previous', 'node', '_hash')
  6. def __init__(self, rule, ptr, start):
  7. self.is_complete = len(rule.expansion) == ptr
  8. self.rule = rule # rule
  9. self.ptr = ptr # ptr
  10. self.start = start # j
  11. self.node = None # w
  12. if self.is_complete:
  13. self.s = rule.origin
  14. self.expect = None
  15. self.previous = rule.expansion[ptr - 1] if ptr > 0 and len(rule.expansion) else None
  16. else:
  17. self.s = (rule, ptr)
  18. self.expect = rule.expansion[ptr]
  19. self.previous = rule.expansion[ptr - 1] if ptr > 0 and len(rule.expansion) else None
  20. self._hash = hash((self.s, self.start, self.rule))
  21. def advance(self):
  22. return Item(self.rule, self.ptr + 1, self.start)
  23. def __eq__(self, other):
  24. return self is other or (self.s == other.s and self.start == other.start and self.rule == other.rule)
  25. def __hash__(self):
  26. return self._hash
  27. def __repr__(self):
  28. before = ( expansion.name for expansion in self.rule.expansion[:self.ptr] )
  29. after = ( expansion.name for expansion in self.rule.expansion[self.ptr:] )
  30. symbol = "{} ::= {}* {}".format(self.rule.origin.name, ' '.join(before), ' '.join(after))
  31. return '%s (%d)' % (symbol, self.start)
  32. # class TransitiveItem(Item):
  33. # ... # removed at commit 4c1cfb2faf24e8f8bff7112627a00b94d261b420