From 255ef0d973a140b5be07cb4d97c5bf8f8e20788e Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Sun, 1 Apr 2018 00:06:31 +0300
Subject: [PATCH 01/19] Added error message for the alias syntax in terminals
 (Issue #97)

---
 lark/load_grammar.py | 7 ++++++-
 tests/test_parser.py | 6 ++++++
 2 files changed, 12 insertions(+), 1 deletion(-)

diff --git a/lark/load_grammar.py b/lark/load_grammar.py
index 1637514..2e8b893 100644
--- a/lark/load_grammar.py
+++ b/lark/load_grammar.py
@@ -402,6 +402,8 @@ class TokenTreeToPattern(Transformer):
             assert len(args) == 2
         return PatternRE('(?:%s)%s' % (inner.to_regexp(), op), inner.flags)
 
+    def alias(self, t):
+        raise GrammarError("Aliasing not allowed in terminals (You used -> in the wrong place)")
 
 def _interleave(l, item):
     for e in l:
@@ -455,6 +457,9 @@ class Grammar:
                         exp.children[i] = Token(sym.type, new_terminal_names[sym])
 
         for name, (tree, priority) in term_defs:   # TODO transfer priority to rule?
+            if any(tree.find_data('alias')):
+                raise GrammarError("Aliasing not allowed in terminals (You used -> in the wrong place)")
+
             if name.startswith('_'):
                 options = RuleOptions(filter_out=True, priority=-priority)
             else:
@@ -516,7 +521,7 @@ class Grammar:
 
             for expansion, alias in expansions:
                 if alias and name.startswith('_'):
-                    raise Exception("Rule %s is marked for expansion (it starts with an underscore) and isn't allowed to have aliases (alias=%s)" % (name, alias))
+                    raise GrammarError("Rule %s is marked for expansion (it starts with an underscore) and isn't allowed to have aliases (alias=%s)" % (name, alias))
 
                 rule = Rule(name, expansion, alias, options)
                 compiled_rules.append(rule)
diff --git a/tests/test_parser.py b/tests/test_parser.py
index 89b9d69..a948bd5 100644
--- a/tests/test_parser.py
+++ b/tests/test_parser.py
@@ -822,6 +822,12 @@ def _make_parser_test(LEXER, PARSER):
                 """
             self.assertRaises( GrammarError, _Lark, g)
 
+        def test_alias_in_terminal(self):
+            g = """start: TERM
+                TERM: "a" -> alias
+                """
+            self.assertRaises( GrammarError, _Lark, g)
+
         @unittest.skipIf(LEXER==None, "TODO: Fix scanless parsing or get rid of it") # TODO
         def test_line_and_column(self):
             g = r"""!start: "A" bc "D"

From 25c3c51b1c6c096b6e4bcfe63d543fece572b72d Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Thu, 5 Apr 2018 15:40:33 +0300
Subject: [PATCH 02/19] Fixed bug in Earley: A tree builder optimization
 clashed with explicit ambiguity

---
 lark/lark.py               |  2 +-
 lark/parse_tree_builder.py | 22 ++++++++++++++++++----
 tests/test_parser.py       | 24 ++++++++++++++++++++++++
 3 files changed, 43 insertions(+), 5 deletions(-)

diff --git a/lark/lark.py b/lark/lark.py
index fb5e04f..2660bd7 100644
--- a/lark/lark.py
+++ b/lark/lark.py
@@ -172,7 +172,7 @@ class Lark:
     def _build_parser(self):
         self.parser_class = get_frontend(self.options.parser, self.options.lexer)
 
-        self._parse_tree_builder = ParseTreeBuilder(self.rules, self.options.tree_class, self.options.propagate_positions, self.options.keep_all_tokens)
+        self._parse_tree_builder = ParseTreeBuilder(self.rules, self.options.tree_class, self.options.propagate_positions, self.options.keep_all_tokens, self.options.parser!='lalr')
         callback = self._parse_tree_builder.create_callback(self.options.transformer)
         if self.profiler:
             for f in dir(callback):
diff --git a/lark/parse_tree_builder.py b/lark/parse_tree_builder.py
index e84b01d..7c74178 100644
--- a/lark/parse_tree_builder.py
+++ b/lark/parse_tree_builder.py
@@ -57,6 +57,19 @@ class ChildFilter:
         self.node_builder = node_builder
         self.to_include = to_include
 
+    def __call__(self, children):
+        filtered = []
+        for i, to_expand in self.to_include:
+            if to_expand:
+                filtered += children[i].children
+            else:
+                filtered.append(children[i])
+
+        return self.node_builder(filtered)
+
+class ChildFilterLALR(ChildFilter):
+    "Optimized childfilter for LALR (assumes no duplication in parse tree, so it's safe to change it)"
+
     def __call__(self, children):
         filtered = []
         for i, to_expand in self.to_include:
@@ -73,21 +86,22 @@ class ChildFilter:
 def _should_expand(sym):
     return not is_terminal(sym) and sym.startswith('_')
 
-def maybe_create_child_filter(expansion, filter_out):
+def maybe_create_child_filter(expansion, filter_out, ambiguous):
     to_include = [(i, _should_expand(sym)) for i, sym in enumerate(expansion) if sym not in filter_out]
 
     if len(to_include) < len(expansion) or any(to_expand for i, to_expand in to_include):
-        return partial(ChildFilter, to_include)
+        return partial(ChildFilter if ambiguous else ChildFilterLALR, to_include)
 
 
 class Callback(object):
     pass
 
 class ParseTreeBuilder:
-    def __init__(self, rules, tree_class, propagate_positions=False, keep_all_tokens=False):
+    def __init__(self, rules, tree_class, propagate_positions=False, keep_all_tokens=False, ambiguous=False):
         self.tree_class = tree_class
         self.propagate_positions = propagate_positions
         self.always_keep_all_tokens = keep_all_tokens
+        self.ambiguous = ambiguous
 
         self.rule_builders = list(self._init_builders(rules))
 
@@ -107,7 +121,7 @@ class ParseTreeBuilder:
             wrapper_chain = filter(None, [
                 create_token and partial(CreateToken, create_token),
                 (expand_single_child and not rule.alias) and ExpandSingleChild,
-                maybe_create_child_filter(rule.expansion, () if keep_all_tokens else filter_out),
+                maybe_create_child_filter(rule.expansion, () if keep_all_tokens else filter_out, self.ambiguous),
                 self.propagate_positions and PropagatePositions,
             ])
 
diff --git a/tests/test_parser.py b/tests/test_parser.py
index a948bd5..47d0e3d 100644
--- a/tests/test_parser.py
+++ b/tests/test_parser.py
@@ -293,6 +293,30 @@ def _make_full_earley_test(LEXER):
             self.assertEqual(res, expected)
 
 
+        def test_explicit_ambiguity(self):
+            grammar = r"""
+            start: NAME+
+
+            NAME: /\w+/
+
+            %ignore " "
+            """
+
+            text = """cat"""
+
+            parser = Lark(grammar, start='start', ambiguity='explicit')
+            tree = parser.parse(text)
+            self.assertEqual(tree.data, '_ambig')
+
+            combinations = {tuple(str(s) for s in t.children) for t in tree.children}
+            self.assertEqual(combinations, {
+                ('cat',),
+                ('ca', 't'),
+                ('c', 'at'),
+                ('c', 'a' ,'t')
+            })
+
+
 
 
 

From 4f2330fc9b75869fcb5d887bcfca349af8e5ca20 Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Thu, 5 Apr 2018 16:09:42 +0300
Subject: [PATCH 03/19] Fixed bug in Earley prioritization

---
 lark/parsers/resolve_ambig.py |  6 +-----
 tests/test_parser.py          | 40 +++++++++++++++++++++++------------
 2 files changed, 28 insertions(+), 18 deletions(-)

diff --git a/lark/parsers/resolve_ambig.py b/lark/parsers/resolve_ambig.py
index 9c859b5..456c6a9 100644
--- a/lark/parsers/resolve_ambig.py
+++ b/lark/parsers/resolve_ambig.py
@@ -9,11 +9,7 @@ from ..tree import Tree, Visitor_NoRecurse
 # Author: Erez Sh
 
 def _compare_rules(rule1, rule2):
-    c = -compare( len(rule1.expansion), len(rule2.expansion))
-    if rule1.origin.startswith('__'):   # XXX hack! We should set priority in parser, not here
-        c = -c
-    return c
-
+    return -compare( len(rule1.expansion), len(rule2.expansion))
 
 def _sum_priority(tree):
     p = 0
diff --git a/tests/test_parser.py b/tests/test_parser.py
index 47d0e3d..d4d63ca 100644
--- a/tests/test_parser.py
+++ b/tests/test_parser.py
@@ -187,17 +187,22 @@ def _make_full_earley_test(LEXER):
             l.parse(program)
 
 
-        def test_earley_scanless3(self):
-            "Tests prioritization and disambiguation for pseudo-terminals (there should be only one result)"
+        # XXX Fails for scanless mode
+        # XXX Decided not to fix, because
+        #       a) It's a subtle bug
+        #       b) Scanless is intended for deprecation
+        #
+        # def test_earley_scanless3(self):
+        #     "Tests prioritization and disambiguation for pseudo-terminals (there should be only one result)"
 
-            grammar = """
-            start: A A
-            A: "a"+
-            """
+        #     grammar = """
+        #     start: A A
+        #     A: "a"+
+        #     """
 
-            l = Lark(grammar, parser='earley', lexer=LEXER)
-            res = l.parse("aaa")
-            self.assertEqual(res.children, ['aa', 'a'])
+        #     l = Lark(grammar, parser='earley', lexer=LEXER)
+        #     res = l.parse("aaa")
+        #     self.assertEqual(res.children, ['aa', 'a'])
 
         def test_earley_scanless4(self):
             grammar = """
@@ -293,15 +298,12 @@ def _make_full_earley_test(LEXER):
             self.assertEqual(res, expected)
 
 
-        def test_explicit_ambiguity(self):
+        def test_explicit_ambiguity2(self):
             grammar = r"""
             start: NAME+
-
             NAME: /\w+/
-
             %ignore " "
             """
-
             text = """cat"""
 
             parser = Lark(grammar, start='start', ambiguity='explicit')
@@ -316,6 +318,18 @@ def _make_full_earley_test(LEXER):
                 ('c', 'a' ,'t')
             })
 
+        def test_term_ambig_resolve(self):
+            grammar = r"""
+            !start: NAME+
+            NAME: /\w+/
+            %ignore " "
+            """
+            text = """foo bar"""
+
+            parser = Lark(grammar)
+            tree = parser.parse(text)
+            self.assertEqual(tree.children, ['foo', 'bar'])
+
 
 
 

From eb6e809ffcf30b0e65ded939032dd6b223d2eb78 Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Thu, 5 Apr 2018 16:15:22 +0300
Subject: [PATCH 04/19] Version bump

---
 lark/__init__.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lark/__init__.py b/lark/__init__.py
index 1875820..af6f7b5 100644
--- a/lark/__init__.py
+++ b/lark/__init__.py
@@ -4,4 +4,4 @@ from .lexer import UnexpectedInput, LexError
 from .lark import Lark
 from .utils import inline_args
 
-__version__ = "0.5.5"
+__version__ = "0.5.6"

From ba0dc789a32fe21bb731132cec9a12b8ae6cb036 Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Sat, 7 Apr 2018 12:21:51 +0300
Subject: [PATCH 05/19] Significantly better memory performance (Thanks
 @drslump!)

Added __slots__ to RulePtr and Token, resulting in significantly lower memory consumption.

As suggested by @drslump.
---
 lark/lexer.py                    | 2 ++
 lark/parsers/grammar_analysis.py | 2 ++
 2 files changed, 4 insertions(+)

diff --git a/lark/lexer.py b/lark/lexer.py
index bcf09f1..0a46ee1 100644
--- a/lark/lexer.py
+++ b/lark/lexer.py
@@ -25,6 +25,8 @@ class UnexpectedInput(LexError):
         self.considered_rules = considered_rules
 
 class Token(Str):
+    __slots__ = ('type', 'pos_in_stream', 'value', 'line', 'column', 'end_line', 'end_column')
+
     def __new__(cls, type_, value, pos_in_stream=None, line=None, column=None):
         self = super(Token, cls).__new__(cls, value)
         self.type = type_
diff --git a/lark/parsers/grammar_analysis.py b/lark/parsers/grammar_analysis.py
index 9ad49ce..5cbd697 100644
--- a/lark/parsers/grammar_analysis.py
+++ b/lark/parsers/grammar_analysis.py
@@ -5,6 +5,8 @@ from ..grammar import Rule
 
 
 class RulePtr(object):
+    __slots__ = ('rule', 'index')
+
     def __init__(self, rule, index):
         assert isinstance(rule, Rule)
         assert index <= len(rule.expansion)

From b951b5f79cf1ac79ad70e44d7038bf214ece7d2b Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Sat, 7 Apr 2018 14:55:17 +0300
Subject: [PATCH 06/19] Significant reduction in memory consumption (Saving
 only parse-table instead of analysis instance)

---
 lark/parser_frontends.py    | 4 ++--
 lark/parsers/earley.py      | 6 +++---
 lark/parsers/lalr_parser.py | 3 ++-
 lark/tools/standalone.py    | 2 +-
 4 files changed, 8 insertions(+), 7 deletions(-)

diff --git a/lark/parser_frontends.py b/lark/parser_frontends.py
index c4a6f9b..a36252c 100644
--- a/lark/parser_frontends.py
+++ b/lark/parser_frontends.py
@@ -15,9 +15,9 @@ class WithLexer:
 
     def init_contextual_lexer(self, lexer_conf, parser_conf):
         self.lexer_conf = lexer_conf
-        d = {idx:t.keys() for idx, t in self.parser.analysis.parse_table.states.items()}
+        states = {idx:list(t.keys()) for idx, t in self.parser._parse_table.states.items()}
         always_accept = lexer_conf.postlex.always_accept if lexer_conf.postlex else ()
-        self.lexer = ContextualLexer(lexer_conf.tokens, d, ignore=lexer_conf.ignore, always_accept=always_accept, user_callbacks=lexer_conf.callbacks)
+        self.lexer = ContextualLexer(lexer_conf.tokens, states, ignore=lexer_conf.ignore, always_accept=always_accept, user_callbacks=lexer_conf.callbacks)
 
     def lex(self, text):
         stream = self.lexer.lex(text)
diff --git a/lark/parsers/earley.py b/lark/parsers/earley.py
index 2b04a1e..d119e41 100644
--- a/lark/parsers/earley.py
+++ b/lark/parsers/earley.py
@@ -145,16 +145,16 @@ class Column:
 
 class Parser:
     def __init__(self, parser_conf, term_matcher, resolve_ambiguity=None):
-        self.analysis = GrammarAnalyzer(parser_conf)
+        analysis = GrammarAnalyzer(parser_conf)
         self.parser_conf = parser_conf
         self.resolve_ambiguity = resolve_ambiguity
 
-        self.FIRST = self.analysis.FIRST
+        self.FIRST = analysis.FIRST
         self.postprocess = {}
         self.predictions = {}
         for rule in parser_conf.rules:
             self.postprocess[rule] = rule.alias if callable(rule.alias) else getattr(parser_conf.callback, rule.alias)
-            self.predictions[rule.origin] = [x.rule for x in self.analysis.expand_rule(rule.origin)]
+            self.predictions[rule.origin] = [x.rule for x in analysis.expand_rule(rule.origin)]
 
         self.term_matcher = term_matcher
 
diff --git a/lark/parsers/lalr_parser.py b/lark/parsers/lalr_parser.py
index f4e0942..a20db07 100644
--- a/lark/parsers/lalr_parser.py
+++ b/lark/parsers/lalr_parser.py
@@ -11,11 +11,12 @@ class Parser:
     def __init__(self, parser_conf):
         assert all(r.options is None or r.options.priority is None
                    for r in parser_conf.rules), "LALR doesn't yet support prioritization"
-        self.analysis = analysis = LALR_Analyzer(parser_conf)
+        analysis = LALR_Analyzer(parser_conf)
         analysis.compute_lookahead()
         callbacks = {rule: getattr(parser_conf.callback, rule.alias or rule.origin, None)
                           for rule in parser_conf.rules}
 
+        self._parse_table = analysis.parse_table
         self.parser_conf = parser_conf
         self.parser = _Parser(analysis.parse_table, callbacks)
         self.parse = self.parser.parse
diff --git a/lark/tools/standalone.py b/lark/tools/standalone.py
index cf29cee..61ce94e 100644
--- a/lark/tools/standalone.py
+++ b/lark/tools/standalone.py
@@ -126,7 +126,7 @@ def _get_token_type(token_type):
 
 class ParserAtoms:
     def __init__(self, parser):
-        self.parse_table = parser.analysis.parse_table
+        self.parse_table = parser._parse_table
 
     def print_python(self):
         print('class ParseTable: pass')

From b9e1e444c9adea3e964a25aa58141bb6bf27c90b Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Sat, 7 Apr 2018 15:13:12 +0300
Subject: [PATCH 07/19] Added SlottedTree

---
 lark/load_grammar.py | 38 +++++++++++++++++++-------------------
 lark/tree.py         |  2 ++
 2 files changed, 21 insertions(+), 19 deletions(-)

diff --git a/lark/load_grammar.py b/lark/load_grammar.py
index 2e8b893..a6b2d82 100644
--- a/lark/load_grammar.py
+++ b/lark/load_grammar.py
@@ -14,7 +14,7 @@ from .parsers.lalr_parser import UnexpectedToken
 from .common import is_terminal, GrammarError, LexerConf, ParserConf, PatternStr, PatternRE, TokenDef
 from .grammar import RuleOptions, Rule
 
-from .tree import Tree as T, Transformer, InlineTransformer, Visitor
+from .tree import Tree, Transformer, InlineTransformer, Visitor, SlottedTree as ST
 
 __path__ = os.path.dirname(__file__)
 IMPORT_PATHS = [os.path.join(__path__, 'grammars')]
@@ -145,14 +145,14 @@ class EBNF_to_BNF(InlineTransformer):
         new_name = '__%s_%s_%d' % (self.prefix, type_, self.i)
         self.i += 1
         t = Token('RULE', new_name, -1)
-        tree = T('expansions', [T('expansion', [expr]), T('expansion', [t, expr])])
+        tree = ST('expansions', [ST('expansion', [expr]), ST('expansion', [t, expr])])
         self.new_rules.append((new_name, tree, self.rule_options))
         self.rules_by_expr[expr] = t
         return t
 
     def expr(self, rule, op, *args):
         if op.value == '?':
-            return T('expansions', [rule, T('expansion', [])])
+            return ST('expansions', [rule, ST('expansion', [])])
         elif op.value == '+':
             # a : b c+ d
             #   -->
@@ -165,7 +165,7 @@ class EBNF_to_BNF(InlineTransformer):
             # a : b _c? d
             # _c : _c c | c;
             new_name = self._add_recurse_rule('star', rule)
-            return T('expansions', [new_name, T('expansion', [])])
+            return ST('expansions', [new_name, ST('expansion', [])])
         elif op.value == '~':
             if len(args) == 1:
                 mn = mx = int(args[0])
@@ -173,7 +173,7 @@ class EBNF_to_BNF(InlineTransformer):
                 mn, mx = map(int, args)
                 if mx < mn:
                     raise GrammarError("Bad Range for %s (%d..%d isn't allowed)" % (rule, mn, mx))
-            return T('expansions', [T('expansion', [rule] * n) for n in range(mn, mx+1)])
+            return ST('expansions', [ST('expansion', [rule] * n) for n in range(mn, mx+1)])
         assert False, op
 
 
@@ -183,7 +183,7 @@ class SimplifyRule_Visitor(Visitor):
     def _flatten(tree):
         while True:
             to_expand = [i for i, child in enumerate(tree.children)
-                         if isinstance(child, T) and child.data == tree.data]
+                         if isinstance(child, Tree) and child.data == tree.data]
             if not to_expand:
                 break
             tree.expand_kids_by_index(*to_expand)
@@ -203,9 +203,9 @@ class SimplifyRule_Visitor(Visitor):
             self._flatten(tree)
 
             for i, child in enumerate(tree.children):
-                if isinstance(child, T) and child.data == 'expansions':
+                if isinstance(child, Tree) and child.data == 'expansions':
                     tree.data = 'expansions'
-                    tree.children = [self.visit(T('expansion', [option if i==j else other
+                    tree.children = [self.visit(ST('expansion', [option if i==j else other
                                                                 for j, other in enumerate(tree.children)]))
                                      for option in set(child.children)]
                     break
@@ -217,7 +217,7 @@ class SimplifyRule_Visitor(Visitor):
         if rule.data == 'expansions':
             aliases = []
             for child in tree.children[0].children:
-                aliases.append(T('alias', [child, alias_name]))
+                aliases.append(ST('alias', [child, alias_name]))
             tree.data = 'expansions'
             tree.children = aliases
 
@@ -239,7 +239,7 @@ class RuleTreeToText(Transformer):
 
 class CanonizeTree(InlineTransformer):
     def maybe(self, expr):
-        return T('expr', [expr, Token('OP', '?', -1)])
+        return ST('expr', [expr, Token('OP', '?', -1)])
 
     def tokenmods(self, *args):
         if len(args) == 1:
@@ -353,7 +353,7 @@ def _literal_to_pattern(literal):
 
 class PrepareLiterals(InlineTransformer):
     def literal(self, literal):
-        return T('pattern', [_literal_to_pattern(literal)])
+        return ST('pattern', [_literal_to_pattern(literal)])
 
     def range(self, start, end):
         assert start.type == end.type == 'STRING'
@@ -361,13 +361,13 @@ class PrepareLiterals(InlineTransformer):
         end = end.value[1:-1]
         assert len(start) == len(end) == 1, (start, end, len(start), len(end))
         regexp = '[%s-%s]' % (start, end)
-        return T('pattern', [PatternRE(regexp)])
+        return ST('pattern', [PatternRE(regexp)])
 
 class SplitLiterals(InlineTransformer):
     def pattern(self, p):
         if isinstance(p, PatternStr) and len(p.value)>1:
-            return T('expansion', [T('pattern', [PatternStr(ch, flags=p.flags)]) for ch in p.value])
-        return T('pattern', [p])
+            return ST('expansion', [ST('pattern', [PatternStr(ch, flags=p.flags)]) for ch in p.value])
+        return ST('pattern', [p])
 
 class TokenTreeToPattern(Transformer):
     def pattern(self, ps):
@@ -408,14 +408,14 @@ class TokenTreeToPattern(Transformer):
 def _interleave(l, item):
     for e in l:
         yield e
-        if isinstance(e, T):
+        if isinstance(e, Tree):
             if e.data in ('literal', 'range'):
                 yield item
         elif is_terminal(e):
             yield item
 
 def _choice_of_rules(rules):
-    return T('expansions', [T('expansion', [Token('RULE', name)]) for name in rules])
+    return ST('expansions', [ST('expansion', [Token('RULE', name)]) for name in rules])
 
 class Grammar:
     def __init__(self, rule_defs, token_defs, ignore):
@@ -442,9 +442,9 @@ class Grammar:
                     if r == start:
                         exp.children = [expr] + exp.children
                 for exp in tree.find_data('expr'):
-                    exp.children[0] = T('expansion', list(_interleave(exp.children[:1], expr)))
+                    exp.children[0] = ST('expansion', list(_interleave(exp.children[:1], expr)))
 
-            _ignore_tree = T('expr', [_choice_of_rules(terms_to_ignore.values()), Token('OP', '?')])
+            _ignore_tree = ST('expr', [_choice_of_rules(terms_to_ignore.values()), Token('OP', '?')])
             rule_defs.append(('__ignore', _ignore_tree, None))
 
         # Convert all tokens to rules
@@ -584,7 +584,7 @@ class GrammarLoader:
 
         rules = [options_from_rule(name, x) for name, x in RULES.items()]
         rules = [Rule(r, x.split(), None, o) for r, xs, o in rules for x in xs]
-        callback = ParseTreeBuilder(rules, T).create_callback()
+        callback = ParseTreeBuilder(rules, ST).create_callback()
         lexer_conf = LexerConf(tokens, ['WS', 'COMMENT'])
 
         parser_conf = ParserConf(rules, callback, 'start')
diff --git a/lark/tree.py b/lark/tree.py
index 68eaf42..d496d75 100644
--- a/lark/tree.py
+++ b/lark/tree.py
@@ -99,6 +99,8 @@ class Tree(object):
         self.data = data
         self.children = children
 
+class SlottedTree(Tree):
+    __slots__ = 'data', 'children', 'rule'
 
 
 ###{standalone

From 61afbed17a4ad9af6024854b2ec32bfb7f330682 Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Sat, 7 Apr 2018 15:17:37 +0300
Subject: [PATCH 08/19] A minor style fix (a possible memory usage improvement)

---
 lark/parsers/grammar_analysis.py | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/lark/parsers/grammar_analysis.py b/lark/parsers/grammar_analysis.py
index 5cbd697..f34d5c1 100644
--- a/lark/parsers/grammar_analysis.py
+++ b/lark/parsers/grammar_analysis.py
@@ -136,7 +136,8 @@ class GrammarAnalyzer(object):
                     if not is_terminal(new_r):
                         yield new_r
 
-        _ = list(bfs([rule], _expand_rule))
+        for _ in bfs([rule], _expand_rule):
+            pass
 
         return fzset(init_ptrs)
 

From 138f1d5d76d1a98e2489cb12503ec907fb6f6ed5 Mon Sep 17 00:00:00 2001
From: Parker <6646825+psboyce@users.noreply.github.com>
Date: Sat, 14 Apr 2018 23:10:28 -0600
Subject: [PATCH 09/19] Fix order of members when pickling Token

I found this while porting Token to C, essentially the value and pos_in_stream members of Token were swapped in ``__reduce__``, which means running ``pickle.loads`` and ``pickle.dumps`` would result in unpickled tokens whose value was the original's position in stream, and vice versa. In my C extension this caused a TypeError exception, but the behavior will have to be corrected in both.
---
 lark/lexer.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/lark/lexer.py b/lark/lexer.py
index 0a46ee1..938d22b 100644
--- a/lark/lexer.py
+++ b/lark/lexer.py
@@ -41,7 +41,7 @@ class Token(Str):
         return cls(type_, value, borrow_t.pos_in_stream, line=borrow_t.line, column=borrow_t.column)
 
     def __reduce__(self):
-        return (self.__class__, (self.type, self.pos_in_stream, self.value, self.line, self.column, ))
+        return (self.__class__, (self.type, self.value, self.pos_in_stream, self.line, self.column, ))
 
     def __repr__(self):
         return 'Token(%s, %r)' % (self.type, self.value)

From e69d567bce7376fd968471f3907c0d99bb9a46d3 Mon Sep 17 00:00:00 2001
From: DrSlump <drslump@pollinimini.net>
Date: Sun, 15 Apr 2018 12:42:13 +0200
Subject: [PATCH 10/19] example driven parser errors

---
 lark/common.py              | 30 ++++++++++++++++++++++++++++--
 lark/parsers/lalr_parser.py |  4 +---
 2 files changed, 29 insertions(+), 5 deletions(-)

diff --git a/lark/common.py b/lark/common.py
index 7611a2c..4091136 100644
--- a/lark/common.py
+++ b/lark/common.py
@@ -17,12 +17,13 @@ class ParseError(Exception):
     pass
 
 class UnexpectedToken(ParseError):
-    def __init__(self, token, expected, seq, index, considered_rules=None):
+    def __init__(self, token, expected, seq, index, considered_rules=None, state=None):
         self.token = token
         self.expected = expected
         self.line = getattr(token, 'line', '?')
         self.column = getattr(token, 'column', '?')
         self.considered_rules = considered_rules
+        self.state = state
 
         try:
             context = ' '.join(['%r(%s)' % (t.value, t.type) for t in seq[index:index+5]])
@@ -36,7 +37,32 @@ class UnexpectedToken(ParseError):
 
         super(UnexpectedToken, self).__init__(message)
 
-
+    def match_examples(self, parse_fn, examples):
+        """ Given a parser instance and a dictionary mapping some label with
+            some malformed syntax examples, it'll return the label for the
+            example that bests matches the current error.
+        """
+        if not self.state:
+            return None
+
+        candidate = None
+        for label,example in examples.items():
+            if not isinstance(example, (tuple, list)):
+                example = [example]
+
+            for malformed in example:
+                try:
+                    parse_fn(malformed)
+                except UnexpectedToken as ut:
+                    if ut.state == self.state:
+                        if ut.token == self.token:
+                            return label
+                        elif not candidate:
+                            candidate = label
+                except:
+                    pass
+
+        return candidate
 ###}
 
 
diff --git a/lark/parsers/lalr_parser.py b/lark/parsers/lalr_parser.py
index a20db07..baea614 100644
--- a/lark/parsers/lalr_parser.py
+++ b/lark/parsers/lalr_parser.py
@@ -2,7 +2,6 @@
 """
 # Author: Erez Shinan (2017)
 # Email : erezshin@gmail.com
-
 from ..common import UnexpectedToken
 
 from .lalr_analysis import LALR_Analyzer, Shift
@@ -47,8 +46,7 @@ class _Parser:
                 return states[state][key]
             except KeyError:
                 expected = states[state].keys()
-
-                raise UnexpectedToken(token, expected, seq, i)
+                raise UnexpectedToken(token, expected, seq, i, state=state)
 
         def reduce(rule):
             size = len(rule.expansion)

From 880f42dd1273f30f76f9f2c9ab116b26d923a684 Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Wed, 18 Apr 2018 12:33:47 +0300
Subject: [PATCH 11/19] Corrections to PR and added get_context

---
 lark/common.py | 22 +++++++++++++---------
 1 file changed, 13 insertions(+), 9 deletions(-)

diff --git a/lark/common.py b/lark/common.py
index 4091136..84a4139 100644
--- a/lark/common.py
+++ b/lark/common.py
@@ -1,7 +1,7 @@
 import re
 import sys
 
-from .utils import get_regexp_width
+from .utils import get_regexp_width, STRING_TYPE
 
 Py36 = (sys.version_info[:2] >= (3, 6))
 
@@ -42,27 +42,31 @@ class UnexpectedToken(ParseError):
             some malformed syntax examples, it'll return the label for the
             example that bests matches the current error.
         """
-        if not self.state:
-            return None
+        assert self.state, "Not supported for this exception"
 
         candidate = None
-        for label,example in examples.items():
-            if not isinstance(example, (tuple, list)):
-                example = [example]
+        for label, example in examples.items():
+            assert not isinstance(example, STRING_TYPE)
 
             for malformed in example:
                 try:
                     parse_fn(malformed)
                 except UnexpectedToken as ut:
                     if ut.state == self.state:
-                        if ut.token == self.token:
+                        if ut.token == self.token:  # Try exact match first
                             return label
                         elif not candidate:
                             candidate = label
-                except:
-                    pass
 
         return candidate
+
+    def get_context(self, text, span=10):
+        pos = self.token.pos_in_stream
+        start = max(pos - span, 0)
+        end = pos + span
+        before = text[start:pos].rsplit('\n', 1)[-1]
+        after = text[pos:end].split('\n', 1)[0]
+        return before + after + '\n' + ' ' * len(before) + '^\n'
 ###}
 
 

From 599b80e30af85fb49f0621ff5d6c808770584c22 Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Wed, 18 Apr 2018 12:37:57 +0300
Subject: [PATCH 12/19] Added example for error reporting with LALR

---
 examples/README.md               |  1 +
 examples/error_reporting_lalr.py | 81 ++++++++++++++++++++++++++++++++
 2 files changed, 82 insertions(+)
 create mode 100644 examples/error_reporting_lalr.py

diff --git a/examples/README.md b/examples/README.md
index 88d3bb0..3fbe3ea 100644
--- a/examples/README.md
+++ b/examples/README.md
@@ -10,6 +10,7 @@
 
 ### Advanced
 
+- [error\_reporting\_lalr.py](error_reporting_lalr.py) - A demonstration of example-driven error reporting with the LALR parser
 - [python\_parser.py](python_parser.py) - A fully-working Python 2 & 3 parser (but not production ready yet!)
 - [conf.py](conf.py) - Demonstrates the power of LALR's contextual lexer on a toy configuration language
 - [reconstruct\_json.py](reconstruct_json.py) - Demonstrates the experimental text-reconstruction feature
diff --git a/examples/error_reporting_lalr.py b/examples/error_reporting_lalr.py
new file mode 100644
index 0000000..a1055fd
--- /dev/null
+++ b/examples/error_reporting_lalr.py
@@ -0,0 +1,81 @@
+#
+# This demonstrates example-driven error reporting with the LALR parser
+#
+
+from lark import Lark, UnexpectedToken
+
+from .json_parser import json_grammar   # Using the grammar from the json_parser example
+
+json_parser = Lark(json_grammar, parser='lalr')
+
+class JsonSyntaxError(SyntaxError):
+    def __str__(self):
+        context, line, column = self.args
+        return '%s at line %s, column %s.\n\n%s' % (self.label, line, column, context)
+
+class JsonMissingValue(JsonSyntaxError):
+    label = 'Missing Value'
+
+class JsonMissingOpening(JsonSyntaxError):
+    label = 'Missing Opening'
+
+class JsonMissingClosing(JsonSyntaxError):
+    label = 'Missing Closing'
+
+class JsonMissingComma(JsonSyntaxError):
+    label = 'Missing Comma'
+
+class JsonTrailingComma(JsonSyntaxError):
+    label = 'Trailing Comma'
+
+
+def parse(json_text):
+    try:
+        j = json_parser.parse(json_text)
+    except UnexpectedToken as ut:
+        exc_class = ut.match_examples(json_parser.parse, {
+            JsonMissingValue: ['{"foo": }'],
+            JsonMissingOpening: ['{"foo": ]}',
+                                 '{"foor": }}'],
+            JsonMissingClosing: ['{"foo": [}',
+                                 '{',
+                                 '{"a": 1',
+                                 '[1'],
+            JsonMissingComma: ['[1 2]',
+                               '[false 1]',
+                               '["b" 1]',
+                               '{"a":true 1:4}',
+                               '{"a":1 1:4}',
+                               '{"a":"b" 1:4}'],
+            JsonTrailingComma: ['[,]',
+                                '[1,]',
+                                '[1,2,]',
+                                '{"foo":1,}',
+                                '{"foo":false,"bar":true,}']
+        })
+        if not exc_class:
+            raise
+        raise exc_class(ut.get_context(json_text), ut.line, ut.column)
+
+
+def test():
+    try:
+        parse('{"key":')
+    except JsonMissingValue:
+        pass
+
+    try:
+        parse('{"key": "value"')
+    except JsonMissingClosing:
+        pass
+
+    try:
+        parse('{"key": ] ')
+    except JsonMissingOpening:
+        pass
+
+
+if __name__ == '__main__':
+    test()
+
+

From 9848cac9f0b1e988214d12b1d4cd8972a2b5444f Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Wed, 18 Apr 2018 13:27:49 +0300
Subject: [PATCH 13/19] Improved Lark's error reporting for grammar syntax
 errors (Based on PR #129)

---
 lark/load_grammar.py | 22 +++++++++++++++-------
 1 file changed, 15 insertions(+), 7 deletions(-)

diff --git a/lark/load_grammar.py b/lark/load_grammar.py
index a6b2d82..43d1bf5 100644
--- a/lark/load_grammar.py
+++ b/lark/load_grammar.py
@@ -600,14 +600,22 @@ class GrammarLoader:
         except UnexpectedInput as e:
             raise GrammarError("Unexpected input %r at line %d column %d in %s" % (e.context, e.line, e.column, name))
         except UnexpectedToken as e:
-            if e.expected == ['_COLON']:
-                raise GrammarError("Missing colon at line %s column %s" % (e.line, e.column))
-            elif e.expected == ['RULE']:
-                raise GrammarError("Missing alias at line %s column %s" % (e.line, e.column))
+            context = e.get_context(grammar_text)
+            error = e.match_examples(self.parser.parse, {
+                'Unclosed parenthesis': ['a: (\n'],
+                'Umatched closing parenthesis': ['a: )\n', 'a: [)\n', 'a: (]\n'],
+                'Expecting rule or token definition (missing colon)': ['a\n', 'a->\n', 'A->\n', 'a A\n'],
+                'Alias expects lowercase name': ['a: -> "a"\n'],
+                'Unexpected colon': ['a::\n', 'a: b:\n', 'a: B:\n', 'a: "a":\n'],
+                'Misplaced operator': ['a: b??', 'a: b(?)', 'a:+\n', 'a:?\n', 'a:*\n', 'a:|*\n'],
+                'Expecting option ("|") or a new rule or token definition': ['a:a\n()\n'],
+                '%import expects a name': ['%import "a"\n'],
+                '%ignore expects a value': ['%ignore %import\n'],
+            })
+            if error:
+                raise GrammarError("%s at line %s column %s\n\n%s" % (error, e.line, e.column, context))
             elif 'STRING' in e.expected:
-                raise GrammarError("Expecting a value at line %s column %s" % (e.line, e.column))
-            elif e.expected == ['_OR']:
-                raise GrammarError("Newline without starting a new option (Expecting '|') at line %s column %s" % (e.line, e.column))
+                raise GrammarError("Expecting a value at line %s column %s\n\n%s" % (e.line, e.column, context))
             raise
 
         # Extract grammar items

From f5550b30403996bb5d1f24abc5b36c8e58b0c84f Mon Sep 17 00:00:00 2001
From: Ramon Klass <tier@schokokeks.org>
Date: Thu, 19 Apr 2018 16:57:43 +0200
Subject: [PATCH 14/19] Implemented a new visitor class (Interpreter) that
 works top-down (PR #130)

It emulates antlr's visitor behavior for a dynamic evaluation order of subtrees
---
 lark/tree.py        | 24 ++++++++++++++++++++++++
 tests/test_trees.py | 33 ++++++++++++++++++++++++++++++++-
 2 files changed, 56 insertions(+), 1 deletion(-)

diff --git a/lark/tree.py b/lark/tree.py
index d496d75..e6d5ed7 100644
--- a/lark/tree.py
+++ b/lark/tree.py
@@ -174,6 +174,30 @@ class Visitor_NoRecurse(Visitor):
         return tree
 
 
+from functools import wraps
+def visit_children_decor(func):
+    @wraps(func)
+    def inner(cls, tree):
+        values = cls.visit_children(tree)
+        return func(cls, values)
+    return inner
+
+class Interpreter(object):
+
+    def visit(self, tree):
+        return getattr(self, tree.data)(tree)
+
+    def visit_children(self, tree):
+        return [self.visit(child) if isinstance(child, Tree) else child
+                for child in tree.children]
+
+    def __getattr__(self, name):
+        return self.__default__
+
+    def __default__(self, tree):
+        self.visit_children(tree)
+
+
 class Transformer_NoRecurse(Transformer):
     def transform(self, tree):
         subtrees = list(tree.iter_subtrees())
diff --git a/tests/test_trees.py b/tests/test_trees.py
index c90cc7d..c83b5ef 100644
--- a/tests/test_trees.py
+++ b/tests/test_trees.py
@@ -5,7 +5,7 @@ from unittest import TestCase
 import copy
 import pickle
 
-from lark.tree import Tree
+from lark.tree import Tree, Interpreter, visit_children_decor
 
 
 class TestTrees(TestCase):
@@ -21,6 +21,37 @@ class TestTrees(TestCase):
         assert pickle.loads(data) == s
 
 
+    def test_interp(self):
+        t = Tree('a', [Tree('b', []), Tree('c', []), 'd'])
+
+        class Interp1(Interpreter):
+            def a(self, tree):
+                return self.visit_children(tree) + ['e']
+
+            def b(self, tree):
+                return 'B'
+
+            def c(self, tree):
+                return 'C'
+
+        self.assertEqual(Interp1().visit(t), list('BCde'))
+
+        class Interp2(Interpreter):
+            @visit_children_decor
+            def a(self, values):
+                return values + ['e']
+
+            def b(self, tree):
+                return 'B'
+
+            def c(self, tree):
+                return 'C'
+
+        self.assertEqual(Interp2().visit(t), list('BCde'))
+
+
+
+
 if __name__ == '__main__':
     unittest.main()
 

From 4c89d69d97f00da0c0ab043508ad2843ad230954 Mon Sep 17 00:00:00 2001
From: Erez Shinan <erez27+git@gmail.com>
Date: Mon, 23 Apr 2018 10:20:43 +0300
Subject: [PATCH 15/19] Update README.md

---
 README.md | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/README.md b/README.md
index 9e077cf..619be58 100644
--- a/README.md
+++ b/README.md
@@ -165,3 +165,5 @@ If you're interested in taking one of these on, let me know and I will provide m
 If you have any questions or want my assistance, you can email me at erezshin at gmail com.
 
 I'm also available for contract work.
+
+ -- [Erez](https://github.com/erezsh)

From 1854b81ebcdd05bf53175fa57615964d03218f56 Mon Sep 17 00:00:00 2001
From: Ramon Klass <tier@schokokeks.org>
Date: Tue, 24 Apr 2018 00:14:03 +0200
Subject: [PATCH 16/19] interpreter: default behavior changed to return the
 values instead of discarding them, added test showcasing the behavior

---
 lark/tree.py        | 2 +-
 tests/test_trees.py | 8 ++++++++
 2 files changed, 9 insertions(+), 1 deletion(-)

diff --git a/lark/tree.py b/lark/tree.py
index e6d5ed7..ad086d2 100644
--- a/lark/tree.py
+++ b/lark/tree.py
@@ -195,7 +195,7 @@ class Interpreter(object):
         return self.__default__
 
     def __default__(self, tree):
-        self.visit_children(tree)
+        return self.visit_children(tree)
 
 
 class Transformer_NoRecurse(Transformer):
diff --git a/tests/test_trees.py b/tests/test_trees.py
index c83b5ef..6017386 100644
--- a/tests/test_trees.py
+++ b/tests/test_trees.py
@@ -49,6 +49,14 @@ class TestTrees(TestCase):
 
         self.assertEqual(Interp2().visit(t), list('BCde'))
 
+        class Interp3(Interpreter):
+            def b(self, tree):
+                return 'B'
+
+            def c(self, tree):
+                return 'C'
+
+        self.assertEqual(Interp3().visit(t), list('BCd'))
 
 
 

From 0f0776c0fa552aa74708570a7fa86f4bb6d54921 Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Tue, 24 Apr 2018 15:36:53 +0300
Subject: [PATCH 17/19] BUGIX in lexer: Embedding strings overwrote priority
 (Issue #121)

---
 lark/lexer.py        |  2 ++
 tests/test_parser.py | 12 ++++++++++++
 2 files changed, 14 insertions(+)

diff --git a/lark/lexer.py b/lark/lexer.py
index 938d22b..19e1be4 100644
--- a/lark/lexer.py
+++ b/lark/lexer.py
@@ -143,6 +143,8 @@ def _create_unless(tokens):
     for retok in tokens_by_type.get(PatternRE, []):
         unless = [] # {}
         for strtok in tokens_by_type.get(PatternStr, []):
+            if strtok.priority > retok.priority:
+                continue
             s = strtok.pattern.value
             m = re.match(retok.pattern.to_regexp(), s)
             if m and m.group(0) == s:
diff --git a/tests/test_parser.py b/tests/test_parser.py
index d4d63ca..5c68bec 100644
--- a/tests/test_parser.py
+++ b/tests/test_parser.py
@@ -1173,6 +1173,18 @@ def _make_parser_test(LEXER, PARSER):
             self.assertRaises((ParseError, UnexpectedInput), l.parse, u'ABB')
             self.assertRaises((ParseError, UnexpectedInput), l.parse, u'AAAABB')
 
+        @unittest.skipIf(PARSER=='earley', "Priority not handled correctly right now")  # TODO XXX
+        def test_priority_vs_embedded(self):
+            g = """
+            A.2: "a"
+            WORD: ("a".."z")+
+
+            start: (A | WORD)+
+            """
+            l = _Lark(g)
+            t = l.parse('abc')
+            self.assertEqual(t.children, ['a', 'bc'])
+            self.assertEqual(t.children[0].type, 'A')
 
 
 

From 51644a6c584eb9833af71c40198fdc5d8a99c904 Mon Sep 17 00:00:00 2001
From: Erez Shinan <erezshin+git@gmail.com>
Date: Wed, 25 Apr 2018 19:06:33 +0300
Subject: [PATCH 18/19] Added examples/lark.g - Reference implementation of the
 Lark grammar (inspired by issue #116)

---
 examples/README.md       |  1 +
 examples/lark.g          | 49 ++++++++++++++++++++++++++++++++++++++++
 examples/lark_grammar.py | 18 +++++++++++++++
 lark/grammars/common.g   |  1 +
 lark/load_grammar.py     |  8 ++++++-
 5 files changed, 76 insertions(+), 1 deletion(-)
 create mode 100644 examples/lark.g
 create mode 100644 examples/lark_grammar.py

diff --git a/examples/README.md b/examples/README.md
index 3fbe3ea..25bf504 100644
--- a/examples/README.md
+++ b/examples/README.md
@@ -7,6 +7,7 @@
 - [indented\_tree.py](indented\_tree.py) - A demonstration of parsing indentation ("whitespace significant" language)
 - [fruitflies.py](fruitflies.py) - A demonstration of ambiguity
 - [turtle\_dsl.py](turtle_dsl.py) - Implements a LOGO-like toy language for Python's turtle, with interpreter.
+- [lark\_grammar.py](lark_grammar.py) - A reference implementation of the Lark grammar (using LALR(1) + standard lexer)
 
 ### Advanced
 
diff --git a/examples/lark.g b/examples/lark.g
new file mode 100644
index 0000000..1fbf592
--- /dev/null
+++ b/examples/lark.g
@@ -0,0 +1,49 @@
+start: (_item | _NL)*
+
+_item: rule
+     | token
+     | statement
+
+rule: RULE priority? ":" expansions _NL
+token: TOKEN priority? ":" expansions _NL
+
+priority: "." NUMBER
+
+statement: "%ignore" expansions _NL                -> ignore
+         | "%import" import_args ["->" TOKEN] _NL  -> import
+
+import_args: name ("." name)*
+
+?expansions: alias (_VBAR alias)*
+
+?alias: expansion ["->" RULE]
+
+?expansion: expr*
+
+?expr: atom [OP | "~" NUMBER [".." NUMBER]]
+
+?atom: "(" expansions ")"
+     | "[" expansions "]" -> maybe
+     | STRING ".." STRING -> literal_range
+     | name
+     | (REGEXP | STRING) -> literal
+
+name: RULE
+    | TOKEN
+
+_VBAR: _NL? "|"
+OP: /[+*][?]?|[?](?![a-z])/
+RULE: /!?[_?]?[a-z][_a-z0-9]*/
+TOKEN: /_?[A-Z][_A-Z0-9]*/
+STRING: _STRING "i"?
+REGEXP: /\/(?!\/)(\\\/|\\\\|[^\/\n])*?\/[imslux]*/
+_NL: /(\r?\n)+\s*/
+
+%import common.ESCAPED_STRING -> _STRING
+%import common.INT -> NUMBER
+%import common.WS_INLINE
+
+COMMENT: "//" /[^\n]/*
+
+%ignore WS_INLINE
+%ignore COMMENT
diff --git a/examples/lark_grammar.py b/examples/lark_grammar.py
new file mode 100644
index 0000000..88fc4cf
--- /dev/null
+++ b/examples/lark_grammar.py
@@ -0,0 +1,18 @@
+from lark import Lark
+
+parser = Lark(open('examples/lark.g'), parser="lalr")
+
+grammar_files = [
+    'examples/python2.g',
+    'examples/python3.g',
+    'examples/lark.g',
+    'lark/grammars/common.g',
+]
+
+def test():
+    for grammar_file in grammar_files:
+        tree = parser.parse(open(grammar_file).read())
+    print("All grammars parsed successfully")
+
+if __name__ == '__main__':
+    test()
diff --git a/lark/grammars/common.g b/lark/grammars/common.g
index 2bd02d0..8bc8079 100644
--- a/lark/grammars/common.g
+++ b/lark/grammars/common.g
@@ -20,6 +20,7 @@ SIGNED_NUMBER: ["+"|"-"] NUMBER
 //
 // Strings
 //
+//STRING: /"(\\\"|\\\\|[^"\n])*?"i?/
 STRING_INNER: ("\\\""|/[^"]/)
 ESCAPED_STRING: "\"" STRING_INNER* "\""
 
diff --git a/lark/load_grammar.py b/lark/load_grammar.py
index 43d1bf5..13aeff0 100644
--- a/lark/load_grammar.py
+++ b/lark/load_grammar.py
@@ -122,7 +122,7 @@ RULES = {
     'statement': ['ignore', 'import'],
     'ignore': ['_IGNORE expansions _NL'],
     'import': ['_IMPORT import_args _NL',
-               '_IMPORT import_args _TO TOKEN'],
+               '_IMPORT import_args _TO TOKEN _NL'],
     'import_args': ['_import_args'],
     '_import_args': ['name', '_import_args _DOT name'],
 
@@ -375,6 +375,7 @@ class TokenTreeToPattern(Transformer):
         return p
 
     def expansion(self, items):
+        assert items
         if len(items) == 1:
             return items[0]
         if len({i.flags for i in items}) > 1:
@@ -486,6 +487,11 @@ class Grammar:
 
         # Convert token-trees to strings/regexps
         transformer = PrepareLiterals() * TokenTreeToPattern()
+        for name, (token_tree, priority) in token_defs:
+            for t in token_tree.find_data('expansion'):
+                if not t.children:
+                    raise GrammarError("Tokens cannot be empty (%s)" % name)
+
         tokens = [TokenDef(name, transformer.transform(token_tree), priority)
                   for name, (token_tree, priority) in token_defs]
 

From 0a40137ac79d9bfbc477e2d4c443b8503d3e28da Mon Sep 17 00:00:00 2001
From: Erez Shinan <erez27+git@gmail.com>
Date: Wed, 25 Apr 2018 19:09:50 +0300
Subject: [PATCH 19/19] Update README.md

---
 examples/README.md | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/examples/README.md b/examples/README.md
index 25bf504..0951c86 100644
--- a/examples/README.md
+++ b/examples/README.md
@@ -7,7 +7,7 @@
 - [indented\_tree.py](indented\_tree.py) - A demonstration of parsing indentation ("whitespace significant" language)
 - [fruitflies.py](fruitflies.py) - A demonstration of ambiguity
 - [turtle\_dsl.py](turtle_dsl.py) - Implements a LOGO-like toy language for Python's turtle, with interpreter.
-- [lark\_grammar.py](lark_grammar.py) - A reference implementation of the Lark grammar (using LALR(1) + standard lexer)
+- [lark\_grammar.py](lark_grammar.py) + [lark.g](lark.g) - A reference implementation of the Lark grammar (using LALR(1) + standard lexer)
 
 ### Advanced