# -*- coding: utf-8 -*- ####################################################################### # Name: test_peg_parser # Purpose: Test for parser constructed using PEG textual grammars. # Author: Igor R. Dejanović # Copyright: (c) 2014-2017 Igor R. Dejanović # License: MIT License ####################################################################### import pytest # noqa from arpeggio import Sequence, NonTerminal, NoMatch from arpeggio.peg import ParserPEG from arpeggio.cleanpeg import ParserPEG as ParserPEGClean grammar = r''' // This is a comment number <- r'\d*\.\d*|\d+'; factor <- ("+" / "-")? (number / "(" expression ")"); // This is another comment term <- factor (( "*" / "/") factor)*; expression <- term (("+" / "-") term)*; calc <- expression+ EOF; // And final comment at the end of file ''' clean_grammar = grammar.replace('<-', '=').replace(';', '') @pytest.mark.parametrize('parser', [ParserPEG(grammar, 'calc'), ParserPEGClean(clean_grammar, 'calc')]) def test_construct_parser(parser): assert parser.parser_model.rule_name == 'calc' assert isinstance(parser.parser_model, Sequence) assert parser.parser_model.nodes[0].name == 'OneOrMore' @pytest.mark.parametrize('parser', [ParserPEG(grammar, 'calc'), ParserPEGClean(clean_grammar, 'calc')]) def test_parse_input(parser): input = "4+5*7/3.45*-45*(2.56+32)/-56*(2-1.34)" result = parser.parse(input) assert isinstance(result, NonTerminal) assert str(result) == "4 | + | 5 | * | 7 | / | 3.45 | * | - | 45 | * | ( | 2.56 | + | 32 | ) | / | - | 56 | * | ( | 2 | - | 1.34 | ) | " # noqa assert repr(result) == "[ [ [ [ number '4' [0] ] ], '+' [1], [ [ number '5' [2] ], '*' [3], [ number '7' [4] ], '/' [5], [ number '3.45' [6] ], '*' [10], [ '-' [11], number '45' [12] ], '*' [14], [ '(' [15], [ [ [ number '2.56' [16] ] ], '+' [20], [ [ number '32' [21] ] ] ], ')' [23] ], '/' [24], [ '-' [25], number '56' [26] ], '*' [28], [ '(' [29], [ [ [ number '2' [30] ] ], '-' [31], [ [ number '1.34' [32] ] ] ], ')' [36] ] ] ], EOF [37] ]" # noqa @pytest.mark.parametrize('parser', [ParserPEG(grammar, 'calc', reduce_tree=True), ParserPEGClean(clean_grammar, 'calc', reduce_tree=True)]) def test_reduce_tree(parser): input = "4+5*7/3.45*-45*(2.56+32)/-56*(2-1.34)" result = parser.parse(input) assert isinstance(result, NonTerminal) assert str(result) == "4 | + | 5 | * | 7 | / | 3.45 | * | - | 45 | * | ( | 2.56 | + | 32 | ) | / | - | 56 | * | ( | 2 | - | 1.34 | ) | " # noqa assert repr(result) == "[ [ number '4' [0], '+' [1], [ number '5' [2], '*' [3], number '7' [4], '/' [5], number '3.45' [6], '*' [10], [ '-' [11], number '45' [12] ], '*' [14], [ '(' [15], [ number '2.56' [16], '+' [20], number '32' [21] ], ')' [23] ], '/' [24], [ '-' [25], number '56' [26] ], '*' [28], [ '(' [29], [ number '2' [30], '-' [31], number '1.34' [32] ], ')' [36] ] ] ], EOF [37] ]" # noqa def test_unordered_group(): grammar = """ g <- (("a" "b") "c" )#; """ parser = ParserPEG(grammar, 'g', reduce_tree=True) r = parser.parse("c a b") assert isinstance(r, NonTerminal) r = parser.parse("a b c") assert isinstance(r, NonTerminal) with pytest.raises(NoMatch): parser.parse("a c b")