X-Git-Url: https://git.phdru.name/?a=blobdiff_plain;f=parser%2Fparser.py;h=e214698a60d156e3721ba851ca1371a17feba260;hb=b4b7ad7bdf38bc6cb84d0f29cbae0df6e46a0eda;hp=1fb9903c62ee93794a22925678df963c728d4f2c;hpb=9d22f4f705db6a30fa2d49fdc074b901ec3cb3dc;p=phdru.name%2Fcgi-bin%2Fblog-ru%2Fsearch-tags.git diff --git a/parser/parser.py b/parser/parser.py index 1fb9903..e214698 100644 --- a/parser/parser.py +++ b/parser/parser.py @@ -4,9 +4,11 @@ from ply import lex, yacc literals = '()' -tokens = ('NAME', 'AND_OP', 'OR_OP', 'NOT_OP') +tokens = ('OP_WORD', 'NAME', 'AND_OP', 'OR_OP', 'NOT_OP', 'SP1') -t_NAME = '[a-z][a-z0-9_]*' +t_OP_WORD = '(AND|and|OR|or|NOT|not)' + +t_NAME = '([a-z][a-z0-9_]*)' t_AND_OP = '&' @@ -14,7 +16,7 @@ t_OR_OP = r'\|' t_NOT_OP = '!' -t_ignore = '[ \t]+' +t_SP1 = '[ \t]+' def t_error(t): """Avoid warnings on stderr""" @@ -26,28 +28,85 @@ def p_expression_name(p): p[0] = ('NAME', p[1]) def p_expression_and_and(p): - """expression : expression AND_OP AND_OP expression""" - p[0] = ('AND', p[1], p[4]) + """expression : expression SP0 AND_OP AND_OP SP0 expression""" + p[0] = ('AND', p[1], p[6]) def p_expression_and(p): - """expression : expression AND_OP expression""" - p[0] = ('AND', p[1], p[3]) - -def p_expression_not(p): - """expression : NOT_OP expression""" - p[0] = ('NOT', p[2]) + """expression : expression SP0 AND_OP SP0 expression""" + p[0] = ('AND', p[1], p[5]) + +def p_expression_op_word(p): + """expression : l_expression op_word r_expression""" + if p[2] in ('AND', 'and'): + p[0] = ('AND', p[1], p[3]) + elif p[2] in ('OR', 'or'): + p[0] = ('OR', p[1], p[3]) + else: + raise ValueError(p) def p_expression_or_or(p): - """expression : expression OR_OP OR_OP expression""" - p[0] = ('OR', p[1], p[4]) + """expression : expression SP0 OR_OP OR_OP SP0 expression""" + p[0] = ('OR', p[1], p[6]) def p_expression_or(p): - """expression : expression OR_OP expression""" - p[0] = ('OR', p[1], p[3]) + """expression : expression SP0 OR_OP SP0 expression""" + p[0] = ('OR', p[1], p[5]) + +def p_expression_not(p): + """expression : NOT_OP SP0 expression""" + p[0] = ('NOT', p[3]) + +def p_expression_not_word(p): + """expression : op_word r_expression""" + if p[1] in ('NOT', 'not'): + p[0] = ('NOT', p[2]) + else: + raise ValueError(p) + +def p_expression_in_parens(p): + """expression : expression_parens""" + p[0] = p[1] + +def p_l_expression(p): + """l_expression : expression_parens + | expression SP1 + """ + if len(p) == 2: + p[0] = p[1] + elif len(p) == 3: + p[0] = p[1] + else: + raise ValueError(p) + +def p_r_expression(p): + """r_expression : expression_parens + | SP1 expression + """ + if len(p) == 2: + p[0] = p[1] + elif len(p) == 3: + p[0] = p[2] + else: + raise ValueError(p) def p_expression_parens(p): - """expression : '(' expression ')'""" - p[0] = ('PARENS', p[2]) + """expression_parens : '(' SP0 expression SP0 ')'""" + p[0] = ('PARENS', p[3]) + +def p_op_word(p): + """op_word : OP_WORD""" + if p[1] in ('AND', 'and', 'OR', 'or', 'NOT', 'not'): + p[0] = p[1] + else: + raise SyntaxError + +def p_SP0(p): + """SP0 : SP1 + | empty + """ + +def p_empty(p): + """empty :""" def p_error(p): """Avoid warnings on stderr"""