正在分析使用PLY的行上定义的命令字符串

def p_command(self, p): '''command : tokens NEWLINE | NEWLINE''' print("found command:", list(p)) def p_tokens(self, p): '''tokens : type_a_tokens | type_b_tokens | type_c_tokens''' p[0] = p[1] def p_type_a_tokens(self, p): '''type_a_tokens : STRING STRING QUANTITY STRING STRING''' p[0] = "TypeA" def p_type_b_tokens(self, p): '''type_b_tokens : STRING STRING STRING STRING STRING STRING''' p[0] = "TypeB" def p_type_c_tokens(self, p): '''type_c_tokens : STRING STRING QUANTITY QUANTITY QUANTITY''' p[0] = "TypeC"

from ply import lex, yacc class InputParser(object): # top level tokens tokens = [ 'QUANTITY', 'STRING', 'NEWLINE' ] t_QUANTITY = r'[+-]?(\d+\.\d*|\d*\.\d+|\d+)([eE][+-]?\d*\.?\d*|[GMkmunpf])?' t_STRING = r'[a-zA-Z_][a-zA-Z_0-9]*' # ignored characters t_ignore = ' \t' # ignore comments t_ignore_COMMENT = r'\#.*' def __init__(self, **kwargs): self.lexer = lex.lex(module=self, **kwargs) self.parser = yacc.yacc(module=self, **kwargs) # detect new lines def t_newline(self, t): r'\n+' # generate newline token t.type = "NEWLINE" # error handling def t_error(self, t): # anything that gets past the other filters print("Illegal character '%s' on line %i at position %i" % (t.value[0], self.lexer.lineno)) # skip forward a character t.lexer.skip(1) # match commands on their own lines def p_command(self, p): '''command : tokens NEWLINE | NEWLINE''' print("found command:", list(p)) p[0] = p[1] def p_tokens(self, p): '''tokens : type_a_tokens | type_b_tokens | type_c_tokens''' p[0] = p[1] def p_type_a_tokens(self, p): '''type_a_tokens : STRING STRING QUANTITY STRING STRING''' print("found type a") p[0] = "TypeA" def p_type_b_tokens(self, p): '''type_b_tokens : STRING STRING STRING STRING STRING STRING''' print("found type b") p[0] = "TypeB" def p_type_c_tokens(self, p): '''type_c_tokens : STRING STRING QUANTITY QUANTITY QUANTITY''' print("found type c") p[0] = "TypeC" def p_error(self, p): if p: error_msg = "syntax error '%s'" % p.value else: error_msg = "syntax error at end of file" print(error_msg) def parse(self, text): self.parser.parse(text, lexer=self.lexer) if __name__ == "__main__": parser = InputParser() parser.parse(""" a b 5.5 c d # TypeA e f 1.6 g h # TypeA i j k l m n # TypeB # empty line o p -1 2.0 3e4 # TypeC """)

1条回答

网友

1楼 · 发布于 2024-04-24 06:13:45

问题是由于第一个规则是特殊的：这是解析器开始的地方。因为上面的第一个规则不能组合两个命令（在两个相邻的行上找到），所以它失败了。在

我通过在p_command上方添加一个新的根规则来修复它，它可以采用单个command（当文件只包含一个命令时）或一个命令列表（command_list）：

def p_command_list(self, p):
    '''command_list : command
                    | command_list command'''
    if len(p) == 3:
        self.commands.append(p[2])
    else:
        self.commands.append(p[1])

（我还向类添加了一个commands字段来保存解析后的命令）

这可以处理多个被“合并”在一起的命令，就像在我的输入文件中发现的那样。在

相关问题更多 >

编程相关推荐

热门问题

热门文章