将纯文本与pyparsing匹配

import pyparsing as pp struct = pp.Regex(r'specialStructure') txt = pp.SkipTo( struct ) | pp.SkipTo( pp.StringEnd(), include=True ) grammar = pp.ZeroOrMore( struct | txt ) result = grammar.parseString(s)

s = """ some plain text nestedStructureBegin here we are inside a nested structure nestedStructureBegin bla bla nestedStructureEnd nestedStructureEnd some bla bla again. """ import pyparsing as pp grammar = pp.Forward() begin = pp.Regex(r'nestedStructureBegin').suppress() end = pp.Regex(r'nestedStructureEnd').suppress() struct = begin + pp.Group(grammar) + end keyword = begin | end txt = pp.SkipTo( keyword ) | pp.SkipTo( pp.StringEnd(), include=True ) grammar << pp.ZeroOrMore( struct | txt ) for parser in [struct, txt]: parser.addParseAction(lambda toks: print(toks)) result = grammar.parseString(s)

1条回答

网友

1楼 · 发布于 2024-09-28 23:51:52

我已经找到了一个即使在嵌套结构中也能很好工作的解决方案。其思想是逐字符解析输入，然后使用pp.Combine重建原始的纯文本输入。在

s = """
some plain text
begin
   we are inside a nested structure
   begin
      some more depth
   end
end
and finally some more bla bla...
"""

import pyparsing as pp

grammar = pp.Forward()
begin = pp.Regex(r'begin').suppress()
end = pp.Regex(r'end').suppress()
keyword = begin | end
block = begin + pp.Group(grammar) + end
char = ~keyword + pp.Regex(r'[\s\S]')
chars = pp.OneOrMore(char)
txt = pp.Combine(chars)
grammar << pp.ZeroOrMore( block | txt )

result = grammar.parseString(s)

相关问题更多 >

编程相关推荐

热门问题

热门文章