tpegs.nim 9.1 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335
  1. discard """
  2. targets: "c cpp js"
  3. output: '''
  4. PEG AST traversal output
  5. ------------------------
  6. pkNonTerminal: Sum @(2, 3)
  7. pkSequence: (Product (('+' / '-') Product)*)
  8. pkNonTerminal: Product @(3, 7)
  9. pkSequence: (Value (('*' / '/') Value)*)
  10. pkNonTerminal: Value @(4, 5)
  11. pkOrderedChoice: (([0-9] [0-9]*) / ('(' Expr ')'))
  12. pkSequence: ([0-9] [0-9]*)
  13. pkCharChoice: [0-9]
  14. pkGreedyRepSet: [0-9]*
  15. pkSequence: ('(' Expr ')')
  16. pkChar: '('
  17. pkNonTerminal: Expr @(1, 4)
  18. pkNonTerminal: Sum @(2, 3)
  19. pkChar: ')'
  20. pkGreedyRep: (('*' / '/') Value)*
  21. pkSequence: (('*' / '/') Value)
  22. pkOrderedChoice: ('*' / '/')
  23. pkChar: '*'
  24. pkChar: '/'
  25. pkNonTerminal: Value @(4, 5)
  26. pkGreedyRep: (('+' / '-') Product)*
  27. pkSequence: (('+' / '-') Product)
  28. pkOrderedChoice: ('+' / '-')
  29. pkChar: '+'
  30. pkChar: '-'
  31. pkNonTerminal: Product @(3, 7)
  32. Event parser output
  33. -------------------
  34. @[5.0]
  35. +
  36. @[5.0, 3.0]
  37. @[8.0]
  38. /
  39. @[8.0, 2.0]
  40. @[4.0]
  41. -
  42. @[4.0, 7.0]
  43. -*
  44. @[4.0, 7.0, 22.0]
  45. @[4.0, 154.0]
  46. -
  47. @[-150.0]
  48. '''
  49. """
  50. when defined(nimHasEffectsOf):
  51. {.experimental: "strictEffects".}
  52. import std/[strutils, streams, pegs, assertions]
  53. const
  54. indent = " "
  55. let
  56. pegAst = """
  57. Expr <- Sum
  58. Sum <- Product (('+' / '-')Product)*
  59. Product <- Value (('*' / '/')Value)*
  60. Value <- [0-9]+ / '(' Expr ')'
  61. """.peg
  62. txt = "(5+3)/2-7*22"
  63. block:
  64. var
  65. outp = newStringStream()
  66. processed: seq[string] = @[]
  67. proc prt(outp: Stream, kind: PegKind, s: string; level: int = 0) =
  68. outp.writeLine indent.repeat(level) & "$1: $2" % [$kind, s]
  69. proc recLoop(p: Peg, level: int = 0) =
  70. case p.kind
  71. of pkEmpty..pkWhitespace:
  72. discard
  73. of pkTerminal, pkTerminalIgnoreCase, pkTerminalIgnoreStyle:
  74. outp.prt(p.kind, $p, level)
  75. of pkChar, pkGreedyRepChar:
  76. outp.prt(p.kind, $p, level)
  77. of pkCharChoice, pkGreedyRepSet:
  78. outp.prt(p.kind, $p, level)
  79. of pkNonTerminal:
  80. outp.prt(p.kind,
  81. "$1 @($3, $4)" % [p.nt.name, $p.nt.rule.kind, $p.nt.line, $p.nt.col], level)
  82. if not(p.nt.name in processed):
  83. processed.add p.nt.name
  84. p.nt.rule.recLoop level+1
  85. of pkBackRef..pkBackRefIgnoreStyle:
  86. outp.prt(p.kind, $p, level)
  87. else:
  88. outp.prt(p.kind, $p, level)
  89. for s in items(p):
  90. s.recLoop level+1
  91. pegAst.recLoop
  92. echo "PEG AST traversal output"
  93. echo "------------------------"
  94. echo outp.data
  95. block:
  96. var
  97. pStack {.threadvar.}: seq[string]
  98. valStack {.threadvar.}: seq[float]
  99. opStack {.threadvar.}: string
  100. let
  101. parseArithExpr = pegAst.eventParser:
  102. pkNonTerminal:
  103. enter:
  104. pStack.add p.nt.name
  105. leave:
  106. pStack.setLen pStack.high
  107. if length > 0:
  108. let matchStr = s.substr(start, start+length-1)
  109. case p.nt.name
  110. of "Value":
  111. try:
  112. valStack.add matchStr.parseFloat
  113. echo valStack
  114. except ValueError:
  115. discard
  116. of "Sum", "Product":
  117. try:
  118. let val {.used.} = matchStr.parseFloat
  119. except ValueError:
  120. if valStack.len > 1 and opStack.len > 0:
  121. valStack[^2] = case opStack[^1]
  122. of '+': valStack[^2] + valStack[^1]
  123. of '-': valStack[^2] - valStack[^1]
  124. of '*': valStack[^2] * valStack[^1]
  125. else: valStack[^2] / valStack[^1]
  126. valStack.setLen valStack.high
  127. echo valStack
  128. opStack.setLen opStack.high
  129. echo opStack
  130. pkChar:
  131. leave:
  132. if length == 1 and "Value" != pStack[^1]:
  133. let matchChar = s[start]
  134. opStack.add matchChar
  135. echo opStack
  136. echo "Event parser output"
  137. echo "-------------------"
  138. let pLen = parseArithExpr(txt)
  139. doAssert txt.len == pLen
  140. import std/importutils
  141. block:
  142. proc pegsTest() =
  143. privateAccess(NonTerminal)
  144. privateAccess(Captures)
  145. if "test" =~ peg"s <- {{\ident}}": # bug #19104
  146. doAssert matches[0] == "test"
  147. doAssert matches[1] == "test", $matches[1]
  148. doAssert escapePeg("abc''def'") == r"'abc'\x27\x27'def'\x27"
  149. doAssert match("(a b c)", peg"'(' @ ')'")
  150. doAssert match("W_HI_Le", peg"\y 'while'")
  151. doAssert(not match("W_HI_L", peg"\y 'while'"))
  152. doAssert(not match("W_HI_Le", peg"\y v'while'"))
  153. doAssert match("W_HI_Le", peg"y'while'")
  154. doAssert($ +digits == $peg"\d+")
  155. doAssert "0158787".match(peg"\d+")
  156. doAssert "ABC 0232".match(peg"\w+\s+\d+")
  157. doAssert "ABC".match(peg"\d+ / \w+")
  158. var accum: seq[string] = @[]
  159. for word in split("00232this02939is39an22example111", peg"\d+"):
  160. accum.add(word)
  161. doAssert(accum == @["this", "is", "an", "example"])
  162. doAssert matchLen("key", ident) == 3
  163. var pattern = sequence(ident, *whitespace, term('='), *whitespace, ident)
  164. doAssert matchLen("key1= cal9", pattern) == 11
  165. var ws = newNonTerminal("ws", 1, 1)
  166. ws.rule = *whitespace
  167. var expr = newNonTerminal("expr", 1, 1)
  168. expr.rule = sequence(capture(ident), *sequence(
  169. nonterminal(ws), term('+'), nonterminal(ws), nonterminal(expr)))
  170. var c: Captures
  171. var s = "a+b + c +d+e+f"
  172. doAssert rawMatch(s, expr.rule, 0, c) == len(s)
  173. var a = ""
  174. for i in 0..c.ml-1:
  175. a.add(substr(s, c.matches[i][0], c.matches[i][1]))
  176. doAssert a == "abcdef"
  177. #echo expr.rule
  178. #const filename = "lib/devel/peg/grammar.txt"
  179. #var grammar = parsePeg(newFileStream(filename, fmRead), filename)
  180. #echo "a <- [abc]*?".match(grammar)
  181. doAssert find("_____abc_______", term("abc"), 2) == 5
  182. doAssert match("_______ana", peg"A <- 'ana' / . A")
  183. doAssert match("abcs%%%", peg"A <- ..A / .A / '%'")
  184. var matches: array[0..MaxSubpatterns-1, string]
  185. if "abc" =~ peg"{'a'}'bc' 'xyz' / {\ident}":
  186. doAssert matches[0] == "abc"
  187. else:
  188. doAssert false
  189. var g2 = peg"""S <- A B / C D
  190. A <- 'a'+
  191. B <- 'b'+
  192. C <- 'c'+
  193. D <- 'd'+
  194. """
  195. doAssert($g2 == "((A B) / (C D))")
  196. doAssert match("cccccdddddd", g2)
  197. doAssert("var1=key; var2=key2".replacef(peg"{\ident}'='{\ident}", "$1<-$2$2") ==
  198. "var1<-keykey; var2<-key2key2")
  199. doAssert("var1=key; var2=key2".replace(peg"{\ident}'='{\ident}", "$1<-$2$2") ==
  200. "$1<-$2$2; $1<-$2$2")
  201. doAssert "var1=key; var2=key2".endsWith(peg"{\ident}'='{\ident}")
  202. if "aaaaaa" =~ peg"'aa' !. / ({'a'})+":
  203. doAssert matches[0] == "a"
  204. else:
  205. doAssert false
  206. if match("abcdefg", peg"c {d} ef {g}", matches, 2):
  207. doAssert matches[0] == "d"
  208. doAssert matches[1] == "g"
  209. else:
  210. doAssert false
  211. accum = @[]
  212. for x in findAll("abcdef", peg".", 3):
  213. accum.add(x)
  214. doAssert(accum == @["d", "e", "f"])
  215. for x in findAll("abcdef", peg"^{.}", 3):
  216. doAssert x == "d"
  217. if "f(a, b)" =~ peg"{[0-9]+} / ({\ident} '(' {@} ')')":
  218. doAssert matches[0] == "f"
  219. doAssert matches[1] == "a, b"
  220. else:
  221. doAssert false
  222. doAssert match("eine übersicht und außerdem", peg"(\letter \white*)+")
  223. # ß is not a lower cased letter?!
  224. doAssert match("eine übersicht und auerdem", peg"(\lower \white*)+")
  225. doAssert match("EINE ÜBERSICHT UND AUSSERDEM", peg"(\upper \white*)+")
  226. doAssert(not match("456678", peg"(\letter)+"))
  227. doAssert("var1 = key; var2 = key2".replacef(
  228. peg"\skip(\s*) {\ident}'='{\ident}", "$1<-$2$2") ==
  229. "var1<-keykey;var2<-key2key2")
  230. doAssert match("prefix/start", peg"^start$", 7)
  231. if "foo" =~ peg"{'a'}?.*":
  232. doAssert matches[0].len == 0
  233. else: doAssert false
  234. if "foo" =~ peg"{''}.*":
  235. doAssert matches[0] == ""
  236. else: doAssert false
  237. if "foo" =~ peg"{'foo'}":
  238. doAssert matches[0] == "foo"
  239. else: doAssert false
  240. let empty_test = peg"^\d*"
  241. let str = "XYZ"
  242. doAssert(str.find(empty_test) == 0)
  243. doAssert(str.match(empty_test))
  244. proc handleMatches(m: int, n: int, c: openArray[string]): string =
  245. result = ""
  246. if m > 0:
  247. result.add ", "
  248. result.add case n:
  249. of 2: toLowerAscii(c[0]) & ": '" & c[1] & "'"
  250. of 1: toLowerAscii(c[0]) & ": ''"
  251. else: ""
  252. doAssert("Var1=key1;var2=Key2; VAR3".
  253. replace(peg"{\ident}('='{\ident})* ';'* \s*",
  254. handleMatches) == "var1: 'key1', var2: 'Key2', var3: ''")
  255. doAssert "test1".match(peg"""{@}$""")
  256. doAssert "test2".match(peg"""{(!$ .)*} $""")
  257. doAssert "abbb".match(peg"{a} {b} $2 $^1")
  258. doAssert "abBA".match(peg"{a} {b} i$2 i$^2")
  259. doAssert "abba".match(peg"{a} {b} $^1 {} $^1")
  260. block:
  261. let grammar = peg"""
  262. program <- {''} stmt* $
  263. stmt <- call / block
  264. call <- 'call()' EOL
  265. EOL <- \n / $
  266. block <- 'block:' \n indBody
  267. indBody <- {$^1 ' '+} stmt ($^1 stmt)* {}
  268. """
  269. let program = """
  270. call()
  271. block:
  272. block:
  273. call()
  274. call()
  275. call()
  276. call()
  277. """
  278. var c: Captures
  279. doAssert program.len == program.rawMatch(grammar, 0, c)
  280. doAssert c.ml == 1
  281. pegsTest()
  282. static:
  283. pegsTest()