rstast.nim 9.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319
  1. #
  2. #
  3. # Nim's Runtime Library
  4. # (c) Copyright 2012 Andreas Rumpf
  5. #
  6. # See the file "copying.txt", included in this
  7. # distribution, for details about the copyright.
  8. #
  9. ## This module implements an AST for the `reStructuredText`:idx: parser.
  10. ##
  11. ## **Note:** Import ``packages/docutils/rstast`` to use this module
  12. import strutils, json
  13. type
  14. RstNodeKind* = enum ## the possible node kinds of an PRstNode
  15. rnInner, # an inner node or a root
  16. rnHeadline, # a headline
  17. rnOverline, # an over- and underlined headline
  18. rnTransition, # a transition (the ------------- <hr> thingie)
  19. rnParagraph, # a paragraph
  20. rnBulletList, # a bullet list
  21. rnBulletItem, # a bullet item
  22. rnEnumList, # an enumerated list
  23. rnEnumItem, # an enumerated item
  24. rnDefList, # a definition list
  25. rnDefItem, # an item of a definition list consisting of ...
  26. rnDefName, # ... a name part ...
  27. rnDefBody, # ... and a body part ...
  28. rnFieldList, # a field list
  29. rnField, # a field item
  30. rnFieldName, # consisting of a field name ...
  31. rnFieldBody, # ... and a field body
  32. rnOptionList, rnOptionListItem, rnOptionGroup, rnOption, rnOptionString,
  33. rnOptionArgument, rnDescription, rnLiteralBlock, rnQuotedLiteralBlock,
  34. rnLineBlock, # the | thingie
  35. rnLineBlockItem, # sons of the | thing
  36. rnBlockQuote, # text just indented
  37. rnTable, rnGridTable, rnTableRow, rnTableHeaderCell, rnTableDataCell,
  38. rnLabel, # used for footnotes and other things
  39. rnFootnote, # a footnote
  40. rnCitation, # similar to footnote
  41. rnStandaloneHyperlink, rnHyperlink, rnRef, rnDirective, # a directive
  42. rnDirArg, rnRaw, rnTitle, rnContents, rnImage, rnFigure, rnCodeBlock,
  43. rnRawHtml, rnRawLatex,
  44. rnContainer, # ``container`` directive
  45. rnIndex, # index directve:
  46. # .. index::
  47. # key
  48. # * `file#id <file#id>`_
  49. # * `file#id <file#id>'_
  50. rnSubstitutionDef, # a definition of a substitution
  51. rnGeneralRole, # Inline markup:
  52. rnSub, rnSup, rnIdx,
  53. rnEmphasis, # "*"
  54. rnStrongEmphasis, # "**"
  55. rnTripleEmphasis, # "***"
  56. rnInterpretedText, # "`"
  57. rnInlineLiteral, # "``"
  58. rnSubstitutionReferences, # "|"
  59. rnSmiley, # some smiley
  60. rnLeaf # a leaf; the node's text field contains the
  61. # leaf val
  62. PRstNode* = ref RstNode ## an RST node
  63. RstNodeSeq* = seq[PRstNode]
  64. RstNode* {.acyclic, final.} = object ## an RST node's description
  65. kind*: RstNodeKind ## the node's kind
  66. text*: string ## valid for leafs in the AST; and the title of
  67. ## the document or the section
  68. level*: int ## valid for some node kinds
  69. sons*: RstNodeSeq ## the node's sons
  70. proc len*(n: PRstNode): int =
  71. result = len(n.sons)
  72. proc newRstNode*(kind: RstNodeKind): PRstNode =
  73. new(result)
  74. result.sons = @[]
  75. result.kind = kind
  76. proc newRstNode*(kind: RstNodeKind, s: string): PRstNode =
  77. result = newRstNode(kind)
  78. result.text = s
  79. proc lastSon*(n: PRstNode): PRstNode =
  80. result = n.sons[len(n.sons)-1]
  81. proc add*(father, son: PRstNode) =
  82. add(father.sons, son)
  83. proc add*(father: PRstNode; s: string) =
  84. add(father.sons, newRstNode(rnLeaf, s))
  85. proc addIfNotNil*(father, son: PRstNode) =
  86. if son != nil: add(father, son)
  87. type
  88. RenderContext {.pure.} = object
  89. indent: int
  90. verbatim: int
  91. proc renderRstToRst(d: var RenderContext, n: PRstNode,
  92. result: var string) {.gcsafe.}
  93. proc renderRstSons(d: var RenderContext, n: PRstNode, result: var string) =
  94. for i in countup(0, len(n) - 1):
  95. renderRstToRst(d, n.sons[i], result)
  96. proc renderRstToRst(d: var RenderContext, n: PRstNode, result: var string) =
  97. # this is needed for the index generation; it may also be useful for
  98. # debugging, but most code is already debugged...
  99. const
  100. lvlToChar: array[0..8, char] = ['!', '=', '-', '~', '`', '<', '*', '|', '+']
  101. if n == nil: return
  102. var ind = spaces(d.indent)
  103. case n.kind
  104. of rnInner:
  105. renderRstSons(d, n, result)
  106. of rnHeadline:
  107. result.add("\n")
  108. result.add(ind)
  109. let oldLen = result.len
  110. renderRstSons(d, n, result)
  111. let headlineLen = result.len - oldLen
  112. result.add("\n")
  113. result.add(ind)
  114. result.add repeat(lvlToChar[n.level], headlineLen)
  115. of rnOverline:
  116. result.add("\n")
  117. result.add(ind)
  118. var headline = ""
  119. renderRstSons(d, n, headline)
  120. let lvl = repeat(lvlToChar[n.level], headline.len - d.indent)
  121. result.add(lvl)
  122. result.add("\n")
  123. result.add(headline)
  124. result.add("\n")
  125. result.add(ind)
  126. result.add(lvl)
  127. of rnTransition:
  128. result.add("\n\n")
  129. result.add(ind)
  130. result.add repeat('-', 78-d.indent)
  131. result.add("\n\n")
  132. of rnParagraph:
  133. result.add("\n\n")
  134. result.add(ind)
  135. renderRstSons(d, n, result)
  136. of rnBulletItem:
  137. inc(d.indent, 2)
  138. var tmp = ""
  139. renderRstSons(d, n, tmp)
  140. if tmp.len > 0:
  141. result.add("\n")
  142. result.add(ind)
  143. result.add("* ")
  144. result.add(tmp)
  145. dec(d.indent, 2)
  146. of rnEnumItem:
  147. inc(d.indent, 4)
  148. var tmp = ""
  149. renderRstSons(d, n, tmp)
  150. if tmp.len > 0:
  151. result.add("\n")
  152. result.add(ind)
  153. result.add("(#) ")
  154. result.add(tmp)
  155. dec(d.indent, 4)
  156. of rnOptionList, rnFieldList, rnDefList, rnDefItem, rnLineBlock, rnFieldName,
  157. rnFieldBody, rnStandaloneHyperlink, rnBulletList, rnEnumList:
  158. renderRstSons(d, n, result)
  159. of rnDefName:
  160. result.add("\n\n")
  161. result.add(ind)
  162. renderRstSons(d, n, result)
  163. of rnDefBody:
  164. inc(d.indent, 2)
  165. if n.sons[0].kind != rnBulletList:
  166. result.add("\n")
  167. result.add(ind)
  168. result.add(" ")
  169. renderRstSons(d, n, result)
  170. dec(d.indent, 2)
  171. of rnField:
  172. var tmp = ""
  173. renderRstToRst(d, n.sons[0], tmp)
  174. var L = max(tmp.len + 3, 30)
  175. inc(d.indent, L)
  176. result.add "\n"
  177. result.add ind
  178. result.add ':'
  179. result.add tmp
  180. result.add ':'
  181. result.add spaces(L - tmp.len - 2)
  182. renderRstToRst(d, n.sons[1], result)
  183. dec(d.indent, L)
  184. of rnLineBlockItem:
  185. result.add("\n")
  186. result.add(ind)
  187. result.add("| ")
  188. renderRstSons(d, n, result)
  189. of rnBlockQuote:
  190. inc(d.indent, 2)
  191. renderRstSons(d, n, result)
  192. dec(d.indent, 2)
  193. of rnRef:
  194. result.add("`")
  195. renderRstSons(d, n, result)
  196. result.add("`_")
  197. of rnHyperlink:
  198. result.add('`')
  199. renderRstToRst(d, n.sons[0], result)
  200. result.add(" <")
  201. renderRstToRst(d, n.sons[1], result)
  202. result.add(">`_")
  203. of rnGeneralRole:
  204. result.add('`')
  205. renderRstToRst(d, n.sons[0],result)
  206. result.add("`:")
  207. renderRstToRst(d, n.sons[1],result)
  208. result.add(':')
  209. of rnSub:
  210. result.add('`')
  211. renderRstSons(d, n, result)
  212. result.add("`:sub:")
  213. of rnSup:
  214. result.add('`')
  215. renderRstSons(d, n, result)
  216. result.add("`:sup:")
  217. of rnIdx:
  218. result.add('`')
  219. renderRstSons(d, n, result)
  220. result.add("`:idx:")
  221. of rnEmphasis:
  222. result.add("*")
  223. renderRstSons(d, n, result)
  224. result.add("*")
  225. of rnStrongEmphasis:
  226. result.add("**")
  227. renderRstSons(d, n, result)
  228. result.add("**")
  229. of rnTripleEmphasis:
  230. result.add("***")
  231. renderRstSons(d, n, result)
  232. result.add("***")
  233. of rnInterpretedText:
  234. result.add('`')
  235. renderRstSons(d, n, result)
  236. result.add('`')
  237. of rnInlineLiteral:
  238. inc(d.verbatim)
  239. result.add("``")
  240. renderRstSons(d, n, result)
  241. result.add("``")
  242. dec(d.verbatim)
  243. of rnSmiley:
  244. result.add(n.text)
  245. of rnLeaf:
  246. if d.verbatim == 0 and n.text == "\\":
  247. result.add("\\\\") # XXX: escape more special characters!
  248. else:
  249. result.add(n.text)
  250. of rnIndex:
  251. result.add("\n\n")
  252. result.add(ind)
  253. result.add(".. index::\n")
  254. inc(d.indent, 3)
  255. if n.sons[2] != nil: renderRstSons(d, n.sons[2], result)
  256. dec(d.indent, 3)
  257. of rnContents:
  258. result.add("\n\n")
  259. result.add(ind)
  260. result.add(".. contents::")
  261. else:
  262. result.add("Error: cannot render: " & $n.kind)
  263. proc renderRstToRst*(n: PRstNode, result: var string) =
  264. ## renders `n` into its string representation and appends to `result`.
  265. var d: RenderContext
  266. renderRstToRst(d, n, result)
  267. proc renderRstToJsonNode(node: PRstNode): JsonNode =
  268. result =
  269. %[
  270. (key: "kind", val: %($node.kind)),
  271. (key: "level", val: %BiggestInt(node.level))
  272. ]
  273. if node.text.len > 0:
  274. result.add("text", %node.text)
  275. if len(node.sons) > 0:
  276. var accm = newSeq[JsonNode](len(node.sons))
  277. for i, son in node.sons:
  278. accm[i] = renderRstToJsonNode(son)
  279. result.add("sons", %accm)
  280. proc renderRstToJson*(node: PRstNode): string =
  281. ## Writes the given RST node as JSON that is in the form
  282. ## ::
  283. ## {
  284. ## "kind":string node.kind,
  285. ## "text":optional string node.text,
  286. ## "level":optional int node.level,
  287. ## "sons":optional node array
  288. ## }
  289. renderRstToJsonNode(node).pretty