123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173 |
- #
- #
- # Nim's Runtime Library
- # (c) Copyright 2010 Andreas Rumpf
- #
- # See the file "copying.txt", included in this
- # distribution, for details about the copyright.
- #
- ## This module parses an XML document and creates its XML tree representation.
- import streams, parsexml, strtabs, xmltree
- type
- XmlError* = object of ValueError ## Exception that is raised
- ## for invalid XML.
- errors*: seq[string] ## All detected parsing errors.
- proc raiseInvalidXml(errors: seq[string]) =
- var e: ref XmlError
- new(e)
- e.msg = errors[0]
- e.errors = errors
- raise e
- proc addNode(father, son: XmlNode) =
- if son != nil: add(father, son)
- proc parse(x: var XmlParser, errors: var seq[string]): XmlNode {.gcsafe.}
- proc untilElementEnd(x: var XmlParser, result: XmlNode,
- errors: var seq[string]) =
- while true:
- case x.kind
- of xmlElementEnd:
- if x.elementName == result.tag:
- next(x)
- else:
- errors.add(errorMsg(x, "</" & result.tag & "> expected"))
- # do not skip it here!
- break
- of xmlEof:
- errors.add(errorMsg(x, "</" & result.tag & "> expected"))
- break
- else:
- result.addNode(parse(x, errors))
- proc parse(x: var XmlParser, errors: var seq[string]): XmlNode =
- case x.kind
- of xmlComment:
- result = newComment(x.charData)
- next(x)
- of xmlCharData, xmlWhitespace:
- result = newText(x.charData)
- next(x)
- of xmlPI, xmlSpecial:
- # we just ignore processing instructions for now
- next(x)
- of xmlError:
- errors.add(errorMsg(x))
- next(x)
- of xmlElementStart: ## ``<elem>``
- result = newElement(x.elementName)
- next(x)
- untilElementEnd(x, result, errors)
- of xmlElementEnd:
- errors.add(errorMsg(x, "unexpected ending tag: " & x.elementName))
- of xmlElementOpen:
- result = newElement(x.elementName)
- next(x)
- result.attrs = newStringTable()
- while true:
- case x.kind
- of xmlAttribute:
- result.attrs[x.attrKey] = x.attrValue
- next(x)
- of xmlElementClose:
- next(x)
- break
- of xmlError:
- errors.add(errorMsg(x))
- next(x)
- break
- else:
- errors.add(errorMsg(x, "'>' expected"))
- next(x)
- break
- untilElementEnd(x, result, errors)
- of xmlAttribute, xmlElementClose:
- errors.add(errorMsg(x, "<some_tag> expected"))
- next(x)
- of xmlCData:
- result = newCData(x.charData)
- next(x)
- of xmlEntity:
- ## &entity;
- result = newEntity(x.entityName)
- next(x)
- of xmlEof: discard
- proc parseXml*(s: Stream, filename: string,
- errors: var seq[string]): XmlNode =
- ## Parses the XML from stream ``s`` and returns a ``XmlNode``. Every
- ## occurred parsing error is added to the ``errors`` sequence.
- var x: XmlParser
- open(x, s, filename, {reportComments})
- while true:
- x.next()
- case x.kind
- of xmlElementOpen, xmlElementStart:
- result = parse(x, errors)
- break
- of xmlComment, xmlWhitespace, xmlSpecial, xmlPI: discard # just skip it
- of xmlError:
- errors.add(errorMsg(x))
- else:
- errors.add(errorMsg(x, "<some_tag> expected"))
- break
- close(x)
- proc parseXml*(s: Stream): XmlNode =
- ## Parses the XML from stream ``s`` and returns a ``XmlNode``. All parsing
- ## errors are turned into an ``XmlError`` exception.
- var errors: seq[string] = @[]
- result = parseXml(s, "unknown_xml_doc", errors)
- if errors.len > 0: raiseInvalidXml(errors)
- proc parseXml*(str: string): XmlNode =
- ## Parses the XML from string ``str`` and returns a ``XmlNode``. All parsing
- ## errors are turned into an ``XmlError`` exception.
- parseXml(newStringStream(str))
- proc loadXml*(path: string, errors: var seq[string]): XmlNode =
- ## Loads and parses XML from file specified by ``path``, and returns
- ## a ``XmlNode``. Every occurred parsing error is added to the ``errors``
- ## sequence.
- var s = newFileStream(path, fmRead)
- if s == nil: raise newException(IOError, "Unable to read file: " & path)
- result = parseXml(s, path, errors)
- proc loadXml*(path: string): XmlNode =
- ## Loads and parses XML from file specified by ``path``, and returns
- ## a ``XmlNode``. All parsing errors are turned into an ``XmlError``
- ## exception.
- var errors: seq[string] = @[]
- result = loadXml(path, errors)
- if errors.len > 0: raiseInvalidXml(errors)
- when isMainModule:
- when not defined(testing):
- import os
- var errors: seq[string] = @[]
- var x = loadXml(paramStr(1), errors)
- for e in items(errors): echo e
- var f: File
- if open(f, "xmltest.txt", fmWrite):
- f.write($x)
- f.close()
- else:
- quit("cannot write test.txt")
- else:
- block: # correctly parse ../../tests/testdata/doc1.xml
- let filePath = "tests/testdata/doc1.xml"
- var errors: seq[string] = @[]
- var xml = loadXml(filePath, errors)
- assert(errors.len == 0, "The file tests/testdata/doc1.xml should be parsed without errors.")
- block bug1518:
- var err: seq[string] = @[]
- assert $parsexml(newStringStream"<tag>One & two</tag>", "temp.xml", err) == "<tag>One & two</tag>"
|