NimYAML/test/testEventParser.nim

258 lines
8.6 KiB
Nim
Raw Normal View History

# NimYAML - YAML implementation in Nim
# (c) Copyright 2016 Felix Krause
#
# See the file "copying.txt", included in this
# distribution, for details about the copyright.
import "../yaml"
2016-12-05 18:22:51 +00:00
import lexbase, streams, tables, strutils
type
2016-04-02 15:48:22 +00:00
LexerToken = enum
plusStr, minusStr, plusDoc, minusDoc, plusMap, minusMap, plusSeq, minusSeq,
2016-12-05 18:22:51 +00:00
eqVal, eqAli, chevTag, andAnchor, starAnchor, quotContent, colonContent,
explDirEnd, explDocEnd, noToken
2016-09-20 19:53:38 +00:00
2016-04-02 15:48:22 +00:00
StreamPos = enum
beforeStream, inStream, afterStream
2016-04-02 15:48:22 +00:00
EventLexer = object of BaseLexer
content: string
2016-09-20 19:53:38 +00:00
2016-04-02 15:48:22 +00:00
EventStreamError = object of Exception
proc nextToken(lex: var EventLexer): LexerToken =
2016-04-02 15:48:22 +00:00
while true:
case lex.buf[lex.bufpos]
2016-04-02 15:48:22 +00:00
of ' ', '\t': lex.bufpos.inc()
of '\r': lex.bufpos = lex.handleCR(lex.bufpos)
of '\l': lex.bufpos = lex.handleLF(lex.bufpos)
else: break
if lex.buf[lex.bufpos] == EndOfFile: return noToken
case lex.buf[lex.bufpos]
2016-12-05 18:22:51 +00:00
of ':', '"', '\'', '|', '>':
2016-04-02 15:48:22 +00:00
let t = if lex.buf[lex.bufpos] == ':': colonContent else: quotContent
lex.content = ""
lex.bufpos.inc()
while true:
case lex.buf[lex.bufpos]
of EndOfFile: break
of '\c':
lex.bufpos = lex.handleCR(lex.bufpos)
break
of '\l':
lex.bufpos = lex.handleLF(lex.bufpos)
break
of '\\':
lex.bufpos.inc()
2016-04-02 15:48:22 +00:00
case lex.buf[lex.bufpos]
of 'n': lex.content.add('\l')
of 'r': lex.content.add('\r')
of '0': lex.content.add('\0')
of 'b': lex.content.add('\b')
of 't': lex.content.add('\t')
of '\\': lex.content.add('\\')
else: raise newException(EventStreamError,
2016-04-02 15:48:22 +00:00
"Unknown escape character: " & lex.buf[lex.bufpos])
else: lex.content.add(lex.buf[lex.bufpos])
lex.bufpos.inc()
result = t
of '<':
lex.content = ""
lex.bufpos.inc()
while lex.buf[lex.bufpos] != '>':
lex.content.add(lex.buf[lex.bufpos])
lex.bufpos.inc()
if lex.buf[lex.bufpos] == EndOfFile:
raise newException(EventStreamError, "Unclosed tag URI!")
result = chevTag
lex.bufpos.inc()
of '&':
lex.content = ""
lex.bufpos.inc()
while lex.buf[lex.bufpos] notin {' ', '\t', '\r', '\l', EndOfFile}:
lex.content.add(lex.buf[lex.bufpos])
lex.bufpos.inc()
result = andAnchor
2016-12-05 18:22:51 +00:00
of '*':
lex.content = ""
lex.bufpos.inc()
while lex.buf[lex.bufpos] notin {' ', '\t', '\r', '\l', EndOfFile}:
lex.content.add(lex.buf[lex.bufpos])
lex.bufpos.inc()
result = starAnchor
2016-04-02 15:48:22 +00:00
else:
lex.content = ""
while lex.buf[lex.bufpos] notin {' ', '\t', '\r', '\l', EndOfFile}:
lex.content.add(lex.buf[lex.bufpos])
lex.bufpos.inc()
case lex.content
of "+STR": result = plusStr
of "-STR": result = minusStr
of "+DOC": result = plusDoc
of "-DOC": result = minusDoc
of "+MAP": result = plusMap
of "-MAP": result = minusMap
of "+SEQ": result = plusSeq
of "-SEQ": result = minusSeq
of "=VAL": result = eqVal
of "=ALI": result = eqAli
2016-12-05 18:22:51 +00:00
of "---": result = explDirEnd
of "...": result = explDocEnd
2016-04-02 15:48:22 +00:00
else: raise newException(EventStreamError, "Invalid token: " & lex.content)
template assertInStream() {.dirty.} =
2016-04-02 15:48:22 +00:00
if streamPos != inStream:
raise newException(EventStreamError, "Missing +STR")
template assertInEvent(name: string) {.dirty.} =
2016-04-02 15:48:22 +00:00
if not inEvent:
raise newException(EventStreamError, "Illegal token: " & name)
template yieldEvent() {.dirty.} =
2016-04-02 15:48:22 +00:00
if inEvent:
yield curEvent
inEvent = false
template setTag(t: TagId) {.dirty.} =
2016-04-02 15:48:22 +00:00
case curEvent.kind
of yamlStartSeq: curEvent.seqTag = t
of yamlStartMap: curEvent.mapTag = t
of yamlScalar: curEvent.scalarTag = t
else: discard
template setAnchor(a: AnchorId) {.dirty.} =
2016-04-02 15:48:22 +00:00
case curEvent.kind
of yamlStartSeq: curEvent.seqAnchor = a
of yamlStartMap: curEvent.mapAnchor = a
of yamlScalar: curEvent.scalarAnchor = a
of yamlAlias: curEvent.aliasTarget = a
else: discard
template curTag(): TagId =
2016-04-02 15:48:22 +00:00
var foo: TagId
case curEvent.kind
of yamlStartSeq: foo = curEvent.seqTag
of yamlStartMap: foo = curEvent.mapTag
of yamlScalar: foo = curEvent.scalarTag
else: raise newException(EventStreamError,
$curEvent.kind & " may not have a tag")
foo
template setCurTag(val: TagId) =
2016-04-02 15:48:22 +00:00
case curEvent.kind
of yamlStartSeq: curEvent.seqTag = val
of yamlStartMap: curEvent.mapTag = val
of yamlScalar: curEvent.scalarTag = val
else: raise newException(EventStreamError,
$curEvent.kind & " may not have a tag")
template curAnchor(): AnchorId =
2016-04-02 15:48:22 +00:00
var foo: AnchorId
case curEvent.kind
of yamlStartSeq: foo = curEvent.seqAnchor
of yamlStartMap: foo = curEvent.mapAnchor
of yamlScalar: foo = curEvent.scalarAnchor
of yamlAlias: foo = curEvent.aliasTarget
else: raise newException(EventStreamError,
$curEvent.kind & "may not have an anchor")
foo
template setCurAnchor(val: AnchorId) =
2016-04-02 15:48:22 +00:00
case curEvent.kind
of yamlStartSeq: curEvent.seqAnchor = val
of yamlStartMap: curEvent.mapAnchor = val
of yamlScalar: curEvent.scalarAnchor = val
of yamlAlias: curEvent.aliasTarget = val
else: raise newException(EventStreamError,
$curEvent.kind & " may not have an anchor")
2016-09-20 19:53:38 +00:00
template eventStart(k: YamlStreamEventKind) {.dirty.} =
2016-04-02 15:48:22 +00:00
assertInStream()
yieldEvent()
curEvent = YamlStreamEvent(kind: k)
2016-04-02 15:48:22 +00:00
setTag(yTagQuestionMark)
setAnchor(yAnchorNone)
inEvent = true
proc parseEventStream*(input: Stream, tagLib: TagLibrary): YamlStream =
2016-04-02 15:48:22 +00:00
var backend = iterator(): YamlStreamEvent =
var lex: EventLexer
lex.open(input)
var
inEvent = false
curEvent: YamlStreamEvent
streamPos: StreamPos = beforeStream
2016-04-02 15:48:22 +00:00
anchors = initTable[string, AnchorId]()
nextAnchorId = 0.AnchorId
while lex.buf[lex.bufpos] != EndOfFile:
let token = lex.nextToken()
case token
of plusStr:
if streamPos != beforeStream:
raise newException(EventStreamError, "Illegal +STR")
streamPos = inStream
of minusStr:
if streamPos != inStream:
raise newException(EventStreamError, "Illegal -STR")
if inEvent: yield curEvent
inEvent = false
streamPos = afterStream
of plusDoc: eventStart(yamlStartDoc)
of minusDoc: eventStart(yamlEndDoc)
of plusMap: eventStart(yamlStartMap)
of minusMap: eventStart(yamlEndMap)
of plusSeq: eventStart(yamlStartSeq)
of minusSeq: eventStart(yamlEndSeq)
of eqVal: eventStart(yamlScalar)
of eqAli: eventStart(yamlAlias)
of chevTag:
assertInEvent("tag")
if curTag() != yTagQuestionMark:
raise newException(EventStreamError,
"Duplicate tag in " & $curEvent.kind)
try:
setCurTag(tagLib.tags[lex.content])
except KeyError: setCurTag(tagLib.registerUri(lex.content))
of andAnchor:
assertInEvent("anchor")
if curAnchor() != yAnchorNone:
raise newException(EventStreamError,
"Duplicate anchor in " & $curEvent.kind)
2016-12-05 18:22:51 +00:00
anchors[lex.content] = nextAnchorId
setCurAnchor(nextAnchorId)
nextAnchorId = (AnchorId)(((int)nextAnchorId) + 1)
of starAnchor:
assertInEvent("alias")
if curEvent.kind != yamlAlias:
raise newException(EventStreamError, "Unexpected alias: " &
escape(lex.content))
elif curEvent.aliasTarget != yAnchorNone:
raise newException(EventStreamError, "Duplicate alias target: " &
escape(lex.content))
2016-04-02 15:48:22 +00:00
else:
2016-12-05 18:22:51 +00:00
curEvent.aliasTarget = anchors[lex.content]
2016-04-02 15:48:22 +00:00
of quotContent:
assertInEvent("scalar content")
if curTag() == yTagQuestionMark: setCurTag(yTagExclamationMark)
if curEvent.kind != yamlScalar:
raise newException(EventStreamError,
"scalar content in non-scalar tag")
curEvent.scalarContent = lex.content
of colonContent:
assertInEvent("scalar content")
curEvent.scalarContent = lex.content
if curEvent.kind != yamlScalar:
raise newException(EventStreamError,
"scalar content in non-scalar tag")
2016-12-05 18:22:51 +00:00
of explDirEnd:
assertInEvent("explicit directives end")
if curEvent.kind != yamlStartDoc:
raise newException(EventStreamError,
"Unexpected explicit directives end")
of explDocEnd:
if curEvent.kind != yamlEndDoc:
raise newException(EventStreamError,
"Unexpected explicit document end")
2016-04-02 15:48:22 +00:00
of noToken: discard
result = initYamlStream(backend)