vmdef.nim 8.3 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262
  1. #
  2. #
  3. # The Nim Compiler
  4. # (c) Copyright 2013 Andreas Rumpf
  5. #
  6. # See the file "copying.txt", included in this
  7. # distribution, for details about the copyright.
  8. #
  9. ## This module contains the type definitions for the new evaluation engine.
  10. ## An instruction is 1-3 int32s in memory, it is a register based VM.
  11. import ast, idents, options, modulegraphs, lineinfos
  12. const
  13. byteExcess* = 128 # we use excess-K for immediates
  14. wordExcess* = 32768
  15. MaxLoopIterations* = 10_000_000 # max iterations of all loops
  16. type
  17. TRegister* = range[0..255]
  18. TDest* = range[-1 .. 255]
  19. TInstr* = distinct uint32
  20. TOpcode* = enum
  21. opcEof, # end of code
  22. opcRet, # return
  23. opcYldYoid, # yield with no value
  24. opcYldVal, # yield with a value
  25. opcAsgnInt,
  26. opcAsgnFloat,
  27. opcAsgnRef,
  28. opcAsgnComplex,
  29. opcCastIntToFloat32, # int and float must be of the same byte size
  30. opcCastIntToFloat64, # int and float must be of the same byte size
  31. opcCastFloatToInt32, # int and float must be of the same byte size
  32. opcCastFloatToInt64, # int and float must be of the same byte size
  33. opcFastAsgnComplex,
  34. opcNodeToReg,
  35. opcLdArr, # a = b[c]
  36. opcWrArr, # a[b] = c
  37. opcLdObj, # a = b.c
  38. opcWrObj, # a.b = c
  39. opcAddrReg,
  40. opcAddrNode,
  41. opcLdDeref,
  42. opcWrDeref,
  43. opcWrStrIdx,
  44. opcLdStrIdx, # a = b[c]
  45. opcAddInt,
  46. opcAddImmInt,
  47. opcSubInt,
  48. opcSubImmInt,
  49. opcLenSeq,
  50. opcLenStr,
  51. opcIncl, opcInclRange, opcExcl, opcCard, opcMulInt, opcDivInt, opcModInt,
  52. opcAddFloat, opcSubFloat, opcMulFloat, opcDivFloat,
  53. opcShrInt, opcShlInt, opcAshrInt,
  54. opcBitandInt, opcBitorInt, opcBitxorInt, opcAddu, opcSubu, opcMulu,
  55. opcDivu, opcModu, opcEqInt, opcLeInt, opcLtInt, opcEqFloat,
  56. opcLeFloat, opcLtFloat, opcLeu, opcLtu,
  57. opcEqRef, opcEqNimNode, opcSameNodeType,
  58. opcXor, opcNot, opcUnaryMinusInt, opcUnaryMinusFloat, opcBitnotInt,
  59. opcEqStr, opcLeStr, opcLtStr, opcEqSet, opcLeSet, opcLtSet,
  60. opcMulSet, opcPlusSet, opcMinusSet, opcSymdiffSet, opcConcatStr,
  61. opcContainsSet, opcRepr, opcSetLenStr, opcSetLenSeq,
  62. opcIsNil, opcOf, opcIs,
  63. opcSubStr, opcParseFloat, opcConv, opcCast,
  64. opcQuit, opcInvalidField,
  65. opcNarrowS, opcNarrowU,
  66. opcSignExtend,
  67. opcAddStrCh,
  68. opcAddStrStr,
  69. opcAddSeqElem,
  70. opcRangeChck,
  71. opcNAdd,
  72. opcNAddMultiple,
  73. opcNKind,
  74. opcNSymKind,
  75. opcNIntVal,
  76. opcNFloatVal,
  77. opcNSymbol,
  78. opcNIdent,
  79. opcNGetType,
  80. opcNStrVal,
  81. opcNSigHash,
  82. opcNGetSize,
  83. opcNSetIntVal,
  84. opcNSetFloatVal, opcNSetSymbol, opcNSetIdent, opcNSetType, opcNSetStrVal,
  85. opcNNewNimNode, opcNCopyNimNode, opcNCopyNimTree, opcNDel, opcGenSym,
  86. opcNccValue, opcNccInc, opcNcsAdd, opcNcsIncl, opcNcsLen, opcNcsAt,
  87. opcNctPut, opcNctLen, opcNctGet, opcNctHasNext, opcNctNext, opcNodeId,
  88. opcSlurp,
  89. opcGorge,
  90. opcParseExprToAst,
  91. opcParseStmtToAst,
  92. opcQueryErrorFlag,
  93. opcNError,
  94. opcNWarning,
  95. opcNHint,
  96. opcNGetLineInfo, opcNSetLineInfo,
  97. opcEqIdent,
  98. opcStrToIdent,
  99. opcGetImpl,
  100. opcGetImplTransf
  101. opcEcho,
  102. opcIndCall, # dest = call regStart, n; where regStart = fn, arg1, ...
  103. opcIndCallAsgn, # dest = call regStart, n; where regStart = fn, arg1, ...
  104. opcRaise,
  105. opcNChild,
  106. opcNSetChild,
  107. opcCallSite,
  108. opcNewStr,
  109. opcTJmp, # jump Bx if A != 0
  110. opcFJmp, # jump Bx if A == 0
  111. opcJmp, # jump Bx
  112. opcJmpBack, # jump Bx; resulting from a while loop
  113. opcBranch, # branch for 'case'
  114. opcTry,
  115. opcExcept,
  116. opcFinally,
  117. opcFinallyEnd,
  118. opcNew,
  119. opcNewSeq,
  120. opcLdNull, # dest = nullvalue(types[Bx])
  121. opcLdNullReg,
  122. opcLdConst, # dest = constants[Bx]
  123. opcAsgnConst, # dest = copy(constants[Bx])
  124. opcLdGlobal, # dest = globals[Bx]
  125. opcLdGlobalAddr, # dest = addr(globals[Bx])
  126. opcLdImmInt, # dest = immediate value
  127. opcNBindSym, opcNDynBindSym,
  128. opcSetType, # dest.typ = types[Bx]
  129. opcTypeTrait,
  130. opcMarshalLoad, opcMarshalStore,
  131. opcSymOwner,
  132. opcSymIsInstantiationOf
  133. TBlock* = object
  134. label*: PSym
  135. fixups*: seq[TPosition]
  136. TEvalMode* = enum ## reason for evaluation
  137. emRepl, ## evaluate because in REPL mode
  138. emConst, ## evaluate for 'const' according to spec
  139. emOptimize, ## evaluate for optimization purposes (same as
  140. ## emConst?)
  141. emStaticExpr, ## evaluate for enforced compile time eval
  142. ## ('static' context)
  143. emStaticStmt ## 'static' as an expression
  144. TSandboxFlag* = enum ## what the evaluation engine should allow
  145. allowCast, ## allow unsafe language feature: 'cast'
  146. allowInfiniteLoops ## allow endless loops
  147. TSandboxFlags* = set[TSandboxFlag]
  148. TSlotKind* = enum # We try to re-use slots in a smart way to
  149. # minimize allocations; however the VM supports arbitrary
  150. # temporary slot usage. This is required for the parameter
  151. # passing implementation.
  152. slotEmpty, # slot is unused
  153. slotFixedVar, # slot is used for a fixed var/result (requires copy then)
  154. slotFixedLet, # slot is used for a fixed param/let
  155. slotTempUnknown, # slot but type unknown (argument of proc call)
  156. slotTempInt, # some temporary int
  157. slotTempFloat, # some temporary float
  158. slotTempStr, # some temporary string
  159. slotTempComplex, # some complex temporary (s.node field is used)
  160. slotTempPerm # slot is temporary but permanent (hack)
  161. PProc* = ref object
  162. blocks*: seq[TBlock] # blocks; temp data structure
  163. sym*: PSym
  164. slots*: array[TRegister, tuple[inUse: bool, kind: TSlotKind]]
  165. maxSlots*: int
  166. VmArgs* = object
  167. ra*, rb*, rc*: Natural
  168. slots*: pointer
  169. currentException*: PNode
  170. currentLineInfo*: TLineInfo
  171. VmCallback* = proc (args: VmArgs) {.closure.}
  172. PCtx* = ref TCtx
  173. TCtx* = object of TPassContext # code gen context
  174. code*: seq[TInstr]
  175. debug*: seq[TLineInfo] # line info for every instruction; kept separate
  176. # to not slow down interpretation
  177. globals*: PNode #
  178. constants*: PNode # constant data
  179. types*: seq[PType] # some instructions reference types (e.g. 'except')
  180. currentExceptionA*, currentExceptionB*: PNode
  181. exceptionInstr*: int # index of instruction that raised the exception
  182. prc*: PProc
  183. module*: PSym
  184. callsite*: PNode
  185. mode*: TEvalMode
  186. features*: TSandboxFlags
  187. traceActive*: bool
  188. loopIterations*: int
  189. comesFromHeuristic*: TLineInfo # Heuristic for better macro stack traces
  190. callbacks*: seq[tuple[key: string, value: VmCallback]]
  191. errorFlag*: string
  192. cache*: IdentCache
  193. config*: ConfigRef
  194. graph*: ModuleGraph
  195. oldErrorCount*: int
  196. TPosition* = distinct int
  197. PEvalContext* = PCtx
  198. proc newCtx*(module: PSym; cache: IdentCache; g: ModuleGraph): PCtx =
  199. PCtx(code: @[], debug: @[],
  200. globals: newNode(nkStmtListExpr), constants: newNode(nkStmtList), types: @[],
  201. prc: PProc(blocks: @[]), module: module, loopIterations: MaxLoopIterations,
  202. comesFromHeuristic: unknownLineInfo(), callbacks: @[], errorFlag: "",
  203. cache: cache, config: g.config, graph: g)
  204. proc refresh*(c: PCtx, module: PSym) =
  205. c.module = module
  206. c.prc = PProc(blocks: @[])
  207. c.loopIterations = MaxLoopIterations
  208. proc registerCallback*(c: PCtx; name: string; callback: VmCallback): int {.discardable.} =
  209. result = c.callbacks.len
  210. c.callbacks.add((name, callback))
  211. const
  212. firstABxInstr* = opcTJmp
  213. largeInstrs* = { # instructions which use 2 int32s instead of 1:
  214. opcSubStr, opcConv, opcCast, opcNewSeq, opcOf,
  215. opcMarshalLoad, opcMarshalStore}
  216. slotSomeTemp* = slotTempUnknown
  217. relativeJumps* = {opcTJmp, opcFJmp, opcJmp, opcJmpBack}
  218. # flag is used to signal opcSeqLen if node is NimNode.
  219. const nimNodeFlag* = 16
  220. template opcode*(x: TInstr): TOpcode = TOpcode(x.uint32 and 0xff'u32)
  221. template regA*(x: TInstr): TRegister = TRegister(x.uint32 shr 8'u32 and 0xff'u32)
  222. template regB*(x: TInstr): TRegister = TRegister(x.uint32 shr 16'u32 and 0xff'u32)
  223. template regC*(x: TInstr): TRegister = TRegister(x.uint32 shr 24'u32)
  224. template regBx*(x: TInstr): int = (x.uint32 shr 16'u32).int
  225. template jmpDiff*(x: TInstr): int = regBx(x) - wordExcess