parse.scm 18 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353
  1. ;;; ECMAScript for Guile
  2. ;; Copyright (C) 2009, 2010 Free Software Foundation, Inc.
  3. ;;;; This library is free software; you can redistribute it and/or
  4. ;;;; modify it under the terms of the GNU Lesser General Public
  5. ;;;; License as published by the Free Software Foundation; either
  6. ;;;; version 3 of the License, or (at your option) any later version.
  7. ;;;;
  8. ;;;; This library is distributed in the hope that it will be useful,
  9. ;;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
  10. ;;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
  11. ;;;; Lesser General Public License for more details.
  12. ;;;;
  13. ;;;; You should have received a copy of the GNU Lesser General Public
  14. ;;;; License along with this library; if not, write to the Free Software
  15. ;;;; Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
  16. ;;; Code:
  17. (define-module (language ecmascript parse)
  18. #:use-module (system base lalr)
  19. #:use-module (language ecmascript tokenize)
  20. #:export (read-ecmascript read-ecmascript/1 make-parser))
  21. (define* (syntax-error message #:optional token)
  22. (if (lexical-token? token)
  23. (throw 'syntax-error #f message
  24. (and=> (lexical-token-source token)
  25. source-location->source-properties)
  26. (or (lexical-token-value token)
  27. (lexical-token-category token))
  28. #f)
  29. (throw 'syntax-error #f message #f token #f)))
  30. (define (read-ecmascript port)
  31. (let ((parse (make-parser)))
  32. (parse (make-tokenizer port) syntax-error)))
  33. (define (read-ecmascript/1 port)
  34. (let ((parse (make-parser)))
  35. (parse (make-tokenizer/1 port) syntax-error)))
  36. (define *eof-object*
  37. (call-with-input-string "" read-char))
  38. (define (make-parser)
  39. ;; Return a fresh ECMAScript parser. Parsers produced by `lalr-scm' are now
  40. ;; stateful (e.g., they won't invoke the tokenizer any more once it has
  41. ;; returned `*eoi*'), hence the need to instantiate new parsers.
  42. (lalr-parser
  43. ;; terminal (i.e. input) token types
  44. (lbrace rbrace lparen rparen lbracket rbracket dot semicolon comma <
  45. > <= >= == != === !== + - * % ++ -- << >> >>> & bor ^ ! ~ && or ?
  46. colon = += -= *= %= <<= >>= >>>= &= bor= ^= / /=
  47. break else new var case finally return void catch for switch while
  48. continue function this with default if throw delete in try do
  49. instanceof typeof null true false
  50. Identifier StringLiteral NumericLiteral RegexpLiteral)
  51. (Program (SourceElements) : $1
  52. (*eoi*) : *eof-object*)
  53. ;;
  54. ;; Verily, here we define statements. Expressions are defined
  55. ;; afterwards.
  56. ;;
  57. (SourceElement (Statement) : $1
  58. (FunctionDeclaration) : $1)
  59. (FunctionDeclaration (function Identifier lparen rparen lbrace FunctionBody rbrace) : `(var (,$2 (lambda () ,$6)))
  60. (function Identifier lparen FormalParameterList rparen lbrace FunctionBody rbrace) : `(var (,$2 (lambda ,$4 ,$7))))
  61. (FunctionExpression (function lparen rparen lbrace FunctionBody rbrace) : `(lambda () ,$5)
  62. (function Identifier lparen rparen lbrace FunctionBody rbrace) : `(lambda () ,$6)
  63. (function lparen FormalParameterList rparen lbrace FunctionBody rbrace) : `(lambda ,$3 ,$6)
  64. (function Identifier lparen FormalParameterList rparen lbrace FunctionBody rbrace) : `(lambda ,$4 ,$7))
  65. (FormalParameterList (Identifier) : `(,$1)
  66. (FormalParameterList comma Identifier) : `(,@$1 ,$3))
  67. (SourceElements (SourceElement) : $1
  68. (SourceElements SourceElement) : (if (and (pair? $1) (eq? (car $1) 'begin))
  69. `(begin ,@(cdr $1) ,$2)
  70. `(begin ,$1 ,$2)))
  71. (FunctionBody (SourceElements) : $1
  72. () : '(begin))
  73. (Statement (Block) : $1
  74. (VariableStatement) : $1
  75. (EmptyStatement) : $1
  76. (ExpressionStatement) : $1
  77. (IfStatement) : $1
  78. (IterationStatement) : $1
  79. (ContinueStatement) : $1
  80. (BreakStatement) : $1
  81. (ReturnStatement) : $1
  82. (WithStatement) : $1
  83. (LabelledStatement) : $1
  84. (SwitchStatement) : $1
  85. (ThrowStatement) : $1
  86. (TryStatement) : $1)
  87. (Block (lbrace StatementList rbrace) : `(block ,$2))
  88. (StatementList (Statement) : $1
  89. (StatementList Statement) : (if (and (pair? $1) (eq? (car $1) 'begin))
  90. `(begin ,@(cdr $1) ,$2)
  91. `(begin ,$1 ,$2)))
  92. (VariableStatement (var VariableDeclarationList) : `(var ,@$2))
  93. (VariableDeclarationList (VariableDeclaration) : `(,$1)
  94. (VariableDeclarationList comma VariableDeclaration) : `(,@$1 ,$2))
  95. (VariableDeclarationListNoIn (VariableDeclarationNoIn) : `(,$1)
  96. (VariableDeclarationListNoIn comma VariableDeclarationNoIn) : `(,@$1 ,$2))
  97. (VariableDeclaration (Identifier) : `(,$1)
  98. (Identifier Initialiser) : `(,$1 ,$2))
  99. (VariableDeclarationNoIn (Identifier) : `(,$1)
  100. (Identifier Initialiser) : `(,$1 ,$2))
  101. (Initialiser (= AssignmentExpression) : $2)
  102. (InitialiserNoIn (= AssignmentExpressionNoIn) : $2)
  103. (EmptyStatement (semicolon) : '(begin))
  104. (ExpressionStatement (Expression semicolon) : $1)
  105. (IfStatement (if lparen Expression rparen Statement else Statement) : `(if ,$3 ,$5 ,$7)
  106. (if lparen Expression rparen Statement) : `(if ,$3 ,$5))
  107. (IterationStatement (do Statement while lparen Expression rparen semicolon) : `(do ,$2 ,$5)
  108. (while lparen Expression rparen Statement) : `(while ,$3 ,$5)
  109. (for lparen semicolon semicolon rparen Statement) : `(for #f #f #f ,$6)
  110. (for lparen semicolon semicolon Expression rparen Statement) : `(for #f #f ,$5 ,$7)
  111. (for lparen semicolon Expression semicolon rparen Statement) : `(for #f ,$4 #f ,$7)
  112. (for lparen semicolon Expression semicolon Expression rparen Statement) : `(for #f ,$4 ,$6 ,$8)
  113. (for lparen ExpressionNoIn semicolon semicolon rparen Statement) : `(for ,$3 #f #f ,$7)
  114. (for lparen ExpressionNoIn semicolon semicolon Expression rparen Statement) : `(for ,$3 #f ,$6 ,$8)
  115. (for lparen ExpressionNoIn semicolon Expression semicolon rparen Statement) : `(for ,$3 ,$5 #f ,$8)
  116. (for lparen ExpressionNoIn semicolon Expression semicolon Expression rparen Statement) : `(for ,$3 ,$5 ,$7 ,$9)
  117. (for lparen var VariableDeclarationListNoIn semicolon semicolon rparen Statement) : `(for (var ,@$4) #f #f ,$8)
  118. (for lparen var VariableDeclarationListNoIn semicolon semicolon Expression rparen Statement) : `(for (var ,@$4) #f ,$7 ,$9)
  119. (for lparen var VariableDeclarationListNoIn semicolon Expression semicolon rparen Statement) : `(for (var ,@$4) ,$6 #f ,$9)
  120. (for lparen var VariableDeclarationListNoIn semicolon Expression semicolon Expression rparen Statement) : `(for (var ,@$4) ,$6 ,$8 ,$10)
  121. (for lparen LeftHandSideExpression in Expression rparen Statement) : `(for-in ,$3 ,$5 ,$7)
  122. (for lparen var VariableDeclarationNoIn in Expression rparen Statement) : `(begin (var ,$4) (for-in (ref ,@$4) ,$6 ,$8)))
  123. (ContinueStatement (continue Identifier semicolon) : `(continue ,$2)
  124. (continue semicolon) : `(continue))
  125. (BreakStatement (break Identifier semicolon) : `(break ,$2)
  126. (break semicolon) : `(break))
  127. (ReturnStatement (return Expression semicolon) : `(return ,$2)
  128. (return semicolon) : `(return))
  129. (WithStatement (with lparen Expression rparen Statement) : `(with ,$3 ,$5))
  130. (SwitchStatement (switch lparen Expression rparen CaseBlock) : `(switch ,$3 ,@$5))
  131. (CaseBlock (lbrace rbrace) : '()
  132. (lbrace CaseClauses rbrace) : $2
  133. (lbrace CaseClauses DefaultClause rbrace) : `(,@$2 ,@$3)
  134. (lbrace DefaultClause rbrace) : `(,$2)
  135. (lbrace DefaultClause CaseClauses rbrace) : `(,@$2 ,@$3))
  136. (CaseClauses (CaseClause) : `(,$1)
  137. (CaseClauses CaseClause) : `(,@$1 ,$2))
  138. (CaseClause (case Expression colon) : `(case ,$2)
  139. (case Expression colon StatementList) : `(case ,$2 ,$4))
  140. (DefaultClause (default colon) : `(default)
  141. (default colon StatementList) : `(default ,$3))
  142. (LabelledStatement (Identifier colon Statement) : `(label ,$1 ,$3))
  143. (ThrowStatement (throw Expression semicolon) : `(throw ,$2))
  144. (TryStatement (try Block Catch) : `(try ,$2 ,$3 #f)
  145. (try Block Finally) : `(try ,$2 #f ,$3)
  146. (try Block Catch Finally) : `(try ,$2 ,$3 ,$4))
  147. (Catch (catch lparen Identifier rparen Block) : `(catch ,$3 ,$5))
  148. (Finally (finally Block) : `(finally ,$2))
  149. ;;
  150. ;; As promised, expressions. We build up to Expression bottom-up, so
  151. ;; as to get operator precedence right.
  152. ;;
  153. (PrimaryExpression (this) : 'this
  154. (null) : 'null
  155. (true) : 'true
  156. (false) : 'false
  157. (Identifier) : `(ref ,$1)
  158. (StringLiteral) : `(string ,$1)
  159. (RegexpLiteral) : `(regexp ,$1)
  160. (NumericLiteral) : `(number ,$1)
  161. (dot NumericLiteral) : `(number ,(string->number (string-append "." (number->string $2))))
  162. (ArrayLiteral) : $1
  163. (ObjectLiteral) : $1
  164. (lparen Expression rparen) : $2)
  165. (ArrayLiteral (lbracket rbracket) : '(array)
  166. (lbracket Elision rbracket) : '(array ,@$2)
  167. (lbracket ElementList rbracket) : `(array ,@$2)
  168. (lbracket ElementList comma rbracket) : `(array ,@$2)
  169. (lbracket ElementList comma Elision rbracket) : `(array ,@$2))
  170. (ElementList (AssignmentExpression) : `(,$1)
  171. (Elision AssignmentExpression) : `(,@$1 ,$2)
  172. (ElementList comma AssignmentExpression) : `(,@$1 ,$3)
  173. (ElementList comma Elision AssignmentExpression) : `(,@$1 ,@$3 ,$4))
  174. (Elision (comma) : '((number 0))
  175. (Elision comma) : `(,@$1 (number 0)))
  176. (ObjectLiteral (lbrace rbrace) : `(object)
  177. (lbrace PropertyNameAndValueList rbrace) : `(object ,@$2))
  178. (PropertyNameAndValueList (PropertyName colon AssignmentExpression) : `((,$1 ,$3))
  179. (PropertyNameAndValueList comma PropertyName colon AssignmentExpression) : `(,@$1 (,$3 ,$5)))
  180. (PropertyName (Identifier) : $1
  181. (StringLiteral) : (string->symbol $1)
  182. (NumericLiteral) : $1)
  183. (MemberExpression (PrimaryExpression) : $1
  184. (FunctionExpression) : $1
  185. (MemberExpression lbracket Expression rbracket) : `(aref ,$1 ,$3)
  186. (MemberExpression dot Identifier) : `(pref ,$1 ,$3)
  187. (new MemberExpression Arguments) : `(new ,$2 ,$3))
  188. (NewExpression (MemberExpression) : $1
  189. (new NewExpression) : `(new ,$2 ()))
  190. (CallExpression (MemberExpression Arguments) : `(call ,$1 ,$2)
  191. (CallExpression Arguments) : `(call ,$1 ,$2)
  192. (CallExpression lbracket Expression rbracket) : `(aref ,$1 ,$3)
  193. (CallExpression dot Identifier) : `(pref ,$1 ,$3))
  194. (Arguments (lparen rparen) : '()
  195. (lparen ArgumentList rparen) : $2)
  196. (ArgumentList (AssignmentExpression) : `(,$1)
  197. (ArgumentList comma AssignmentExpression) : `(,@$1 ,$3))
  198. (LeftHandSideExpression (NewExpression) : $1
  199. (CallExpression) : $1)
  200. (PostfixExpression (LeftHandSideExpression) : $1
  201. (LeftHandSideExpression ++) : `(postinc ,$1)
  202. (LeftHandSideExpression --) : `(postdec ,$1))
  203. (UnaryExpression (PostfixExpression) : $1
  204. (delete UnaryExpression) : `(delete ,$2)
  205. (void UnaryExpression) : `(void ,$2)
  206. (typeof UnaryExpression) : `(typeof ,$2)
  207. (++ UnaryExpression) : `(preinc ,$2)
  208. (-- UnaryExpression) : `(predec ,$2)
  209. (+ UnaryExpression) : `(+ ,$2)
  210. (- UnaryExpression) : `(- ,$2)
  211. (~ UnaryExpression) : `(~ ,$2)
  212. (! UnaryExpression) : `(! ,$2))
  213. (MultiplicativeExpression (UnaryExpression) : $1
  214. (MultiplicativeExpression * UnaryExpression) : `(* ,$1 ,$3)
  215. (MultiplicativeExpression / UnaryExpression) : `(/ ,$1 ,$3)
  216. (MultiplicativeExpression % UnaryExpression) : `(% ,$1 ,$3))
  217. (AdditiveExpression (MultiplicativeExpression) : $1
  218. (AdditiveExpression + MultiplicativeExpression) : `(+ ,$1 ,$3)
  219. (AdditiveExpression - MultiplicativeExpression) : `(- ,$1 ,$3))
  220. (ShiftExpression (AdditiveExpression) : $1
  221. (ShiftExpression << MultiplicativeExpression) : `(<< ,$1 ,$3)
  222. (ShiftExpression >> MultiplicativeExpression) : `(>> ,$1 ,$3)
  223. (ShiftExpression >>> MultiplicativeExpression) : `(>>> ,$1 ,$3))
  224. (RelationalExpression (ShiftExpression) : $1
  225. (RelationalExpression < ShiftExpression) : `(< ,$1 ,$3)
  226. (RelationalExpression > ShiftExpression) : `(> ,$1 ,$3)
  227. (RelationalExpression <= ShiftExpression) : `(<= ,$1 ,$3)
  228. (RelationalExpression >= ShiftExpression) : `(>= ,$1 ,$3)
  229. (RelationalExpression instanceof ShiftExpression) : `(instanceof ,$1 ,$3)
  230. (RelationalExpression in ShiftExpression) : `(in ,$1 ,$3))
  231. (RelationalExpressionNoIn (ShiftExpression) : $1
  232. (RelationalExpressionNoIn < ShiftExpression) : `(< ,$1 ,$3)
  233. (RelationalExpressionNoIn > ShiftExpression) : `(> ,$1 ,$3)
  234. (RelationalExpressionNoIn <= ShiftExpression) : `(<= ,$1 ,$3)
  235. (RelationalExpressionNoIn >= ShiftExpression) : `(>= ,$1 ,$3)
  236. (RelationalExpressionNoIn instanceof ShiftExpression) : `(instanceof ,$1 ,$3))
  237. (EqualityExpression (RelationalExpression) : $1
  238. (EqualityExpression == RelationalExpression) : `(== ,$1 ,$3)
  239. (EqualityExpression != RelationalExpression) : `(!= ,$1 ,$3)
  240. (EqualityExpression === RelationalExpression) : `(=== ,$1 ,$3)
  241. (EqualityExpression !== RelationalExpression) : `(!== ,$1 ,$3))
  242. (EqualityExpressionNoIn (RelationalExpressionNoIn) : $1
  243. (EqualityExpressionNoIn == RelationalExpressionNoIn) : `(== ,$1 ,$3)
  244. (EqualityExpressionNoIn != RelationalExpressionNoIn) : `(!= ,$1 ,$3)
  245. (EqualityExpressionNoIn === RelationalExpressionNoIn) : `(=== ,$1 ,$3)
  246. (EqualityExpressionNoIn !== RelationalExpressionNoIn) : `(!== ,$1 ,$3))
  247. (BitwiseANDExpression (EqualityExpression) : $1
  248. (BitwiseANDExpression & EqualityExpression) : `(& ,$1 ,$3))
  249. (BitwiseANDExpressionNoIn (EqualityExpressionNoIn) : $1
  250. (BitwiseANDExpressionNoIn & EqualityExpressionNoIn) : `(& ,$1 ,$3))
  251. (BitwiseXORExpression (BitwiseANDExpression) : $1
  252. (BitwiseXORExpression ^ BitwiseANDExpression) : `(^ ,$1 ,$3))
  253. (BitwiseXORExpressionNoIn (BitwiseANDExpressionNoIn) : $1
  254. (BitwiseXORExpressionNoIn ^ BitwiseANDExpressionNoIn) : `(^ ,$1 ,$3))
  255. (BitwiseORExpression (BitwiseXORExpression) : $1
  256. (BitwiseORExpression bor BitwiseXORExpression) : `(bor ,$1 ,$3))
  257. (BitwiseORExpressionNoIn (BitwiseXORExpressionNoIn) : $1
  258. (BitwiseORExpressionNoIn bor BitwiseXORExpressionNoIn) : `(bor ,$1 ,$3))
  259. (LogicalANDExpression (BitwiseORExpression) : $1
  260. (LogicalANDExpression && BitwiseORExpression) : `(and ,$1 ,$3))
  261. (LogicalANDExpressionNoIn (BitwiseORExpressionNoIn) : $1
  262. (LogicalANDExpressionNoIn && BitwiseORExpressionNoIn) : `(and ,$1 ,$3))
  263. (LogicalORExpression (LogicalANDExpression) : $1
  264. (LogicalORExpression or LogicalANDExpression) : `(or ,$1 ,$3))
  265. (LogicalORExpressionNoIn (LogicalANDExpressionNoIn) : $1
  266. (LogicalORExpressionNoIn or LogicalANDExpressionNoIn) : `(or ,$1 ,$3))
  267. (ConditionalExpression (LogicalORExpression) : $1
  268. (LogicalORExpression ? AssignmentExpression colon AssignmentExpression) : `(if ,$1 ,$3 ,$5))
  269. (ConditionalExpressionNoIn (LogicalORExpressionNoIn) : $1
  270. (LogicalORExpressionNoIn ? AssignmentExpressionNoIn colon AssignmentExpressionNoIn) : `(if ,$1 ,$3 ,$5))
  271. (AssignmentExpression (ConditionalExpression) : $1
  272. (LeftHandSideExpression AssignmentOperator AssignmentExpression) : `(,$2 ,$1 ,$3))
  273. (AssignmentExpressionNoIn (ConditionalExpressionNoIn) : $1
  274. (LeftHandSideExpression AssignmentOperator AssignmentExpressionNoIn) : `(,$2 ,$1 ,$3))
  275. (AssignmentOperator (=) : '=
  276. (*=) : '*=
  277. (/=) : '/=
  278. (%=) : '%=
  279. (+=) : '+=
  280. (-=) : '-=
  281. (<<=) : '<<=
  282. (>>=) : '>>=
  283. (>>>=) : '>>>=
  284. (&=) : '&=
  285. (^=) : '^=
  286. (bor=) : 'bor=)
  287. (Expression (AssignmentExpression) : $1
  288. (Expression comma AssignmentExpression) : `(begin ,$1 ,$3))
  289. (ExpressionNoIn (AssignmentExpressionNoIn) : $1
  290. (ExpressionNoIn comma AssignmentExpressionNoIn) : `(begin ,$1 ,$3))))