mirror of
https://git.savannah.gnu.org/git/guile.git
synced 2025-04-30 11:50:28 +02:00
* module/language/ecmascript/tokenize.scm: Use `make-lexical-token' and related procedures instead of pairs as tokens passed to the parser. Pass source location information in the form of `source-location' objects. * module/language/ecmascript/parse.scm (read-ecmascript, read-ecmascript/1): Instantiate a new parser at each call. (parse-ecmascript): Rename to... (make-parser): ... this. Change `->' to `:' in the grammar syntax. * module/language/ecmascript/parse-lalr.scm: Remove. * module/Makefile.am (ECMASCRIPT_LANG_SOURCES): Remove `language/ecmascript/parse-lalr.scm'.
343 lines
18 KiB
Scheme
343 lines
18 KiB
Scheme
;;; ECMAScript for Guile
|
|
|
|
;; Copyright (C) 2009, 2010 Free Software Foundation, Inc.
|
|
|
|
;;;; This library is free software; you can redistribute it and/or
|
|
;;;; modify it under the terms of the GNU Lesser General Public
|
|
;;;; License as published by the Free Software Foundation; either
|
|
;;;; version 3 of the License, or (at your option) any later version.
|
|
;;;;
|
|
;;;; This library is distributed in the hope that it will be useful,
|
|
;;;; but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
;;;; MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the GNU
|
|
;;;; Lesser General Public License for more details.
|
|
;;;;
|
|
;;;; You should have received a copy of the GNU Lesser General Public
|
|
;;;; License along with this library; if not, write to the Free Software
|
|
;;;; Foundation, Inc., 51 Franklin Street, Fifth Floor, Boston, MA 02110-1301 USA
|
|
|
|
;;; Code:
|
|
|
|
(define-module (language ecmascript parse)
|
|
#:use-module (system base lalr)
|
|
#:use-module (language ecmascript tokenize)
|
|
#:export (read-ecmascript read-ecmascript/1 make-parser))
|
|
|
|
(define (syntax-error message . args)
|
|
(apply throw 'SyntaxError message args))
|
|
|
|
(define (read-ecmascript port)
|
|
(let ((parse (make-parser)))
|
|
(parse (make-tokenizer port) syntax-error)))
|
|
|
|
(define (read-ecmascript/1 port)
|
|
(let ((parse (make-parser)))
|
|
(parse (make-tokenizer/1 port) syntax-error)))
|
|
|
|
(define *eof-object*
|
|
(call-with-input-string "" read-char))
|
|
|
|
(define (make-parser)
|
|
;; Return a fresh ECMAScript parser. Parsers produced by `lalr-scm' are now
|
|
;; stateful (e.g., they won't invoke the tokenizer any more once it has
|
|
;; returned `*eoi*'), hence the need to instantiate new parsers.
|
|
|
|
(lalr-parser
|
|
;; terminal (i.e. input) token types
|
|
(lbrace rbrace lparen rparen lbracket rbracket dot semicolon comma <
|
|
> <= >= == != === !== + - * % ++ -- << >> >>> & bor ^ ! ~ && or ?
|
|
colon = += -= *= %= <<= >>= >>>= &= bor= ^= / /=
|
|
|
|
break else new var case finally return void catch for switch while
|
|
continue function this with default if throw delete in try do
|
|
instanceof typeof null true false
|
|
|
|
Identifier StringLiteral NumericLiteral RegexpLiteral)
|
|
|
|
|
|
(Program (SourceElements) : $1
|
|
(*eoi*) : *eof-object*)
|
|
|
|
;;
|
|
;; Verily, here we define statements. Expressions are defined
|
|
;; afterwards.
|
|
;;
|
|
|
|
(SourceElement (Statement) : $1
|
|
(FunctionDeclaration) : $1)
|
|
|
|
(FunctionDeclaration (function Identifier lparen rparen lbrace FunctionBody rbrace) : `(var (,$2 (lambda () ,$6)))
|
|
(function Identifier lparen FormalParameterList rparen lbrace FunctionBody rbrace) : `(var (,$2 (lambda ,$4 ,$7))))
|
|
(FunctionExpression (function lparen rparen lbrace FunctionBody rbrace) : `(lambda () ,$5)
|
|
(function Identifier lparen rparen lbrace FunctionBody rbrace) : `(lambda () ,$6)
|
|
(function lparen FormalParameterList rparen lbrace FunctionBody rbrace) : `(lambda ,$3 ,$6)
|
|
(function Identifier lparen FormalParameterList rparen lbrace FunctionBody rbrace) : `(lambda ,$4 ,$7))
|
|
(FormalParameterList (Identifier) : `(,$1)
|
|
(FormalParameterList comma Identifier) : `(,@$1 ,$3))
|
|
(SourceElements (SourceElement) : $1
|
|
(SourceElements SourceElement) : (if (and (pair? $1) (eq? (car $1) 'begin))
|
|
`(begin ,@(cdr $1) ,$2)
|
|
`(begin ,$1 ,$2)))
|
|
(FunctionBody (SourceElements) : $1)
|
|
|
|
(Statement (Block) : $1
|
|
(VariableStatement) : $1
|
|
(EmptyStatement) : $1
|
|
(ExpressionStatement) : $1
|
|
(IfStatement) : $1
|
|
(IterationStatement) : $1
|
|
(ContinueStatement) : $1
|
|
(BreakStatement) : $1
|
|
(ReturnStatement) : $1
|
|
(WithStatement) : $1
|
|
(LabelledStatement) : $1
|
|
(SwitchStatement) : $1
|
|
(ThrowStatement) : $1
|
|
(TryStatement) : $1)
|
|
|
|
(Block (lbrace StatementList rbrace) : `(block ,$2))
|
|
(StatementList (Statement) : $1
|
|
(StatementList Statement) : (if (and (pair? $1) (eq? (car $1) 'begin))
|
|
`(begin ,@(cdr $1) ,$2)
|
|
`(begin ,$1 ,$2)))
|
|
|
|
(VariableStatement (var VariableDeclarationList) : `(var ,@$2))
|
|
(VariableDeclarationList (VariableDeclaration) : `(,$1)
|
|
(VariableDeclarationList comma VariableDeclaration) : `(,@$1 ,$2))
|
|
(VariableDeclarationListNoIn (VariableDeclarationNoIn) : `(,$1)
|
|
(VariableDeclarationListNoIn comma VariableDeclarationNoIn) : `(,@$1 ,$2))
|
|
(VariableDeclaration (Identifier) : `(,$1)
|
|
(Identifier Initialiser) : `(,$1 ,$2))
|
|
(VariableDeclarationNoIn (Identifier) : `(,$1)
|
|
(Identifier Initialiser) : `(,$1 ,$2))
|
|
(Initialiser (= AssignmentExpression) : $2)
|
|
(InitialiserNoIn (= AssignmentExpressionNoIn) : $2)
|
|
|
|
(EmptyStatement (semicolon) : '(begin))
|
|
|
|
(ExpressionStatement (Expression semicolon) : $1)
|
|
|
|
(IfStatement (if lparen Expression rparen Statement else Statement) : `(if ,$3 ,$5 ,$7)
|
|
(if lparen Expression rparen Statement) : `(if ,$3 ,$5))
|
|
|
|
(IterationStatement (do Statement while lparen Expression rparen semicolon) : `(do ,$2 ,$5)
|
|
|
|
(while lparen Expression rparen Statement) : `(while ,$3 ,$5)
|
|
|
|
(for lparen semicolon semicolon rparen Statement) : `(for #f #f #f ,$6)
|
|
(for lparen semicolon semicolon Expression rparen Statement) : `(for #f #f ,$5 ,$7)
|
|
(for lparen semicolon Expression semicolon rparen Statement) : `(for #f ,$4 #f ,$7)
|
|
(for lparen semicolon Expression semicolon Expression rparen Statement) : `(for #f ,$4 ,$6 ,$8)
|
|
|
|
(for lparen ExpressionNoIn semicolon semicolon rparen Statement) : `(for ,$3 #f #f ,$7)
|
|
(for lparen ExpressionNoIn semicolon semicolon Expression rparen Statement) : `(for ,$3 #f ,$6 ,$8)
|
|
(for lparen ExpressionNoIn semicolon Expression semicolon rparen Statement) : `(for ,$3 ,$5 #f ,$8)
|
|
(for lparen ExpressionNoIn semicolon Expression semicolon Expression rparen Statement) : `(for ,$3 ,$5 ,$7 ,$9)
|
|
|
|
(for lparen var VariableDeclarationListNoIn semicolon semicolon rparen Statement) : `(for (var ,@$4) #f #f ,$8)
|
|
(for lparen var VariableDeclarationListNoIn semicolon semicolon Expression rparen Statement) : `(for (var ,@$4) #f ,$7 ,$9)
|
|
(for lparen var VariableDeclarationListNoIn semicolon Expression semicolon rparen Statement) : `(for (var ,@$4) ,$6 #f ,$9)
|
|
(for lparen var VariableDeclarationListNoIn semicolon Expression semicolon Expression rparen Statement) : `(for (var ,@$4) ,$6 ,$8 ,$10)
|
|
|
|
(for lparen LeftHandSideExpression in Expression rparen Statement) : `(for-in ,$3 ,$5 ,$7)
|
|
(for lparen var VariableDeclarationNoIn in Expression rparen Statement) : `(begin (var ,$4) (for-in (ref ,@$4) ,$6 ,$8)))
|
|
|
|
(ContinueStatement (continue Identifier semicolon) : `(continue ,$2)
|
|
(continue semicolon) : `(continue))
|
|
|
|
(BreakStatement (break Identifier semicolon) : `(break ,$2)
|
|
(break semicolon) : `(break))
|
|
|
|
(ReturnStatement (return Expression semicolon) : `(return ,$2)
|
|
(return semicolon) : `(return))
|
|
|
|
(WithStatement (with lparen Expression rparen Statement) : `(with ,$3 ,$5))
|
|
|
|
(SwitchStatement (switch lparen Expression rparen CaseBlock) : `(switch ,$3 ,@$5))
|
|
(CaseBlock (lbrace rbrace) : '()
|
|
(lbrace CaseClauses rbrace) : $2
|
|
(lbrace CaseClauses DefaultClause rbrace) : `(,@$2 ,@$3)
|
|
(lbrace DefaultClause rbrace) : `(,$2)
|
|
(lbrace DefaultClause CaseClauses rbrace) : `(,@$2 ,@$3))
|
|
(CaseClauses (CaseClause) : `(,$1)
|
|
(CaseClauses CaseClause) : `(,@$1 ,$2))
|
|
(CaseClause (case Expression colon) : `(case ,$2)
|
|
(case Expression colon StatementList) : `(case ,$2 ,$4))
|
|
(DefaultClause (default colon) : `(default)
|
|
(default colon StatementList) : `(default ,$3))
|
|
|
|
(LabelledStatement (Identifier colon Statement) : `(label ,$1 ,$3))
|
|
|
|
(ThrowStatement (throw Expression semicolon) : `(throw ,$2))
|
|
|
|
(TryStatement (try Block Catch) : `(try ,$2 ,$3 #f)
|
|
(try Block Finally) : `(try ,$2 #f ,$3)
|
|
(try Block Catch Finally) : `(try ,$2 ,$3 ,$4))
|
|
(Catch (catch lparen Identifier rparen Block) : `(catch ,$3 ,$5))
|
|
(Finally (finally Block) : `(finally ,$2))
|
|
|
|
;;
|
|
;; As promised, expressions. We build up to Expression bottom-up, so
|
|
;; as to get operator precedence right.
|
|
;;
|
|
|
|
(PrimaryExpression (this) : 'this
|
|
(null) : 'null
|
|
(true) : 'true
|
|
(false) : 'false
|
|
(Identifier) : `(ref ,$1)
|
|
(StringLiteral) : `(string ,$1)
|
|
(RegexpLiteral) : `(regexp ,$1)
|
|
(NumericLiteral) : `(number ,$1)
|
|
(ArrayLiteral) : $1
|
|
(ObjectLiteral) : $1
|
|
(lparen Expression rparen) : $2)
|
|
|
|
(ArrayLiteral (lbracket rbracket) : '(array)
|
|
(lbracket Elision rbracket) : '(array ,@$2)
|
|
(lbracket ElementList rbracket) : `(array ,@$2)
|
|
(lbracket ElementList comma rbracket) : `(array ,@$2)
|
|
(lbracket ElementList comma Elision rbracket) : `(array ,@$2))
|
|
(ElementList (AssignmentExpression) : `(,$1)
|
|
(Elision AssignmentExpression) : `(,@$1 ,$2)
|
|
(ElementList comma AssignmentExpression) : `(,@$1 ,$3)
|
|
(ElementList comma Elision AssignmentExpression) : `(,@$1 ,@$3 ,$4))
|
|
(Elision (comma) : '((number 0))
|
|
(Elision comma) : `(,@$1 (number 0)))
|
|
|
|
(ObjectLiteral (lbrace rbrace) : `(object)
|
|
(lbrace PropertyNameAndValueList rbrace) : `(object ,@$2))
|
|
(PropertyNameAndValueList (PropertyName colon AssignmentExpression) : `((,$1 ,$3))
|
|
(PropertyNameAndValueList comma PropertyName colon AssignmentExpression) : `(,@$1 (,$3 ,$5)))
|
|
(PropertyName (Identifier) : $1
|
|
(StringLiteral) : (string->symbol $1)
|
|
(NumericLiteral) : $1)
|
|
|
|
(MemberExpression (PrimaryExpression) : $1
|
|
(FunctionExpression) : $1
|
|
(MemberExpression lbracket Expression rbracket) : `(aref ,$1 ,$3)
|
|
(MemberExpression dot Identifier) : `(pref ,$1 ,$3)
|
|
(new MemberExpression Arguments) : `(new ,$2 ,$3))
|
|
|
|
(NewExpression (MemberExpression) : $1
|
|
(new NewExpression) : `(new ,$2 ()))
|
|
|
|
(CallExpression (MemberExpression Arguments) : `(call ,$1 ,$2)
|
|
(CallExpression Arguments) : `(call ,$1 ,$2)
|
|
(CallExpression lbracket Expression rbracket) : `(aref ,$1 ,$3)
|
|
(CallExpression dot Identifier) : `(pref ,$1 ,$3))
|
|
(Arguments (lparen rparen) : '()
|
|
(lparen ArgumentList rparen) : $2)
|
|
(ArgumentList (AssignmentExpression) : `(,$1)
|
|
(ArgumentList comma AssignmentExpression) : `(,@$1 ,$3))
|
|
|
|
(LeftHandSideExpression (NewExpression) : $1
|
|
(CallExpression) : $1)
|
|
|
|
(PostfixExpression (LeftHandSideExpression) : $1
|
|
(LeftHandSideExpression ++) : `(postinc ,$1)
|
|
(LeftHandSideExpression --) : `(postdec ,$1))
|
|
|
|
(UnaryExpression (PostfixExpression) : $1
|
|
(delete UnaryExpression) : `(delete ,$2)
|
|
(void UnaryExpression) : `(void ,$2)
|
|
(typeof UnaryExpression) : `(typeof ,$2)
|
|
(++ UnaryExpression) : `(preinc ,$2)
|
|
(-- UnaryExpression) : `(predec ,$2)
|
|
(+ UnaryExpression) : `(+ ,$2)
|
|
(- UnaryExpression) : `(- ,$2)
|
|
(~ UnaryExpression) : `(~ ,$2)
|
|
(! UnaryExpression) : `(! ,$2))
|
|
|
|
(MultiplicativeExpression (UnaryExpression) : $1
|
|
(MultiplicativeExpression * UnaryExpression) : `(* ,$1 ,$3)
|
|
(MultiplicativeExpression / UnaryExpression) : `(/ ,$1 ,$3)
|
|
(MultiplicativeExpression % UnaryExpression) : `(% ,$1 ,$3))
|
|
|
|
(AdditiveExpression (MultiplicativeExpression) : $1
|
|
(AdditiveExpression + MultiplicativeExpression) : `(+ ,$1 ,$3)
|
|
(AdditiveExpression - MultiplicativeExpression) : `(- ,$1 ,$3))
|
|
|
|
(ShiftExpression (AdditiveExpression) : $1
|
|
(ShiftExpression << MultiplicativeExpression) : `(<< ,$1 ,$3)
|
|
(ShiftExpression >> MultiplicativeExpression) : `(>> ,$1 ,$3)
|
|
(ShiftExpression >>> MultiplicativeExpression) : `(>>> ,$1 ,$3))
|
|
|
|
(RelationalExpression (ShiftExpression) : $1
|
|
(RelationalExpression < ShiftExpression) : `(< ,$1 ,$3)
|
|
(RelationalExpression > ShiftExpression) : `(> ,$1 ,$3)
|
|
(RelationalExpression <= ShiftExpression) : `(<= ,$1 ,$3)
|
|
(RelationalExpression >= ShiftExpression) : `(>= ,$1 ,$3)
|
|
(RelationalExpression instanceof ShiftExpression) : `(instanceof ,$1 ,$3)
|
|
(RelationalExpression in ShiftExpression) : `(in ,$1 ,$3))
|
|
|
|
(RelationalExpressionNoIn (ShiftExpression) : $1
|
|
(RelationalExpressionNoIn < ShiftExpression) : `(< ,$1 ,$3)
|
|
(RelationalExpressionNoIn > ShiftExpression) : `(> ,$1 ,$3)
|
|
(RelationalExpressionNoIn <= ShiftExpression) : `(<= ,$1 ,$3)
|
|
(RelationalExpressionNoIn >= ShiftExpression) : `(>= ,$1 ,$3)
|
|
(RelationalExpressionNoIn instanceof ShiftExpression) : `(instanceof ,$1 ,$3))
|
|
|
|
(EqualityExpression (RelationalExpression) : $1
|
|
(EqualityExpression == RelationalExpression) : `(== ,$1 ,$3)
|
|
(EqualityExpression != RelationalExpression) : `(!= ,$1 ,$3)
|
|
(EqualityExpression === RelationalExpression) : `(=== ,$1 ,$3)
|
|
(EqualityExpression !== RelationalExpression) : `(!== ,$1 ,$3))
|
|
|
|
(EqualityExpressionNoIn (RelationalExpressionNoIn) : $1
|
|
(EqualityExpressionNoIn == RelationalExpressionNoIn) : `(== ,$1 ,$3)
|
|
(EqualityExpressionNoIn != RelationalExpressionNoIn) : `(!= ,$1 ,$3)
|
|
(EqualityExpressionNoIn === RelationalExpressionNoIn) : `(=== ,$1 ,$3)
|
|
(EqualityExpressionNoIn !== RelationalExpressionNoIn) : `(!== ,$1 ,$3))
|
|
|
|
(BitwiseANDExpression (EqualityExpression) : $1
|
|
(BitwiseANDExpression & EqualityExpression) : `(& ,$1 ,$3))
|
|
(BitwiseANDExpressionNoIn (EqualityExpressionNoIn) : $1
|
|
(BitwiseANDExpressionNoIn & EqualityExpressionNoIn) : `(& ,$1 ,$3))
|
|
|
|
(BitwiseXORExpression (BitwiseANDExpression) : $1
|
|
(BitwiseXORExpression ^ BitwiseANDExpression) : `(^ ,$1 ,$3))
|
|
(BitwiseXORExpressionNoIn (BitwiseANDExpressionNoIn) : $1
|
|
(BitwiseXORExpressionNoIn ^ BitwiseANDExpressionNoIn) : `(^ ,$1 ,$3))
|
|
|
|
(BitwiseORExpression (BitwiseXORExpression) : $1
|
|
(BitwiseORExpression bor BitwiseXORExpression) : `(bor ,$1 ,$3))
|
|
(BitwiseORExpressionNoIn (BitwiseXORExpressionNoIn) : $1
|
|
(BitwiseORExpressionNoIn bor BitwiseXORExpressionNoIn) : `(bor ,$1 ,$3))
|
|
|
|
(LogicalANDExpression (BitwiseORExpression) : $1
|
|
(LogicalANDExpression && BitwiseORExpression) : `(and ,$1 ,$3))
|
|
(LogicalANDExpressionNoIn (BitwiseORExpressionNoIn) : $1
|
|
(LogicalANDExpressionNoIn && BitwiseORExpressionNoIn) : `(and ,$1 ,$3))
|
|
|
|
(LogicalORExpression (LogicalANDExpression) : $1
|
|
(LogicalORExpression or LogicalANDExpression) : `(or ,$1 ,$3))
|
|
(LogicalORExpressionNoIn (LogicalANDExpressionNoIn) : $1
|
|
(LogicalORExpressionNoIn or LogicalANDExpressionNoIn) : `(or ,$1 ,$3))
|
|
|
|
(ConditionalExpression (LogicalORExpression) : $1
|
|
(LogicalORExpression ? AssignmentExpression colon AssignmentExpression) : `(if ,$1 ,$3 ,$5))
|
|
(ConditionalExpressionNoIn (LogicalORExpressionNoIn) : $1
|
|
(LogicalORExpressionNoIn ? AssignmentExpressionNoIn colon AssignmentExpressionNoIn) : `(if ,$1 ,$3 ,$5))
|
|
|
|
(AssignmentExpression (ConditionalExpression) : $1
|
|
(LeftHandSideExpression AssignmentOperator AssignmentExpression) : `(,$2 ,$1 ,$3))
|
|
(AssignmentExpressionNoIn (ConditionalExpressionNoIn) : $1
|
|
(LeftHandSideExpression AssignmentOperator AssignmentExpressionNoIn) : `(,$2 ,$1 ,$3))
|
|
(AssignmentOperator (=) : '=
|
|
(*=) : '*=
|
|
(/=) : '/=
|
|
(%=) : '%=
|
|
(+=) : '+=
|
|
(-=) : '-=
|
|
(<<=) : '<<=
|
|
(>>=) : '>>=
|
|
(>>>=) : '>>>=
|
|
(&=) : '&=
|
|
(^=) : '^=
|
|
(bor=) : 'bor=)
|
|
|
|
(Expression (AssignmentExpression) : $1
|
|
(Expression comma AssignmentExpression) : `(begin ,$1 ,$3))
|
|
(ExpressionNoIn (AssignmentExpressionNoIn) : $1
|
|
(ExpressionNoIn comma AssignmentExpressionNoIn) : `(begin ,$1 ,$3))))
|