jashkenas--coffeescript/lib/coffee_script/grammar.y

469 lines
18 KiB
Plaintext
Raw Normal View History

2009-12-13 22:07:16 +00:00
class Parser
2010-01-06 06:27:58 +00:00
# Declare terminal tokens produced by the lexer.
token IF ELSE UNLESS
token NUMBER STRING REGEX
token TRUE FALSE YES NO ON OFF
token IDENTIFIER PROPERTY_ACCESS PROTOTYPE_ACCESS SOAK_ACCESS
2010-01-06 02:40:36 +00:00
token CODE PARAM NEW RETURN
2009-12-14 15:00:31 +00:00
token TRY CATCH FINALLY THROW
2009-12-15 04:11:28 +00:00
token BREAK CONTINUE
token FOR IN OF BY WHEN WHILE
token SWITCH LEADING_WHEN
2009-12-24 19:50:44 +00:00
token DELETE INSTANCEOF TYPEOF
token SUPER EXTENDS
token ARGUMENTS
token NEWLINE
token COMMENT
2009-12-15 14:11:27 +00:00
token JS
token INDENT OUTDENT
2009-12-13 22:07:16 +00:00
2009-12-17 01:19:52 +00:00
# Declare order of operations.
2009-12-13 22:07:16 +00:00
prechigh
2010-01-05 03:19:45 +00:00
left '?'
2010-01-06 02:40:36 +00:00
nonassoc UMINUS NOT '!' '!!' '~' '++' '--'
2009-12-13 22:07:16 +00:00
left '*' '/' '%'
left '+' '-'
left '<<' '>>' '>>>'
left '&' '|' '^'
2009-12-13 22:07:16 +00:00
left '<=' '<' '>' '>='
right '==' '!=' IS ISNT
2009-12-13 22:07:16 +00:00
left '&&' '||' AND OR
right '-=' '+=' '/=' '*=' '%='
2009-12-24 19:50:44 +00:00
right DELETE INSTANCEOF TYPEOF
left '.'
2009-12-29 04:08:02 +00:00
right INDENT
left OUTDENT
right WHEN LEADING_WHEN IN OF BY
2010-01-12 22:45:06 +00:00
right THROW FOR NEW SUPER
left EXTENDS
left '||=' '&&=' '?='
right ASSIGN RETURN
2010-01-14 01:59:57 +00:00
right '=>' '==>' UNLESS IF ELSE WHILE
2009-12-13 22:07:16 +00:00
preclow
rule
# All parsing will end in this rule, being the trunk of the AST.
Root:
/* nothing */ { result = Expressions.new }
| Terminator { result = Expressions.new }
| Expressions { result = val[0] }
| Block Terminator { result = val[0] }
2009-12-13 22:07:16 +00:00
;
# Any list of expressions or method body, seperated by line breaks or semis.
2009-12-13 22:07:16 +00:00
Expressions:
Expression { result = Expressions.wrap(val) }
| Expressions Terminator Expression { result = val[0] << val[2] }
2009-12-14 04:25:31 +00:00
| Expressions Terminator { result = val[0] }
2009-12-13 22:07:16 +00:00
;
2010-01-06 06:27:58 +00:00
# All types of expressions in our language. The basic unit of CoffeeScript
# is the expression.
2009-12-13 22:07:16 +00:00
Expression:
Value
2009-12-13 22:07:16 +00:00
| Call
| Code
| Operation
| Assign
2009-12-13 22:07:16 +00:00
| If
2009-12-14 15:00:31 +00:00
| Try
| Throw
2009-12-13 23:37:29 +00:00
| Return
| While
| For
2009-12-16 03:30:27 +00:00
| Switch
| Extends
| Splat
| Existence
| Comment
2009-12-13 22:07:16 +00:00
;
2010-01-06 06:27:58 +00:00
# A block of expressions. Note that the Rewriter will convert some postfix
# forms into blocks for us, by altering the token stream.
Block:
2009-12-29 04:08:02 +00:00
INDENT Expressions OUTDENT { result = val[1] }
| INDENT OUTDENT { result = Expressions.new }
;
2010-01-06 06:27:58 +00:00
# Tokens that can terminate an expression.
2009-12-13 22:07:16 +00:00
Terminator:
"\n"
| ";"
;
2010-01-06 06:27:58 +00:00
# All hard-coded values. These can be printed straight to JavaScript.
2009-12-13 22:07:16 +00:00
Literal:
NUMBER { result = LiteralNode.new(val[0]) }
| STRING { result = LiteralNode.new(val[0]) }
2009-12-15 14:11:27 +00:00
| JS { result = LiteralNode.new(val[0]) }
2009-12-13 23:37:29 +00:00
| REGEX { result = LiteralNode.new(val[0]) }
2009-12-15 04:11:28 +00:00
| BREAK { result = LiteralNode.new(val[0]) }
| CONTINUE { result = LiteralNode.new(val[0]) }
| ARGUMENTS { result = LiteralNode.new(val[0]) }
| TRUE { result = LiteralNode.new(Value.new(true)) }
| FALSE { result = LiteralNode.new(Value.new(false)) }
| YES { result = LiteralNode.new(Value.new(true)) }
| NO { result = LiteralNode.new(Value.new(false)) }
| ON { result = LiteralNode.new(Value.new(true)) }
| OFF { result = LiteralNode.new(Value.new(false)) }
2009-12-13 22:07:16 +00:00
;
2010-01-06 06:27:58 +00:00
# Assignment to a variable (or index).
2009-12-13 22:07:16 +00:00
Assign:
2009-12-29 04:08:02 +00:00
Value ASSIGN Expression { result = AssignNode.new(val[0], val[2]) }
2009-12-13 22:07:16 +00:00
;
2010-01-06 06:27:58 +00:00
# Assignment within an object literal (can be quoted).
2009-12-13 22:07:16 +00:00
AssignObj:
2009-12-29 04:08:02 +00:00
IDENTIFIER ASSIGN Expression { result = AssignNode.new(ValueNode.new(val[0]), val[2], :object) }
| STRING ASSIGN Expression { result = AssignNode.new(ValueNode.new(LiteralNode.new(val[0])), val[2], :object) }
| Comment { result = val[0] }
2009-12-13 22:07:16 +00:00
;
# A return statement.
2009-12-13 23:37:29 +00:00
Return:
RETURN Expression { result = ReturnNode.new(val[1]) }
| RETURN { result = ReturnNode.new(ValueNode.new(Value.new('null'))) }
2009-12-13 23:37:29 +00:00
;
# A comment.
Comment:
COMMENT { result = CommentNode.new(val[0]) }
;
2009-12-13 22:07:16 +00:00
# Arithmetic and logical operators
# For Ruby's Operator precedence, see:
# https://www.cs.auckland.ac.nz/references/ruby/ProgrammingRuby/language.html
Operation:
'!' Expression { result = OpNode.new(val[0], val[1]) }
| '!!' Expression { result = OpNode.new(val[0], val[1]) }
| '-' Expression = UMINUS { result = OpNode.new(val[0], val[1]) }
| NOT Expression { result = OpNode.new(val[0], val[1]) }
| '~' Expression { result = OpNode.new(val[0], val[1]) }
| '--' Expression { result = OpNode.new(val[0], val[1]) }
| '++' Expression { result = OpNode.new(val[0], val[1]) }
| DELETE Expression { result = OpNode.new(val[0], val[1]) }
| TYPEOF Expression { result = OpNode.new(val[0], val[1]) }
| Expression '--' { result = OpNode.new(val[1], val[0], nil, true) }
| Expression '++' { result = OpNode.new(val[1], val[0], nil, true) }
| Expression '*' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '/' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '%' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '+' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '-' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '<<' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '>>' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '>>>' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '&' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '|' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '^' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '<=' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '<' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '>' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '>=' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '==' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '!=' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression IS Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression ISNT Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '&&' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '||' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression AND Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression OR Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '?' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '-=' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '+=' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '/=' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '*=' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '%=' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '||=' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '&&=' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression '?=' Expression { result = OpNode.new(val[1], val[0], val[2]) }
| Expression INSTANCEOF Expression { result = OpNode.new(val[1], val[0], val[2]) }
2010-01-06 04:29:43 +00:00
| Expression IN Expression { result = OpNode.new(val[1], val[0], val[2]) }
2009-12-29 04:08:02 +00:00
;
2010-01-06 06:27:58 +00:00
# The existence operator.
Existence:
Expression '?' { result = ExistenceNode.new(val[0]) }
;
2009-12-29 04:08:02 +00:00
# Function definition.
Code:
2010-01-14 01:59:57 +00:00
ParamList FuncGlyph Block { result = CodeNode.new(val[0], val[2], val[1]) }
| FuncGlyph Block { result = CodeNode.new([], val[1], val[0]) }
;
# The symbols to signify functions, and bound functions.
FuncGlyph:
'=>' { result = :func }
| '==>' { result = :boundfunc }
2009-12-17 14:07:42 +00:00
;
# The parameters to a function definition.
2009-12-13 22:07:16 +00:00
ParamList:
2009-12-31 22:50:12 +00:00
Param { result = val }
| ParamList "," Param { result = val[0] << val[2] }
;
2010-01-06 06:27:58 +00:00
# A Parameter (or ParamSplat) in a function definition.
2009-12-31 22:50:12 +00:00
Param:
PARAM
| PARAM "." "." "." { result = SplatNode.new(val[0]) }
;
2010-01-06 06:27:58 +00:00
# A regular splat.
Splat:
Expression "." "." "." { result = SplatNode.new(val[0]) }
2009-12-13 22:07:16 +00:00
;
# Expressions that can be treated as values.
2009-12-14 15:00:31 +00:00
Value:
IDENTIFIER { result = ValueNode.new(val[0]) }
| Literal { result = ValueNode.new(val[0]) }
| Array { result = ValueNode.new(val[0]) }
| Object { result = ValueNode.new(val[0]) }
| Parenthetical { result = ValueNode.new(val[0]) }
| Range { result = ValueNode.new(val[0]) }
2009-12-14 15:00:31 +00:00
| Value Accessor { result = val[0] << val[1] }
| Invocation Accessor { result = ValueNode.new(val[0], [val[1]]) }
2009-12-14 01:29:44 +00:00
;
# Accessing into an object or array, through dot or index notation.
2009-12-14 01:29:44 +00:00
Accessor:
PROPERTY_ACCESS IDENTIFIER { result = AccessorNode.new(val[1]) }
| PROTOTYPE_ACCESS IDENTIFIER { result = AccessorNode.new(val[1], :prototype) }
| SOAK_ACCESS IDENTIFIER { result = AccessorNode.new(val[1], :soak) }
2009-12-14 01:29:44 +00:00
| Index { result = val[0] }
2009-12-26 08:16:40 +00:00
| Range { result = SliceNode.new(val[0]) }
2009-12-14 01:29:44 +00:00
;
# Indexing into an object or array.
2009-12-14 01:29:44 +00:00
Index:
2009-12-15 16:36:24 +00:00
"[" Expression "]" { result = IndexNode.new(val[1]) }
2009-12-13 22:07:16 +00:00
;
# An object literal.
2009-12-13 22:07:16 +00:00
Object:
"{" AssignList "}" { result = ObjectNode.new(val[1]) }
;
# Assignment within an object literal (comma or newline separated).
2009-12-13 22:07:16 +00:00
AssignList:
/* nothing */ { result = [] }
2009-12-13 22:07:16 +00:00
| AssignObj { result = val }
| AssignList "," AssignObj { result = val[0] << val[2] }
| AssignList Terminator AssignObj { result = val[0] << val[2] }
| AssignList ","
Terminator AssignObj { result = val[0] << val[3] }
| INDENT AssignList OUTDENT { result = val[1] }
2009-12-13 22:07:16 +00:00
;
# All flavors of function call (instantiation, super, and regular).
2009-12-13 22:07:16 +00:00
Call:
2009-12-14 04:59:12 +00:00
Invocation { result = val[0] }
2009-12-14 15:00:31 +00:00
| NEW Invocation { result = val[1].new_instance }
2009-12-17 14:07:42 +00:00
| Super { result = val[0] }
2009-12-14 04:45:18 +00:00
;
# Extending an object's prototype.
Extends:
Value EXTENDS Value { result = ExtendsNode.new(val[0], val[2]) }
;
# A generic function invocation.
2009-12-14 04:45:18 +00:00
Invocation:
Value Arguments { result = CallNode.new(val[0], val[1]) }
| Invocation Arguments { result = CallNode.new(val[0], val[1]) }
;
2010-01-06 06:27:58 +00:00
# The list of arguments to a function invocation.
Arguments:
"(" ArgList ")" { result = val[1] }
| "(" ArgList ")" Code { result = val[1] << val[3] }
2009-12-13 22:07:16 +00:00
;
# Calling super.
2009-12-17 14:07:42 +00:00
Super:
SUPER "(" ArgList ")" { result = CallNode.new(Value.new('super'), val[2]) }
2009-12-17 14:07:42 +00:00
;
# The range literal.
Range:
"[" Expression
"." "." Expression "]" { result = RangeNode.new(val[1], val[4]) }
| "[" Expression
"." "." "." Expression "]" { result = RangeNode.new(val[1], val[5], true) }
;
# The array literal.
2009-12-13 22:07:16 +00:00
Array:
"[" ArgList "]" { result = ArrayNode.new(val[1]) }
2009-12-13 22:07:16 +00:00
;
# A list of arguments to a method call, or as the contents of an array.
2009-12-13 22:07:16 +00:00
ArgList:
/* nothing */ { result = [] }
| Expression { result = val }
| INDENT Expression { result = [val[1]] }
| ArgList "," Expression { result = val[0] << val[2] }
2009-12-14 01:29:44 +00:00
| ArgList Terminator Expression { result = val[0] << val[2] }
| ArgList "," Terminator Expression { result = val[0] << val[3] }
| ArgList "," INDENT Expression { result = val[0] << val[3] }
| ArgList OUTDENT { result = val[0] }
2009-12-13 22:07:16 +00:00
;
# Just simple, comma-separated, required arguments (no fancy syntax).
SimpleArgs:
Expression { result = val[0] }
| SimpleArgs "," Expression { result = ([val[0]] << val[2]).flatten }
;
2009-12-18 03:22:35 +00:00
# Try/catch/finally exception handling blocks.
2009-12-14 15:00:31 +00:00
Try:
TRY Block Catch { result = TryNode.new(val[1], val[2][0], val[2][1]) }
2009-12-30 05:22:27 +00:00
| TRY Block FINALLY Block { result = TryNode.new(val[1], nil, nil, val[3]) }
| TRY Block Catch
2009-12-29 04:08:02 +00:00
FINALLY Block { result = TryNode.new(val[1], val[2][0], val[2][1], val[4]) }
2009-12-24 07:01:39 +00:00
;
# A catch clause.
Catch:
2009-12-30 05:22:27 +00:00
CATCH IDENTIFIER Block { result = [val[1], val[2]] }
;
2009-12-18 03:22:35 +00:00
# Throw an exception.
Throw:
THROW Expression { result = ThrowNode.new(val[1]) }
2009-12-14 15:00:31 +00:00
;
2009-12-18 03:22:35 +00:00
# Parenthetical expressions.
2009-12-14 04:25:00 +00:00
Parenthetical:
"(" Expression ")" { result = ParentheticalNode.new(val[1], val[0].line) }
2009-12-14 04:25:00 +00:00
;
2009-12-18 03:22:35 +00:00
# The while loop. (there is no do..while).
While:
WHILE Expression Block { result = WhileNode.new(val[1], val[2]) }
2010-01-09 16:51:32 +00:00
| WHILE Expression { result = WhileNode.new(val[1], nil) }
| Expression WHILE Expression { result = WhileNode.new(val[2], Expressions.wrap(val[0])) }
;
2009-12-18 03:22:35 +00:00
# Array comprehensions, including guard and current index.
# Looks a little confusing, check nodes.rb for the arguments to ForNode.
For:
Expression FOR
2010-01-01 16:54:59 +00:00
ForVariables ForSource { result = ForNode.new(val[0], val[3], val[2][0], val[2][1]) }
| FOR ForVariables ForSource Block { result = ForNode.new(val[3], val[2], val[1][0], val[1][1]) }
;
2009-12-25 21:40:57 +00:00
# An array comprehension has variables for the current element and index.
ForVariables:
IDENTIFIER { result = val }
| IDENTIFIER "," IDENTIFIER { result = [val[0], val[2]] }
;
2009-12-25 21:40:57 +00:00
# The source of the array comprehension can optionally be filtered.
ForSource:
2010-01-01 16:54:59 +00:00
IN Expression { result = {:source => val[1]} }
| OF Expression { result = {:source => val[1], :object => true} }
2010-01-01 16:54:59 +00:00
| ForSource
WHEN Expression { result = val[0].merge(:filter => val[2]) }
| ForSource
BY Expression { result = val[0].merge(:step => val[2]) }
;
# Switch/When blocks.
2009-12-16 03:30:27 +00:00
Switch:
2009-12-29 04:08:02 +00:00
SWITCH Expression INDENT
Whens OUTDENT { result = val[3].rewrite_condition(val[1]) }
| SWITCH Expression INDENT
Whens ELSE Block OUTDENT { result = val[3].rewrite_condition(val[1]).add_else(val[5]) }
2009-12-16 03:30:27 +00:00
;
# The inner list of whens.
Whens:
When { result = val[0] }
| Whens When { result = val[0] << val[1] }
2009-12-16 03:30:27 +00:00
;
# An individual when.
When:
LEADING_WHEN SimpleArgs Block { result = IfNode.new(val[1], val[2], nil, {:statement => true}) }
| LEADING_WHEN SimpleArgs Block
Terminator { result = IfNode.new(val[1], val[2], nil, {:statement => true}) }
| Comment Terminator When { result = val[2].add_comment(val[0]) }
2009-12-16 03:30:27 +00:00
;
2010-01-06 06:27:58 +00:00
# The most basic form of "if".
2009-12-29 04:08:02 +00:00
IfBlock:
IF Expression Block { result = IfNode.new(val[1], val[2]) }
2009-12-29 04:08:02 +00:00
;
# An elsif portion of an if-else block.
ElsIf:
ELSE IfBlock { result = val[1].force_statement }
;
# Multiple elsifs can be chained together.
ElsIfs:
ElsIf { result = val[0] }
| ElsIfs ElsIf { result = val[0].add_else(val[1]) }
;
# Terminating else bodies are strictly optional.
ElseBody
/* nothing */ { result = nil }
| ELSE Block { result = val[1] }
;
# All the alternatives for ending an if-else block.
IfEnd:
ElseBody { result = val[0] }
| ElsIfs ElseBody { result = val[0].add_else(val[1]) }
;
# The full complement of if blocks, including postfix one-liner ifs and unlesses.
If:
2009-12-29 04:08:02 +00:00
IfBlock IfEnd { result = val[0].add_else(val[1]) }
| Expression IF Expression { result = IfNode.new(val[2], Expressions.wrap(val[0]), nil, {:statement => true}) }
| Expression UNLESS Expression { result = IfNode.new(val[2], Expressions.wrap(val[0]), nil, {:statement => true, :invert => true}) }
;
2009-12-13 22:07:16 +00:00
end
---- header
module CoffeeScript
2009-12-13 22:07:16 +00:00
---- inner
2009-12-18 03:22:35 +00:00
# Lex and parse a CoffeeScript.
2009-12-17 15:04:43 +00:00
def parse(code)
2009-12-18 03:22:35 +00:00
# Uncomment the following line to enable grammar debugging, in combination
# with the -g flag in the Rake build task.
2009-12-13 22:07:16 +00:00
# @yydebug = true
@tokens = Lexer.new.tokenize(code)
do_parse
end
2009-12-18 03:22:35 +00:00
# Retrieve the next token from the list.
2009-12-13 22:07:16 +00:00
def next_token
@tokens.shift
2009-12-17 15:04:43 +00:00
end
2009-12-18 03:22:35 +00:00
# Raise a custom error class that knows about line numbers.
2009-12-17 15:04:43 +00:00
def on_error(error_token_id, error_value, value_stack)
raise ParseError.new(token_to_str(error_token_id), error_value, value_stack)
end
---- footer
end