mirror of
https://github.com/haml/haml.git
synced 2022-11-09 12:33:31 -05:00
191 lines
5.7 KiB
Ruby
191 lines
5.7 KiB
Ruby
require 'strscan'
|
|
|
|
module Sass
|
|
module Script
|
|
# The lexical analyzer for SassScript.
|
|
# It takes a raw string and converts it to individual tokens
|
|
# that are easier to parse.
|
|
class Lexer
|
|
# A struct containing information about an individual token.
|
|
#
|
|
# `type`: \[{Symbol}\]
|
|
# : The type of token.
|
|
#
|
|
# `value`: \[{Object}\]
|
|
# : The Ruby object corresponding to the value of the token.
|
|
#
|
|
# `line`: \[{Fixnum}\]
|
|
# : The line of the source file on which the token appears.
|
|
#
|
|
# `offset`: \[{Fixnum}\]
|
|
# : The number of bytes into the line the SassScript token appeared.
|
|
Token = Struct.new(:type, :value, :line, :offset)
|
|
|
|
# A hash from operator strings to the corresponding token types.
|
|
OPERATORS = {
|
|
'+' => :plus,
|
|
'-' => :minus,
|
|
'*' => :times,
|
|
'/' => :div,
|
|
'%' => :mod,
|
|
'=' => :single_eq,
|
|
'(' => :lparen,
|
|
')' => :rparen,
|
|
',' => :comma,
|
|
'and' => :and,
|
|
'or' => :or,
|
|
'not' => :not,
|
|
'==' => :eq,
|
|
'!=' => :neq,
|
|
'>=' => :gte,
|
|
'<=' => :lte,
|
|
'>' => :gt,
|
|
'<' => :lt,
|
|
'#{' => :begin_interpolation,
|
|
'}' => :end_interpolation,
|
|
}
|
|
|
|
# A list of operator strings ordered with longer names first
|
|
# so that `>` and `<` don't clobber `>=` and `<=`.
|
|
OP_NAMES = OPERATORS.keys.sort_by {|o| -o.size}
|
|
|
|
# A hash of regular expressions that are used for tokenizing.
|
|
REGULAR_EXPRESSIONS = {
|
|
:whitespace => /\s*/,
|
|
:variable => /!(\w+)/,
|
|
:ident => /(\\.|[^\s\\+\-*\/%(),=!])+/,
|
|
:string_end => /((?:\\.|\#(?!\{)|[^"\\#])*)(?:"|(?=#\{))/,
|
|
:number => /(-)?(?:(\d*\.\d+)|(\d+))([a-zA-Z%]+)?/,
|
|
:color => /\##{"([0-9a-fA-F]{1,2})" * 3}|(#{Color::HTML4_COLORS.keys.join("|")})/,
|
|
:bool => /(true|false)\b/,
|
|
:op => %r{(#{Regexp.union(*OP_NAMES.map{|s| Regexp.new(Regexp.escape(s) + (s =~ /\w$/ ? '(?:\b|$)' : ''))})})}
|
|
}
|
|
|
|
# @param str [String, StringScanner] The source text to lex
|
|
# @param line [Fixnum] The line on which the SassScript appears.
|
|
# Used for error reporting
|
|
# @param offset [Fixnum] The number of characters in on which the SassScript appears.
|
|
# Used for error reporting
|
|
def initialize(str, line, offset, filename)
|
|
@scanner = str.is_a?(StringScanner) ? str : StringScanner.new(str)
|
|
@line = line
|
|
@offset = offset
|
|
@filename = filename
|
|
@prev = nil
|
|
end
|
|
|
|
# Moves the lexer forward one token.
|
|
#
|
|
# @return [Token] The token that was moved past
|
|
def next
|
|
@tok ||= read_token
|
|
@tok, tok = nil, @tok
|
|
@prev = tok
|
|
return tok
|
|
end
|
|
|
|
# Returns the next token without moving the lexer forward.
|
|
#
|
|
# @return [Token] The next token
|
|
def peek
|
|
@tok ||= read_token
|
|
end
|
|
|
|
# @return [Boolean] Whether or not there's more source text to lex.
|
|
def done?
|
|
whitespace unless after_interpolation?
|
|
@scanner.eos? && @tok.nil?
|
|
end
|
|
|
|
private
|
|
|
|
def read_token
|
|
return if done?
|
|
|
|
value = token
|
|
unless value
|
|
raise SyntaxError.new("Syntax error in '#{@scanner.string}' at character #{current_position}.")
|
|
end
|
|
Token.new(value.first, value.last, @line, last_match_position)
|
|
end
|
|
|
|
def whitespace
|
|
@scanner.scan(REGULAR_EXPRESSIONS[:whitespace])
|
|
end
|
|
|
|
def token
|
|
return string('') if after_interpolation?
|
|
variable || string || number || color || bool || op || ident
|
|
end
|
|
|
|
def variable
|
|
return unless @scanner.scan(REGULAR_EXPRESSIONS[:variable])
|
|
[:const, @scanner[1]]
|
|
end
|
|
|
|
def ident
|
|
return unless s = @scanner.scan(REGULAR_EXPRESSIONS[:ident])
|
|
[:ident, s.gsub(/\\(.)/, '\1')]
|
|
end
|
|
|
|
def string(start_char = '"')
|
|
return unless @scanner.scan(/#{start_char}#{REGULAR_EXPRESSIONS[:string_end]}/)
|
|
[:string, Script::String.new(@scanner[1].gsub(/\\([^0-9a-f])/, '\1').gsub(/\\([0-9a-f]{1,4})/, "\\\\\\1"))]
|
|
end
|
|
|
|
def begin_interpolation
|
|
@scanner.scan
|
|
end
|
|
|
|
def number
|
|
return unless @scanner.scan(REGULAR_EXPRESSIONS[:number])
|
|
value = @scanner[2] ? @scanner[2].to_f : @scanner[3].to_i
|
|
value = -value if @scanner[1]
|
|
[:number, Script::Number.new(value, Array(@scanner[4]))]
|
|
end
|
|
|
|
def color
|
|
return unless @scanner.scan(REGULAR_EXPRESSIONS[:color])
|
|
value = if @scanner[4]
|
|
color = Color::HTML4_COLORS[@scanner[4].downcase]
|
|
else
|
|
(1..3).map {|i| @scanner[i]}.map {|num| num.ljust(2, num).to_i(16)}
|
|
end
|
|
[:color, Script::Color.new(value)]
|
|
end
|
|
|
|
def bool
|
|
return unless s = @scanner.scan(REGULAR_EXPRESSIONS[:bool])
|
|
[:bool, Script::Bool.new(s == 'true')]
|
|
end
|
|
|
|
def op
|
|
prev_chr = @scanner.string[@scanner.pos - 1].chr
|
|
return unless op = @scanner.scan(REGULAR_EXPRESSIONS[:op])
|
|
if @prev && op == '-' && prev_chr !~ /\s/ &&
|
|
[:bool, :ident, :const].include?(@prev.type)
|
|
warn(<<END)
|
|
DEPRECATION WARNING:
|
|
On line #{@line}, character #{last_match_position}#{" of '#{@filename}'" if @filename}
|
|
- will be allowed as part of variable names in version 2.4.
|
|
Please add whitespace to separate it from the previous token.
|
|
END
|
|
end
|
|
|
|
[OPERATORS[op]]
|
|
end
|
|
|
|
def current_position
|
|
@offset + @scanner.pos + 1
|
|
end
|
|
|
|
def last_match_position
|
|
current_position - @scanner.matched_size
|
|
end
|
|
|
|
def after_interpolation?
|
|
@prev && @prev.type == :end_interpolation
|
|
end
|
|
end
|
|
end
|
|
end
|