# -*- coding: utf-8 -*- #
module Rouge
module Lexers
class SML < RegexLexer
title "SML"
desc 'Standard ML'
tag 'sml'
aliases 'ml'
filenames '*.sml', '*.sig', '*.fun'
mimetypes 'text/x-standardml', 'application/x-standardml'
def self.keywords
@keywords ||= Set.new %w(
abstype and andalso as case datatype do else end exception
fn fun handle if in infix infixr let local nonfix of op open
orelse raise rec then type val with withtype while
eqtype functor include sharing sig signature struct structure
where
)
end
def self.symbolic_reserved
@symbolic_reserved ||= Set.new %w(: | = => -> # :>)
end
id = /[\w']+/i
symbol = %r([!%&$#/:<=>?@\\~`^|*+-]+)
def self.analyze_text(text)
return 0
end
state :whitespace do
rule /\s+/m, Text
rule /[(][*]/, Comment, :comment
end
state :delimiters do
rule /[(\[{]/, Punctuation, :main
rule /[)\]}]/, Punctuation, :pop!
rule /\b(let|if|local)\b(?!')/, Keyword::Reserved do
push; push
end
rule /\b(struct|sig|while)\b(?!')/ do
token Keyword::Reserved
push
end
rule /\b(do|else|end|in|then)\b(?!')/, Keyword::Reserved, :pop!
end
def token_for_id_with_dot(id)
if self.class.keywords.include? id
Error
else
Name::Namespace
end
end
def token_for_final_id(id)
if self.class.keywords.include? id or self.class.symbolic_reserved.include? id
Error
else
Name
end
end
def token_for_id(id)
if self.class.keywords.include? id
Keyword::Reserved
elsif self.class.symbolic_reserved.include? id
Punctuation
else
Name
end
end
state :core do
rule /[()\[\]{},;_]|[.][.][.]/, Punctuation
rule /#"/, Str::Char, :char
rule /"/, Str::Double, :string
rule /~?0x[0-9a-fA-F]+/, Num::Hex
rule /0wx[0-9a-fA-F]+/, Num::Hex
rule /0w\d+/, Num::Integer
rule /~?\d+([.]\d+)?[eE]~?\d+/, Num::Float
rule /~?\d+[.]\d+/, Num::Float
rule /~?\d+/, Num::Integer
rule /#\s*[1-9][0-9]*/, Name::Label
rule /#\s*#{id}/, Name::Label
rule /#\s+#{symbol}/, Name::Label
rule /\b(datatype|abstype)\b(?!')/, Keyword::Reserved, :dname
rule(/(?=\bexception\b(?!'))/) { push :ename }
rule /\b(functor|include|open|signature|structure)\b(?!')/,
Keyword::Reserved, :sname
rule /\b(type|eqtype)\b(?!')/, Keyword::Reserved, :tname
rule /'#{id}/, Name::Decorator
rule /(#{id})([.])/ do |m|
groups(token_for_id_with_dot(m[1]), Punctuation)
push :dotted
end
rule id do |m|
token token_for_id(m[0])
end
rule symbol do |m|
token token_for_id(m[0])
end
end
state :dotted do
rule /(#{id})([.])/ do |m|
groups(token_for_id_with_dot(m[1]), Punctuation)
end
rule id do |m|
token token_for_id(m[0])
pop!
end
rule symbol do |m|
token token_for_id(m[0])
pop!
end
end
state :root do
rule /#!.*?\n/, Comment::Preproc
rule(//) { push :main }
end
state :main do
mixin :whitespace
rule /\b(val|and)\b(?!')/, Keyword::Reserved, :vname
rule /\b(fun)\b(?!')/ do
token Keyword::Reserved
goto :main_fun
push :fname
end
mixin :delimiters
mixin :core
end
state :main_fun do
mixin :whitespace
rule /\b(fun|and)\b(?!')/, Keyword::Reserved, :fname
rule /\bval\b(?!')/ do
token Keyword::Reserved
goto :main
push :vname
end
rule /[|]/, Punctuation, :fname
rule /\b(case|handle)\b(?!')/ do
token Keyword::Reserved
goto :main
end
mixin :delimiters
mixin :core
end
state :has_escapes do
rule /\\[\\"abtnvfr]/, Str::Escape
rule /\\\^[\x40-\x5e]/, Str::Escape
rule /\\[0-9]{3}/, Str::Escape
rule /\\u\h{4}/, Str::Escape
rule /\\\s+\\/, Str::Interpol
end
state :string do
rule /[^"\\]+/, Str::Double
rule /"/, Str::Double, :pop!
mixin :has_escapes
end
state :char do
rule /[^"\\]+/, Str::Char
rule /"/, Str::Char, :pop!
mixin :has_escapes
end
state :breakout do
rule /(?=\w+\b(#{SML.keywords.to_a.join('|')})\b(?!'))/ do
pop!
end
end
state :sname do
mixin :whitespace
mixin :breakout
rule id, Name::Namespace
rule(//) { pop! }
end
state :has_annotations do
rule /'[\w']*/, Name::Decorator
rule /[(]/, Punctuation, :tyvarseq
end
state :fname do
mixin :whitespace
mixin :has_annotations
rule id, Name::Function, :pop!
rule symbol, Name::Function, :pop!
end
state :vname do
mixin :whitespace
mixin :has_annotations
rule /(#{id})(\s*)(=(?!#{symbol}))/m do
groups Name::Variable, Text, Punctuation
pop!
end
rule /(#{symbol})(\s*)(=(?!#{symbol}))/m do
groups Name::Variable, Text, Punctuation
end
rule id, Name::Variable, :pop!
rule symbol, Name::Variable, :pop!
rule(//) { pop! }
end
state :tname do
mixin :whitespace
mixin :breakout
mixin :has_annotations
rule /'[\w']*/, Name::Decorator
rule /[(]/, Punctuation, :tyvarseq
rule %r(=(?!#{symbol})) do
token Punctuation
goto :typbind
end
rule id, Keyword::Type
rule symbol, Keyword::Type
end
state :typbind do
mixin :whitespace
rule /\b(and)\b(?!')/ do
token Keyword::Reserved
goto :tname
end
mixin :breakout
mixin :core
end
state :dname do
mixin :whitespace
mixin :breakout
mixin :has_annotations
rule /(=)(\s*)(datatype)\b/ do
groups Punctuation, Text, Keyword::Reserved
pop!
end
rule %r(=(?!#{symbol})) do
token Punctuation
goto :datbind
push :datcon
end
rule id, Keyword::Type
rule symbol, Keyword::Type
end
state :datbind do
mixin :whitespace
rule /\b(and)\b(?!')/ do
token Keyword::Reserved; goto :dname
end
rule /\b(withtype)\b(?!')/ do
token Keyword::Reserved; goto :tname
end
rule /\bof\b(?!')/, Keyword::Reserved
rule /([|])(\s*)(#{id})/ do
groups(Punctuation, Text, Name::Class)
end
rule /([|])(\s+)(#{symbol})/ do
groups(Punctuation, Text, Name::Class)
end
mixin :breakout
mixin :core
end
state :ename do
mixin :whitespace
rule /(exception|and)(\s+)(#{id})/ do
groups Keyword::Reserved, Text, Name::Class
end
rule /(exception|and)(\s*)(#{symbol})/ do
groups Keyword::Reserved, Text, Name::Class
end
rule /\b(of)\b(?!')/, Keyword::Reserved
mixin :breakout
mixin :core
end
state :datcon do
mixin :whitespace
rule id, Name::Class, :pop!
rule symbol, Name::Class, :pop!
end
state :tyvarseq do
mixin :whitespace
rule /'[\w']*/, Name::Decorator
rule id, Name
rule /,/, Punctuation
rule /[)]/, Punctuation, :pop!
rule symbol, Name
end
state :comment do
rule /[^(*)]+/, Comment::Multiline
rule /[(][*]/ do
token Comment::Multiline; push
end
rule /[*][)]/, Comment::Multiline, :pop!
rule /[(*)]/, Comment::Multiline
end
end
end
end