# -*- coding: utf-8 -*- #
# frozen_string_literal: true
module Rouge
module Lexers
class Clean < RegexLexer
title "Clean"
desc "The Clean programming language (clean.cs.ru.nl)"
tag 'clean'
filenames '*.dcl', '*.icl'
def self.keywords
@keywords ||= Set.new %w(
if otherwise
let in
with where
case of
infix infixl infixr
class instance
generic derive
special
implementation definition system module
from import qualified as
dynamic
code inline foreign export ccall stdcall
)
end
# These are literal patterns common to the ABC intermediate language and
# Clean. Clean has more extensive literal patterns (see :basic below).
state :common_literals do
rule %r/'(?:[^'\\]|\\(?:x[0-9a-fA-F]+|\d+|.))'/, Str::Char
rule %r/[+~-]?\d+\.\d+(?:E[+-]?\d+)?\b/, Num::Float
rule %r/[+~-]?\d+E[+-]?\d+\b/, Num::Float
rule %r/[+~-]?\d+/, Num::Integer
rule %r/"/, Str::Double, :string
end
state :basic do
rule %r/\s+/m, Text::Whitespace
rule %r/\/\/\*.*/, Comment::Doc
rule %r/\/\/.*/, Comment::Single
rule %r/\/\*\*/, Comment::Doc, :comment_doc
rule %r/\/\*/, Comment::Multiline, :comment
rule %r/[+~-]?0[0-7]+/, Num::Oct
rule %r/[+~-]?0x[0-9a-fA-F]+/, Num::Hex
mixin :common_literals
rule %r/(\[)(\s*)(')(?=.*?'\])/ do
groups Punctuation, Text::Whitespace, Str::Single, Punctuation
push :charlist
end
end
# nested commenting
state :comment_doc do
rule %r/\*\//, Comment::Doc, :pop!
rule %r/\/\/.*/, Comment::Doc # Singleline comments in multiline comments are skipped
rule %r/\/\*/, Comment::Doc, :comment
rule %r/[^*\/]+/, Comment::Doc
rule %r/[*\/]/, Comment::Doc
end
# This is the same as the above, but with Multiline instead of Doc
state :comment do
rule %r/\*\//, Comment::Multiline, :pop!
rule %r/\/\/.*/, Comment::Multiline # Singleline comments in multiline comments are skipped
rule %r/\/\*/, Comment::Multiline, :comment
rule %r/[^*\/]+/, Comment::Multiline
rule %r/[*\/]/, Comment::Multiline
end
state :root do
mixin :basic
rule %r/code(\s+inline)?\s*{/, Comment::Preproc, :abc
rule %r/_*[a-z][\w_`]*/ do |m|
if self.class.keywords.include?(m[0])
token Keyword
else
token Name
end
end
rule %r/_*[A-Z][\w_`]*/ do |m|
if m[0]=='True' || m[0]=='False'
token Keyword::Constant
else
token Keyword::Type
end
end
rule %r/[^\w_\s`]/, Punctuation
rule %r/_\b/, Punctuation
end
state :escapes do
rule %r/\\x[0-9a-fA-F]{1,2}/i, Str::Escape
rule %r/\\d\d{0,3}/i, Str::Escape
rule %r/\\0[0-7]{0,3}/, Str::Escape
rule %r/\\[0-7]{1,3}/, Str::Escape
rule %r/\\[nrfbtv\\"']/, Str::Escape
end
state :string do
rule %r/"/, Str::Double, :pop!
mixin :escapes
rule %r/[^\\"]+/, Str::Double
end
state :charlist do
rule %r/(')(\])/ do
groups Str::Single, Punctuation
pop!
end
mixin :escapes
rule %r/[^\\']/, Str::Single
end
state :abc_basic do
rule %r/\s+/, Text::Whitespace
rule %r/\|.*/, Comment::Single
mixin :common_literals
end
# The ABC intermediate language can be included, similar to C's inline
# assembly. For some information about ABC, see:
# https://en.wikipedia.org/wiki/Clean_(programming_language)#The_ABC-Machine
state :abc do
mixin :abc_basic
rule %r/}/, Comment::Preproc, :pop!
rule %r/\.\w*/, Keyword, :abc_rest_of_line
rule %r/[\w_]+/, Name::Builtin, :abc_rest_of_line
end
state :abc_rest_of_line do
rule %r/\n/, Text::Whitespace, :pop!
rule %r/}/ do
token Comment::Preproc
pop!
pop!
end
mixin :abc_basic
rule %r/\S+/, Name
end
end
end
end