class Dentaku::TokenScanner
def access
def access names = { lbracket: '[', rbracket: ']' }.invert new(:access, '\[|\]', lambda { |raw| names[raw] }) end
def array
def array names = { array_start: '{', array_end: '}', }.invert new(:array, '\{|\}|,', lambda { |raw| names[raw] }) end
def available_scanners
def available_scanners [ :null, :whitespace, :datetime, # before numeric so it can pick up timestamps :numeric, :hexadecimal, :double_quoted_string, :single_quoted_string, :negate, :combinator, :operator, :grouping, :array, :access, :case_statement, :comparator, :boolean, :function, :identifier, :quoted_identifier ] end
def boolean
def boolean new(:logical, '(true|false)\b', lambda { |raw| raw.strip.downcase == 'true' }) end
def case_statement
def case_statement names = { open: 'case', close: 'end', then: 'then', when: 'when', else: 'else' }.invert new(:case, '(case|end|then|when|else)\b', lambda { |raw| names[raw.downcase] }) end
def combinator
def combinator names = { and: '&&', or: '||' }.invert new(:combinator, '(and|or|&&|\|\|)\s', lambda { |raw| norm = raw.strip.downcase names.fetch(norm) { norm.to_sym } }) end
def comparator
def comparator names = { le: '<=', ge: '>=', ne: '!=', lt: '<', gt: '>', eq: '=' }.invert alternate = { ne: '<>', eq: '==' }.invert new(:comparator, '<=|>=|!=|<>|<|>|==|=', lambda { |raw| names[raw] || alternate[raw] }) end
def datetime
def datetime new(:datetime, DATE_TIME_REGEXP, lambda { |raw| Time.parse(raw).to_datetime }) end
def double_quoted_string
def double_quoted_string new(:string, '"[^"]*"', lambda { |raw| raw.gsub(/^"|"$/, '') }) end
def function
def function new(:function, '\w+!?\s*\(', lambda do |raw| function_name = raw.gsub('(', '') [ Token.new(:function, function_name.strip.downcase.to_sym, function_name), Token.new(:grouping, :open, '(') ] end) end
def grouping
def grouping names = { open: '(', close: ')', comma: ',' }.invert new(:grouping, '\(|\)|,', lambda { |raw| names[raw] }) end
def hexadecimal
def hexadecimal new(:numeric, '(0x[0-9a-f]+)\b', lambda { |raw| raw[2..-1].to_i(16) }) end
def identifier
def identifier new(:identifier, '[[[:word:]]\.]+\b', lambda { |raw| standardize_case(raw.strip) }) end
def initialize(category, regexp, converter = nil, condition = nil)
def initialize(category, regexp, converter = nil, condition = nil) @category = category @regexp = %r{\A(#{ regexp })}i @converter = converter @condition = condition || ->(*) { true } end
def negate
def negate new(:operator, '-', lambda { |raw| :negate }, lambda { |last_token| last_token.nil? || last_token.is?(:operator) || last_token.is?(:comparator) || last_token.is?(:combinator) || last_token.value == :open || last_token.value == :comma }) end
def null
def null new(:null, 'null\b') end
def numeric
def numeric new(:numeric, '((?:\d+(\.\d+)?|\.\d+)(?:(e|E)(\+|-)?\d+)?)\b', lambda { |raw| raw =~ /(\.|e|E)/ ? BigDecimal(raw) : raw.to_i }) end
def operator
def operator names = { pow: '^', add: '+', subtract: '-', multiply: '*', divide: '/', mod: '%', bitor: '|', bitand: '&', bitshiftleft: '<<', bitshiftright: '>>' }.invert new(:operator, '\^|\+|-|\*|\/|%|\||&|<<|>>', lambda { |raw| names[raw] }) end
def quoted_identifier
def quoted_identifier new(:identifier, '`[^`]*`', lambda { |raw| raw.gsub(/^`|`$/, '') }) end
def register_default_scanners
def register_default_scanners register_scanners(available_scanners) end
def register_scanner(id, scanner)
def register_scanner(id, scanner) @scanners[id] = scanner end
def register_scanners(scanner_ids)
def register_scanners(scanner_ids) @scanners = scanner_ids.each_with_object({}) do |id, scanners| scanners[id] = self.send(id) end end
def scan(string, last_token = nil)
def scan(string, last_token = nil) if (m = @regexp.match(string)) && @condition.call(last_token) value = raw = m.to_s value = @converter.call(raw) if @converter return Array(value).map do |v| Token === v ? v : Token.new(@category, v, raw) end end false end
def scanners(options = {})
def scanners(options = {}) @case_sensitive = options.fetch(:case_sensitive, false) raw_date_literals = options.fetch(:raw_date_literals, true) @scanners.select { |k, _| raw_date_literals || k != :datetime }.values end
def scanners=(scanner_ids)
def scanners=(scanner_ids) @scanners.select! { |k, v| scanner_ids.include?(k) } end
def single_quoted_string
def single_quoted_string new(:string, "'[^']*'", lambda { |raw| raw.gsub(/^'|'$/, '') }) end
def whitespace
def whitespace new(:whitespace, '\s+') end