diff options
| -rw-r--r-- | lexers/crystal.lua | 142 | ||||
| -rw-r--r-- | vis.lua | 1 |
2 files changed, 143 insertions, 0 deletions
diff --git a/lexers/crystal.lua b/lexers/crystal.lua new file mode 100644 index 0000000..4af2fef --- /dev/null +++ b/lexers/crystal.lua @@ -0,0 +1,142 @@ +-- Copyright 2006-2016 Mitchell mitchell.att.foicica.com. See LICENSE. +-- Copyright 2016 Michel Martens. +-- Crystal LPeg lexer (based on Ruby). + +local l = require('lexer') +local token, word_match = l.token, l.word_match +local P, R, S = lpeg.P, lpeg.R, lpeg.S + +local M = {_NAME = 'crystal'} + +-- Whitespace. +local ws = token(l.WHITESPACE, l.space^1) + +-- Comments. +local line_comment = '#' * l.nonnewline_esc^0 +local comment = token(l.COMMENT, line_comment) + +local delimiter_matches = {['('] = ')', ['['] = ']', ['{'] = '}'} +local literal_delimitted = P(function(input, index) + local delimiter = input:sub(index, index) + if not delimiter:find('[%w\r\n\f\t ]') then -- only non alpha-numerics + local match_pos, patt + if delimiter_matches[delimiter] then + -- Handle nested delimiter/matches in strings. + local s, e = delimiter, delimiter_matches[delimiter] + patt = l.delimited_range(s..e, false, false, true) + else + patt = l.delimited_range(delimiter) + end + match_pos = lpeg.match(patt, input, index) + return match_pos or #input + 1 + end +end) + +-- Strings. +local cmd_str = l.delimited_range('`') +local sq_str = l.delimited_range("'") +local dq_str = l.delimited_range('"') +local heredoc = '<<' * P(function(input, index) + local s, e, indented, _, delimiter = + input:find('(%-?)(["`]?)([%a_][%w_]*)%2[\n\r\f;]+', index) + if s == index and delimiter then + local end_heredoc = (#indented > 0 and '[\n\r\f]+ *' or '[\n\r\f]+') + local _, e = input:find(end_heredoc..delimiter, e) + return e and e + 1 or #input + 1 + end +end) +-- TODO: regex_str fails with `obj.method /patt/` syntax. +local regex_str = #P('/') * l.last_char_includes('!%^&*([{-=+|:;,?<>~') * + l.delimited_range('/', true, false) * S('iomx')^0 +local string = token(l.STRING, (sq_str + dq_str + heredoc + cmd_str) * S('f')^-1) + + token(l.REGEX, regex_str) + +local word_char = l.alnum + S('_!?') + +-- Numbers. +local dec = l.digit^1 * ('_' * l.digit^1)^0 * S('ri')^-1 +local bin = '0b' * S('01')^1 * ('_' * S('01')^1)^0 +local integer = S('+-')^-1 * (bin + l.hex_num + l.oct_num + dec) +-- TODO: meta, control, etc. for numeric_literal. +local numeric_literal = '?' * (l.any - l.space) * -word_char +local number = token(l.NUMBER, l.float * S('ri')^-1 + integer + numeric_literal) + +-- Keywords. +local keyword = token(l.KEYWORD, word_match({ + 'alias', 'begin', 'break', 'case', 'class', 'def', 'defined?', + 'do', 'else', 'elsif', 'end', 'ensure', 'false', 'for', 'if', + 'in', 'module', 'next', 'nil', 'not', 'redo', 'rescue', 'retry', + 'return', 'self', 'super', 'then', 'true', 'undef', 'unless', + 'until', 'when', 'while', 'yield', '__FILE__', '__LINE__' +}, '?!')) + +-- Functions. +local func = token(l.FUNCTION, word_match({ + 'abort', 'at_exit', 'caller', 'delay', 'exit', 'fork', 'future', + 'get_stack_top', 'gets', 'lazy', 'loop', 'main', 'p', 'print', + 'printf', 'puts', 'raise', 'rand', 'read_line', 'require', 'sleep', + 'spawn', 'sprintf', 'system', 'with_color', + -- Macros + 'assert_responds_to', 'debugger', 'parallel', 'pp', 'record', + 'redefine_main' +}, '?!')) * -S('.:|') + +-- Identifiers. +local word = (l.alpha + '_') * word_char^0 +local identifier = token(l.IDENTIFIER, word) + +-- Variables. +local global_var = '$' * (word + S('!@L+`\'=~/\\,.;<>_*"$?:') + l.digit + '-' * + S('0FadiIKlpvw')) +local class_var = '@@' * word +local inst_var = '@' * word +local variable = token(l.VARIABLE, global_var + class_var + inst_var) + +-- Symbols. +local symbol = token('symbol', ':' * P(function(input, index) + if input:sub(index - 2, index - 2) ~= ':' then return index end +end) * (word_char^1 + sq_str + dq_str)) + +-- Operators. +local operator = token(l.OPERATOR, S('!%^&*()[]{}-=+/|:;.,?<>~')) + +M._rules = { + {'whitespace', ws}, + {'keyword', keyword}, + {'function', func}, + {'identifier', identifier}, + {'comment', comment}, + {'string', string}, + {'number', number}, + {'variable', variable}, + {'symbol', symbol}, + {'operator', operator}, +} + +M._tokenstyles = { + symbol = l.STYLE_CONSTANT +} + +local function disambiguate(text, pos, line, s) + return line:sub(1, s - 1):match('^%s*$') and + not text:sub(1, pos - 1):match('\\[ \t]*\r?\n$') and 1 or 0 +end + +M._foldsymbols = { + _patterns = {'%l+', '[%(%)%[%]{}]', '#'}, + [l.KEYWORD] = { + begin = 1, class = 1, def = 1, ['do'] = 1, ['for'] = 1, ['module'] = 1, + case = 1, + ['if'] = disambiguate, ['while'] = disambiguate, + ['unless'] = disambiguate, ['until'] = disambiguate, + ['end'] = -1 + }, + [l.OPERATOR] = { + ['('] = 1, [')'] = -1, ['['] = 1, [']'] = -1, ['{'] = 1, ['}'] = -1 + }, + [l.COMMENT] = { + ['#'] = l.fold_line_comments('#') + } +} + +return M @@ -98,6 +98,7 @@ vis.filetypes = { [".cmake|.cmake.in|.ctest|.ctest.in"] = "cmake", [".coffee"] = "coffeescript", [".cpp|.cxx|.c++|.cc|.hh|.hpp|.hxx|.h++"] = "cpp", + [".cr"] = "crystal", [".cs"] = "csharp", [".css"] = "css", [".cu|.cuh"] = "cuda", |
