rust.lua (3399B)
- -- Copyright 2015-2024 Alejandro Baez (https://keybase.io/baez). See LICENSE.
- -- Rust LPeg lexer.
- local lexer = lexer
- local P, S = lpeg.P, lpeg.S
- local C, Cmt = lpeg.C, lpeg.Cmt
- local lex = lexer.new(...)
- -- Keywords.
- lex:add_rule('keyword', lex:tag(lexer.KEYWORD, lex:word_match(lexer.KEYWORD)))
- -- Library types.
- lex:add_rule('library', lex:tag(lexer.TYPE, lexer.upper * (lexer.lower + lexer.dec_num)^1))
- -- Types.
- lex:add_rule('type', lex:tag(lexer.TYPE, lex:word_match(lexer.TYPE)))
- -- Lifetime annotation.
- lex:add_rule('lifetime', lex:tag(lexer.OPERATOR, S('<&') * P("'")))
- -- Strings.
- local sq_str = P('b')^-1 * lexer.range("'", true)
- local dq_str = P('b')^-1 * lexer.range('"')
- local raw_str = Cmt(P('b')^-1 * P('r') * C(P('#')^0) * '"', function(input, index, hashes)
- local _, e = input:find('"' .. hashes, index, true)
- return (e or #input) + 1
- end)
- lex:add_rule('string', lex:tag(lexer.STRING, sq_str + dq_str + raw_str))
- -- Functions.
- local builtin_macros = lex:tag(lexer.FUNCTION_BUILTIN, lex:word_match(lexer.FUNCTION_BUILTIN) * '!')
- local macros = lex:tag(lexer.FUNCTION, lexer.word * '!')
- local func = lex:tag(lexer.FUNCTION, lexer.word)
- lex:add_rule('function', (builtin_macros + macros + func) * #(lexer.space^0 * '('))
- -- Identifiers.
- local identifier = P('r#')^-1 * lexer.word
- lex:add_rule('identifier', lex:tag(lexer.IDENTIFIER, identifier))
- -- Comments.
- local line_comment = lexer.to_eol('//', true)
- local block_comment = lexer.range('/*', '*/', false, false, true)
- lex:add_rule('comment', lex:tag(lexer.COMMENT, line_comment + block_comment))
- -- Numbers.
- lex:add_rule('number', lex:tag(lexer.NUMBER, lexer.number_('_')))
- -- Attributes.
- lex:add_rule('preprocessor', lex:tag(lexer.PREPROCESSOR, '#' * lexer.range('[', ']', true)))
- -- Operators.
- lex:add_rule('operator', lex:tag(lexer.OPERATOR, S('+-/*%<>!=`^~@&|?#~:;,.()[]{}')))
- -- Fold points.
- lex:add_fold_point(lexer.COMMENT, '/*', '*/')
- lex:add_fold_point(lexer.OPERATOR, '(', ')')
- lex:add_fold_point(lexer.OPERATOR, '{', '}')
- -- https://doc.rust-lang.org/std/#keywords
- lex:set_word_list(lexer.KEYWORD, {
- 'SelfTy', 'as', 'async', 'await', 'break', 'const', 'continue', 'crate', 'dyn', 'else', 'enum',
- 'extern', 'false', 'fn', 'for', 'if', 'impl', 'in', 'let', 'loop', 'match', 'mod', 'move', 'mut',
- 'pub', 'ref', 'return', 'self', 'static', 'struct', 'super', 'trait', 'true', 'type', 'union',
- 'unsafe', 'use', 'where', 'while'
- })
- -- https://doc.rust-lang.org/std/#primitives
- lex:set_word_list(lexer.TYPE, {
- 'never', 'array', 'bool', 'char', 'f32', 'f64', 'fn', 'i8', 'i16', 'i32', 'i64', 'i128', 'isize',
- 'pointer', 'reference', 'slice', 'str', 'tuple', 'u8', 'u16', 'u32', 'u64', 'u128', 'unit',
- 'usize'
- })
- lex:set_word_list(lexer.FUNCTION_BUILTIN, {
- 'assert', 'assert_eq', 'assert_ne', 'cfg', 'column', 'compile_error', 'concat', 'dbg',
- 'debug_assert', 'debug_assert_eq', 'debug_assert_ne', 'env', 'eprint', 'eprintln', 'file',
- 'format', 'format_args', 'include', 'include_bytes', 'include_str', 'line', 'matches',
- 'module_path', 'option_env', 'panic', 'print', 'println', 'stringify', 'thread_local', 'todo',
- 'unimplemented', 'unreachable', 'vec', 'write', 'writeln',
- -- Experimental
- 'concat_bytes', 'concat_idents', 'const_format_args', 'format_args_nl', 'log_syntax',
- 'trace_macros',
- -- Deprecated
- 'try'
- })
- lexer.property['scintillua.comment'] = '//'
- return lex