| """ |
| pygments.lexers.rust |
| ~~~~~~~~~~~~~~~~~~~~ |
| |
| Lexers for the Rust language. |
| |
| :copyright: Copyright 2006-2023 by the Pygments team, see AUTHORS. |
| :license: BSD, see LICENSE for details. |
| """ |
| |
| from pygments.lexer import RegexLexer, include, bygroups, words, default |
| from pygments.token import Text, Comment, Operator, Keyword, Name, String, \ |
| Number, Punctuation, Whitespace |
| |
| __all__ = ['RustLexer'] |
| |
| |
| class RustLexer(RegexLexer): |
| """ |
| Lexer for the Rust programming language (version 1.47). |
| |
| .. versionadded:: 1.6 |
| """ |
| name = 'Rust' |
| url = 'https://www.rust-lang.org/' |
| filenames = ['*.rs', '*.rs.in'] |
| aliases = ['rust', 'rs'] |
| mimetypes = ['text/rust', 'text/x-rust'] |
| |
| keyword_types = (words(( |
| 'u8', 'u16', 'u32', 'u64', 'u128', 'i8', 'i16', 'i32', 'i64', 'i128', |
| 'usize', 'isize', 'f32', 'f64', 'char', 'str', 'bool', |
| ), suffix=r'\b'), Keyword.Type) |
| |
| builtin_funcs_types = (words(( |
| 'Copy', 'Send', 'Sized', 'Sync', 'Unpin', |
| 'Drop', 'Fn', 'FnMut', 'FnOnce', 'drop', |
| 'Box', 'ToOwned', 'Clone', |
| 'PartialEq', 'PartialOrd', 'Eq', 'Ord', |
| 'AsRef', 'AsMut', 'Into', 'From', 'Default', |
| 'Iterator', 'Extend', 'IntoIterator', 'DoubleEndedIterator', |
| 'ExactSizeIterator', |
| 'Option', 'Some', 'None', |
| 'Result', 'Ok', 'Err', |
| 'String', 'ToString', 'Vec', |
| ), suffix=r'\b'), Name.Builtin) |
| |
| builtin_macros = (words(( |
| 'asm', 'assert', 'assert_eq', 'assert_ne', 'cfg', 'column', |
| 'compile_error', 'concat', 'concat_idents', 'dbg', 'debug_assert', |
| 'debug_assert_eq', 'debug_assert_ne', 'env', 'eprint', 'eprintln', |
| 'file', 'format', 'format_args', 'format_args_nl', 'global_asm', |
| 'include', 'include_bytes', 'include_str', |
| 'is_aarch64_feature_detected', |
| 'is_arm_feature_detected', |
| 'is_mips64_feature_detected', |
| 'is_mips_feature_detected', |
| 'is_powerpc64_feature_detected', |
| 'is_powerpc_feature_detected', |
| 'is_x86_feature_detected', |
| 'line', 'llvm_asm', 'log_syntax', 'macro_rules', 'matches', |
| 'module_path', 'option_env', 'panic', 'print', 'println', 'stringify', |
| 'thread_local', 'todo', 'trace_macros', 'unimplemented', 'unreachable', |
| 'vec', 'write', 'writeln', |
| ), suffix=r'!'), Name.Function.Magic) |
| |
| tokens = { |
| 'root': [ |
| # rust allows a file to start with a shebang, but if the first line |
| # starts with #![ then it's not a shebang but a crate attribute. |
| (r'#![^[\r\n].*$', Comment.Preproc), |
| default('base'), |
| ], |
| 'base': [ |
| # Whitespace and Comments |
| (r'\n', Whitespace), |
| (r'\s+', Whitespace), |
| (r'//!.*?\n', String.Doc), |
| (r'///(\n|[^/].*?\n)', String.Doc), |
| (r'//(.*?)\n', Comment.Single), |
| (r'/\*\*(\n|[^/*])', String.Doc, 'doccomment'), |
| (r'/\*!', String.Doc, 'doccomment'), |
| (r'/\*', Comment.Multiline, 'comment'), |
| |
| # Macro parameters |
| (r"""\$([a-zA-Z_]\w*|\(,?|\),?|,?)""", Comment.Preproc), |
| # Keywords |
| (words(('as', 'async', 'await', 'box', 'const', 'crate', 'dyn', |
| 'else', 'extern', 'for', 'if', 'impl', 'in', 'loop', |
| 'match', 'move', 'mut', 'pub', 'ref', 'return', 'static', |
| 'super', 'trait', 'unsafe', 'use', 'where', 'while'), |
| suffix=r'\b'), Keyword), |
| (words(('abstract', 'become', 'do', 'final', 'macro', 'override', |
| 'priv', 'typeof', 'try', 'unsized', 'virtual', 'yield'), |
| suffix=r'\b'), Keyword.Reserved), |
| (r'(true|false)\b', Keyword.Constant), |
| (r'self\b', Name.Builtin.Pseudo), |
| (r'mod\b', Keyword, 'modname'), |
| (r'let\b', Keyword.Declaration), |
| (r'fn\b', Keyword, 'funcname'), |
| (r'(struct|enum|type|union)\b', Keyword, 'typename'), |
| (r'(default)(\s+)(type|fn)\b', bygroups(Keyword, Text, Keyword)), |
| keyword_types, |
| (r'[sS]elf\b', Name.Builtin.Pseudo), |
| # Prelude (taken from Rust's src/libstd/prelude.rs) |
| builtin_funcs_types, |
| builtin_macros, |
| # Path separators, so types don't catch them. |
| (r'::\b', Text), |
| # Types in positions. |
| (r'(?::|->)', Text, 'typename'), |
| # Labels |
| (r'(break|continue)(\b\s*)(\'[A-Za-z_]\w*)?', |
| bygroups(Keyword, Text.Whitespace, Name.Label)), |
| |
| # Character literals |
| (r"""'(\\['"\\nrt]|\\x[0-7][0-9a-fA-F]|\\0""" |
| r"""|\\u\{[0-9a-fA-F]{1,6}\}|.)'""", |
| String.Char), |
| (r"""b'(\\['"\\nrt]|\\x[0-9a-fA-F]{2}|\\0""" |
| r"""|\\u\{[0-9a-fA-F]{1,6}\}|.)'""", |
| String.Char), |
| |
| # Binary literals |
| (r'0b[01_]+', Number.Bin, 'number_lit'), |
| # Octal literals |
| (r'0o[0-7_]+', Number.Oct, 'number_lit'), |
| # Hexadecimal literals |
| (r'0[xX][0-9a-fA-F_]+', Number.Hex, 'number_lit'), |
| # Decimal literals |
| (r'[0-9][0-9_]*(\.[0-9_]+[eE][+\-]?[0-9_]+|' |
| r'\.[0-9_]*(?!\.)|[eE][+\-]?[0-9_]+)', Number.Float, |
| 'number_lit'), |
| (r'[0-9][0-9_]*', Number.Integer, 'number_lit'), |
| |
| # String literals |
| (r'b"', String, 'bytestring'), |
| (r'"', String, 'string'), |
| (r'(?s)b?r(#*)".*?"\1', String), |
| |
| # Lifetime names |
| (r"'", Operator, 'lifetime'), |
| |
| # Operators and Punctuation |
| (r'\.\.=?', Operator), |
| (r'[{}()\[\],.;]', Punctuation), |
| (r'[+\-*/%&|<>^!~@=:?]', Operator), |
| |
| # Identifiers |
| (r'[a-zA-Z_]\w*', Name), |
| # Raw identifiers |
| (r'r#[a-zA-Z_]\w*', Name), |
| |
| # Attributes |
| (r'#!?\[', Comment.Preproc, 'attribute['), |
| |
| # Misc |
| # Lone hashes: not used in Rust syntax, but allowed in macro |
| # arguments, most famously for quote::quote!() |
| (r'#', Text), |
| ], |
| 'comment': [ |
| (r'[^*/]+', Comment.Multiline), |
| (r'/\*', Comment.Multiline, '#push'), |
| (r'\*/', Comment.Multiline, '#pop'), |
| (r'[*/]', Comment.Multiline), |
| ], |
| 'doccomment': [ |
| (r'[^*/]+', String.Doc), |
| (r'/\*', String.Doc, '#push'), |
| (r'\*/', String.Doc, '#pop'), |
| (r'[*/]', String.Doc), |
| ], |
| 'modname': [ |
| (r'\s+', Text), |
| (r'[a-zA-Z_]\w*', Name.Namespace, '#pop'), |
| default('#pop'), |
| ], |
| 'funcname': [ |
| (r'\s+', Text), |
| (r'[a-zA-Z_]\w*', Name.Function, '#pop'), |
| default('#pop'), |
| ], |
| 'typename': [ |
| (r'\s+', Text), |
| (r'&', Keyword.Pseudo), |
| (r"'", Operator, 'lifetime'), |
| builtin_funcs_types, |
| keyword_types, |
| (r'[a-zA-Z_]\w*', Name.Class, '#pop'), |
| default('#pop'), |
| ], |
| 'lifetime': [ |
| (r"(static|_)", Name.Builtin), |
| (r"[a-zA-Z_]+\w*", Name.Attribute), |
| default('#pop'), |
| ], |
| 'number_lit': [ |
| (r'[ui](8|16|32|64|size)', Keyword, '#pop'), |
| (r'f(32|64)', Keyword, '#pop'), |
| default('#pop'), |
| ], |
| 'string': [ |
| (r'"', String, '#pop'), |
| (r"""\\['"\\nrt]|\\x[0-7][0-9a-fA-F]|\\0""" |
| r"""|\\u\{[0-9a-fA-F]{1,6}\}""", String.Escape), |
| (r'[^\\"]+', String), |
| (r'\\', String), |
| ], |
| 'bytestring': [ |
| (r"""\\x[89a-fA-F][0-9a-fA-F]""", String.Escape), |
| include('string'), |
| ], |
| 'attribute_common': [ |
| (r'"', String, 'string'), |
| (r'\[', Comment.Preproc, 'attribute['), |
| ], |
| 'attribute[': [ |
| include('attribute_common'), |
| (r'\]', Comment.Preproc, '#pop'), |
| (r'[^"\]\[]+', Comment.Preproc), |
| ], |
| } |