from pygments.lexer import RegexLexer, bygroups from pygments.token import * class DataSpecLexer(RegexLexer): name = 'DataSpec' aliases = ['dataspec'] filenames = [] tokens = { 'root': [ (r'(\s*)(\+-)', bygroups(Text, Text), 'boundary'), (r'(\s+)([\+|])', bygroups(Text, Text), 'content'), (r'~', Generic.Strong, 'content'), (r'(\s*)([\w=;]+)(\s)(::)(\s)', bygroups(Text, Name.Tag, Text, Operator, Text), 'definition'), ], 'boundary': [ (r'---\+$', Text, '#pop'), (r'(//)(-\+)?$', bygroups(Generic.Strong, Text), '#pop'), (r'---\+-', Text), (r'---\+\s', Text, '#pop', 'content'), (r'(//)(-\+-)', bygroups(Generic.Strong, Text)), ], 'content': [ (r'(\s*)([\+|])$', bygroups(Text, Text), '#pop'), (r'(\s*)(\.\.\.)$', bygroups(Text, Generic.Strong), '#pop'), (r'(\s*)(~)$', bygroups(Text, Generic.Strong), '#pop'), (r'(\s*)([\w=;]+)$', bygroups(Text, Name.Tag), '#pop'), (r'(\s*)([\w=;]+)', bygroups(Text, Name.Tag)), (r'(\s*)(\|)', bygroups(Text, Text)), (r'(\s*)(\()', bygroups(Text, Punctuation), 'expression'), ], 'expression': [ (r'(\s*)(\))', bygroups(Text, Punctuation), '#pop'), (r'(\s*)([+-])', bygroups(Text, Operator)), (r'(\s*)(\$\w+)', bygroups(Text, Name.Tag)), (r'(\s*)(\w+)', bygroups(Text, Name)), ], 'definition': [ (r'(\s*)([\w=;]+)(\s)(::)(\s)', bygroups(Text, Name.Tag, Text, Operator, Text)), (r'(\s*)((?:[A-Z][a-z]+)+)', bygroups(Text, Name.Class)), (r'(\s*)([A-Z]{2,})', bygroups(Text, Name.Constant)), (r'(\s*)([\[\]])', bygroups(Text, Punctuation)), (r'(\s*)(\$\w+)', bygroups(Text, Name.Tag)), (r'(\s*)([0-9]+)(\+)?', bygroups(Text, Number, Punctuation)), (r'(-)([0-9]+)', bygroups(Punctuation, Number)), (r'(\s*)(->|<=|>=|\*)', bygroups(Text, Operator)), (r'(\s*)([\w()-=\'<>]+)', bygroups(Text, Comment)), ], }