This repository has been archived on 2024-06-20. You can view files and clone it, but you cannot make any changes to it's state, such as pushing and creating new issues, pull requests or comments.
coffee.pygments/pygments/lexers/asn1.py
Jean Abou Samra 25f230191f Move versionadded data to a lexer attribute
That way, we can set it to "" for old lexers, and check that it's
present on new lexers. (In the future, we might also use it for better
presentation in the documentation.)
2023-11-26 14:51:52 +01:00

178 lines
4.2 KiB
Python

"""
pygments.lexers.asn1
~~~~~~~~~~~~~~~~~~~~
Pygments lexers for ASN.1.
:copyright: Copyright 2006-2023 by the Pygments team, see AUTHORS.
:license: BSD, see LICENSE for details.
"""
import re
from pygments.token import Comment, Operator, Keyword, Name, String, \
Number, Punctuation, Whitespace
from pygments.lexer import RegexLexer, words, bygroups
__all__ = ['Asn1Lexer']
SINGLE_WORD_KEYWORDS = [
"ENCODED",
"ABSTRACT-SYNTAX",
"END",
"APPLICATION",
"EXPLICIT",
"IMPLICIT",
"AUTOMATIC",
"TAGS",
"BEGIN",
"EXTENSIBILITY",
"BY",
"FROM",
"COMPONENT",
"UNIVERSAL",
"COMPONENTS",
"CONSTRAINED",
"IMPLIED",
"DEFINITIONS",
"INCLUDES",
"PRIVATE",
"WITH",
"OF",
]
OPERATOR_WORDS = [
"EXCEPT",
"UNION",
"INTERSECTION",
]
SINGLE_WORD_NAMESPACE_KEYWORDS = [
"EXPORTS",
"IMPORTS",
]
MULTI_WORDS_DECLARATIONS = [
"SEQUENCE OF",
"SET OF",
"INSTANCE OF",
"WITH SYNTAX",
]
SINGLE_WORDS_DECLARATIONS = [
"SIZE",
"SEQUENCE",
"SET",
"CLASS",
"UNIQUE",
"DEFAULT",
"CHOICE",
"PATTERN",
"OPTIONAL",
"PRESENT",
"ABSENT",
"CONTAINING",
"ENUMERATED",
"ALL",
]
TWO_WORDS_TYPES = [
"OBJECT IDENTIFIER",
"BIT STRING",
"OCTET STRING",
"CHARACTER STRING",
"EMBEDDED PDV",
]
SINGLE_WORD_TYPES = [
"RELATIVE-OID",
"TYPE-IDENTIFIER",
"ObjectDescriptor",
"IA5String",
"INTEGER",
"ISO646String",
"T61String",
"BMPString",
"NumericString",
"TeletexString",
"GeneralizedTime",
"REAL",
"BOOLEAN",
"GeneralString",
"GraphicString",
"UniversalString",
"UTCTime",
"VisibleString",
"UTF8String",
"PrintableString",
"VideotexString",
"EXTERNAL",
]
def word_sequences(tokens):
return "(" + '|'.join(token.replace(' ', r'\s+') for token in tokens) + r')\b'
class Asn1Lexer(RegexLexer):
"""
Lexer for ASN.1 module definition
"""
flags = re.MULTILINE
name = 'ASN.1'
aliases = ['asn1']
filenames = ["*.asn1"]
url = "https://www.itu.int/ITU-T/studygroups/com17/languages/X.680-0207.pdf"
version_added = '2.16'
tokens = {
'root': [
# Whitespace:
(r'\s+', Whitespace),
# Comments:
(r'--.*$', Comment.Single),
(r'/\*', Comment.Multiline, 'comment'),
# Numbers:
(r'\d+\.\d*([eE][-+]?\d+)?', Number.Float),
(r'\d+', Number.Integer),
# Identifier:
(r"&?[a-z][-a-zA-Z0-9]*[a-zA-Z0-9]\b", Name.Variable),
# Constants:
(words(("TRUE", "FALSE", "NULL", "MINUS-INFINITY", "PLUS-INFINITY", "MIN", "MAX"), suffix=r'\b'), Keyword.Constant),
# Builtin types:
(word_sequences(TWO_WORDS_TYPES), Keyword.Type),
(words(SINGLE_WORD_TYPES, suffix=r'\b'), Keyword.Type),
# Other keywords:
(r"EXPORTS\s+ALL\b", Keyword.Namespace),
(words(SINGLE_WORD_NAMESPACE_KEYWORDS, suffix=r'\b'), Operator.Namespace),
(word_sequences(MULTI_WORDS_DECLARATIONS), Keyword.Declaration),
(words(SINGLE_WORDS_DECLARATIONS, suffix=r'\b'), Keyword.Declaration),
(words(OPERATOR_WORDS, suffix=r'\b'), Operator.Word),
(words(SINGLE_WORD_KEYWORDS), Keyword),
# Type identifier:
(r"&?[A-Z][-a-zA-Z0-9]*[a-zA-Z0-9]\b", Name.Type),
# Operators:
(r"(::=|\.\.\.|\.\.|\[\[|\]\]|\||\^)", Operator),
# Punctuation:
(r"(\.|,|\{|\}|\(|\)|\[|\])", Punctuation),
# String:
(r'"', String, 'string'),
# Binary string:
(r"('[01 ]*')(B)\b", bygroups(String, String.Affix)),
(r"('[0-9A-F ]*')(H)\b",bygroups(String, String.Affix)),
],
'comment': [
(r'[^*/]+', Comment.Multiline),
(r'/\*', Comment.Multiline, '#push'),
(r'\*/', Comment.Multiline, '#pop'),
(r'[*/]', Comment.Multiline)
],
'string': [
(r'""', String),
(r'"', String, "#pop"),
(r'[^"]', String),
]
}