Python/libs/pygments-lexer-pseudocode2: pygments_lexer_pseudocode2/algpseudocode.py comparison

comparison pygments_lexer_pseudocode2/algpseudocode.py @ 84:3ac1c4502ad0

Implement "\tt-XXX" and "ttx-XXX" for explicit token types. Overwrite defaults or implement tokens that are not yet handled by default.

author	Franz Glasner <fzglas.hg@dom66.de>
date	Thu, 30 Apr 2026 19:37:24 +0200
parents	cd79d2c76347
children	ae5e741d2a9b

comparison

equal deleted inserted replaced

-:cd79d2c76347
+:3ac1c4502ad0
 import re
 import pygments.util
 from pygments.lexer import bygroups, include, words
 from pygments.token import (Comment, Keyword, Name, Operator, Punctuation,
-Text, Whitespace)
+Text, Whitespace,
+STANDARD_TYPES)
 #
 # Relative imports do not work with pygments.lexers.load_lexer_from_file()
 # in all of our supported Python releases.
 #
 yield match.start(), toktype, lexer.SYMBOLS.get(kw, kw)
 if ctx:
 ctx.pos = match.end()
 return _op_symbol
+def op_explicit_tokentype(lexer, match, ctx=None):
+needed_css = match.group("type")
+for ttype, css in STANDARD_TYPES.items():
+if css == needed_css:
+toktype = ttype
+break
+else:
+toktype = Text
+yield match.start(), toktype, match.group("character")
+if ctx:
+ctx.pos = match.end()
 tokens = {
 "root": [
 (r"\n", Whitespace),
 (r"/\*", Comment.Multiline, "multiline-nested-comment"),
 "expr": [
 include("punctuation"),
 include("py-strings"),
 include("py-numbers"),
 (r"(?i)\\text\s*\{", LexBase.op_ignore, "text-in-expr"),
+include("explicit-tokentype"),
 include("remark"),
 include("keyword-constants"),
 include("text-operators"),
 include("math-builtins"),
 include("py-name"),
 "expr-in-braces": [
 include("punctuation-in-braces"),
 include("py-strings"),
 include("py-numbers"),
 (r"(?i)\\text\s*\{", LexBase.op_ignore, "text-in-expr"),
+include("explicit-tokentype"),
 include("remark"),
 include("keyword-constants"),
 include("text-operators"),
 include("math-builtins"),
 include("py-name"),
 (r"\n", Whitespace),
 (r"\\\}", LexBase.op_fixed(Text, "}")),
 (r"(?i)\\expr(?:ession)?\s*\{",
 LexBase.op_ignore,
 "block-expr"),
+include("explicit-tokentype"),
 include("remark"),
 (r"\\\\", LexBase.op_fixed(Text, "\\")),
 (r"\\", LexBase.op_fixed(Text, "\\")),
 ],
 "text-in-expr": [
 (r"\n", Whitespace),
 (r"\\\}", LexBase.op_fixed(Text, "}")),
 (r"(?:i)\\(expr(?:ession)?)\s*(\{)",
 bygroups(LexBase.op_ignore, LexBase.op_ignore),
 "expr-in-braces"),
+include("explicit-tokentype"),
 (r"\\\\", LexBase.op_fixed(Text, "\\")),
 (r"\\", LexBase.op_fixed(Text, "\\")),
 ],
 "math-builtins": [
 (words(("sqrt", "pow", "cos", "sin", "tan", "arcos", "arcsin",
 ],
 "punctuation-in-braces": [
 # like "punctuation" but needs an escaped curly brace for }
 (r"\\\}", LexBase.op_fixed(Punctuation, "}")),
 (r"[{:(),;[\]]", Punctuation),
+],
+"explicit-tokentype": [
+# All these REs are CASE-SENSITIVE!
+# Multiple characters possible, but no escaping!
+(r"\\ttx\-(?P<type>[^/:|=*+!\$~]+)(?P<sep>[/:|=*+!\$~])"
+r"(?P<character>(.|\n)+?)(?P=sep)",
+op_explicit_tokentype),
+(r"\\ttx\-(?P<type>[^{]+)\{"
+r"(?P<character>[^}]+?)\}",
+op_explicit_tokentype),
+(r"\\ttx\-(?P<type>[^\(]+)\("
+r"(?P<character>[^\)]+?)\)",
+op_explicit_tokentype),
+(r"\\ttx\-(?P<type>[^<]+)<"
+r"(?P<character>[^>]+?)>",
+op_explicit_tokentype),
+# Every character is possible: no escaping needed!
+(r"\\tt-(?P<type>[^/]+)/(?P<character>(?:.|\n))",
+op_explicit_tokentype),
 ],
 }
 def __init__(self, **options):
 val = pygments.util.get_bool_opt(options, "no_end", default=False)

Mercurial > hgrepos > Python > libs > pygments-lexer-pseudocode2

comparison pygments_lexer_pseudocode2/algpseudocode.py @ 84:3ac1c4502ad0