# Abbreviation Extension for Python-Markdown # ========================================== # This extension adds abbreviation handling to Python-Markdown. # See https://Python-Markdown.github.io/extensions/abbreviations # for documentation. # Original code Copyright 2007-2008 [Waylan Limberg](http://achinghead.com/) # and [Seemant Kulleen](http://www.kulleen.org/) # All changes Copyright 2008-2014 The Python Markdown Project # License: [BSD](https://opensource.org/licenses/bsd-license.php) """ This extension adds abbreviation handling to Python-Markdown. See the [documentation](https://Python-Markdown.github.io/extensions/abbreviations) for details. """ from __future__ import annotations from . import Extension from ..blockprocessors import BlockProcessor from ..inlinepatterns import InlineProcessor from ..util import AtomicString import re import xml.etree.ElementTree as etree class AbbrExtension(Extension): """ Abbreviation Extension for Python-Markdown. """ def extendMarkdown(self, md): """ Insert `AbbrPreprocessor` before `ReferencePreprocessor`. """ md.parser.blockprocessors.register(AbbrPreprocessor(md.parser), 'abbr', 16) class AbbrPreprocessor(BlockProcessor): """ Abbreviation Preprocessor - parse text for abbr references. """ RE = re.compile(r'^[*]\[(?P[^\\]*?)\][ ]?:[ ]*\n?[ ]*(?P.*)$', re.MULTILINE) def test(self, parent: etree.Element, block: str) -> bool: return True def run(self, parent: etree.Element, blocks: list[str]) -> bool: """ Find and remove all Abbreviation references from the text. Each reference is set as a new `AbbrPattern` in the markdown instance. """ block = blocks.pop(0) m = self.RE.search(block) if m: abbr = m.group('abbr').strip() title = m.group('title').strip() self.parser.md.inlinePatterns.register( AbbrInlineProcessor(self._generate_pattern(abbr), title), 'abbr-%s' % abbr, 2 ) if block[m.end():].strip(): # Add any content after match back to blocks as separate block blocks.insert(0, block[m.end():].lstrip('\n')) if block[:m.start()].strip(): # Add any content before match back to blocks as separate block blocks.insert(0, block[:m.start()].rstrip('\n')) return True # No match. Restore block. blocks.insert(0, block) return False def _generate_pattern(self, text: str) -> str: """ Given a string, returns a regex pattern to match that string. """ return f"(?P<abbr>\\b{ re.escape(text) }\\b)" class AbbrInlineProcessor(InlineProcessor): """ Abbreviation inline pattern. """ def __init__(self, pattern: str, title: str): super().__init__(pattern) self.title = title def handleMatch(self, m: re.Match[str], data: str) -> tuple[etree.Element, int, int]: abbr = etree.Element('abbr') abbr.text = AtomicString(m.group('abbr')) abbr.set('title', self.title) return abbr, m.start(0), m.end(0) def makeExtension(**kwargs): # pragma: no cover return AbbrExtension(**kwargs)