handle links which use the <> construct to encode blank spaces

2024-07-30 22:12:33 -06:00 · 2024-07-30 22:12:33 -06:00 · 4facd16452
commit 4facd16452
parent b293684fb7
2 changed files with 56 additions and 1 deletions
--- a/src/dragonglass/dragonglass.py
+++ b/src/dragonglass/dragonglass.py
@ -31,7 +31,6 @@ def main() -> int:
        return 1
    context.load_config(args)
    tenv = create_template_environment(context)
    nodes = generate_list(context.source_dir)
    for node in nodes:
@ -57,6 +56,7 @@ def main() -> int:
    if not dest_dir.exists():
        dest_dir.mkdir()
    tenv = create_template_environment(context)
    for node in nodes:
        p = node.target_file(dest_dir)
--- a/src/dragonglass/mparse.py
+++ b/src/dragonglass/mparse.py
@ -4,6 +4,7 @@ import re
 import xml.etree.ElementTree as etree  # noqa: N813
 from typing import Any
 from urllib.parse import unquote as urlunquote
 from urllib.parse import quote as urlquote
 from urllib.parse import urlparse
 import markdown
@ -61,7 +62,17 @@ class MetaStripper(Extension):
    """
    class MetaStripperProc(Preprocessor):
        """The actual metadata stripper."""
        def run(self, lines: list[str]) -> list[str]:
            """
            Removes the metadata lines from the front of the array of lines.
            Args:
                lines (list[str]): The Markdown lies read in.
            Returns:
                list[str]: The Markdown lines after the metadata has been removed.
            """
            if lines[0] == '---':
                lines.pop(0)
                while lines[0] != '---':
@ -70,6 +81,12 @@ class MetaStripper(Extension):
            return lines
    def extendMarkdown(self, md: markdown.Markdown) -> None:  # noqa: N802
        """
        Registers the metadata stripper with the Markdown parser.
        Args:
            md (markdown.Markdown): The Markdown parser to register the stripper with.
        """
        md.preprocessors.register(MetaStripper.MetaStripperProc(md), 'metastripper', PRIO_BASE)
@ -78,14 +95,35 @@ class ObsidianImages(Extension):
    DIMS = re.compile(r'(.*)\|(\d+)(?:x(\d+))?')
    def __init__(self, context: Context, **kwargs: dict[str, Any]) -> None:
        """
        Initialize the image processor class.
        Args:
            context (Context): The dragonglass context, containing the configuration.
            **kwargs (dict): Other keyword arguments to the image tag processor.
        """
        super(ObsidianImages, self).__init__(**kwargs)
        self._context = context
    @property
    def invalid_reference_classname(self) -> str:
        """
        Returns the CSS class name for an invalid reference in the text.
        """
        return 'invalid-reference'
    def _parse_dimensions(self, s: str) -> tuple[str, int, int]:
        """
        Parses an image reference looking for image dimensions.
        Args:
            s (str): The image reference to be parsed.
        Returns:
            str: The actual image reference.
            int: The image width in pixels, or -1 if not specified.
            int: The image height in pixels, or -1 if not specified.
        """
        m = self.DIMS.match(s)
        if m:
            width = int(m.group(2))
@ -222,6 +260,8 @@ class ObsidianLinks(Extension):
        def handleMatch(self, m: re.Match[str], data: str) -> tuple[etree.Element, int, int]:  # noqa: N802
            text = m.group(1)
            link = m.group(2)
            if link.startswith('<') and link.endswith('>'):  # handle whitespace encoding
                link = urlquote(link[1:-1].strip(), safe=':/')
            if is_proper_url(link):
                el = etree.Element('a')
                el.set('href', link)
@ -249,11 +289,26 @@ class ObsidianLinks(Extension):
 class ObsidianInlines(Extension):
    """An extension that handles the special Obsidian markdown format sequences."""
    def extendMarkdown(self, md: markdown.Markdown) -> None:  # noqa: N802
        """
        Registers the inline patterns with the Markdown parser.
        Args:
            md (markdown.Markdown): The Markdown parser to register the patterns with.
        """
        md.inlinePatterns.register(SimpleTagInlineProcessor(r'()~~(.*?)~~', 'del'), 'strikeout', PRIO_BASE)
        md.inlinePatterns.register(SimpleTagInlineProcessor(r'()\=\=(.*?)\=\=', 'ins'), 'highlight', PRIO_BASE + 1)
 def create_markdown_parser(context: Context) -> markdown.Markdown:
    """
    Creates a Markdown parser with all our extensions loaded.
    Args:
        context (Context): The dragonglass context, that contains the configuration.
    Returns:
        markdown.Markdown: The new Markdown parser.
    """
    return markdown.Markdown(extensions=[MetaStripper(),
                                         ObsidianImages(context),
                                         ObsidianLinks(context),