feat: Add inclusion syntax for extracted content

Also updated the documentation, using the extraction syntax. Resolves #2.
2021-01-08 11:36:03 -08:00 · 2021-01-08 11:36:03 -08:00 · ea8e65ae64
parent cf4d538fd0
commit ea8e65ae64
2 changed files with 129 additions and 12 deletions
--- a/mkdocs_semiliterate/plugin.py
+++ b/mkdocs_semiliterate/plugin.py
@ -8,15 +8,88 @@ you will have immediate access to all of the following extensions. (Note that th
 documentation assumes a familiarity with the
 [usage](https://athackst.github.io/mkdocs-simple-plugin/mkdocs_simple_plugin/plugin/)
 of the `simple` plugin.)
+"""
+
+from mkdocs import utils
+from mkdocs.config import config_options
+from mkdocs_simple_plugin.plugin import SimplePlugin, StreamExtract, LazyFile
+
+import re
+import yaml
+
+
+class StreamInclusion(StreamExtract):
+    """ md  An extension of the StreamExtract class which adds

 ### Inclusion syntax

-To be documented when implemented.
-"""
+While extracting content from a file (because it matches one of the
+`semiliterate` patterns, rather than just one of the `include_extensions`),
+an unescaped expression of the form
+
+`{! FILENAME YAML !}`
+
+(which may span multiple lines) will trigger file inclusion. The FILENAME may
+be a bare word, in which case it cannot contain whitespace, or it may be
+enclosed in single or double quotes. Note that FILENAME is interpreted relative
+to the directory in which the file containing the `{! .. !}` expression
+resides. The YAML is interpreted exactly as the extraction options to a
+`semiliterate` item as
+[documented](https://athackst.github.io/mkdocs-simple-plugin/mkdocs_simple_plugin/plugin/index.html#plugin_usage)
+for the `simple` extension. The text extracted from FILENAME
+is interpolated at the current location in the file currently being written.
+Recursive inclusion is supported.
+
+Note that the `{! ... !}` directive must be in lines that semiliterate would
+normally copy. That is, it does not examine lines before the `start` regexp
+is encountered, or after the `terminate` regexp, or between instances of
+`stop` and `start`. It also doesn't check any text written from lines that
+match these special expressions. Moreover, on such normally-transcribed lines,
+it's the text **after** the application of any semiliterate replacements that
+is checked for `{! ... !}`.
+     """
+
+    include_open = re.compile(r'''(?<![`\\])(\{\!\s*)([\s'"])''')
+    include_quoted_file = re.compile(
+        r'''(['"])(?P<fn>.*?)\1\s+(?P<yml>[\s\S]*?)\s\!\}''')
+    include_bare_file = re.compile(r'\s(?P<fn>.*?)\s+(?P<yml>[\s\S]*?)\s\!\}')
+
+    def extract_line(self, line):
+        """Copy line to the output stream, applying all specified replacements
+           and handling inclusion syntax.
+        """
+        line = self.replace_line(line)
+        include_match = StreamInclusion.include_open.search(line)
+        if not include_match:
+            self.transcribe(line)
+            return
+        # OK, we have found (the start of) an inclusion and must process it
+        preamble = line[:include_match.start()]
+        remainder = line[include_match.end(1):]
+        body_pattern = StreamInclusion.include_quoted_file
+        if include_match[2].isspace():
+            body_pattern = StreamInclusion.include_bare_file
+        body_match = body_pattern.search(remainder)
+        if not body_match:
+            for extra_line in self.input_stream:
+                remainder += self.replace_line(extra_line)
+                body_match = body_pattern.search(remainder)
+                if body_match:
+                    break
+        if not body_match:
+            raise EOFError("semiliterate: End of file while scanning for `!}`")
+        include_path = self.include_root + '/' + body_match['fn']
+        new_root = re.match(r'(.*)/', include_path)[1]
+        include_parameters = yaml.safe_load(body_match['yml'])
+        with open(include_path) as include_file:
+            self.transcribe(preamble)
+            inclusion = StreamInclusion(
+                include_file, self.output_stream, include_root=new_root,
+                **include_parameters)
+            if inclusion.productive():
+                self.wrote_something = True
+        self.transcribe(remainder[body_match.end():])

-import mkdocs
-from mkdocs.config import config_options
-from mkdocs_simple_plugin.plugin import SimplePlugin

 class SemiliteratePlugin(SimplePlugin):
    """ md   An extension of the mkdocs-simple-plugin
@ -26,12 +99,13 @@ class SemiliteratePlugin(SimplePlugin):
 behavior as compared to `simple`. They are described in this section, with their
 default values in parentheses at the beginning of each entry.

-copy_standard_markdown
-:   (false) Whether to add MkDocs' list of standard Markdown extensions to the
-    `include_extensions` parameter so that Markdown files will be directly copied
-    to the docsite. Note that the `simple` behavior corresponds to a _true_ value
-    for `copy_standard_markdown`, but `semiliterate` still incorporates all
-    standard Markdown files because of the `extract_standard_markdown` default.
+{! plugin.py ---
+  start: '[*]SimplePlugin.config_scheme'
+  terminate: '^\s*\)'
+  replace:
+  - ['\(.(.*)., config_options.Type\(.*, default=(.*)\)\)', '\1\n:  (\2)']
+  - '^\s*#(.*\s*)$'
+!}

 extract_standard_markdown
 :   (true) To be implemented and documented
@ -40,9 +114,52 @@ extract_standard_markdown
    config_scheme = (
        *SimplePlugin.config_scheme,
        ('copy_standard_markdown', config_options.Type(bool, default=False))
+        # Whether to add MkDocs' list of standard Markdown extensions to the
+        #    `include_extensions` parameter so that Markdown files will be
+        #    directly copied to the docsite. Note that the `simple` behavior
+        #    corresponds to a _true_ value for `copy_standard_markdown`, but
+        #    `semiliterate` still incorporates all standard Markdown files
+        #    because of the `extract_standard_markdown` default.
    )

    def copy_doc_files(self, destination_directory):
        if not self.config['copy_standard_markdown']:
            self.include_extensions = self.config['include_extensions']
        return super().copy_doc_files(destination_directory)
+
+    ## FIXME: This method is copied from simple, just to insert a control
+    ## over what class is used to do the extraction. Try to get this inserted as
+    ## the method of the same name in simple.
+    def extract_from(self, from_directory, name, destination_directory):
+        """Extract content from the file in _from_directory_ named _name_
+           to a file or files in _destination_directory_, as specified by
+           the semiliterate parameters.
+        """
+        new_paths = []
+        original = "{}/{}".format(from_directory, name)
+        for item in self.semiliterate:
+            name_match = item['pattern'].search(name)
+            if name_match:
+                new_name = (name[:name_match.start(name_match.lastindex)]
+                            + '.md'
+                            + name[name_match.end(name_match.lastindex):])
+                if 'destination' in item:
+                    new_name = name_match.expand(item['destination'])
+                new_file = LazyFile(destination_directory, new_name)
+                with open(original) as original_file:
+                    utils.log.debug(
+                        "mkdocs-simple-plugin: Scanning {} ...".format(original))
+                    productive = self.try_extraction(
+                        original_file, from_directory, new_file, **item)
+                    new_file.close()
+                    if productive:
+                        new_path = "{}/{}".format(destination_directory,
+                                                  new_name)
+                        utils.log.debug(
+                            "        ... extracted {}".format(new_path))
+                        new_paths.append((original, new_path))
+        return new_paths
+
+    def try_extraction(self, original_file, root, new_file, **kwargs):
+        return StreamInclusion(
+            original_file, new_file, include_root=root, **kwargs).productive()
--- a/setup.cfg
+++ b/setup.cfg
@ -1,6 +1,6 @@
 [metadata]
 name = mkdocs-semiliterate
-version = 0.0.3
+version = 0.0.4

 [options]
 packages = mkdocs_semiliterate