intern sphinx_exec_directive with HS backend

doyougnu · doyougnu · commit f9e6563ac0ea · 2023-01-16T08:08:04.000-05:00
diff --git a/.gitignore b/.gitignore
@@ -2,11 +2,13 @@ book
 _build
 *.el
 
+
 # profiling outputs
 *.eventlog
 *.eventlog.*
 *.hp
 *.prof
+*/__pycache__
 
 # nix stuff
 .direnv/
diff --git a/.gitmodules b/.gitmodules
@@ -0,0 +1,3 @@
+[submodule "extensions/sphinx_exec_directive"]
+	path = extensions/sphinx_exec_directive
+	url = https://github.com/doyougnu/sphinx_exec_directive.git
diff --git a/conf.py b/conf.py
@@ -13,7 +13,8 @@
 import os
 import sys
 import time
-sys.path.insert(0, os.path.abspath('.'))
+
+sys.path.insert(0, os.path.abspath('extensions'))
 
 # -- Project information -----------------------------------------------------
 
@@ -42,7 +43,8 @@
                                          ## underscore
              , 'sphinxcontrib.bibtex'
              , 'sphinx_copybutton'
-             , 'sphinxcontrib.execHS.ext'
+             # , 'sphinxcontrib.execHS.ext'
+             , 'sphinx_exec_directive'
              ]
 
 # flags
diff --git a/extensions/sphinx_exec_directive b/extensions/sphinx_exec_directive
@@ -0,0 +1 @@
+Subproject commit 8a93684a1b41fce2a21825dce2bff5262a059115
diff --git a/extensions/sphinx_exec_directive.py b/extensions/sphinx_exec_directive.py
@@ -0,0 +1,289 @@
+import os
+import io
+import re
+import subprocess
+from hashlib import md5
+from contextlib import redirect_stdout
+from pathlib import Path
+from tempfile import NamedTemporaryFile
+
+from docutils import nodes
+from docutils.parsers.rst import directives, Directive, Parser
+from docutils.utils import new_document
+
+context = dict()
+previous_rst = None
+
+
+class cd:
+    """
+    Context manager for changing the current working directory. Taken from
+    https://stackoverflow.com/a/13197763/7115316.
+    """
+    def __init__(self, newPath):
+        self.newPath = os.path.expanduser(newPath)
+
+    def __enter__(self):
+        self.savedPath = os.getcwd()
+        os.chdir(self.newPath)
+
+    def __exit__(self, etype, value, traceback):
+        os.chdir(self.savedPath)
+
+
+def execute_code(runner, globals_dict=None):
+
+    def execute_code_with_pipe(command, code_in, post_process=[]):
+        proc = subprocess.Popen(command,
+                                stdin=subprocess.PIPE,
+                                stdout=subprocess.PIPE,
+                                stderr=subprocess.PIPE)
+        out, err = proc.communicate(input=code_in.encode("utf-8"))
+
+        # apply all post processing functions now that we have output
+        out = out.decode('utf-8')
+
+        for f in post_process:
+            out = f(out)
+
+        # Log any stderr.
+        if err is not None and err.strip() != "":
+            print(err)
+
+        return out
+
+    if runner['process'] == 'python':
+        if globals_dict is None:
+            globals_dict = {}
+
+        output_object = io.StringIO()
+        with redirect_stdout(output_object):
+            exec(runner['code_in'], globals_dict)
+        code_out = output_object.getvalue()
+
+    elif runner['process'] == 'haskell':
+        post_process = []
+        payload = []
+
+        # check that the runner with field is set
+        # and set post-process hooks
+        if not runner['with']:
+            runner['with'] = 'runghc' # default is runghc, no hooks
+
+        if runner['with'] == 'ghci':
+            # if running with ghci then we post process the output to remove
+            # ghci specific text
+            post_process += [lambda s: s.replace("ghci>",""),
+                             lambda s: re.sub("^.*?\n", "", s),
+                             lambda s: s.replace("Leaving GHCi.\n", "").rstrip()
+                            ]
+
+        # do the business
+        if runner['with'] == 'cabal' or runner['with'] == 'stack':
+            if runner['project_dir']:
+                with cd(Path(runner['project_dir'])):
+                    payload   = [runner['with']] + runner['args']
+                    comp_proc = subprocess.run(payload, capture_output=True, text=True)
+                    out       = comp_proc.stdout
+                    err       = comp_proc.stderr
+                # Log
+                if err is not None and err.strip() != "":
+                    print(err) # should use sphinx logger
+                code_out = out
+        else:
+            code_out = execute_code_with_pipe(runner['with'], runner['code_in'], post_process)
+
+    elif runner['process'] == 'matlab':
+        # MATLAB can't pipe, so we need to dump to a tempfile.
+        with NamedTemporaryFile(suffix=".m") as tempfile:
+            tempfile.write(code.encode('utf-8'))
+            tempfile.flush()   # mandatory, or else it will be empty
+            filepath = Path(tempfile.name)
+            # Then execute MATLAB.
+            with cd(filepath.parent):
+                comp_proc = subprocess.run(['matlab', '-batch', filepath.stem],
+                                           capture_output=True, text=True)
+                out = comp_proc.stdout.decode('utf-8')
+                err = comp_proc.stderr
+        # Log any stderr.
+        if err is not None and err.strip() != "":
+            print(err)
+        code_out = out
+
+    elif process == 'shell':
+        code_out = execute_code_with_pipe(['sh'])
+
+    else:
+        raise ValueError(f"process type '{process}' not recognised.")
+
+    return code_out
+
+
+def _option_boolean(arg):
+    """Copied from matplotlib plot_directive."""
+    if not arg or not arg.strip():
+        # no argument given, assume used as a flag
+        return True
+    elif arg.strip().lower() in ('no', '0', 'false'):
+        return False
+    elif arg.strip().lower() in ('yes', '1', 'true'):
+        return True
+    else:
+        raise ValueError('"%s" unknown boolean' % arg)
+
+
+def _option_str(arg):
+    return str(arg)
+
+def _option_process(arg):
+    if arg is None:
+        return 'python'
+    else:
+        return arg.lower()
+
+
+class Exec(Directive):
+    has_content = True
+    required_arguments = 0
+    optional_arguments = 1
+    option_spec = {
+        'context':   _option_boolean,
+        'cache':     _option_boolean,
+        'process':   _option_process,
+        'intertext': _option_str,
+        'project_dir': _option_str,
+        'with':      _option_str,
+        'args':      _option_str
+    }
+
+    def run(self):
+        # Get the source file and if it has changed, then reset the context.
+        current_rst = Path(self.state_machine.document.attributes['source'])
+        global previous_rst
+        if previous_rst is None or previous_rst != current_rst:
+            previous_rst = current_rst
+            context.clear()
+
+        # Parse options
+        save_context = self.options.get('context', False)
+        # Don't cache if the user requests saving context, or if the context is
+        # nonempty. The reason is because the global_dict can't be updated just
+        # by reading in code from a file (as opposed to executing it). I can't
+        # be bothered to fix this (and truthfully I don't see an easy way,
+        # short of serialising the entire contents of `context`).
+        cache = (not save_context
+                 and len(context) == 0
+                 and self.options.get('cache', True))
+        process = self.options.get('process', 'python')
+        project_dir = self.options.get('project_dir', '')
+        opt_with = self.options.get('with', '')
+        args     = self.options.get ('args','').split()
+
+        # A runner is "that which runs the code", i.e., a dictionary that
+        # defines the entire external process
+        runner = {'process': process,  # the language
+                  'with':    opt_with, # to run with what tool/binary
+                  'project_dir': project_dir,   # if we're running from project
+                                                # then store the project dir
+                                                # 'code_in': '', # The code to
+                                                # run, if from file then this is
+                                                # the contents of source_file,
+                                                # if not then its the contents
+                                                # of a literal code block
+                  'args':    args}     # args to run with, with
+
+        # Determine whether input is to be read from a file, or directly from
+        # the exec block's contents.
+        from_file = len(self.arguments) > 0
+
+        # Get some important paths.
+        # NOTE ABOUT PATHS:
+        # Any variable ending in _pAD is an absolute path to a directory.
+        #                        _pRD is a  relative path to a directory.
+        #                        _pAF is an absolute path to a file.
+        #                        _pRF is a  relative path to a file.
+        top_level_sphinx_pAD = Path(setup.confdir)
+
+        # Determine where to get source code from. If we are using a build
+        # system then the user file is actually a project directory
+        if from_file:
+            # Set the 'source file' to be the specified file. The argument to
+            # the exec block is given as a relative path, so has to be made
+            # absolute with respect to the top-level Sphinx directory.
+            source_pAF = top_level_sphinx_pAD.joinpath(Path(self.arguments[0]))
+            runner['code_in'] = source_pAF.read_text()
+            runner['source_file'] = source_pAF
+        else:
+            # Set the 'source file' to be the rst file which the code is in.
+            # This path is already absolute.
+            source_pAF = current_rst
+            runner['code_in'] = "\n".join(self.content)
+
+        # Look up the output in the cache, or execute the code.
+        if cache:
+            source_pRF = source_pAF.relative_to(top_level_sphinx_pAD)
+
+            # Figure out where to dump the output.
+            if from_file:
+                source_identifier = source_pRF.with_suffix('')
+                source_identifier = str(source_identifier).replace('/', '-')
+                identifier = f"{source_identifier}-{process}-file.out"
+                # ^ folder-yymmdd-filename-python-file.out
+            else:
+                source_identifier = source_pRF.with_suffix('')
+                source_identifier = str(source_identifier).replace('/', '-')
+                md5_hash = md5(runner['code_in'].encode('utf-8')).hexdigest()
+                identifier = (f"{source_identifier}-{process}-"
+                              f"inline-{md5_hash}.out")
+                # ^ folder-yymmdd-python-inline-<HASH>.out
+            build_pAD = Path(setup.app.doctreedir).parent
+            output_pAF = build_pAD / "exec_directive" / identifier
+
+            # Look for the cached output. If not found, execute it.
+            cache_found = (
+                output_pAF.exists()
+                and source_pAF.stat().st_mtime < output_pAF.stat().st_mtime
+            )
+            if cache_found:
+                with open(output_pAF, "r") as out_f:
+                    code_out = out_f.read()
+            else:
+                code_out = execute_code(runner, context)
+                if not output_pAF.parent.exists():
+                    output_pAF.parent.mkdir()
+                with open(output_pAF, "w") as out_f:
+                    print(code_out, file=out_f, end="")
+        else:  # caching was disabled, execute it
+            code_out = execute_code(runner, context)
+
+        # Reset the context if it's not meant to be preserved
+        if not save_context:
+            context.clear()
+
+        node_in = nodes.literal_block(runner['code_in'], runner['code_in'])
+        node_out = nodes.literal_block(code_out, code_out)
+        node_in['language'] = process
+        node_out['language'] = 'none'
+
+        if code_out.strip() == "":
+            return [node_in]
+        else:
+            intertext = self.options.get('intertext', None)
+            if intertext:
+                internodes = new_document('intertext', self.state.document.settings)
+                Parser().parse(intertext, internodes)
+                return [node_in, *internodes.document.children, node_out]
+            else:
+                return [node_in, node_out]
+
+
+def setup(app):
+    setup.app = app
+    setup.confdir = app.confdir
+    app.add_directive("exec", Exec)
+
+    return {
+        'version': '0.5',
+        'parallel_read_safe': True,
+        'parallel_write_safe': True,
+    }
diff --git a/hoh.nix b/hoh.nix
@@ -15,17 +15,20 @@ let
    nonPythonInputs = with pkgs; [ sphinx-press-theme # this comes from the overlay
                                   sphinx-copybutton  # this comes from the overlay
                                   pandoc
-                                  sphinx-exec-directive
+                                  # change once extension fixes are upstreamed
+                                  # sphinx-exec-directive
                                   rst2html5
                                   sphinx-autobuild
                                   sphinx-exec-haskell
+                                  ghc
+                                  cabal-install
                                 ];
 in
 pkgs.stdenv.mkDerivation {
    pname   = "hoh";
    version = "0.0.1";
    src     = ./.;
-   buildInputs = pythonInputs ++ nonPythonInputs;
+   propagatedBuildInputs = pythonInputs ++ nonPythonInputs;
 
    preBuild = ''
    unset SOURCE_DATE_EPOCH
diff --git a/src/Optimizations/GHC_opt/lambda_lifting.rst b/src/Optimizations/GHC_opt/lambda_lifting.rst

Original file line number	Diff line number	Diff line change
`@@ -0,0 +1,3 @@`
	`1`	`+[submodule "extensions/sphinx_exec_directive"]`
	`2`	`+ path = extensions/sphinx_exec_directive`
	`3`	`+ url = https://github.com/doyougnu/sphinx_exec_directive.git`