Merge pull request #202 from NeuroML/feat/issue-201

feat: update lems scripts to include version and commit information
NeuroML · Jun 18, 2024 · 36300c2 · 36300c2
2 parents 88aca25 + 301f066
commit 36300c2
Show file tree

Hide file tree

Showing 12 changed files with 1,845 additions and 74 deletions.
diff --git a/scripts/lems/asttemplates.py b/scripts/lems/asttemplates.py
@@ -25,7 +25,8 @@
     ---
     {%- endif %}
 
-    Generated on {{ todays_date }}.
+    Schema against which LEMS based on these should be valid: [LEMS_v{{ lems_version }}.xsd](https://github.com/LEMS/LEMS/tree/{{ lems_branch }}/Schemas/LEMS/LEMS_v{{ lems_version }}.xsd).
+    Generated on {{ lems_date }} from [this](https://github.com/LEMS/LEMS/commit/{{ lems_commit }}) commit.
     Please file any issues or questions at the [issue tracker here](https://github.com/LEMS/LEMS/issues).
 
     ---
@@ -78,3 +79,27 @@
     """
 
 ))
+
+schema_quote = env.from_string(textwrap.dedent(
+    """
+    ````{tab-item} Schema
+    ```{code-block} xml
+    {{ schemadoc }}
+    ```
+    ````
+    """
+))
+
+examples = env.from_string(textwrap.dedent(
+    """
+    {% if lemsexamples|length > 0 %}
+    ````{tab-item} {{ title }}: XML
+    {% for e in lemsexamples -%}
+    ```{code-block} xml
+    {{ e|trim }}
+    ```
+    {% endfor -%}
+    ````
+    {%- endif -%}
+    """
+))
diff --git a/scripts/lems/requirements.txt b/scripts/lems/requirements.txt
@@ -0,0 +1,3 @@
+lxml
+xmltodict
+jinja2
diff --git a/scripts/lems/xml2md.py b/scripts/lems/xml2md.py
@@ -7,12 +7,23 @@
 Copyright 2023 NeuroML contributors
 """
 
+import os
+import logging
+import tempfile
+import subprocess
+import re
+import lxml
+import lxml.etree as ET
 import xmltodict
 from datetime import date
 import asttemplates
 from collections import OrderedDict
 
 
+logger = logging.getLogger(__name__)
+logging.basicConfig(level=logging.WARNING)
+
+
 # pages to which different sections should belong
 # key is the name in the annotated source, list entries are [heading,
 # description]
@@ -28,83 +39,262 @@
     "components": ["Defining Components", ""]
 }
 
-todays_date = date.today().strftime("%d/%m/%y")
+lems_branch = "master"
+lems_version = "0.7.6"
+GitHubRepo = "https://github.com/LEMS/LEMS.git"
+lems_date = date.today().strftime("%d/%m/%y")
+lems_commit = ""
+
 parsed_data = {}
 
 srcfile = "sourceannotations.xml"
-destdir = "../../source/Userdocs/LEMS_elements/"
-
-# populate our page info
-with open(srcfile, 'r') as ast_doc:
-    elementtypes = xmltodict.parse(ast_doc.read())['ElementTypes']['ElementType']
-    for et in elementtypes:
-        try:
-            parsed_data[et['@section']].append(et)
-        except KeyError:
-            parsed_data[et['@section']] = []
-            parsed_data[et['@section']].append(et)
-
-# add Include
-parsed_data['root'].append(
-    OrderedDict(
-        {
-            '@name': 'Include',
-            'Info': 'Include LEMS files in other LEMS files. Files are included where the Include declaration occurs.  The enclosing Lems block is stripped off and the rest of the content included as is',
-            'Property': OrderedDict(
-                {
-                    '@name': 'file',
-                    '@type': 'String',
-                    '#text': 'the name or relative path of a file to be included'
-                }
-            )
-        }
-    )
-)
 
-print(parsed_data)
+lems_element_schema = {}
+lems_element_examples = {}
+
+
+def get_lems_examples(srcdirs, examples_max=5):
+    """Get examples for component types
 
-# render templates
-for pg, pginfo in sections_pages.items():
-    outputfile = "{}/{}.md".format(destdir, pginfo[0].replace(" ", ""))
-    with open(outputfile, 'w') as ast_doc:
-        print(
-            asttemplates.page_header.render(section_data=pginfo, todays_date=todays_date),
-            file=ast_doc)
+    :param srcdirs: directores where examples are
+    :type srcdir: list(str)
+    :param examples_max: maximum number of examples to store
+    :type examples_max: int
+    :returns: TODO
+    """
+    for pg, pginfo in sections_pages.items():
         for et in parsed_data[pg]:
-            print(f"Rendering {et['@name']}")
-            print(
-                asttemplates.elementtype.render(et=et),
-                file=ast_doc)
-            if 'Property' in et or 'ListProperty' in et:
-                print("""`````{tab-set}""", end="", file=ast_doc)
+            lems_element_examples[et['@name']] = []
+
+    for srcdir in srcdirs:
+        example_files = os.listdir(srcdir)
+        for f in sorted(example_files):
+            if ".nml" in f or ".xml" in f:
+                srcfile = srcdir + "/" + f
+                print("Processing example file: {}".format(srcfile))
+                fh = open(srcfile, 'r')
+
+                # Replace xmlns bits, we can't do it using lxml
+                # So we need to read the file, do some regular expression
+                # substitutions, and then start the XML bits
+                data = fh.read()
+                data = re.sub('xmlns=".*"', '', data)
+                data = re.sub('xmlns:xsi=".*"', '', data)
+                data = re.sub('xsi:schemaLocation=".*"', '', data)
+                # Remove comment lines
+                data = re.sub('<!--.*-->', '', data)
+                # Strip empty lines
+                data = os.linesep.join([s for s in data.splitlines() if s])
+
+                try:
+                    root = ET.fromstring(bytes(data, 'utf-8'))
+                except ET.XMLSyntaxError as e:
+                    print(f"Could not parse file {srcfile}: {e}")
+                    continue
+                namespaces = root.nsmap
+
+                for lems_element in lems_element_examples.keys():
+                    #  print("looking for lems_element {}".format(lems_element))
+                    # To find recursively, we have to use the XPath system:
+                    # https://stackoverflow.com/a/2723968/375067
+                    # Gotta use namespaces:
+                    # https://stackoverflow.com/a/28700661/375067
+                    examples = root.findall(".//" + lems_element, namespaces=namespaces)
+                    """
+                    if len(examples) == 0:
+                        print("Found no XML examples for {}".format(lems_element))
+                    """
+                    # Sort by length so that we take the 5 longest examples
+                    # Also sort so that the order remains the same when using
+                    # different Python versions etc.
+                    examples.sort(key=len, reverse=True)
+                    # Let's only keep the first 5 examples
+                    for example in examples:
+                        if len(lems_element_examples[lems_element]) < examples_max:
+                            lems_element_examples[lems_element].append(
+                                ET.tostring(example, pretty_print=True,
+                                            encoding="unicode", with_comments="False"
+                                            )
+                            )
+    #  print(lems_element_examples)
+
+
+def get_schema_doc(schemafile):
+    """Get schemas for everything
+
+    :param schemafile: path to the XSD schema file
+    """
+    print(ET.__file__)
+    parser = lxml.etree.XMLParser(remove_comments=True,
+                                  remove_blank_text=True, ns_clean=True)
+    try:
+        tree = ET.parse(schemafile, parser=parser)
+        root = tree.getroot()
+    except ET.XMLSyntaxError as e:
+        print(f"Could not parse file {schemafile}: {e}")
+    namespaces = root.nsmap
+
+    # currently unused
+    for simple_type in root.findall("xs:simpleType", namespaces=namespaces):
+        simple_type_str = ET.tostring(simple_type, pretty_print=True,
+                                      encoding="unicode",
+                                      xml_declaration=False)
+
+        # needs to be lowerCamelCase to match XML core types
+        type_name = simple_type.attrib['name'].lower().replace("nml2quantity_", "")
+        lems_element_schema[type_name] = re.sub(r"Type.*name=",r"Type name=", simple_type_str)
+
+    for complex_type in root.findall("xs:complexType", namespaces=namespaces):
+        for node in complex_type:
+            if "annotation" in str(node.tag) or "documentation" in str(node.tag):
+                complex_type.remove(node)
+
+        complex_type_str = ET.tostring(complex_type, pretty_print=True,
+                                       encoding="unicode",
+                                       xml_declaration=False)
+        # needs to be lowerCamelCase to match XML core types
+        type_name = complex_type.attrib['name'].lower()
+        lems_element_schema[type_name] = re.sub(r"Type.*name=",r"Type name=", complex_type_str)
+
+
+def main(srcdir, destdir):
+    """Main runner function.
+
+    :param arg1: TODO
+    :returns: TODO
 
+    """
+    # If not defined or empty, download a new copy to a temporary directory
+    if not srcdir or src == "":
+        print("No src directory specified. Cloning NeuroML2 repo")
+        tempdir = tempfile.TemporaryDirectory()
+        tmpsrcdir = tempdir.name
+        print("Temporariy directory: {}".format(tmpsrcdir))
+        clone_command = ["git", "clone", "--depth", "1", "--branch", lems_branch, GitHubRepo, tmpsrcdir]
+        subprocess.run(clone_command)
+    else:
+        tmpsrcdir = srcdir
+
+    # TODO: add LEMS examples
+    #  exampledirs = [tmpsrcdir + "/examples/", tmpsrcdir + "/LEMSexamples/"]
+    exampledirs = [tmpsrcdir + "/examples/"]
+    xsdsrc = tmpsrcdir + f"/Schemas/LEMS/LEMS_v{lems_version}.xsd"
+
+    # Get current commit
+    commit_command = ["git", "log", "-1", "--pretty=format:%H"]
+    output = subprocess.run(commit_command, capture_output=True,
+                            cwd=tmpsrcdir, text=True)
+    lems_commit = output.stdout
+
+    # populate our page info
+    with open(srcfile, 'r') as ast_doc:
+        elementtypes = xmltodict.parse(ast_doc.read())['ElementTypes']['ElementType']
+        for et in elementtypes:
             try:
-                if type(et['Property']) == list:
-                    props=et['Property']
-                else:
-                    props=[et['Property']]
-                print(f" - {len(props)} properties: {props}")
-                print(
-                    asttemplates.prop.render(props=props),
-                    file=ast_doc)
+                parsed_data[et['@section']].append(et)
             except KeyError:
-                pass
+                parsed_data[et['@section']] = []
+                parsed_data[et['@section']].append(et)
 
-            try:
-                if type(et['ListProperty']) == list:
-                    lprops=et['ListProperty']
-                else:
-                    lprops=[et['ListProperty']]
-                print(f" - {len(lprops)} properties: {lprops}")
+    # add Include
+    parsed_data['root'].append(
+        OrderedDict(
+            {
+                '@name': 'Include',
+                'Info': 'Include LEMS files in other LEMS files. Files are included where the Include declaration occurs.  The enclosing Lems block is stripped off and the rest of the content included as is',
+                'Property': OrderedDict(
+                    {
+                        '@name': 'file',
+                        '@type': 'String',
+                        '#text': 'the name or relative path of a file to be included'
+                    }
+                )
+            }
+        )
+    )
+
+    logger.debug(parsed_data)
+
+    # start
+    get_schema_doc(xsdsrc)
+
+    # examples
+    get_lems_examples(exampledirs)
+
+    logger.debug("EXAMPLES")
+    logger.debug(lems_element_examples)
+
+    # render templates
+    for pg, pginfo in sections_pages.items():
+        outputfile = "{}/{}.md".format(destdir, pginfo[0].replace(" ", ""))
+        with open(outputfile, 'w') as ast_doc:
+            print(
+                asttemplates.page_header.render(section_data=pginfo,
+                                                lems_date=lems_date,
+                                                lems_commit=lems_commit,
+                                                lems_version=lems_version,
+                                                lems_branch=lems_branch),
+                file=ast_doc)
+            for et in parsed_data[pg]:
+                print(f"Rendering {et['@name']}")
                 print(
-                    asttemplates.listprop.render(lprops=lprops),
+                    asttemplates.elementtype.render(et=et),
                     file=ast_doc)
-            except KeyError:
-                pass
 
-            # process them, close tab-set
-            if 'Property' in et or 'ListProperty' in et:
-                print("""`````""", end="", file=ast_doc)
+                # if the component has schema documentation, add that, otherwise
+                lems_element_schemadoc = None
+                # skip
+                try:
+                    lems_element_schemadoc = lems_element_schema[et['@name'].lower()]
+                    logger.debug(f"Schema doc for {et['@name']}")
+                    logger.debug(lems_element_schemadoc)
+                except KeyError:
+                    logger.warning(f"No schema doc found for {et['@name']}")
+
+                if 'Property' in et or 'ListProperty' in et or lems_element_schemadoc is not None or len(lems_element_examples[et['@name']]) > 0:
+                    print("""`````{tab-set}""", end="", file=ast_doc)
+
+                try:
+                    if isinstance(et['Property'], list):
+                        props=et['Property']
+                    else:
+                        props=[et['Property']]
+                    print(f" - {len(props)} properties: {props}")
+                    print(
+                        asttemplates.prop.render(props=props),
+                        file=ast_doc)
+                except KeyError:
+                    pass
+
+                try:
+                    if isinstance(et['ListProperty'], list):
+                        lprops=et['ListProperty']
+                    else:
+                        lprops=[et['ListProperty']]
+                    print(f" - {len(lprops)} properties: {lprops}")
+                    print(
+                        asttemplates.listprop.render(lprops=lprops),
+                        file=ast_doc)
+                except KeyError:
+                    pass
+
+                if lems_element_schemadoc is not None:
+                    print(asttemplates.schema_quote.render(schemadoc=lems_element_schemadoc), file=ast_doc)
+
+                if len(lems_element_examples[et['@name']]) > 0:
+                    print(asttemplates.examples.render(
+                        title="Usage", lemsexamples=lems_element_examples[et['@name']]),
+                          file=ast_doc)
+
+                # process them, close tab-set
+                if 'Property' in et or 'ListProperty' in et or lems_element_schemadoc is not None or len(lems_element_examples[et['@name']]) > 0:
+                    print("""`````""", end="", file=ast_doc)
 
 
 # print(parsed_data)
+
+if __name__ == "__main__":
+    # src = "/home/asinha/Documents/02_Code/00_mine/NeuroML/software/NeuroML2/"
+    src = None
+    destdir = "../../source/Userdocs/LEMS_elements/"
+    main(src, destdir)