8 years ago · 6b58777bfa
--- a/src/keras-operator.json
+++ b/src/keras-operator.json
--- a/tools/keras-operator-json.py
+++ b/tools/keras-operator-json.py
@@ -1,7 +1,219 @@
 
															 #!/usr/bin/env python
														
 
															-import json
														
 
															+from __future__ import unicode_literals
														
 
															+from __future__ import print_function
														
 
															+
														
 
															 import io
														
 
															+import json
														
 
															+import pydoc
														
 
															+import re
														
 
															 import sys
														
 
															-print('TODO')
														
 
															+def count_leading_spaces(s):
														
 
															+    ws = re.search('\S', s)
														
 
															+    if ws:
														
 
															+        return ws.start()
														
 
															+    else:
														
 
															+        return 0
														
 
															+
														
 
															+def process_docstring(docstring):
														
 
															+    # First, extract code blocks and process them.
														
 
															+    code_blocks = []
														
 
															+    if '```' in docstring:
														
 
															+        tmp = docstring[:]
														
 
															+        while '```' in tmp:
														
 
															+            tmp = tmp[tmp.find('```'):]
														
 
															+            index = tmp[3:].find('```') + 6
														
 
															+            snippet = tmp[:index]
														
 
															+            # Place marker in docstring for later reinjection.
														
 
															+            docstring = docstring.replace(
														
 
															+                snippet, '$CODE_BLOCK_%d' % len(code_blocks))
														
 
															+            snippet_lines = snippet.split('\n')
														
 
															+            # Remove leading spaces.
														
 
															+            num_leading_spaces = snippet_lines[-1].find('`')
														
 
															+            snippet_lines = ([snippet_lines[0]] +
														
 
															+                             [line[num_leading_spaces:]
														
 
															+                             for line in snippet_lines[1:]])
														
 
															+            # Most code snippets have 3 or 4 more leading spaces
														
 
															+            # on inner lines, but not all. Remove them.
														
 
															+            inner_lines = snippet_lines[1:-1]
														
 
															+            leading_spaces = None
														
 
															+            for line in inner_lines:
														
 
															+                if not line or line[0] == '\n':
														
 
															+                    continue
														
 
															+                spaces = count_leading_spaces(line)
														
 
															+                if leading_spaces is None:
														
 
															+                    leading_spaces = spaces
														
 
															+                if spaces < leading_spaces:
														
 
															+                    leading_spaces = spaces
														
 
															+            if leading_spaces:
														
 
															+                snippet_lines = ([snippet_lines[0]] +
														
 
															+                                 [line[leading_spaces:]
														
 
															+                                  for line in snippet_lines[1:-1]] +
														
 
															+                                 [snippet_lines[-1]])
														
 
															+            snippet = '\n'.join(snippet_lines)
														
 
															+            code_blocks.append(snippet)
														
 
															+            tmp = tmp[index:]
														
 
															+
														
 
															+    # Format docstring section titles.
														
 
															+    docstring = re.sub(r'\n(\s+)# (.*)\n',
														
 
															+                       r'\n\1__\2__\n\n',
														
 
															+                       docstring)
														
 
															+    # Format docstring lists.
														
 
															+    docstring = re.sub(r'    ([^\s\\\(]+):(.*)\n',
														
 
															+                       r'    - __\1__:\2\n',
														
 
															+                       docstring)
														
 
															+
														
 
															+    # Strip all leading spaces.
														
 
															+    lines = docstring.split('\n')
														
 
															+    docstring = '\n'.join([line.lstrip(' ') for line in lines])
														
 
															+
														
 
															+    # Reinject code blocks.
														
 
															+    for i, code_block in enumerate(code_blocks):
														
 
															+        docstring = docstring.replace(
														
 
															+            '$CODE_BLOCK_%d' % i, code_block)
														
 
															+    return docstring
														
 
															+
														
 
															+def split_docstring(docstring):
														
 
															+    headers = {}
														
 
															+    current_header = ''
														
 
															+    current_lines = []
														
 
															+    lines = docstring.split('\n')
														
 
															+    for line in lines:
														
 
															+        if line.startswith('__') and line.endswith('__'):
														
 
															+            headers[current_header] = current_lines
														
 
															+            current_lines = []
														
 
															+            current_header = line[2:-2]
														
 
															+            if current_header == 'Masking' or current_header.startswith('Note '):
														
 
															+                headline = '**' + current_header + '**'                
														
 
															+                current_lines = headers['']
														
 
															+                current_header = ''
														
 
															+                current_lines.append(headline)
														
 
															+        else:
														
 
															+            current_lines.append(line)
														
 
															+    if len(current_lines) > 0:
														
 
															+        headers[current_header] = current_lines
														
 
															+    return headers
														
 
															+
														
 
															+def update_argument(schema, name, lines):
														
 
															+    attribute = None
														
 
															+    if not 'attributes' in schema:
														
 
															+        schema['attributes'] = []
														
 
															+    for current_attribute in schema['attributes']:
														
 
															+        if 'name' in current_attribute and current_attribute['name'] == name:
														
 
															+            attribute = current_attribute
														
 
															+            break
														
 
															+    if not attribute:
														
 
															+        attribute = {}
														
 
															+        attribute['name'] = name
														
 
															+        schema['attributes'].append(attribute)
														
 
															+    attribute['description'] = '\n'.join(lines)
														
 
															+
														
 
															+def update_arguments(schema, lines):
														
 
															+    argument_name = None
														
 
															+    argument_lines = []
														
 
															+    for line in lines:
														
 
															+        if line.startswith('- __'):
														
 
															+            line = line.lstrip('- ')
														
 
															+            colon = line.index(':')
														
 
															+            if colon > 0:
														
 
															+                name = line[0:colon]
														
 
															+                line = line[colon+1:].lstrip(' ')
														
 
															+                if name.startswith('__') and name.endswith('__'):
														
 
															+                    if argument_name:
														
 
															+                        update_argument(schema, argument_name, argument_lines)
														
 
															+                    argument_name = name[2:-2]
														
 
															+                    argument_lines = []
														
 
															+        if argument_name:
														
 
															+            argument_lines.append(line)
														
 
															+    if argument_name:
														
 
															+        update_argument(schema, argument_name, argument_lines)
														
 
															+    return
														
 
															+
														
 
															+def update_examples(schema, lines):
														
 
															+    if 'examples' in schema:
														
 
															+        del schema['examples']
														
 
															+    summary_lines = []
														
 
															+    code_lines = None
														
 
															+    for line in lines:
														
 
															+        if line.startswith('```'):
														
 
															+            if code_lines != None:
														
 
															+                example = {}
														
 
															+                example['code'] = '\n'.join(code_lines)
														
 
															+                if len(summary_lines) > 0:
														
 
															+                    example['summary'] = '\n'.join(summary_lines)
														
 
															+                if not 'examples' in schema:
														
 
															+                    schema['examples'] = []
														
 
															+                schema['examples'].append(example)
														
 
															+                summary_lines = []
														
 
															+                code_lines = None
														
 
															+            else:
														
 
															+                code_lines = [ ]
														
 
															+        else:
														
 
															+            if code_lines != None:
														
 
															+                code_lines.append(line)
														
 
															+            elif line != '':
														
 
															+                summary_lines.append(line)
														
 
															+
														
 
															+def update_references(schema, lines):
														
 
															+    if 'references' in schema:
														
 
															+        del schema['references']
														
 
															+    for line in lines:
														
 
															+        if line != '':
														
 
															+            line = line.lstrip('- ')
														
 
															+            if not 'references' in schema:
														
 
															+                schema['references'] = []
														
 
															+            schema['references'].append({ 'description': line })
														
 
															+        
														
 
															+json_file = '../src/keras-operator.json'
														
 
															+json_data = open(json_file).read()
														
 
															+json_root = json.loads(json_data)
														
 
															+
														
 
															+for entry in json_root:
														
 
															+    name = entry['name']
														
 
															+    schema = entry['schema']
														
 
															+    if 'package' in schema:
														
 
															+        class_name = schema['package'] + '.' + name
														
 
															+        class_definition = pydoc.locate(class_name)
														
 
															+        if not class_definition:
														
 
															+            raise Exception('\'' + class_name + '\' not found.')
														
 
															+        docstring = class_definition.__doc__
														
 
															+        if not docstring:
														
 
															+            raise Exception('\'' + class_name + '\' missing __doc__.')
														
 
															+        docstring = process_docstring(docstring)
														
 
															+        headers = split_docstring(docstring)
														
 
															+        if '' in headers:
														
 
															+            schema['description'] = '\n'.join(headers[''])
														
 
															+            del headers['']
														
 
															+        if 'Arguments' in headers:
														
 
															+            update_arguments(schema, headers['Arguments'])
														
 
															+            del headers['Arguments']
														
 
															+        if 'Input shape' in headers:
														
 
															+            # TODO
														
 
															+            del headers['Input shape']
														
 
															+        if 'Output shape' in headers:
														
 
															+            # TODO
														
 
															+            del headers['Output shape']
														
 
															+        if 'Examples' in headers:
														
 
															+            update_examples(schema, headers['Examples'])
														
 
															+            del headers['Examples']
														
 
															+        if 'Example' in headers:
														
 
															+            update_examples(schema, headers['Example'])
														
 
															+            del headers['Example']            
														
 
															+        if 'References' in headers:
														
 
															+            update_references(schema, headers['References'])
														
 
															+            del headers['References']
														
 
															+        if 'Raises' in headers:
														
 
															+            del headers['Raises']
														
 
															+        if len(headers) > 0:
														
 
															+            raise Exception('\'' + class_name + '.__doc__\' contains unprocessed headers.')
														
 
															+ 
														
 
															+with io.open(json_file, 'w', newline='') as fout:
														
 
															+    json_data = json.dumps(json_root, sort_keys=True, indent=2)
														
 
															+    for line in json_data.splitlines():
														
 
															+        line = line.rstrip()
														
 
															+        if sys.version_info[0] < 3:
														
 
															+            line = unicode(line)
														
 
															+        fout.write(line)
														
 
															+        fout.write('\n')
														
 
															+