") if g.title_prefix: output_with_translations(g, g.title_prefix) output_raw(g, ": ") output_with_translations(g, title) output

#! /usr/bin/env python # MMD by David A. Moon is licensed under a # Creative Commons Attribution-ShareAlike 4.0 International License # http://creativecommons.org/licenses/by-sa/4.0/ # # Please inform me if you find this useful, or any of the ideas embedded in it. # Comments and criticisms to dave underscore moon atsign alum dot mit dot edu. # Incorporates details_shim by Tyler Uebele licensed as follows: # # Copyright (c) 2013 Tyler Uebele # # Permission is hereby granted, free of charge, to any person obtaining a copy # of this software and associated documentation files (the "Software"), to # deal in the Software without restriction, including without limitation the # rights to use, copy, modify, merge, publish, distribute, sublicense, and/or # sell copies of the Software, and to permit persons to whom the Software is # furnished to do so, subject to the following conditions: # # The above copyright notice and this permission notice shall be included in # all copies or substantial portions of the Software. # # THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR # IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY, # FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE # AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER # LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, # OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN # THE SOFTWARE. # Convert MMD to HTML import codecs import math import os import re import sys import time default_code_style = "display:table; border:1px solid black; background-color:whitesmoke; padding-left:5px; padding-right:5px; padding-top:5px; padding-bottom:5px" # Global state # g is bound to it in most functions class MMD_globals: pass def MMD(input_stream, output_directory): self = MMD_globals() self.input_stream = input_stream self.output_stream = False self.output_directory = output_directory self.line_number = 0 self.title_prefix = False self.page_number = 0 self.current_chapter_name = False self.page_titles = [] #[[chapter [section subsection...]...]...] self.all_references = [] #[[see_arg href]...] self.all_anchors = [] #{"chapter#anchor"...} self.pre_html = [] self.post_html = [] self.this_page_file = False self.previous_page_file = False self.current_mode = 'normal' self.nesting_level = 0 self.code_style = default_code_style return self dot_handlers = dict() # maps a string to a list of before, main, after function # Define the handler(s) with def first, then call this # Handler arguments are (g, line, directive_name) def defdot(directive_name, handler, before=None, after=None): dot_handlers[directive_name] = [before, handler, after] # Main Program def main(argv): if len(argv) < 2 or len(argv) > 3: print("Usage: mmd input_pathname [output_directory]") return 1 else: input_pathname = argv[1] output_directory = None if len(argv) == 3: output_directory = argv[2] else: output_directory = os.path.join(os.path.dirname(input_pathname), "HTML") g = MMD(codecs.open(input_pathname, mode='r', encoding='utf-8'), output_directory) try: os.mkdir(g.output_directory) except OSError: pass try: process_lines(g) return 0 finally: g.input_stream.close() if g.output_stream: g.output_stream.close() # Process lines until end of input file def process_lines(g): while True: line = next_line(g) if line == False: break line2 = line.lstrip() # Remove leading whitespace if len(line2) == 0: # Blank line separates paragraphs if g.output_stream: change_mode(g, 'normal') output_raw(g, "

") elif line2[0] == '.': directive_line(g, line2) elif line2[0] == '*': list_line(g, line2, 'UL') elif line2[0] == '#': list_line(g, line2, 'OL') elif line2[0] == '|': table_line(g, line2) else: change_mode(g, 'normal') output_with_flags_and_translations(g, line) # Input file exhausted end_page(g, False) # Check for broken links for x in g.all_references: see_arg = x[0] href = x[1] if not (href in g.all_anchors): error_output("Broken link: .see " + see_arg + "\n") # Generate index.html file index_path = os.path.join(g.output_directory, "index.html") g.output_stream = open(index_path, "w") output_index(g) index_path # Line Handlers def undefined_handler(g, line, directive_name): error("Unrecognized directive ." + directive_name + " on line " + str(g.line_number)) undefined_handlers = [undefined_handler, undefined_handler, undefined_handler] def directive_line(g, line): change_mode(g, 'normal') space = line.find(" ") directive_end = len(line) if space >= 0: directive_end = space directive_name = line[1 : directive_end] # 1 skips initial period dot_name = directive_name.lower() handler = undefined_handlers if dot_name in dot_handlers: handler = dot_handlers[dot_name] before = handler[0] main_handler = handler[1] after = handler[2] if before: before(g, line, directive_name) if space >= 0: main_handler(g, line[space+1 : len(line)], directive_name) else: end_line = ".end " + directive_name while True: this_line = next_line(g) if this_line == False: break if this_line == end_line: break main_handler(g, this_line, directive_name) if after: after(g, line, directive_name) def list_line(g, line, mode): change_mode(g, mode) # number of leading stars or splats level = 0 while level < len(line) and line[level] == line[0]: level = level + 1 while g.nesting_level > level: output_raw(g, "") g.nesting_level = g.nesting_level - 1 while g.nesting_level < level: type = '1' if g.nesting_level < 3: type = "1ai"[g.nesting_level] if mode == 'UL': output_raw(g, "

", newline=False) output_with_flags_and_translations(g, line[level : len(line)], newline=False) output_raw(g, "

") def leave_UL_mode(g): output_raw(g, "

") def leave_OL_mode(g): output_raw(g, "

" + line + "

") defdot("anchor", anchor) def set_anchor(g, line): g.all_anchors.append(g.current_chapter_name + ".html#" + anchor_name(line)) # Remove all but letters and numbers, change spaces to underscores def anchor_name(title): result = [] for char in title: # This iterates over UTF-8 bytes if ord(char) < 128 and (char.isalpha() or char.isdigit()): result.append(char.lower()) elif char == ' ': result.append('_') return "".join(result) # Remove all but letters and numbers, change spaces to underscores, can't be "index" def chapter_name(title): anchor = anchor_name(title) if anchor == "index": return "index_" else: return anchor # chapter # #anchor # chapter#anchor # Returns [chapter, anchor] where chapter can be false def decode_see(line): sharp = line.find('#') first = line[0 : (sharp if sharp >= 0 else len(line))] second = line[sharp + 1 : len(line)] if sharp >= 0 else False chapter = line if sharp < 0 else first if sharp > 0 else False anchor = second if sharp >= 0 else "" return [chapter, anchor] def make_href(g, line): x = decode_see(line) chapter = x[0] anchor = x[1] file = chapter_name(chapter) if chapter else g.current_chapter_name return file + ".html#" + anchor_name(anchor) # .see chapter#anchor # or .See, output preserves the alphabetic case of the directive def see(g, line, directive): x = decode_see(line) chapter = x[0] anchor = x[1] href = make_href(g, line) text = chapter if anchor == "" else anchor g.all_references.append([line, href]) output_raw(g, directive + "

" + text + "

")

def after_code(g, line, _):
  output_raw(g, "

' % (x, width, y, height, color)) output_raw(g, '' % (x + width/2, y + height/2, font_size), newline=False) output_with_translations(g, text, newline=False) output_raw(g, '') def renderArrow(g, parameters, labels, from_row, from_col, to_row, to_col, text): # Resolve symbolic rows if type(from_row) == str: from_row = labels[from_row] if type(to_row) == str: to_row = labels[to_row] # Convert row,column to x,y col_width = parameters['column width'] row_height = parameters['row height'] title_height = parameters['title size'] * 3 from_x = from_col * col_width + col_width/2 + left_margin to_x = to_col * col_width + col_width/2 + left_margin from_y = title_height + from_row * row_height + row_height/2 to_y = title_height + to_row * row_height + row_height/2 if from_x < to_x: text_x = from_x + 5 from_x = from_x + 2 to_x = to_x - 10 else: text_x = to_x + 15 from_x = from_x - 2 to_x = to_x + 10 # Render font_size = parameters['text size'] if from_row == to_row: # Horizontal arrow output_raw(g, '' % (from_x, from_y, to_x, to_y, parameters['arrow color'])) if text: output_raw(g, '' % (text_x, from_y - 5, font_size), newline=False) output_with_translations(g, text, newline=False) output_raw(g, '') else: # Slanted arrow to_y = to_y - 10 output_raw(g, '' % (from_x, from_y, to_x, to_y, parameters['arrow color'])) if text: if from_x < to_x: angle_radians = math.atan2(to_y - from_y, to_x - from_x) else: angle_radians = math.atan2(from_y - to_y, from_x - to_x) angle_degrees = angle_radians * 360 / (2 * math.pi) if from_x < to_x: text_x = from_x + 40 * math.cos(angle_radians) + 5 * math.sin(angle_radians) text_y = from_y + 40 * math.sin(angle_radians) - 5 * math.cos(angle_radians) else: text_x = to_x + 15 * math.cos(angle_radians) + 5 * math.sin(angle_radians) text_y = to_y + 15 * math.sin(angle_radians) - 5 * math.cos(angle_radians) output_raw(g, '' % (text_x, text_y, font_size, angle_degrees, text_x, text_y), newline=False) output_with_translations(g, text, newline=False) output_raw(g, '') # Use those subroutines to do the rendering # Initial boilerplate col_width = parameters['column width'] row_height = parameters['row height'] title_height = parameters['title size'] * 3 output_raw(g, '') # Clean up g.sequence_lines = [] defdot("sequence", sequence, before=before_sequence, after=after_sequence) # Subroutines # Begin or end a table or list def change_mode(g, new_mode): if new_mode != g.current_mode: if g.current_mode == 'TABLE': leave_table_mode(g) elif g.current_mode == 'UL': leave_UL_mode(g) elif g.current_mode == 'OL': leave_OL_mode(g) g.current_mode = new_mode g.nesting_level = 1 if new_mode == 'TABLE': enter_table_mode(g) elif new_mode == 'UL': enter_UL_mode(g) elif new_mode == 'OL': enter_OL_mode(g) # Read line, strip trailing spaces, convert tabs, false at EOF def next_line(g): line = g.input_stream.readline() if len(line) == 0: return False line = line.rstrip(" \t\n") g.line_number = g.line_number + 1 spaces = " " while True: column = line.find("\t") if column < 0: return line line = line[0 : column] + spaces[column % 8 : ] + line[column + 1 : ] # Start a non-index page def start_page(g, title): g.page_number = g.page_number + 1 g.previous_page_file = g.this_page_file g.this_page_file = chapter_name(title) g.output_stream = open(os.path.join(g.output_directory, g.this_page_file + ".html"), "w") output_raw(g, "") output_raw(g, "") output_raw(g, "") if g.title_prefix: output_with_translations(g, g.title_prefix) output_raw(g, ": ") output_with_translations(g, title) output_raw(g, "") for html in g.pre_html: output_raw(g, html) # End a non-index page def end_page(g, next_chapter_name): if g.output_stream: change_mode(g, 'normal') # Navigation first = g.page_number == 1 prev_page = "index.html" if first else g.previous_page_file + ".html" next_page = next_chapter_name + ".html" if next_chapter_name else None output_raw(g, "

") output_raw(g, "", newline=False) output_raw(g, "Previous page", newline=False) output_raw(g, "", newline=False) output_raw(g, " Table of Contents ", newline=False) if next_chapter_name: output_raw(g, "", newline=False) output_raw(g, "Next page", newline=False) output_raw(g, "", newline=False) output_raw(g, "

") # Bottom of page material for html in g.post_html: output_raw(g, html) output_raw(g, "") g.output_stream.close() g.output_stream = False # Generate the table of contents def output_index(g): prefix = g.title_prefix + ": " if g.title_prefix else "" output_raw(g, "") output_raw(g, "" + prefix + "Table of Contents") # Special code to make

work in old browsers that don't support it # Thank you Tyler Uebele !! details_shim_min_js = "/* Copyright (c) 2006-2013 Tyler Uebele * Released under the MIT license. * latest at https://github.com/tyleruebele/details-shim * minified by Google Closure Compiler */\nfunction details_shim(a){if(!(a&&\"nodeType\"in a&&\"tagName\"in a))return details_shim.init();var b;if(\"details\"==a.tagName.toLowerCase())b=a.getElementsByTagName(\"summary\")[0];else if(a.parentNode&&\"summary\"==a.tagName.toLowerCase())b=a,a=b.parentNode;else return!1;if(\"boolean\"==typeof a.open)return a.getAttribute(\"data-open\")||(a.className=a.className.replace(/\\bdetails_shim_open\\b|\\bdetails_shim_closed\\b/g,\" \")),!1;var c=a.outerHTML||(new XMLSerializer).serializeToString(a),c=c.substring(0,c.indexOf(\">\")),\nc=-1!=c.indexOf(\"open\")&&-1==c.indexOf('open=\"\"')?\"open\":\"closed\";a.setAttribute(\"data-open\",c);a.className+=\" details_shim_\"+c;b.addEventListener?b.addEventListener(\"click\",function(){details_shim.toggle(a)}):b.attachEvent&&b.attachEvent(\"onclick\",function(){details_shim.toggle(a)});Object.defineProperty(a,\"open\",{get:function(){return\"open\"==this.getAttribute(\"data-open\")},set:function(a){details_shim.toggle(this,a)}});for(b=0;bsummary:before{display:inline-block;content:\"\\25bc\";padding:0;margin-right:.35em}\n" output_raw(g, "") output_raw(g, "") js = open(os.path.join(g.output_directory, "details-shim.min.js"), "w") js.write(details_shim_min_js) js.close() css = open(os.path.join(g.output_directory, "details-shim.min.css"), "w") css.write(details_shim_min_css) css.close() output_raw(g, "") for html in g.pre_html: output_raw(g, html) now = time.localtime() output_raw(g, "Last updated " + str(now.tm_mon) + "/" + str(now.tm_mday) + "/" + str(now.tm_year) + ".
") output_raw(g, "

") page_no = 1 for x in g.page_titles: title = x[0] sections = x[1] if len(sections) == 0: output_raw(g, "

", newline=False) else: output_raw(g, "

") page_name = chapter_name(title) output_raw(g, str(page_no) + ". " + title + "
", newline=False) if len(sections) == 0: output_raw(g, "

") else: output_raw(g, "") section_no = 1 for x in sections: title = x[0] subsections = x[1] anchor = anchor_name(title) output_raw(g, "

" + str(page_no) + "." + str(section_no) + " " + title + "

") subsection_no = 1 for title in subsections: anchor = anchor_name(title) output_raw(g, "

" + str(page_no) + "." + str(section_no) + "." + str(subsection_no) + " " + title + "

") subsection_no = subsection_no + 1 section_no = section_no + 1 if len(sections) > 0: output_raw(g, "

") page_no = page_no + 1 output_raw(g, "
") for html in g.post_html: output_raw(g, html) output_raw(g, "") # Output HTML directly def output_raw(g, line, newline = True): for char in line: if ord(char) < 32 or ord(char) > 126: error("Invalid character code " + str(ord(char)) + " on line " + str(g.line_number)) g.output_stream.write(line) if newline: g.output_stream.write('\n') # Output with character translations def output_with_translations(g, line, start=None, end=None, newline=True): for char in line[(start if start else 0) : (end if end else len(line))]: if ord(char) < 32: error("Invalid character code " + str(ord(char)) + " on line " + str(g.line_number)) elif char == '<': output_raw(g, "<", newline=False) elif char == '>': output_raw(g, ">", newline=False) elif char == '&': output_raw(g, "&", newline=False) elif ord(char) > 126: output_raw(g, "&#x", newline=False) for i in xrange(0, 4): shift = 12 - 4 * i higit = 15 & (ord(char) >> shift) g.output_stream.write(chr(higit + (ord('0') if higit < 10 else ord('A') - 10))) g.output_stream.write(';') else: g.output_stream.write(char) if newline: g.output_stream.write('\n') # Output with style flags and character translations # Depends on ` and \ being encoded in one UTF-8 byte def output_with_flags_and_translations(g, line, start=0, end=None, newline=True): if not end: end = len(line) pos = start while pos < end: next = line.find('\\', pos, end) next2 = line.find('`', pos, end) if next < 0 or (next2 >= 0 and next2 < next): next = next2 if next < 0: return output_with_translations(g, line, start=pos, end=end, newline=newline) else: if next > pos: output_with_translations(g, line, start=pos, end=next, newline=False) pos = next nextnext = line.find(line[pos], pos + 2, end) if pos + 2 <= end else -1 # +2 to allow ``` if nextnext < 0: error("Mismatched " + line[pos] + " in " + line + " on line " + str(g.line_number)) if line[pos] == '`': output_raw(g, "", newline=False) output_with_translations(g, line, start=pos + 1, end=nextnext, newline=False) output_raw(g, "", newline=False) pos = nextnext + 1 elif line[pos + 1] == '\\': if not (nextnext < end and line[nextnext + 1] == '\\'): error("Mismatched \\\\ in " + line + " on line " + str(g.line_number)) output_raw(g, "", newline=False) output_with_flags_and_translations(g, line, start=pos + 2, end=nextnext, newline=False) output_raw(g, "", newline=False) pos = nextnext + 2 else: output_raw(g, "", newline=False) output_with_flags_and_translations(g, line, start=pos + 1, end=nextnext, newline=False) output_raw(g, "", newline=False) pos = nextnext + 1 if newline: g.output_stream.write('\n') # Error reporting def error(message): sys.stderr.write("ERROR: " + message + "\n") sys.exit(1) def error_output(message): sys.stderr.write("ERROR: " + message + "\n") # Invoke the main program main(sys.argv)