$TITLE$

" wrapper, but HtmlFormatter now # handles this.) class I7HtmlFormatter(HtmlFormatter): def wrap(self, source): return self._wrap_code(source) def _wrap_code(self, source): # yield 0, '

\n' linenum = 0 for ix, ln in source: if ix == 1: linenum += 1 ln = ln.rstrip() # Convert tabs to spaces. ln = spacerun_pat.sub(spacerun_func, ln) # HTML-escape non-ASCII characters. ln = nonascii_pat.sub(nonascii_func, ln) # Change section-header spans to anchors. if opts.toc: ln = anchorify(ln) # Trim initial whitespace. ln, indent = remove_initial_spaces(ln) if not ln: # A completely blank line would collapse, so we add a space. ln = ' ' # Add the

 wrapper.
                margin = 'margin-left: %dch; text-indent: -2ch;' % (indent+2,)
                ln = '' % (margin,) + ln + ''
                # If this line should be highlighted, wrap the whole thing
                # ( and all) in a ....
                if linenum in self.hl_lines:
                    ln = '' + ln + ''
                ln = ln + '\n'
            yield ix, ln
        # yield 0, '

\n' # Suppress the default hl_lines highlighter wrapper, since we've already # handled that. def _highlight_lines(self, tokensource): return tokensource # Subclass of HtmlFormatter which converts tabs to spaces, escapes non-ASCII # characters, and adds the "

" wrapper. # This does *not* do all the clever left-margin/text-indent stuff. The result # doesn't wrap as nicely, and it looks terrible without CSS. Simpler though. class I7HtmlFormatterOld(HtmlFormatter): def wrap(self, source): return self._wrap_code(source) def _wrap_code(self, source): yield 0, '

\n' for ix, ln in source: if ix == 1: ln = ln.rstrip() ln = spacerun_pat.sub(spacerun_func, ln) ln = nonascii_pat.sub(nonascii_func, ln) ln = ln + '\n' yield ix, ln yield 0, '

\n' # Custom lexer for Inform 7. # Pygments has a built-in I7 lexer, but it insists on syntax-coloring # any I6 inclusions within the I7 code. I think that looks terrible. # This one restricts itself to coloring I6 strings and comments, and it # uses different classes from the I7 ones. class ZarfI7Lexer(Lexer): name = 'ZarfI7Lexer' aliases = ['inform7', 'i7'] filenames = ['*.ni', '*.i7x'] i7sectionlist = ['volume', 'book', 'part', 'chapter', 'section'] i7sectionnames = set(i7sectionlist) doublequotes = '"\u201C\u201D' def get_tokens_unprocessed(self, text): linestyle = Token.Text pos = 0 last = 0 lentext = len(text) lastch = '' linestart = True linecount = 0 while True: if linestart: linecount += 1 # Check to see if this is a special (header) line. If so, flush the output and set the style for the rest of the line. if pos > last: yield (last, linestyle, text[last:pos]) last = pos val = text.find(' ', pos) # Technically the game title or section name can be indented, but we don't handle that. # We should recognize the "---- DOCUMENTATION ----" heading here, and switch into a mode where all text is comments except indented text. Currently we don't. if val >= pos and text[pos:val].lower() in self.i7sectionnames: # Section header line. linestyle = Token.Generic.Heading elif linecount == 1 and pos < lentext and text[pos] in self.doublequotes: # Game title line. linestyle = Token.Generic.Heading else: # Regular line. linestyle = Token.Text if pos >= lentext: # End of document. if pos > last: yield (last, linestyle, text[last:pos]) last = pos break ch = text[pos] if ch == '-' and lastch == '(': # Begin an I6 inclusion section pos -= 1 if pos > last: yield (last, linestyle, text[last:pos]) last = pos last = pos pos += 2 lastch = '' while pos < lentext: ch = text[pos] if ch == ')' and lastch == '-': break if ch == '"': # Begin an I6 string if pos > last: yield (last, Token.Other, text[last:pos]) last = pos pos += 1 while pos < lentext: if text[pos] == '"': break pos += 1 pos += 1 yield (last, Token.String.Other, text[last:pos]) last = pos lastch = '' continue if ch == '\'': # Begin a single-quoted I6 string (dict word) if pos > last: yield (last, Token.Other, text[last:pos]) last = pos pos += 1 while pos < lentext: if text[pos] == '\'': break pos += 1 pos += 1 yield (last, Token.String.Other, text[last:pos]) last = pos lastch = '' continue if ch == '!': # Begin an I6 comment line if pos > last: yield (last, Token.Other, text[last:pos]) last = pos pos += 1 while pos < lentext: if text[pos] == '\n': break pos += 1 pos += 1 yield (last, Token.Comment.Single, text[last:pos]) last = pos lastch = '' continue pos += 1 lastch = ch pos += 1 # I6 code content yield (last, Token.Other, text[last:pos]) last = pos lastch = '' continue if ch == '[' and linestyle != Token.Generic.Heading: # Begin an I7 comment. These can be recursive, so we need to count bracket depth. if pos > last: yield (last, linestyle, text[last:pos]) last = pos pos += 1 depth = 1 while pos < lentext: if text[pos] == '[': depth += 1 if text[pos] == ']': depth -= 1; if depth == 0: break pos += 1 pos += 1 yield (last, Token.Comment.Multiline, text[last:pos]) last = pos lastch = '' continue if ch in self.doublequotes and linestyle != Token.Generic.Heading: # Begin an I7 string. if pos > last: yield (last, linestyle, text[last:pos]) last = pos pos += 1 while pos < lentext: if text[pos] in self.doublequotes: break if text[pos] == '[': # Begin an I7 string interpolation. if pos > last: yield (last, Token.String.Double, text[last:pos]) last = pos pos += 1 while pos < lentext: if text[pos] == ']': break pos += 1 pos += 1 yield (last, Token.String.Interpol, text[last:pos]) last = pos continue pos += 1 pos += 1 # I7 string content yield (last, Token.String.Double, text[last:pos]) last = pos lastch = '' continue pos += 1 lastch = ch linestart = (ch == '\n' or ch == '\r') return if opts.stockmode: i7lexer = get_lexer_by_name('inform7') else: i7lexer = ZarfI7Lexer() # Structure of HTML document, including the stylesheet. template = ''' $TITLE$ $BODY$ ''' if len(args) != 1: print('usage: i7-to-html.py story.ni [ -t title ] [ -o out.html ]') sys.exit() fl = open(args[0]) code = fl.read() fl.close() # The (stock) I7 formatter is slightly buggy about lines that contain only # whitespace. We'll strip those down to empty lines. ls = code.split('\n') ls = [ val.rstrip() for val in ls ] code = '\n'.join(ls) + '\n' # Create a list of lines to highlight, if the --highlight option was given. # Currently this has to be a string like "10" or "30-39". highlightlist = None if opts.highlight: histart, _, hiend = opts.highlight.partition('-') if hiend: highlightlist = list(range(int(histart), int(hiend)+1)) else: highlightlist = [ int(histart) ] # Check which formatter to use. formatter = I7HtmlFormatter if opts.oldmode: formatter = I7HtmlFormatterOld # We always use an empty lineseparator option. (The highlight option adds # extra lineseparators into the output, and we don't want that. We add # our own line breaks in the _wrap_code() method.) # The cssclass option gives the class of the

wrapper around the whole # code block. if highlightlist is not None: htmlformat = formatter(lineseparator='', cssclass='i7', hl_lines=highlightlist) else: htmlformat = formatter(lineseparator='', cssclass='i7') dat = highlight(code, i7lexer, htmlformat) result = template titlestr = None if opts.title: val = opts.title val = html.escape(val) titlestr = nonascii_pat.sub(nonascii_func, val) result = result.replace('$TITLE$', titlestr) if opts.toc: toclines = [] toclines.append('

%s' % (2*depth, anchor, val,) toclines.append(ln) toclines.append('

') dat = '\n'.join(toclines) + '\n

\n' + dat if opts.headfile: fl = open(opts.headfile) headdat = fl.read() fl.close() if titlestr is not None: headdat = headdat.replace('$TITLE$', titlestr) dat = headdat + dat if opts.footfile: fl = open(opts.footfile) footdat = fl.read() fl.close() if titlestr is not None: footdat = footdat.replace('$TITLE$', titlestr) dat = footdat + dat result = result.replace('$BODY$', dat) if not opts.outfile: print(result) else: fl = open(opts.outfile, 'w') fl.write(result) fl.close() print('Generated ' + opts.outfile)