cabinet/generate.py

211 lines
6.3 KiB
Python
Executable File

#!/bin/python3.9
import os
import re
import shutil
import subprocess
from html.parser import HTMLParser
from pygments import highlight
from pygments.lexers import get_lexer_by_name
from pygments.formatters import HtmlFormatter
import sys
if len(sys.argv) > 1 and 'clean' not in sys.argv:
print('usage: %s [clean]' % sys.argv[0])
exit(1)
class CodeHighlighter(HTMLParser):
data = ''
reading_code = False
code = ''
lang = ''
def output(self):
data = self.data
self.data = ''
return data
def handle_starttag(self, tag, attrs):
if tag == 'pre':
self.reading_code = True
if tag == 'code':
for attr in attrs:
if attr[0] == 'class':
self.lang = attr[1].split(' ')[1]
if not self.reading_code:
self.attrs = attrs
self.data += '<' + tag
for attr in attrs:
self.data += ' %s="%s"' % (attr[0], attr[1])
self.data += '>'
def handle_data(self, data):
if self.reading_code:
self.code += data
else:
self.data += data
def handle_endtag(self, tag):
if not self.reading_code:
self.data += '</%s>' % tag
if tag == 'pre':
self.reading_code = False
self.data += highlight(self.code,
get_lexer_by_name(self.lang),
HtmlFormatter(linenos=True))
self.code = ''
self.lang = ''
highlighter = CodeHighlighter()
input_ = 'input'
outroot = 'out'
output = 'Files'
templates = 'templates'
if 'clean' in sys.argv:
shutil.rmtree(outroot, ignore_errors=True)
try:
os.mkdir(outroot)
shutil.copy(templates + '/stylesheet.css', outroot + '/stylesheet.css')
shutil.copy(templates + '/highlight.css', outroot + '/highlight.css')
shutil.copy(templates + '/cabinet.png', outroot + '/cabinet.png')
shutil.copy(templates + '/jquery.js', outroot + '/jquery.js')
shutil.copytree(templates + '/mathjax', outroot + '/mathjax')
shutil.copytree(templates + '/bootstrap', outroot + '/bootstrap')
except:
pass
with open(templates + '/file.html', 'r') as template:
file_template = template.read()
with open(templates + '/index.html', 'r') as template:
index_template = template.read()
def render_template(template, **kwargs):
for var, val in kwargs.items():
template = template.replace('${%s}' % var, val)
return template
class File:
def __init__(self, root, outdir, name):
self.outdir = outdir
self.basename = name[:-4]
self.pdf = self.basename + '.pdf'
self.html = self.basename + '.html'
self.path = self.outdir.removeprefix(outroot + '/') + '/' + self.html
self.pretty_path = self.path.replace('_', ' ').removesuffix('.html')
self.input_path = root + '/' + name
self.root_reference = re.sub(r'.+?/', '../', outdir)
self.root_reference = re.sub(r'/[^\.]+$', '/', self.root_reference)
path = '%s/%s' % (root, name)
with open(path, 'r') as f:
content = f.read()
m = re.findall(r'\\selectlanguage\{(.*?)\}', content)
if not m:
m = re.findall(r'\\usepackage\[(.*?)\]\{babel\}', content)
if not m:
m = re.findall(r'\\documentclass\[(.*?)\]\{.*\}', content)
lang = m[0] if len(m) > 0 else 'english'
m = re.findall(r'\\documentclass\{(.*?)\}', content)
doc_class = m[0] if len(m) > 0 else 'article'
options = [
'pandoc',
'--mathjax=templates/mathjax/es5/tex-mml-chtml.js',
'-f', 'latex',
'-t', 'html',
path
]
if doc_class == 'bookreport':
options.append('-s')
options.append('--template')
options.append('templates/default.html')
self.content = subprocess.check_output(options).decode()
if doc_class == 'bookreport':
if lang == 'portuguese':
self.content = re.sub(r'!\*\*title\*\*!', 'Título', self.content)
self.content = re.sub(r'!\*\*author\*\*!', 'Autor', self.content)
self.content = re.sub(r'!\*\*date\*\*!', 'Data da Ficha', self.content)
else:
self.content = re.sub(r'!\*\*title\*\*!', 'Title', self.content)
self.content = re.sub(r'!\*\*author\*\*!', 'Author', self.content)
self.content = re.sub(r'!\*\*date\*\*!', 'Report Date', self.content)
def expand_html(self):
title = self.basename.replace('_', ' ')
expanded = render_template(file_template,
title=title,
path=self.pretty_path,
root=self.root_reference,
pdf=self.pdf,
content=self.content)
highlighter.feed(expanded)
return highlighter.output()
def write_html(self):
html_content = self.expand_html()
with open(self.outdir + '/' + self.html, 'w') as f:
f.write(html_content)
def write_pdf(self):
subprocess.run(['latexmk', '-shell-escape', '-pdf', '-outdir=%s' % self.outdir, self.input_path])
subprocess.run(['latexmk', '-c', '-outdir=%s' % self.outdir, self.input_path])
def write(self):
html = self.outdir + '/' + self.html
pdf = self.outdir + '/' + self.pdf
input_time = os.path.getmtime(self.input_path)
if not os.path.isfile(html) or input_time > os.path.getmtime(html):
self.write_html()
if not os.path.isfile(pdf) or input_time > os.path.getmtime(pdf):
self.write_pdf()
toc = '<ul>'
for root, dirs, files in os.walk(input_, topdown=True):
outdir = outroot + '/' + output + root[len(input_):]
os.makedirs(outdir, exist_ok=True)
outfiles = []
if len(files) or len(dirs):
for file in files:
if file.endswith('.tex'):
f = File(root, outdir, file)
f.write()
toc += '<li><a href="%s">%s</a></li>' % (f.path, f.pretty_path)
toc += '</ul>'
with open(outroot + '/index.html', 'w') as f:
f.write(render_template(index_template,
toc=toc))