From a56329ccd6c7476281ced948ea143d04647bca88 Mon Sep 17 00:00:00 2001 From: Zach DeCook Date: Wed, 2 Dec 2020 20:13:51 -0500 Subject: Parse div1 div2 div3 as headings --- thml2gmi.py | 24 ++++++++++++++++++++++++ 1 file changed, 24 insertions(+) create mode 100755 thml2gmi.py (limited to 'thml2gmi.py') diff --git a/thml2gmi.py b/thml2gmi.py new file mode 100755 index 0000000..24bc18a --- /dev/null +++ b/thml2gmi.py @@ -0,0 +1,24 @@ +#!/usr/bin/env python +import sys +import xml.etree.ElementTree as ET + +def main(argv): + root = ET.parse(argv[1]).getroot() + head = root.find('ThML.head') + body = root.find('ThML.body') + for thing in list(body): + parseSomething(thing) + +def parseSomething(thing): + if(len(thing.tag) == 4 and thing.tag[:3] == 'div'): + parseDiv(thing) + +def parseDiv(div): + indentLevel = int(div.tag[3:]) + title = div.get('title') + print('#' * indentLevel + ' ' + title) + for child in list(div): + parseSomething(child) + +if __name__ == '__main__': + main(sys.argv) -- cgit 1.4.1