src/cm/converters/pandoc_converters.py
changeset 393 8806f683d0be
parent 358 3e58bf6b3f3e
child 418 8e3c6d8c39f8
--- a/src/cm/converters/pandoc_converters.py	Wed Nov 23 21:25:19 2011 +0100
+++ b/src/cm/converters/pandoc_converters.py	Sun Nov 27 00:31:12 2011 +0100
@@ -209,6 +209,8 @@
     if from_format==to_format=='html':
       # get body content
       stdoutdata = (content.encode('utf8'))
+      #stdoutdata = re.sub(r".*<body[^>]*>", '', stdoutdata)
+      #stdoutdata = re.sub(r"</body>.*", '', stdoutdata)
       # if for some reason, tidy has not guess the doctype, make xml.dom.minidom happy with HTML entities (&nbsp;)
       stdoutdata = re.sub(r"&nbsp;", '\xc2\xa0', stdoutdata)
       dom = parseString(stdoutdata)