diff --git a/ebook_converter/ebooks/__init__.py b/ebook_converter/ebooks/__init__.py
index 66c1756..b4dfce0 100644
--- a/ebook_converter/ebooks/__init__.py
+++ b/ebook_converter/ebooks/__init__.py
@@ -1,12 +1,14 @@
-__license__ = 'GPL v3'
-__copyright__ = '2008, Kovid Goyal <kovid at kovidgoyal.net>'
-
-'''
+"""
 Code for the conversion of ebook formats and the reading of metadata
 from various formats.
-'''
+"""
+import numbers
+import os
+import re
+import sys
+
+from lxml import etree
 
-import os, re, numbers, sys
 from ebook_converter import prints
 from ebook_converter.ebooks.chardet import xml_to_unicode
 
@@ -30,12 +32,15 @@ class ParserError(ValueError):
     pass
 
 
-BOOK_EXTENSIONS = ['lrf', 'rar', 'zip', 'rtf', 'lit', 'txt', 'txtz', 'text', 'htm', 'xhtm',
-                   'html', 'htmlz', 'xhtml', 'pdf', 'pdb', 'updb', 'pdr', 'prc', 'mobi', 'azw', 'doc',
-                   'epub', 'fb2', 'fbz', 'djv', 'djvu', 'lrx', 'cbr', 'cbz', 'cbc', 'oebzip',
-                   'rb', 'imp', 'odt', 'chm', 'tpz', 'azw1', 'pml', 'pmlz', 'mbp', 'tan', 'snb',
-                   'xps', 'oxps', 'azw4', 'book', 'zbf', 'pobi', 'docx', 'docm', 'md',
-                   'textile', 'markdown', 'ibook', 'ibooks', 'iba', 'azw3', 'ps', 'kepub', 'kfx', 'kpf']
+BOOK_EXTENSIONS = ['lrf', 'rar', 'zip', 'rtf', 'lit', 'txt', 'txtz', 'text',
+                   'htm', 'xhtm', 'html', 'htmlz', 'xhtml', 'pdf', 'pdb',
+                   'updb', 'pdr', 'prc', 'mobi', 'azw', 'doc', 'epub', 'fb2',
+                   'fbz', 'djv', 'djvu', 'lrx', 'cbr', 'cbz', 'cbc', 'oebzip',
+                   'rb', 'imp', 'odt', 'chm', 'tpz', 'azw1', 'pml', 'pmlz',
+                   'mbp', 'tan', 'snb', 'xps', 'oxps', 'azw4', 'book', 'zbf',
+                   'pobi', 'docx', 'docm', 'md', 'textile', 'markdown',
+                   'ibook', 'ibooks', 'iba', 'azw3', 'ps', 'kepub', 'kfx',
+                   'kpf']
 
 
 def return_raster_image(path):
@@ -49,8 +54,7 @@ def return_raster_image(path):
 
 def extract_cover_from_embedded_svg(html, base, log):
     from ebook_converter.ebooks.oeb.base import XPath, SVG, XLINK
-    from ebook_converter.utils.xml_parse import safe_xml_fromstring
-    root = safe_xml_fromstring(html)
+    root = etree.fromstring(html)
 
     svg = XPath('//svg:svg')(root)
     if len(svg) == 1 and len(svg[0]) == 1 and svg[0][0].tag == SVG('image'):
@@ -65,10 +69,10 @@ def extract_calibre_cover(raw, base, log):
     from ebook_converter.ebooks.BeautifulSoup import BeautifulSoup
     soup = BeautifulSoup(raw)
     matches = soup.find(name=['h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'p', 'span',
-        'font', 'br'])
+                              'font', 'br'])
     images = soup.findAll('img', src=True)
-    if matches is None and len(images) == 1 and \
-            images[0].get('alt', '').lower()=='cover':
+    if (matches is None and len(images) == 1 and
+            images[0].get('alt', '').lower() == 'cover'):
         img = images[0]
         img = os.path.join(base, *img['src'].split('/'))
         q = return_raster_image(img)
@@ -97,13 +101,14 @@ def render_html_svg_workaround(path_to_html, log, width=590, height=750):
     data = None
     if SVG_NS in raw:
         try:
-            data = extract_cover_from_embedded_svg(raw,
-                   os.path.dirname(path_to_html), log)
+            data = extract_cover_from_embedded_svg(
+                raw, os.path.dirname(path_to_html), log)
         except Exception:
             pass
     if data is None:
         try:
-            data = extract_calibre_cover(raw, os.path.dirname(path_to_html), log)
+            data = extract_calibre_cover(raw, os.path.dirname(path_to_html),
+                                         log)
         except Exception:
             pass
 
@@ -118,7 +123,8 @@ def render_html_data(path_to_html, width, height):
     result = {}
 
     def report_error(text=''):
-        prints('Failed to render', path_to_html, 'with errors:', file=sys.stderr)
+        prints('Failed to render', path_to_html, 'with errors:',
+               file=sys.stderr)
         if text:
             prints(text, file=sys.stderr)
         if result and result['stdout_stderr']:
@@ -127,7 +133,8 @@ def render_html_data(path_to_html, width, height):
 
     with TemporaryDirectory('-render-html') as tdir:
         try:
-            result = fork_job('ebook_converter.ebooks.render_html', 'main', args=(path_to_html, tdir, 'jpeg'))
+            result = fork_job('ebook_converter.ebooks.render_html', 'main',
+                              args=(path_to_html, tdir, 'jpeg'))
         except WorkerError as e:
             report_error(e.orig_tb)
         else:
@@ -156,17 +163,20 @@ def normalize(x):
 
 
 def calibre_cover(title, author_string, series_string=None,
-        output_format='jpg', title_size=46, author_size=36, logo_path=None):
+                  output_format='jpg', title_size=46, author_size=36,
+                  logo_path=None):
     title = normalize(title)
     author_string = normalize(author_string)
     series_string = normalize(series_string)
     from ebook_converter.ebooks.covers import calibre_cover2
     from ebook_converter.utils.img import image_to_data
-    ans = calibre_cover2(title, author_string or '', series_string or '', logo_path=logo_path, as_qimage=True)
+    ans = calibre_cover2(title, author_string or '', series_string or '',
+                         logo_path=logo_path, as_qimage=True)
     return image_to_data(ans, fmt=output_format)
 
 
-UNIT_RE = re.compile(r'^(-*[0-9]*[.]?[0-9]*)\s*(%|em|ex|en|px|mm|cm|in|pt|pc|rem|q)$')
+UNIT_RE = re.compile(r'^(-*[0-9]*[.]?[0-9]*)\s*(%|em|ex|en|px|mm|cm|in|pt|pc'
+                     r'|rem|q)$')
 
 
 def unit_convert(value, base, font, dpi, body_font_size=12):
@@ -175,7 +185,7 @@ def unit_convert(value, base, font, dpi, body_font_size=12):
         return value
     try:
         return float(value) * 72.0 / dpi
-    except:
+    except Exception:
         pass
     result = value
     m = UNIT_RE.match(value)
@@ -227,7 +237,8 @@ def generate_masthead(title, output_path=None, width=600, height=60):
     recs = load_defaults('mobi_output')
     masthead_font_family = recs.get('masthead_font', None)
     from ebook_converter.ebooks.covers import generate_masthead
-    return generate_masthead(title, output_path=output_path, width=width, height=height, font_family=masthead_font_family)
+    return generate_masthead(title, output_path=output_path, width=width,
+                             height=height, font_family=masthead_font_family)
 
 
 def escape_xpath_attr(value):
diff --git a/ebook_converter/ebooks/conversion/plugins/comic_input.py b/ebook_converter/ebooks/conversion/plugins/comic_input.py
index c95e02d..5a81305 100644
--- a/ebook_converter/ebooks/conversion/plugins/comic_input.py
+++ b/ebook_converter/ebooks/conversion/plugins/comic_input.py
@@ -3,6 +3,7 @@ Based on ideas from comiclrf created by FangornUK.
 """
 import shutil, textwrap, codecs, os
 
+from ebook_converter import constants as const
 from ebook_converter.customize.conversion import InputFormatPlugin, OptionRecommendation
 from ebook_converter import CurrentDir
 from ebook_converter.ptempfile import PersistentTemporaryDirectory
@@ -245,7 +246,6 @@ class ComicInput(InputFormatPlugin):
         return os.path.abspath('metadata.opf')
 
     def create_wrappers(self, pages):
-        from ebook_converter.ebooks.oeb.base import XHTML_NS
         wrappers = []
         WRAPPER = textwrap.dedent('''\
         <html xmlns="%s">
@@ -267,7 +267,8 @@ class ComicInput(InputFormatPlugin):
         ''')
         dir = os.path.dirname(pages[0])
         for i, page in enumerate(pages):
-            wrapper = WRAPPER%(XHTML_NS, i+1, os.path.basename(page), i+1)
+            wrapper = WRAPPER%(const.XHTML_NS, i+1, os.path.basename(page),
+                               i+1)
             page = os.path.join(dir, 'page_%d.xhtml'%(i+1))
             with open(page, 'wb') as f:
                 f.write(wrapper.encode('utf-8'))
@@ -275,8 +276,6 @@ class ComicInput(InputFormatPlugin):
         return wrappers
 
     def create_viewer_wrapper(self, pages):
-        from ebook_converter.ebooks.oeb.base import XHTML_NS
-
         def page(src):
             return '<img src="{}"></img>'.format(os.path.basename(src))
 
@@ -303,7 +302,7 @@ class ComicInput(InputFormatPlugin):
             %s
             </body>
         </html>
-        ''' % (XHTML_NS, pages)
+        ''' % (const.XHTML_NS, pages)
         path = os.path.join(base, 'wrapper.xhtml')
         with open(path, 'wb') as f:
             f.write(wrapper.encode('utf-8'))
diff --git a/ebook_converter/ebooks/conversion/plugins/docx_output.py b/ebook_converter/ebooks/conversion/plugins/docx_output.py
index f1ea4eb..cf9e51f 100644
--- a/ebook_converter/ebooks/conversion/plugins/docx_output.py
+++ b/ebook_converter/ebooks/conversion/plugins/docx_output.py
@@ -1,14 +1,22 @@
-from ebook_converter.customize.conversion import OutputFormatPlugin, OptionRecommendation
+import io
 
+from lxml import etree
+
+from ebook_converter import constants as const
+from ebook_converter.customize import conversion
+from ebook_converter.ebooks.docx.dump import do_dump
+from ebook_converter.ebooks.docx.writer.container import DOCX
+from ebook_converter.ebooks.docx.writer.from_html import Convert
+from ebook_converter.ebooks.metadata import opf2 as opf_meta
+from ebook_converter.ebooks.oeb import base
 
-__license__ = 'GPL v3'
-__copyright__ = '2013, Kovid Goyal <kovid at kovidgoyal.net>'
 
 PAGE_SIZES = ['a0', 'a1', 'a2', 'a3', 'a4', 'a5', 'a6', 'b0', 'b1',
               'b2', 'b3', 'b4', 'b5', 'b6', 'legal', 'letter']
+_OPT = conversion.OptionRecommendation
 
 
-class DOCXOutput(OutputFormatPlugin):
+class DOCXOutput(conversion.OutputFormatPlugin):
 
     name = 'DOCX Output'
     author = 'Kovid Goyal'
@@ -16,75 +24,63 @@ class DOCXOutput(OutputFormatPlugin):
     commit_name = 'docx_output'
     ui_data = {'page_sizes': PAGE_SIZES}
 
-    options = {
-        OptionRecommendation(name='docx_page_size', recommended_value='letter',
-            level=OptionRecommendation.LOW, choices=PAGE_SIZES,
-            help='The size of the page. Default is letter. Choices '
-            'are %s' % PAGE_SIZES),
-
-        OptionRecommendation(name='docx_custom_page_size', recommended_value=None,
-            help='Custom size of the document. Use the form widthxheight '
-            'EG. `123x321` to specify the width and height (in pts). '
-            'This overrides any specified page-size.'),
-
-        OptionRecommendation(name='docx_no_cover', recommended_value=False,
-            help='Do not insert the book cover as an image at the start of the document.'
-                   ' If you use this option, the book cover will be discarded.'),
-
-        OptionRecommendation(name='preserve_cover_aspect_ratio', recommended_value=False,
-            help='Preserve the aspect ratio of the cover image instead of stretching'
-                   ' it out to cover the entire page.'),
-
-        OptionRecommendation(name='docx_no_toc', recommended_value=False,
-            help='Do not insert the table of contents as a page at the start of the document.'),
-
-        OptionRecommendation(name='extract_to',
-            help='Extract the contents of the generated %s file to the '
-                'specified directory. The contents of the directory are first '
-                'deleted, so be careful.' % 'DOCX'),
-
-        OptionRecommendation(name='docx_page_margin_left', recommended_value=72.0,
-            level=OptionRecommendation.LOW,
-            help='The size of the left page margin, in pts. Default is 72pt.'
-                   ' Overrides the common left page margin setting.'
-        ),
-
-        OptionRecommendation(name='docx_page_margin_top', recommended_value=72.0,
-            level=OptionRecommendation.LOW,
-            help='The size of the top page margin, in pts. Default is 72pt.'
-                   ' Overrides the common top page margin setting, unless set to zero.'
-        ),
-
-        OptionRecommendation(name='docx_page_margin_right', recommended_value=72.0,
-            level=OptionRecommendation.LOW,
-            help='The size of the right page margin, in pts. Default is 72pt.'
-                   ' Overrides the common right page margin setting, unless set to zero.'
-        ),
-
-        OptionRecommendation(name='docx_page_margin_bottom', recommended_value=72.0,
-            level=OptionRecommendation.LOW,
-            help='The size of the bottom page margin, in pts. Default is 72pt.'
-                   ' Overrides the common bottom page margin setting, unless set to zero.'
-        ),
-
-    }
+    options = {_OPT(name='docx_page_size', recommended_value='letter',
+                    level=_OPT.LOW, choices=PAGE_SIZES,
+                    help='The size of the page. Default is letter. Choices '
+                    'are %s' % PAGE_SIZES),
+               _OPT(name='docx_custom_page_size', recommended_value=None,
+                    help='Custom size of the document. Use the form '
+                    'widthxheight EG. `123x321` to specify the width and '
+                    'height (in pts). This overrides any specified '
+                    'page-size.'),
+               _OPT(name='docx_no_cover', recommended_value=False,
+                    help='Do not insert the book cover as an image at the '
+                    'start of the document. If you use this option, the book '
+                    'cover will be discarded.'),
+               _OPT(name='preserve_cover_aspect_ratio',
+                    recommended_value=False, help='Preserve the aspect ratio '
+                    'of the cover image instead of stretching it out to cover '
+                    'the entire page.'),
+               _OPT(name='docx_no_toc', recommended_value=False,
+                    help='Do not insert the table of contents as a page at '
+                    'the start of the document.'),
+               _OPT(name='extract_to', help='Extract the contents of the '
+                    'generated DOCX file to the specified directory. The '
+                    'contents of the directory are first deleted, so be '
+                    'careful.'),
+               _OPT(name='docx_page_margin_left', recommended_value=72.0,
+                    level=_OPT.LOW, help='The size of the left page margin, '
+                    'in pts. Default is 72pt. Overrides the common left page '
+                    'margin setting.'),
+               _OPT(name='docx_page_margin_top', recommended_value=72.0,
+                    level=_OPT.LOW, help='The size of the top page margin, '
+                    'in pts. Default is 72pt. Overrides the common top page '
+                    'margin setting, unless set to zero.'),
+               _OPT(name='docx_page_margin_right', recommended_value=72.0,
+                    level=_OPT.LOW, help='The size of the right page margin, '
+                    'in pts. Default is 72pt. Overrides the common right page '
+                    'margin setting, unless set to zero.'),
+               _OPT(name='docx_page_margin_bottom', recommended_value=72.0,
+                    level=_OPT.LOW, help='The size of the bottom page margin, '
+                    'in pts. Default is 72pt. Overrides the common bottom '
+                    'page margin setting, unless set to zero.')}
 
     def convert_metadata(self, oeb):
-        from lxml import etree
-        from ebook_converter.ebooks.oeb.base import OPF, OPF2_NS
-        from ebook_converter.ebooks.metadata.opf2 import OPF as ReadOPF
-        from io import BytesIO
-        package = etree.Element(OPF('package'), attrib={'version': '2.0'}, nsmap={None: OPF2_NS})
+
+        package = etree.Element(base.tag('opf', 'package'),
+                                attrib={'version': '2.0'},
+                                nsmap={None: const.OPF2_NS})
         oeb.metadata.to_opf2(package)
-        self.mi = ReadOPF(BytesIO(etree.tostring(package, encoding='utf-8')), populate_spine=False, try_to_guess_cover=False).to_book_metadata()
+        self.mi = opf_meta.OPF(io.BytesIO(etree.tostring(package,
+                                                         encoding='utf-8')),
+                               populate_spine=False,
+                               try_to_guess_cover=False).to_book_metadata()
 
     def convert(self, oeb, output_path, input_plugin, opts, log):
-        from ebook_converter.ebooks.docx.writer.container import DOCX
-        from ebook_converter.ebooks.docx.writer.from_html import Convert
         docx = DOCX(opts, log)
         self.convert_metadata(oeb)
-        Convert(oeb, docx, self.mi, not opts.docx_no_cover, not opts.docx_no_toc)()
+        Convert(oeb, docx, self.mi, not opts.docx_no_cover,
+                not opts.docx_no_toc)()
         docx.write(output_path, self.mi)
         if opts.extract_to:
-            from ebook_converter.ebooks.docx.dump import do_dump
             do_dump(output_path, opts.extract_to)
diff --git a/ebook_converter/ebooks/conversion/plugins/epub_input.py b/ebook_converter/ebooks/conversion/plugins/epub_input.py
index 4316aa0..9056465 100644
--- a/ebook_converter/ebooks/conversion/plugins/epub_input.py
+++ b/ebook_converter/ebooks/conversion/plugins/epub_input.py
@@ -1,14 +1,19 @@
-import os, re, posixpath
-from itertools import cycle
+import hashlib
+import itertools
+import os
+import re
+import traceback
+import uuid
 
-from ebook_converter.customize.conversion import InputFormatPlugin, OptionRecommendation
+from lxml import etree
+
+from ebook_converter.ebooks.metadata import opf2 as opf_meta
+from ebook_converter.ebooks.oeb import base
+from ebook_converter.customize.conversion import InputFormatPlugin
+from ebook_converter.customize.conversion import OptionRecommendation
 
 
-__license__ = 'GPL 3'
-__copyright__ = '2009, Kovid Goyal <kovid@kovidgoyal.net>'
-__docformat__ = 'restructuredtext en'
-
-ADOBE_OBFUSCATION =  'http://ns.adobe.com/pdf/enc#RC'
+ADOBE_OBFUSCATION = 'http://ns.adobe.com/pdf/enc#RC'
 IDPF_OBFUSCATION = 'http://www.idpf.org/2008/embedding'
 
 
@@ -16,8 +21,8 @@ def decrypt_font_data(key, data, algorithm):
     is_adobe = algorithm == ADOBE_OBFUSCATION
     crypt_len = 1024 if is_adobe else 1040
     crypt = bytearray(data[:crypt_len])
-    key = cycle(iter(bytearray(key)))
-    decrypt = bytes(bytearray(x^next(key) for x in crypt))
+    key = itertools.cycle(iter(bytearray(key)))
+    decrypt = bytes(bytearray(x ^ next(key) for x in crypt))
     return decrypt + data[crypt_len:]
 
 
@@ -29,18 +34,16 @@ def decrypt_font(key, path, algorithm):
 
 class EPUBInput(InputFormatPlugin):
 
-    name        = 'EPUB Input'
-    author      = 'Kovid Goyal'
+    name = 'EPUB Input'
+    author = 'Kovid Goyal'
     description = 'Convert EPUB files (.epub) to HTML'
-    file_types  = {'epub'}
+    file_types = {'epub'}
     output_encoding = None
     commit_name = 'epub_input'
 
     recommendations = {('page_breaks_before', '/', OptionRecommendation.MED)}
 
     def process_encryption(self, encfile, opf, log):
-        from lxml import etree
-        import uuid, hashlib
         idpf_key = opf.raw_unique_identifier
         if idpf_key:
             idpf_key = re.sub('[\u0020\u0009\u000d\u000a]', '', idpf_key)
@@ -56,27 +59,28 @@ class EPUBInput(InputFormatPlugin):
                 try:
                     key = item.text.rpartition(':')[-1]
                     key = uuid.UUID(key).bytes
-                except:
-                    import traceback
+                except Exception:
                     traceback.print_exc()
                     key = None
 
         try:
             root = etree.parse(encfile)
-            for em in root.xpath('descendant::*[contains(name(), "EncryptionMethod")]'):
+            for em in root.xpath('descendant::*[contains(name(), '
+                                 '"EncryptionMethod")]'):
                 algorithm = em.get('Algorithm', '')
                 if algorithm not in {ADOBE_OBFUSCATION, IDPF_OBFUSCATION}:
                     return False
-                cr = em.getparent().xpath('descendant::*[contains(name(), "CipherReference")]')[0]
+                cr = em.getparent().xpath('descendant::*[contains(name(), '
+                                          '"CipherReference")]')[0]
                 uri = cr.get('URI')
-                path = os.path.abspath(os.path.join(os.path.dirname(encfile), '..', *uri.split('/')))
+                path = os.path.abspath(os.path.join(os.path.dirname(encfile),
+                                                    '..', *uri.split('/')))
                 tkey = (key if algorithm == ADOBE_OBFUSCATION else idpf_key)
                 if (tkey and os.path.exists(path)):
                     self._encrypted_font_uris.append(uri)
                     decrypt_font(tkey, path, algorithm)
             return True
-        except:
-            import traceback
+        except Exception:
             traceback.print_exc()
         return False
 
@@ -97,8 +101,11 @@ class EPUBInput(InputFormatPlugin):
             return t
 
     def rationalize_cover3(self, opf, log):
-        ''' If there is a reference to the cover/titlepage via manifest properties, convert to
-        entries in the <guide> so that the rest of the pipeline picks it up. '''
+        """
+        If there is a reference to the cover/titlepage via manifest
+        properties, convert to entries in the <guide> so that the rest of the
+        pipeline picks it up.
+        """
         from ebook_converter.ebooks.metadata.opf3 import items_with_property
         removed = guide_titlepage_href = guide_titlepage_id = None
 
@@ -128,7 +135,8 @@ class EPUBInput(InputFormatPlugin):
                 titlepage_id, titlepage_href = tid, href.partition('#')[0]
                 break
         if titlepage_href is None:
-            titlepage_href, titlepage_id = guide_titlepage_href, guide_titlepage_id
+            titlepage_href = guide_titlepage_href
+            titlepage_id = guide_titlepage_id
         if titlepage_href is not None:
             self.set_guide_type(opf, 'titlepage', titlepage_href, 'Title Page')
             spine = list(opf.iterspine())
@@ -148,7 +156,6 @@ class EPUBInput(InputFormatPlugin):
         means, at most one entry with type="cover" that points to a raster
         cover and at most one entry with type="titlepage" that points to an
         HTML titlepage. '''
-        from ebook_converter.ebooks.oeb.base import OPF
         removed = None
         from lxml import etree
         guide_cover, guide_elem = None, None
@@ -160,12 +167,14 @@ class EPUBInput(InputFormatPlugin):
             raster_cover = opf.raster_cover
             if raster_cover:
                 if guide_elem is None:
-                    g = opf.root.makeelement(OPF('guide'))
+                    g = opf.root.makeelement(base.tag('opf', 'guide'))
                     opf.root.append(g)
                 else:
                     g = guide_elem.getparent()
                 guide_cover = raster_cover
-                guide_elem = g.makeelement(OPF('reference'), attrib={'href':raster_cover, 'type':'cover'})
+                guide_elem = g.makeelement(base.tag('opf', 'reference'),
+                                           attrib={'href': raster_cover,
+                                                   'type': 'cover'})
                 g.append(guide_elem)
             return
         spine = list(opf.iterspine())
@@ -186,7 +195,8 @@ class EPUBInput(InputFormatPlugin):
         # specially
         if not self.for_viewer:
             if len(spine) == 1:
-                log.warn('There is only a single spine item and it is marked as the cover. Removing cover marking.')
+                log.warn('There is only a single spine item and it is marked '
+                         'as the cover. Removing cover marking.')
                 for guide_elem in tuple(opf.iterguide()):
                     if guide_elem.get('type', '').lower() == 'cover':
                         guide_elem.getparent().remove(guide_elem)
@@ -215,8 +225,9 @@ class EPUBInput(InputFormatPlugin):
             # Render the titlepage to create a raster cover
             from ebook_converter.ebooks import render_html_svg_workaround
             guide_elem.set('href', 'calibre_raster_cover.jpg')
-            t = etree.SubElement(
-                elem[0].getparent(), OPF('item'), href=guide_elem.get('href'), id='calibre_raster_cover')
+            t = etree.SubElement(elem[0].getparent(), base.tag('opf', 'item'),
+                                 href=guide_elem.get('href'),
+                                 id='calibre_raster_cover')
             t.set('media-type', 'image/jpeg')
             if os.path.exists(guide_cover):
                 renderer = render_html_svg_workaround(guide_cover, log)
@@ -229,17 +240,16 @@ class EPUBInput(InputFormatPlugin):
         return removed
 
     def find_opf(self):
-        from ebook_converter.utils.xml_parse import safe_xml_fromstring
-
         def attr(n, attr):
             for k, v in n.attrib.items():
                 if k.endswith(attr):
                     return v
         try:
             with open('META-INF/container.xml', 'rb') as f:
-                root = safe_xml_fromstring(f.read())
+                root = etree.fromstring(f.read())
                 for r in root.xpath('//*[local-name()="rootfile"]'):
-                    if attr(r, 'media-type') != "application/oebps-package+xml":
+                    if (attr(r, 'media-type') !=
+                            "application/oebps-package+xml"):
                         continue
                     path = attr(r, 'full-path')
                     if not path:
@@ -248,20 +258,18 @@ class EPUBInput(InputFormatPlugin):
                     if os.path.exists(path):
                         return path
         except Exception:
-            import traceback
             traceback.print_exc()
 
     def convert(self, stream, options, file_ext, log, accelerators):
         from ebook_converter.utils.zipfile import ZipFile
         from ebook_converter import walk
         from ebook_converter.ebooks import DRMError
-        from ebook_converter.ebooks.metadata.opf2 import OPF
         try:
             zf = ZipFile(stream)
             zf.extractall(os.getcwd())
-        except:
+        except Exception:
             log.exception('EPUB appears to be invalid ZIP file, trying a'
-                    ' more forgiving ZIP parser')
+                          ' more forgiving ZIP parser')
             from ebook_converter.utils.localunzip import extractall
             stream.seek(0)
             extractall(stream)
@@ -276,11 +284,12 @@ class EPUBInput(InputFormatPlugin):
         path = getattr(stream, 'name', 'stream')
 
         if opf is None:
-            raise ValueError('%s is not a valid EPUB file (could not find opf)'%path)
+            raise ValueError('%s is not a valid EPUB file (could not find '
+                             'opf)' % path)
 
         opf = os.path.relpath(opf, os.getcwd())
-        parts = os.path.split(opf)
-        opf = OPF(opf, os.path.dirname(os.path.abspath(opf)))
+        # parts = os.path.split(opf)
+        opf = opf_meta.OPF(opf, os.path.dirname(os.path.abspath(opf)))
 
         self._encrypted_font_uris = []
         if os.path.exists(encfile):
@@ -288,18 +297,23 @@ class EPUBInput(InputFormatPlugin):
                 raise DRMError(os.path.basename(path))
         self.encrypted_fonts = self._encrypted_font_uris
 
-        if len(parts) > 1 and parts[0]:
-            delta = '/'.join(parts[:-1])+'/'
+        # XXX(gryf): this code would fail pretty ugly, thus, this part was
+        # never used.
+        # if len(parts) > 1 and parts[0]:
+        #    delta = '/'.join(parts[:-1])+'/'
 
-            def normpath(x):
-                return posixpath.normpath(delta + elem.get('href'))
+        #    def normpath(x):
+        #        return posixpath.normpath(delta + elem.get('href'))
 
-            for elem in opf.itermanifest():
-                elem.set('href', normpath(elem.get('href')))
-            for elem in opf.iterguide():
-                elem.set('href', normpath(elem.get('href')))
+        #    for elem in opf.itermanifest():
+        #        elem.set('href', normpath(elem.get('href')))
+        #    for elem in opf.iterguide():
+        #        elem.set('href', normpath(elem.get('href')))
 
-        f = self.rationalize_cover3 if opf.package_version >= 3.0 else self.rationalize_cover2
+        if opf.package_version >= 3.0:
+            f = self.rationalize_cover3
+        else:
+            f = self.rationalize_cover2
         self.removed_cover = f(opf, log)
         if self.removed_cover:
             self.removed_items_to_ignore = (self.removed_cover,)
@@ -352,15 +366,18 @@ class EPUBInput(InputFormatPlugin):
         from lxml import etree
         from ebook_converter.ebooks.chardet import xml_to_unicode
         from ebook_converter.ebooks.oeb.polish.parsing import parse
-        from ebook_converter.ebooks.oeb.base import EPUB_NS, XHTML, NCX_MIME, NCX, urlnormalize, urlunquote, serialize
+        from ebook_converter.ebooks.oeb.base import EPUB_NS, XHTML, NCX_MIME, \
+            NCX, urlnormalize, urlunquote, serialize
         from ebook_converter.ebooks.oeb.polish.toc import first_child
-        from ebook_converter.utils.xml_parse import safe_xml_fromstring
         from tempfile import NamedTemporaryFile
         with open(nav_path, 'rb') as f:
             raw = f.read()
-        raw = xml_to_unicode(raw, strip_encoding_pats=True, assume_utf8=True)[0]
+        raw = xml_to_unicode(raw, strip_encoding_pats=True,
+                             assume_utf8=True)[0]
         root = parse(raw, log=log)
-        ncx = safe_xml_fromstring('<ncx xmlns="http://www.daisy.org/z3986/2005/ncx/" version="2005-1" xml:lang="eng"><navMap/></ncx>')
+        ncx = etree.fromstring('<ncx xmlns="http://www.daisy.org/z3986/2005/'
+                               'ncx/" version="2005-1" xml:lang="eng">'
+                               '<navMap/></ncx>')
         navmap = ncx[0]
         et = '{%s}type' % EPUB_NS
         bn = os.path.basename(nav_path)
@@ -368,8 +385,8 @@ class EPUBInput(InputFormatPlugin):
         def add_from_li(li, parent):
             href = text = None
             for x in li.iterchildren(XHTML('a'), XHTML('span')):
-                text = etree.tostring(
-                    x, method='text', encoding='unicode', with_tail=False).strip() or ' '.join(
+                text = etree.tostring(x, method='text', encoding='unicode',
+                                      with_tail=False).strip() or ' '.join(
                             x.xpath('descendant-or-self::*/@title')).strip()
                 href = x.get('href')
                 if href:
@@ -382,7 +399,7 @@ class EPUBInput(InputFormatPlugin):
             np[0].append(np.makeelement(NCX('text')))
             np[0][0].text = text
             if href:
-                np.append(np.makeelement(NCX('content'), attrib={'src':href}))
+                np.append(np.makeelement(NCX('content'), attrib={'src': href}))
             return np
 
         def process_nav_node(node, toc_parent):
@@ -401,20 +418,25 @@ class EPUBInput(InputFormatPlugin):
         else:
             return
 
-        with NamedTemporaryFile(suffix='.ncx', dir=os.path.dirname(nav_path), delete=False) as f:
+        with NamedTemporaryFile(suffix='.ncx', dir=os.path.dirname(nav_path),
+                                delete=False) as f:
             f.write(etree.tostring(ncx, encoding='utf-8'))
         ncx_href = os.path.relpath(f.name, os.getcwd()).replace(os.sep, '/')
-        ncx_id = opf.create_manifest_item(ncx_href, NCX_MIME, append=True).get('id')
+        ncx_id = opf.create_manifest_item(ncx_href, NCX_MIME,
+                                          append=True).get('id')
         for spine in opf.root.xpath('//*[local-name()="spine"]'):
             spine.set('toc', ncx_id)
-        opts.epub3_nav_href = urlnormalize(os.path.relpath(nav_path).replace(os.sep, '/'))
+        url = os.path.relpath(nav_path).replace(os.sep, '/')
+        opts.epub3_nav_href = urlnormalize(url)
         opts.epub3_nav_parsed = root
         if getattr(self, 'removed_cover', None):
             changed = False
             base_path = os.path.dirname(nav_path)
             for elem in root.xpath('//*[@href]'):
                 href, frag = elem.get('href').partition('#')[::2]
-                link_path = os.path.relpath(os.path.join(base_path, urlunquote(href)), base_path)
+                link_path = os.path.relpath(os.path.join(base_path,
+                                                         urlunquote(href)),
+                                            base_path)
                 abs_href = urlnormalize(link_path)
                 if abs_href == self.removed_cover:
                     changed = True
diff --git a/ebook_converter/ebooks/conversion/plugins/epub_output.py b/ebook_converter/ebooks/conversion/plugins/epub_output.py
index 9f522d7..df7c917 100644
--- a/ebook_converter/ebooks/conversion/plugins/epub_output.py
+++ b/ebook_converter/ebooks/conversion/plugins/epub_output.py
@@ -2,7 +2,11 @@ import os
 import re
 import shutil
 import urllib.parse
+import uuid
 
+from ebook_converter import constants as const
+from ebook_converter.ebooks.oeb import base
+from ebook_converter.ebooks.oeb import parse_utils
 from ebook_converter.customize.conversion import OutputFormatPlugin
 from ebook_converter.customize.conversion import OptionRecommendation
 
@@ -132,39 +136,37 @@ class EPUBOutput(OutputFormatPlugin):
     recommendations = {('pretty_print', True, OptionRecommendation.HIGH)}
 
     def workaround_webkit_quirks(self):  # {{{
-        from ebook_converter.ebooks.oeb.base import XPath
         for x in self.oeb.spine:
             root = x.data
-            body = XPath('//h:body')(root)
+            body = base.XPath('//h:body')(root)
             if body:
                 body = body[0]
 
             if not hasattr(body, 'xpath'):
                 continue
 
-            for pre in XPath('//h:pre')(body):
+            for pre in base.XPath('//h:pre')(body):
                 if not pre.text and len(pre) == 0:
                     pre.tag = 'div'
     # }}}
 
     def upshift_markup(self):  # {{{
         'Upgrade markup to comply with XHTML 1.1 where possible'
-        from ebook_converter.ebooks.oeb.base import XPath, XML
         for x in self.oeb.spine:
             root = x.data
-            if (not root.get(XML('lang'))) and (root.get('lang')):
-                root.set(XML('lang'), root.get('lang'))
-            body = XPath('//h:body')(root)
+            if (not root.get(base.tag('xml', 'lang'))) and (root.get('lang')):
+                root.set(base.tag('xml', 'lang'), root.get('lang'))
+            body = base.XPath('//h:body')(root)
             if body:
                 body = body[0]
 
             if not hasattr(body, 'xpath'):
                 continue
-            for u in XPath('//h:u')(root):
+            for u in base.XPath('//h:u')(root):
                 u.tag = 'span'
 
             seen_ids, seen_names = set(), set()
-            for x in XPath('//*[@id or @name]')(root):
+            for x in base.XPath('//*[@id or @name]')(root):
                 eid, name = x.get('id', None), x.get('name', None)
                 if eid:
                     if eid in seen_ids:
@@ -223,28 +225,27 @@ class EPUBOutput(OutputFormatPlugin):
             first = next(iter(self.oeb.spine))
             self.oeb.toc.add('Start', first.href)
 
-        from ebook_converter.ebooks.oeb.base import OPF
         identifiers = oeb.metadata['identifier']
-        uuid = None
+        _uuid = None
         for x in identifiers:
-            if x.get(OPF('scheme'), None).lower() == 'uuid' or str(x).startswith('urn:uuid:'):
-                uuid = str(x).split(':')[-1]
+            if (x.get(base.tag('opf', 'scheme'), None).lower() == 'uuid' or
+                    str(x).startswith('urn:uuid:')):
+                _uuid = str(x).split(':')[-1]
                 break
         encrypted_fonts = getattr(input_plugin, 'encrypted_fonts', [])
 
-        if uuid is None:
+        if _uuid is None:
             self.log.warn('No UUID identifier found')
-            from uuid import uuid4
-            uuid = str(uuid4())
-            oeb.metadata.add('identifier', uuid, scheme='uuid', id=uuid)
+            _uuid = str(uuid.uuid4())
+            oeb.metadata.add('identifier', _uuid, scheme='uuid', id=_uuid)
 
-        if encrypted_fonts and not uuid.startswith('urn:uuid:'):
+        if encrypted_fonts and not _uuid.startswith('urn:uuid:'):
             # Apparently ADE requires this value to start with urn:uuid:
             # for some absurd reason, or it will throw a hissy fit and refuse
             # to use the obfuscated fonts.
             for x in identifiers:
-                if str(x) == uuid:
-                    x.content = 'urn:uuid:'+uuid
+                if str(x) == _uuid:
+                    x.content = 'urn:uuid:' + _uuid
 
         with TemporaryDirectory('_epub_output') as tdir:
             from ebook_converter.customize.ui import plugin_for_output_format
@@ -264,7 +265,7 @@ class EPUBOutput(OutputFormatPlugin):
                 self.upgrade_to_epub3(tdir, opf)
             encryption = None
             if encrypted_fonts:
-                encryption = self.encrypt_fonts(encrypted_fonts, tdir, uuid)
+                encryption = self.encrypt_fonts(encrypted_fonts, tdir, _uuid)
 
             from ebook_converter.ebooks.epub import initialize_container
             with initialize_container(output_path, os.path.basename(opf),
@@ -312,12 +313,12 @@ class EPUBOutput(OutputFormatPlugin):
         except EnvironmentError:
             pass
 
-    def encrypt_fonts(self, uris, tdir, uuid):  # {{{
+    def encrypt_fonts(self, uris, tdir, _uuid):  # {{{
         from ebook_converter.polyglot.binary import from_hex_bytes
 
-        key = re.sub(r'[^a-fA-F0-9]', '', uuid)
+        key = re.sub(r'[^a-fA-F0-9]', '', _uuid)
         if len(key) < 16:
-            raise ValueError('UUID identifier %r is invalid'%uuid)
+            raise ValueError('UUID identifier %r is invalid'% _uuid)
         key = bytearray(from_hex_bytes((key + key)[:32]))
         paths = []
         with CurrentDir(tdir):
@@ -335,7 +336,8 @@ class EPUBOutput(OutputFormatPlugin):
                     if len(data) >= 1024:
                         data = bytearray(data)
                         f.seek(0)
-                        f.write(bytes(bytearray(data[i] ^ key[i%16] for i in range(1024))))
+                        f.write(bytes(bytearray(data[i] ^ key[i%16]
+                                                for i in range(1024))))
                     else:
                         self.log.warn('Font', path, 'is invalid, ignoring')
                 if not isinstance(uri, str):
@@ -374,11 +376,10 @@ class EPUBOutput(OutputFormatPlugin):
     # }}}
 
     def workaround_ade_quirks(self):  # {{{
-        '''
+        """
         Perform various markup transforms to get the output to render correctly
         in the quirky ADE.
-        '''
-        from ebook_converter.ebooks.oeb.base import XPath, XHTML, barename, urlunquote
+        """
 
         stylesheet = self.oeb.manifest.main_stylesheet
 
@@ -388,23 +389,23 @@ class EPUBOutput(OutputFormatPlugin):
         for node in self.oeb.toc.iter():
             href = getattr(node, 'href', None)
             if hasattr(href, 'partition'):
-                base, _, frag = href.partition('#')
-                frag = urlunquote(frag)
+                _base, _, frag = href.partition('#')
+                frag = base.urlunquote(frag)
                 if frag and frag_pat.match(frag) is None:
                     self.log.warn(
                             'Removing fragment identifier %r from TOC as Adobe Digital Editions cannot handle it'%frag)
-                    node.href = base
+                    node.href = _base
 
         for x in self.oeb.spine:
             root = x.data
-            body = XPath('//h:body')(root)
+            body = base.XPath('//h:body')(root)
             if body:
                 body = body[0]
 
             if hasattr(body, 'xpath'):
                 # remove <img> tags with empty src elements
                 bad = []
-                for x in XPath('//h:img')(body):
+                for x in base.XPath('//h:img')(body):
                     src = x.get('src', '').strip()
                     if src in ('', '#') or src.startswith('http:'):
                         bad.append(x)
@@ -412,7 +413,7 @@ class EPUBOutput(OutputFormatPlugin):
                     img.getparent().remove(img)
 
                 # Add id attribute to <a> tags that have name
-                for x in XPath('//h:a[@name]')(body):
+                for x in base.XPath('//h:a[@name]')(body):
                     if not x.get('id', False):
                         x.set('id', x.get('name'))
                     # The delightful epubcheck has started complaining about <a> tags that
@@ -420,19 +421,19 @@ class EPUBOutput(OutputFormatPlugin):
                     x.attrib.pop('name')
 
                 # Replace <br> that are children of <body> as ADE doesn't handle them
-                for br in XPath('./h:br')(body):
+                for br in base.XPath('./h:br')(body):
                     if br.getparent() is None:
                         continue
                     try:
                         prior = next(br.itersiblings(preceding=True))
-                        priortag = barename(prior.tag)
+                        priortag = parse_utils.barename(prior.tag)
                         priortext = prior.tail
                     except:
                         priortag = 'body'
                         priortext = body.text
                     if priortext:
                         priortext = priortext.strip()
-                    br.tag = XHTML('p')
+                    br.tag = base.tag('xhtml', 'p')
                     br.text = '\u00a0'
                     style = br.get('style', '').split(';')
                     style = list(filter(None, map(lambda x: x.strip(), style)))
@@ -446,44 +447,44 @@ class EPUBOutput(OutputFormatPlugin):
                         style.append('height:0pt')
                     br.set('style', '; '.join(style))
 
-            for tag in XPath('//h:embed')(root):
+            for tag in base.XPath('//h:embed')(root):
                 tag.getparent().remove(tag)
-            for tag in XPath('//h:object')(root):
+            for tag in base.XPath('//h:object')(root):
                 if tag.get('type', '').lower().strip() in {'image/svg+xml', 'application/svg+xml'}:
                     continue
                 tag.getparent().remove(tag)
 
-            for tag in XPath('//h:title|//h:style')(root):
+            for tag in base.XPath('//h:title|//h:style')(root):
                 if not tag.text:
                     tag.getparent().remove(tag)
-            for tag in XPath('//h:script')(root):
+            for tag in base.XPath('//h:script')(root):
                 if (not tag.text and not tag.get('src', False) and tag.get('type', None) != 'text/x-mathjax-config'):
                     tag.getparent().remove(tag)
-            for tag in XPath('//h:body/descendant::h:script')(root):
+            for tag in base.XPath('//h:body/descendant::h:script')(root):
                 tag.getparent().remove(tag)
 
-            formchildren = XPath('./h:input|./h:button|./h:textarea|'
+            formchildren = base.XPath('./h:input|./h:button|./h:textarea|'
                     './h:label|./h:fieldset|./h:legend')
-            for tag in XPath('//h:form')(root):
+            for tag in base.XPath('//h:form')(root):
                 if formchildren(tag):
                     tag.getparent().remove(tag)
                 else:
                     # Not a real form
-                    tag.tag = XHTML('div')
+                    tag.tag = base.tag('xhtml', 'div')
 
-            for tag in XPath('//h:center')(root):
-                tag.tag = XHTML('div')
+            for tag in base.XPath('//h:center')(root):
+                tag.tag = base.tag('xhtml', 'div')
                 tag.set('style', 'text-align:center')
             # ADE can't handle &amp; in an img url
-            for tag in XPath('//h:img[@src]')(root):
+            for tag in base.XPath('//h:img[@src]')(root):
                 tag.set('src', tag.get('src', '').replace('&', ''))
 
             # ADE whimpers in fright when it encounters a <td> outside a
             # <table>
-            in_table = XPath('ancestor::h:table')
-            for tag in XPath('//h:td|//h:tr|//h:th')(root):
+            in_table = base.XPath('ancestor::h:table')
+            for tag in base.XPath('//h:td|//h:tr|//h:th')(root):
                 if not in_table(tag):
-                    tag.tag = XHTML('div')
+                    tag.tag = base.tag('xhtml', 'div')
 
             # ADE fails to render non breaking hyphens/soft hyphens/zero width spaces
             special_chars = re.compile('[\u200b\u00ad]')
@@ -498,7 +499,7 @@ class EPUBOutput(OutputFormatPlugin):
             if stylesheet is not None:
                 # ADE doesn't render lists correctly if they have left margins
                 from css_parser.css import CSSRule
-                for lb in XPath('//h:ul[@class]|//h:ol[@class]')(root):
+                for lb in base.XPath('//h:ul[@class]|//h:ol[@class]')(root):
                     sel = '.'+lb.get('class')
                     for rule in stylesheet.data.cssRules.rulesOfType(CSSRule.STYLE_RULE):
                         if sel == rule.selectorList.selectorText:
@@ -519,11 +520,10 @@ class EPUBOutput(OutputFormatPlugin):
         '''
         Perform toc link transforms to alleviate slow loading.
         '''
-        from ebook_converter.ebooks.oeb.base import XPath
         from ebook_converter.ebooks.oeb.polish.toc import item_at_top
 
         def frag_is_at_top(root, frag):
-            elem = XPath('//*[@id="%s" or @name="%s"]'%(frag, frag))(root)
+            elem = base.XPath('//*[@id="%s" or @name="%s"]'%(frag, frag))(root)
             if elem:
                 elem = elem[0]
             else:
diff --git a/ebook_converter/ebooks/conversion/plugins/fb2_input.py b/ebook_converter/ebooks/conversion/plugins/fb2_input.py
index c84ea79..62f7b86 100644
--- a/ebook_converter/ebooks/conversion/plugins/fb2_input.py
+++ b/ebook_converter/ebooks/conversion/plugins/fb2_input.py
@@ -1,59 +1,57 @@
 """
 Convert .fb2 files to .lrf
 """
-import os, re
+import os
 import pkg_resources
+import re
 
-from ebook_converter.customize.conversion import InputFormatPlugin, OptionRecommendation
+from lxml import etree
+
+from ebook_converter import constants as const
+from ebook_converter.customize.conversion import InputFormatPlugin
+from ebook_converter.customize.conversion import OptionRecommendation
 from ebook_converter import guess_type
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2008, Anatoly Shipitsin <norguhtar at gmail.com>'
-
-FB2NS  = 'http://www.gribuser.ru/xml/fictionbook/2.0'
+FB2NS = 'http://www.gribuser.ru/xml/fictionbook/2.0'
 FB21NS = 'http://www.gribuser.ru/xml/fictionbook/2.1'
 
 
 class FB2Input(InputFormatPlugin):
 
-    name        = 'FB2 Input'
-    author      = 'Anatoly Shipitsin'
+    name = 'FB2 Input'
+    author = 'Anatoly Shipitsin'
     description = 'Convert FB2 and FBZ files to HTML'
-    file_types  = {'fb2', 'fbz'}
+    file_types = {'fb2', 'fbz'}
     commit_name = 'fb2_input'
 
-    recommendations = {
-        ('level1_toc', '//h:h1', OptionRecommendation.MED),
-        ('level2_toc', '//h:h2', OptionRecommendation.MED),
-        ('level3_toc', '//h:h3', OptionRecommendation.MED),
-        }
+    recommendations = {('level1_toc', '//h:h1', OptionRecommendation.MED),
+                       ('level2_toc', '//h:h2', OptionRecommendation.MED),
+                       ('level3_toc', '//h:h3', OptionRecommendation.MED)}
 
-    options = {
-    OptionRecommendation(name='no_inline_fb2_toc',
-        recommended_value=False, level=OptionRecommendation.LOW,
-        help='Do not insert a Table of Contents at the beginning of the book.'
-        )}
+    options = {OptionRecommendation(name='no_inline_fb2_toc',
+                                    recommended_value=False,
+                                    level=OptionRecommendation.LOW,
+                                    help='Do not insert a Table of Contents '
+                                    'at the beginning of the book.')}
 
     def convert(self, stream, options, file_ext, log,
                 accelerators):
-        from lxml import etree
-        from ebook_converter.utils.xml_parse import safe_xml_fromstring
-        from ebook_converter.ebooks.metadata.fb2 import ensure_namespace, get_fb2_data
+        from ebook_converter.ebooks.metadata.fb2 import ensure_namespace
+        from ebook_converter.ebooks.metadata.fb2 import get_fb2_data
         from ebook_converter.ebooks.metadata.opf2 import OPFCreator
         from ebook_converter.ebooks.metadata.meta import get_metadata
-        from ebook_converter.ebooks.oeb.base import XLINK_NS, XHTML_NS
         from ebook_converter.ebooks.chardet import xml_to_unicode
         self.log = log
         log.debug('Parsing XML...')
         raw = get_fb2_data(stream)[0]
         raw = raw.replace(b'\0', b'')
         raw = xml_to_unicode(raw, strip_encoding_pats=True,
-            assume_utf8=True, resolve_entities=True)[0]
+                             assume_utf8=True, resolve_entities=True)[0]
         try:
-            doc = safe_xml_fromstring(raw)
+            doc = etree.fromstring(raw)
         except etree.XMLSyntaxError:
-            doc = safe_xml_fromstring(raw.replace('& ', '&amp;'))
+            doc = etree.fromstring(raw.replace('& ', '&amp;'))
         if doc is None:
             raise ValueError('The FB2 file is not valid XML')
         doc = ensure_namespace(doc)
@@ -62,22 +60,24 @@ class FB2Input(InputFormatPlugin):
         except Exception:
             fb_ns = FB2NS
 
-        NAMESPACES = {'f':fb_ns, 'l':XLINK_NS}
-        stylesheets = doc.xpath('//*[local-name() = "stylesheet" and @type="text/css"]')
+        NAMESPACES = {'f': fb_ns, 'l': const.XLINK_NS}
+        stylesheets = doc.xpath('//*[local-name() = "stylesheet" and '
+                                '@type="text/css"]')
         css = ''
         for s in stylesheets:
             css += etree.tostring(s, encoding='unicode', method='text',
-                    with_tail=False) + '\n\n'
+                                  with_tail=False) + '\n\n'
         if css:
-            import css_parser, logging
+            import css_parser
+            import logging
             parser = css_parser.CSSParser(fetcher=None,
-                    log=logging.getLogger('calibre.css'))
+                                          log=logging.getLogger('calibre.css'))
 
-            XHTML_CSS_NAMESPACE = '@namespace "%s";\n' % XHTML_NS
+            XHTML_CSS_NAMESPACE = '@namespace "%s";\n' % const.XHTML_NS
             text = XHTML_CSS_NAMESPACE + css
             log.debug('Parsing stylesheet...')
             stylesheet = parser.parseString(text)
-            stylesheet.namespaces['h'] = XHTML_NS
+            stylesheet.namespaces['h'] = const.XHTML_NS
             css = stylesheet.cssText
             if isinstance(css, bytes):
                 css = css.decode('utf-8', 'replace')
@@ -92,16 +92,20 @@ class FB2Input(InputFormatPlugin):
         if options.no_inline_fb2_toc:
             log('Disabling generation of inline FB2 TOC')
             ss = re.compile(r'<!-- BUILD TOC -->.*<!-- END BUILD TOC -->',
-                    re.DOTALL).sub('', ss)
+                            re.DOTALL).sub('', ss)
 
-        styledoc = safe_xml_fromstring(ss)
+        styledoc = etree.fromstring(ss)
 
         transform = etree.XSLT(styledoc)
         result = transform(doc)
 
         # Handle links of type note and cite
-        notes = {a.get('href')[1:]: a for a in result.xpath('//a[@link_note and @href]') if a.get('href').startswith('#')}
-        cites = {a.get('link_cite'): a for a in result.xpath('//a[@link_cite]') if not a.get('href', '')}
+        notes = {a.get('href')[1:]: a
+                 for a in result.xpath('//a[@link_note and @href]')
+                 if a.get('href').startswith('#')}
+        cites = {a.get('link_cite'): a
+                 for a in result.xpath('//a[@link_cite]')
+                 if not a.get('href', '')}
         all_ids = {x for x in result.xpath('//*/@id')}
         for cite, a in cites.items():
             note = notes.get(cite, None)
@@ -137,8 +141,10 @@ class FB2Input(InputFormatPlugin):
                 f.write(mi.cover_data[1])
             cpath = os.path.abspath('fb2_cover_calibre_mi.jpg')
         else:
-            for img in doc.xpath('//f:coverpage/f:image', namespaces=NAMESPACES):
-                href = img.get('{%s}href'%XLINK_NS, img.get('href', None))
+            for img in doc.xpath('//f:coverpage/f:image',
+                                 namespaces=NAMESPACES):
+                href = img.get('{%s}href' % const.XLINK_NS,
+                               img.get('href', None))
                 if href is not None:
                     if href.startswith('#'):
                         href = href[1:]
@@ -165,15 +171,15 @@ class FB2Input(InputFormatPlugin):
                 ext = ct.rpartition('/')[-1].lower()
                 if ext in ('png', 'jpeg', 'jpg'):
                     if fname.lower().rpartition('.')[-1] not in {'jpg', 'jpeg',
-                            'png'}:
+                                                                 'png'}:
                         fname += '.' + ext
                     self.binary_map[elem.get('id')] = fname
                 raw = elem.text.strip()
                 try:
                     data = base64_decode(raw)
                 except TypeError:
-                    self.log.exception('Binary data with id=%s is corrupted, ignoring'%(
-                        elem.get('id')))
+                    self.log.exception('Binary data with id=%s is corrupted, '
+                                       'ignoring' % elem.get('id'))
                 else:
                     with open(fname, 'wb') as f:
                         f.write(data)
diff --git a/ebook_converter/ebooks/conversion/plugins/lit_input.py b/ebook_converter/ebooks/conversion/plugins/lit_input.py
index 8fbe8ce..446af67 100644
--- a/ebook_converter/ebooks/conversion/plugins/lit_input.py
+++ b/ebook_converter/ebooks/conversion/plugins/lit_input.py
@@ -1,17 +1,17 @@
+import copy
+
+from lxml import etree
+
+from ebook_converter import constants as const
 from ebook_converter.customize.conversion import InputFormatPlugin
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2009, Kovid Goyal <kovid@kovidgoyal.net>'
-__docformat__ = 'restructuredtext en'
-
-
 class LITInput(InputFormatPlugin):
 
-    name        = 'LIT Input'
-    author      = 'Marshall T. Vandegrift'
+    name = 'LIT Input'
+    author = 'Marshall T. Vandegrift'
     description = 'Convert LIT files to HTML'
-    file_types  = {'lit'}
+    file_types = {'lit'}
     commit_name = 'lit_input'
 
     def convert(self, stream, options, file_ext, log,
@@ -22,7 +22,7 @@ class LITInput(InputFormatPlugin):
         return create_oebbook(log, stream, options, reader=LitReader)
 
     def postprocess_book(self, oeb, opts, log):
-        from ebook_converter.ebooks.oeb.base import XHTML_NS, XPath, XHTML
+        from ebook_converter.ebooks.oeb.base import XPath, XHTML
         for item in oeb.spine:
             root = item.data
             if not hasattr(root, 'xpath'):
@@ -37,22 +37,23 @@ class LITInput(InputFormatPlugin):
                 body = body[0]
                 if len(body) == 1 and body[0].tag == XHTML('pre'):
                     pre = body[0]
-                    from ebook_converter.ebooks.txt.processor import convert_basic, \
-                        separate_paragraphs_single_line
+                    from ebook_converter.ebooks.txt.processor import \
+                        convert_basic, separate_paragraphs_single_line
                     from ebook_converter.ebooks.chardet import xml_to_unicode
-                    from ebook_converter.utils.xml_parse import safe_xml_fromstring
-                    import copy
-                    self.log('LIT file with all text in singe <pre> tag detected')
+                    self.log('LIT file with all text in singe <pre> tag '
+                             'detected')
                     html = separate_paragraphs_single_line(pre.text)
                     html = convert_basic(html).replace('<html>',
-                            '<html xmlns="%s">'%XHTML_NS)
+                                                       '<html xmlns="%s">' %
+                                                       const.XHTML_NS)
                     html = xml_to_unicode(html, strip_encoding_pats=True,
-                            resolve_entities=True)[0]
+                                          resolve_entities=True)[0]
                     if opts.smarten_punctuation:
                         # SmartyPants skips text inside <pre> tags
-                        from ebook_converter.ebooks.conversion.preprocess import smarten_punctuation
-                        html = smarten_punctuation(html, self.log)
-                    root = safe_xml_fromstring(html)
+                        from ebook_converter.ebooks.conversion import \
+                                preprocess
+                        html = preprocess.smarten_punctuation(html, self.log)
+                    root = etree.fromstring(html)
                     body = XPath('//h:body')(root)
                     pre.tag = XHTML('div')
                     pre.text = ''
diff --git a/ebook_converter/ebooks/conversion/plugins/lrf_input.py b/ebook_converter/ebooks/conversion/plugins/lrf_input.py
index 729c3b8..6f51f98 100644
--- a/ebook_converter/ebooks/conversion/plugins/lrf_input.py
+++ b/ebook_converter/ebooks/conversion/plugins/lrf_input.py
@@ -1,54 +1,52 @@
-import os, sys
+import os
+import sys
 import pkg_resources
 
+from lxml import etree
+
 from ebook_converter.customize.conversion import InputFormatPlugin
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2009, Kovid Goyal <kovid@kovidgoyal.net>'
-__docformat__ = 'restructuredtext en'
-
-
 class LRFInput(InputFormatPlugin):
 
-    name        = 'LRF Input'
-    author      = 'Kovid Goyal'
+    name = 'LRF Input'
+    author = 'Kovid Goyal'
     description = 'Convert LRF files to HTML'
-    file_types  = {'lrf'}
+    file_types = {'lrf'}
     commit_name = 'lrf_input'
 
     def convert(self, stream, options, file_ext, log,
                 accelerators):
-        from ebook_converter.ebooks.lrf.input import (MediaType, Styles, TextBlock,
-                Canvas, ImageBlock, RuledLine)
+        from ebook_converter.ebooks.lrf.input import MediaType, Styles, \
+                TextBlock, Canvas, ImageBlock, RuledLine
         self.log = log
         self.log('Generating XML')
         from ebook_converter.ebooks.lrf.lrfparser import LRFDocument
-        from ebook_converter.utils.xml_parse import safe_xml_fromstring
-        from lxml import etree
         d = LRFDocument(stream)
         d.parse()
         xml = d.to_xml(write_files=True)
         if options.verbose > 2:
             open(u'lrs.xml', 'wb').write(xml.encode('utf-8'))
-        doc = safe_xml_fromstring(xml)
+        doc = etree.fromstring(xml)
 
         char_button_map = {}
         for x in doc.xpath('//CharButton[@refobj]'):
             ro = x.get('refobj')
-            jump_button = doc.xpath('//*[@objid="%s"]'%ro)
+            jump_button = doc.xpath('//*[@objid="%s"]' % ro)
             if jump_button:
-                jump_to = jump_button[0].xpath('descendant::JumpTo[@refpage and @refobj]')
+                jump_to = jump_button[0].xpath('descendant::JumpTo[@refpage '
+                                               'and @refobj]')
                 if jump_to:
-                    char_button_map[ro] = '%s.xhtml#%s'%(jump_to[0].get('refpage'),
-                            jump_to[0].get('refobj'))
+                    char_button_map[ro] = ('%s.xhtml#%s' %
+                                           (jump_to[0].get('refpage'),
+                                            jump_to[0].get('refobj')))
         plot_map = {}
         for x in doc.xpath('//Plot[@refobj]'):
             ro = x.get('refobj')
-            image = doc.xpath('//Image[@objid="%s" and @refstream]'%ro)
+            image = doc.xpath('//Image[@objid="%s" and @refstream]' % ro)
             if image:
-                imgstr = doc.xpath('//ImageStream[@objid="%s" and @file]'%
-                    image[0].get('refstream'))
+                imgstr = doc.xpath('//ImageStream[@objid="%s" and @file]' %
+                                   image[0].get('refstream'))
                 if imgstr:
                     plot_map[ro] = imgstr[0].get('file')
 
@@ -58,21 +56,19 @@ class LRFInput(InputFormatPlugin):
                   resource_filename('ebook_converter',
                                     'data/lrf.xsl')) as fobj:
             # TODO(gryf): change this nonsense to etree.parse() instead.
-            styledoc = safe_xml_fromstring(fobj.read())
+            styledoc = etree.fromstring(fobj.read())
         media_type = MediaType()
         styles = Styles()
         text_block = TextBlock(styles, char_button_map, plot_map, log)
         canvas = Canvas(doc, styles, text_block, log)
         image_block = ImageBlock(canvas)
         ruled_line = RuledLine()
-        extensions = {
-                ('calibre', 'media-type') : media_type,
-                ('calibre', 'text-block') : text_block,
-                ('calibre', 'ruled-line') : ruled_line,
-                ('calibre', 'styles')     : styles,
-                ('calibre', 'canvas')     : canvas,
-                ('calibre', 'image-block'): image_block,
-                }
+        extensions = {('calibre', 'media-type'): media_type,
+                      ('calibre', 'text-block'): text_block,
+                      ('calibre', 'ruled-line'): ruled_line,
+                      ('calibre', 'styles'): styles,
+                      ('calibre', 'canvas'): canvas,
+                      ('calibre', 'image-block'): image_block}
         transform = etree.XSLT(styledoc, extensions=extensions)
         try:
             result = transform(doc)
diff --git a/ebook_converter/ebooks/conversion/plugins/rtf_input.py b/ebook_converter/ebooks/conversion/plugins/rtf_input.py
index 3c4192d..5d36fee 100644
--- a/ebook_converter/ebooks/conversion/plugins/rtf_input.py
+++ b/ebook_converter/ebooks/conversion/plugins/rtf_input.py
@@ -1,57 +1,58 @@
-import os, glob, re, textwrap
+import glob
+import os
 import pkg_resources
+import re
+import textwrap
 
-from ebook_converter.customize.conversion import InputFormatPlugin, OptionRecommendation
+from lxml import etree
+
+from ebook_converter.customize.conversion import InputFormatPlugin
+from ebook_converter.customize.conversion import OptionRecommendation
 from ebook_converter.polyglot.builtins import as_bytes
 
-__license__ = 'GPL v3'
-__copyright__ = '2008, Kovid Goyal <kovid at kovidgoyal.net>'
 
-border_style_map = {
-        'single' : 'solid',
-        'double-thickness-border' : 'double',
-        'shadowed-border': 'outset',
-        'double-border': 'double',
-        'dotted-border': 'dotted',
-        'dashed': 'dashed',
-        'hairline': 'solid',
-        'inset': 'inset',
-        'dash-small': 'dashed',
-        'dot-dash': 'dotted',
-        'dot-dot-dash': 'dotted',
-        'outset': 'outset',
-        'tripple': 'double',
-        'triple': 'double',
-        'thick-thin-small': 'solid',
-        'thin-thick-small': 'solid',
-        'thin-thick-thin-small': 'solid',
-        'thick-thin-medium': 'solid',
-        'thin-thick-medium': 'solid',
-        'thin-thick-thin-medium': 'solid',
-        'thick-thin-large': 'solid',
-        'thin-thick-thin-large': 'solid',
-        'wavy': 'ridge',
-        'double-wavy': 'ridge',
-        'striped': 'ridge',
-        'emboss': 'inset',
-        'engrave': 'inset',
-        'frame': 'ridge',
-}
+border_style_map = {'single': 'solid',
+                    'double-thickness-border': 'double',
+                    'shadowed-border': 'outset',
+                    'double-border': 'double',
+                    'dotted-border': 'dotted',
+                    'dashed': 'dashed',
+                    'hairline': 'solid',
+                    'inset': 'inset',
+                    'dash-small': 'dashed',
+                    'dot-dash': 'dotted',
+                    'dot-dot-dash': 'dotted',
+                    'outset': 'outset',
+                    'tripple': 'double',
+                    'triple': 'double',
+                    'thick-thin-small': 'solid',
+                    'thin-thick-small': 'solid',
+                    'thin-thick-thin-small': 'solid',
+                    'thick-thin-medium': 'solid',
+                    'thin-thick-medium': 'solid',
+                    'thin-thick-thin-medium': 'solid',
+                    'thick-thin-large': 'solid',
+                    'thin-thick-thin-large': 'solid',
+                    'wavy': 'ridge',
+                    'double-wavy': 'ridge',
+                    'striped': 'ridge',
+                    'emboss': 'inset',
+                    'engrave': 'inset',
+                    'frame': 'ridge'}
 
 
 class RTFInput(InputFormatPlugin):
 
-    name        = 'RTF Input'
-    author      = 'Kovid Goyal'
+    name = 'RTF Input'
+    author = 'Kovid Goyal'
     description = 'Convert RTF files to HTML'
-    file_types  = {'rtf'}
+    file_types = {'rtf'}
     commit_name = 'rtf_input'
 
-    options = {
-        OptionRecommendation(name='ignore_wmf', recommended_value=False,
-            help='Ignore WMF images instead of replacing them with a '
-                 'placeholder image.'),
-    }
+    options = {OptionRecommendation(name='ignore_wmf', recommended_value=False,
+                                    help='Ignore WMF images instead of '
+                                    'replacing them with a placeholder '
+                                    'image.')}
 
     def generate_xml(self, stream):
         from ebook_converter.ebooks.rtf2xml.ParseRtf import ParseRtf
@@ -64,7 +65,7 @@ class RTFInput(InputFormatPlugin):
                 run_lev = 4
                 indent_out = 1
                 self.log('Running RTFParser in debug mode')
-            except:
+            except Exception:
                 self.log.warn('Impossible to run RTFParser in debug mode')
         parser = ParseRtf(
             in_file=stream,
@@ -108,7 +109,8 @@ class RTFInput(InputFormatPlugin):
             deb_dir=debug_dir,
 
             # Default encoding
-            default_encoding=getattr(self.opts, 'input_encoding', 'cp1252') or 'cp1252',
+            default_encoding=getattr(self.opts, 'input_encoding',
+                                     'cp1252') or 'cp1252',
 
             # Run level
             run_level=run_lev,
@@ -151,7 +153,7 @@ class RTFInput(InputFormatPlugin):
         for count, val in imap.items():
             try:
                 imap[count] = self.convert_image(val)
-            except:
+            except Exception:
                 self.log.exception('Failed to convert', val)
         return imap
 
@@ -161,7 +163,7 @@ class RTFInput(InputFormatPlugin):
         try:
             return self.rasterize_wmf(name)
         except Exception:
-            self.log.exception('Failed to convert WMF image %r'%name)
+            self.log.exception('Failed to convert WMF image %r' % name)
         return self.replace_wmf(name)
 
     def replace_wmf(self, name):
@@ -170,9 +172,11 @@ class RTFInput(InputFormatPlugin):
             return '__REMOVE_ME__'
         from ebook_converter.ebooks.covers import message_image
         if self.default_img is None:
-            self.default_img = message_image('Conversion of WMF images is not supported.'
-            ' Use Microsoft Word or OpenOffice to save this RTF file'
-            ' as HTML and convert that in calibre.')
+            self.default_img = message_image('Conversion of WMF images is not '
+                                             'supported. Use Microsoft Word '
+                                             'or OpenOffice to save this RTF '
+                                             'file as HTML and convert that '
+                                             'in calibre.')
         name = name.replace('.wmf', '.jpg')
         with open(name, 'wb') as f:
             f.write(self.default_img)
@@ -189,10 +193,10 @@ class RTFInput(InputFormatPlugin):
         return name
 
     def write_inline_css(self, ic, border_styles):
-        font_size_classes = ['span.fs%d { font-size: %spt }'%(i, x) for i, x in
-                enumerate(ic.font_sizes)]
-        color_classes = ['span.col%d { color: %s }'%(i, x) for i, x in
-                enumerate(ic.colors) if x != 'false']
+        font_size_classes = ['span.fs%d { font-size: %spt }' % (i, x)
+                             for i, x in enumerate(ic.font_sizes)]
+        color_classes = ['span.col%d { color: %s }' % (i, x)
+                         for i, x in enumerate(ic.colors) if x != 'false']
         css = textwrap.dedent('''
         span.none {
             text-decoration: none; font-weight: normal;
@@ -210,11 +214,11 @@ class RTFInput(InputFormatPlugin):
         span.strike-through { text-decoration: line-through }
 
         ''')
-        css += '\n'+'\n'.join(font_size_classes)
-        css += '\n' +'\n'.join(color_classes)
+        css += '\n' + '\n'.join(font_size_classes)
+        css += '\n' + '\n'.join(color_classes)
 
         for cls, val in border_styles.items():
-            css += '\n\n.%s {\n%s\n}'%(cls, val)
+            css += '\n\n.%s {\n%s\n}' % (cls, val)
 
         with open(u'styles.css', 'ab') as f:
             f.write(css.encode('utf-8'))
@@ -224,35 +228,34 @@ class RTFInput(InputFormatPlugin):
         style_map = {}
         for elem in doc.xpath(r'//*[local-name()="cell"]'):
             style = ['border-style: hidden', 'border-width: 1px',
-                    'border-color: black']
+                     'border-color: black']
             for x in ('bottom', 'top', 'left', 'right'):
-                bs = elem.get('border-cell-%s-style'%x, None)
+                bs = elem.get('border-cell-%s-style' % x, None)
                 if bs:
                     cbs = border_style_map.get(bs, 'solid')
-                    style.append('border-%s-style: %s'%(x, cbs))
-                bw = elem.get('border-cell-%s-line-width'%x, None)
+                    style.append('border-%s-style: %s' % (x, cbs))
+                bw = elem.get('border-cell-%s-line-width' % x, None)
                 if bw:
-                    style.append('border-%s-width: %spt'%(x, bw))
-                bc = elem.get('border-cell-%s-color'%x, None)
+                    style.append('border-%s-width: %spt' % (x, bw))
+                bc = elem.get('border-cell-%s-color' % x, None)
                 if bc:
-                    style.append('border-%s-color: %s'%(x, bc))
+                    style.append('border-%s-color: %s' % (x, bc))
             style = ';\n'.join(style)
             if style not in border_styles:
                 border_styles.append(style)
             idx = border_styles.index(style)
-            cls = 'border_style%d'%idx
+            cls = 'border_style%d' % idx
             style_map[cls] = style
             elem.set('class', cls)
         return style_map
 
     def convert(self, stream, options, file_ext, log,
                 accelerators):
-        from lxml import etree
         from ebook_converter.ebooks.metadata.meta import get_metadata
         from ebook_converter.ebooks.metadata.opf2 import OPFCreator
-        from ebook_converter.ebooks.rtf2xml.ParseRtf import RtfInvalidCodeException
+        from ebook_converter.ebooks.rtf2xml.ParseRtf import \
+            RtfInvalidCodeException
         from ebook_converter.ebooks.rtf.input import InlineClass
-        from ebook_converter.utils.xml_parse import safe_xml_fromstring
         self.opts = options
         self.log = log
         self.log('Converting RTF to XML...')
@@ -269,14 +272,15 @@ class RTFInput(InputFormatPlugin):
             imap = {}
             try:
                 imap = self.extract_images(d[0])
-            except:
+            except Exception:
                 self.log.exception('Failed to extract images...')
 
         self.log('Parsing XML...')
-        doc = safe_xml_fromstring(xml)
+        doc = etree.fromstring(xml)
         border_styles = self.convert_borders(doc)
         for pict in doc.xpath('//rtf:pict[@num]',
-                namespaces={'rtf':'http://rtf2xml.sourceforge.net/'}):
+                              namespaces={'rtf':
+                                          'http://rtf2xml.sourceforge.net/'}):
             num = int(pict.get('num'))
             name = imap.get(num, None)
             if name is not None:
@@ -286,8 +290,8 @@ class RTFInput(InputFormatPlugin):
         inline_class = InlineClass(self.log)
         with open(pkg_resources.resource_filename('ebook_converter',
                                                   'data/rtf.xsl')) as fobj:
-            styledoc = safe_xml_fromstring(fobj.read())
-        extensions = {('calibre', 'inline-class') : inline_class}
+            styledoc = etree.fromstring(fobj.read())
+        extensions = {('calibre', 'inline-class'): inline_class}
         transform = etree.XSLT(styledoc, extensions=extensions)
         result = transform(doc)
         html = u'index.xhtml'
@@ -296,7 +300,8 @@ class RTFInput(InputFormatPlugin):
             # res = res[:100].replace('xmlns:html', 'xmlns') + res[100:]
             # clean multiple \n
             res = re.sub(b'\n+', b'\n', res)
-            # Replace newlines inserted by the 'empty_paragraphs' option in rtf2xml with html blank lines
+            # Replace newlines inserted by the 'empty_paragraphs' option in
+            # rtf2xml with html blank lines
             # res = re.sub('\s*<body>', '<body>', res)
             # res = re.sub('(?<=\n)\n{2}',
             # u'<p>\u00a0</p>\n'.encode('utf-8'), res)
@@ -316,7 +321,8 @@ class RTFInput(InputFormatPlugin):
 
     def postprocess_book(self, oeb, opts, log):
         for item in oeb.spine:
-            for img in item.data.xpath('//*[local-name()="img" and @src="__REMOVE_ME__"]'):
+            for img in item.data.xpath('//*[local-name()="img" and '
+                                       '@src="__REMOVE_ME__"]'):
                 p = img.getparent()
                 idx = p.index(img)
                 p.remove(img)
diff --git a/ebook_converter/ebooks/conversion/plugins/snb_input.py b/ebook_converter/ebooks/conversion/plugins/snb_input.py
index 51c7d7e..fb16039 100644
--- a/ebook_converter/ebooks/conversion/plugins/snb_input.py
+++ b/ebook_converter/ebooks/conversion/plugins/snb_input.py
@@ -1,27 +1,33 @@
 import os
 
+from lxml import etree
+
 from ebook_converter.customize.conversion import InputFormatPlugin
 from ebook_converter.ptempfile import TemporaryDirectory
 from ebook_converter.utils.filenames import ascii_filename
 
 
-__license__ = 'GPL 3'
-__copyright__ = '2010, Li Fanxi <lifanxi@freemindworld.com>'
-__docformat__ = 'restructuredtext en'
-
-HTML_TEMPLATE = '<html><head><meta http-equiv="Content-Type" content="text/html; charset=utf-8"/><title>%s</title></head><body>\n%s\n</body></html>'
+HTML_TEMPLATE = ('<html><head><meta http-equiv="Content-Type" '
+                 'content="text/html; charset=utf-8"/><title>%s</title>'
+                 '</head><body>\n%s\n</body></html>')
 
 
 def html_encode(s):
-    return s.replace('&', '&amp;').replace('<', '&lt;').replace('>', '&gt;').replace('"', '&quot;').replace("'", '&apos;').replace('\n', '<br/>').replace(' ', '&nbsp;')  # noqa
+    return (s.replace('&', '&amp;')
+            .replace('<', '&lt;')
+            .replace('>', '&gt;')
+            .replace('"', '&quot;')
+            .replace("'", '&apos;')
+            .replace('\n', '<br/>')
+            .replace(' ', '&nbsp;'))
 
 
 class SNBInput(InputFormatPlugin):
 
-    name        = 'SNB Input'
-    author      = 'Li Fanxi'
+    name = 'SNB Input'
+    author = 'Li Fanxi'
     description = 'Convert SNB files to OEB'
-    file_types  = {'snb'}
+    file_types = {'snb'}
     commit_name = 'snb_input'
 
     options = set()
@@ -32,13 +38,12 @@ class SNBInput(InputFormatPlugin):
 
         from ebook_converter.ebooks.oeb.base import DirContainer
         from ebook_converter.ebooks.snb.snbfile import SNBFile
-        from ebook_converter.utils.xml_parse import safe_xml_fromstring
 
         log.debug("Parsing SNB file...")
         snbFile = SNBFile()
         try:
             snbFile.Parse(stream)
-        except:
+        except Exception:
             raise ValueError("Invalid SNB file")
         if not snbFile.IsValid():
             log.debug("Invalid SNB file")
@@ -46,27 +51,28 @@ class SNBInput(InputFormatPlugin):
         log.debug("Handle meta data ...")
         from ebook_converter.ebooks.conversion.plumber import create_oebbook
         oeb = create_oebbook(log, None, options,
-                encoding=options.input_encoding, populate=False)
+                             encoding=options.input_encoding, populate=False)
         meta = snbFile.GetFileStream('snbf/book.snbf')
         if meta is not None:
-            meta = safe_xml_fromstring(meta)
-            l = {'title'    : './/head/name',
-                  'creator'  : './/head/author',
-                  'language' : './/head/language',
-                  'generator': './/head/generator',
-                  'publisher': './/head/publisher',
-                  'cover'    : './/head/cover', }
+            meta = etree.fromstring(meta)
+            item_map = {'title': './/head/name',
+                        'creator': './/head/author',
+                        'language': './/head/language',
+                        'generator': './/head/generator',
+                        'publisher': './/head/publisher',
+                        'cover': './/head/cover'}
             d = {}
-            for item in l:
-                node = meta.find(l[item])
+            for key, item in item_map.items():
+                node = meta.find(item)
                 if node is not None:
-                    d[item] = node.text if node.text is not None else ''
+                    d[key] = node.text if node.text is not None else ''
                 else:
-                    d[item] = ''
+                    d[key] = ''
 
             oeb.metadata.add('title', d['title'])
-            oeb.metadata.add('creator', d['creator'], attrib={'role':'aut'})
-            oeb.metadata.add('language', d['language'].lower().replace('_', '-'))
+            oeb.metadata.add('creator', d['creator'], attrib={'role': 'aut'})
+            oeb.metadata.add('language',
+                             d['language'].lower().replace('_', '-'))
             oeb.metadata.add('generator', d['generator'])
             oeb.metadata.add('publisher', d['publisher'])
             if d['cover'] != '':
@@ -84,7 +90,7 @@ class SNBInput(InputFormatPlugin):
             toc = snbFile.GetFileStream('snbf/toc.snbf')
             oeb.container = DirContainer(tdir, log)
             if toc is not None:
-                toc = safe_xml_fromstring(toc)
+                toc = etree.fromstring(toc)
                 i = 1
                 for ch in toc.find('.//body'):
                     chapterName = ch.text
@@ -93,18 +99,22 @@ class SNBInput(InputFormatPlugin):
                     data = snbFile.GetFileStream('snbc/' + chapterSrc)
                     if data is None:
                         continue
-                    snbc = safe_xml_fromstring(data)
+                    snbc = etree.fromstring(data)
                     lines = []
                     for line in snbc.find('.//body'):
                         if line.tag == 'text':
                             lines.append('<p>%s</p>' % html_encode(line.text))
                         elif line.tag == 'img':
-                            lines.append('<p><img src="%s" /></p>' % html_encode(line.text))
+                            lines.append('<p><img src="%s" /></p>' %
+                                         html_encode(line.text))
                     with open(os.path.join(tdir, fname), 'wb') as f:
-                        f.write((HTML_TEMPLATE % (chapterName, '\n'.join(lines))).encode('utf-8', 'replace'))
+                        f.write((HTML_TEMPLATE %
+                                 (chapterName,
+                                  '\n'.join(lines))).encode('utf-8',
+                                                            'replace'))
                     oeb.toc.add(ch.text, fname)
-                    id, href = oeb.manifest.generate(id='html',
-                        href=ascii_filename(fname))
+                    id, href = oeb.manifest.generate(
+                        id='html', href=ascii_filename(fname))
                     item = oeb.manifest.add(id, href, 'text/html')
                     item.html_input_href = fname
                     oeb.spine.add(item, True)
@@ -112,7 +122,7 @@ class SNBInput(InputFormatPlugin):
                 imageFiles = snbFile.OutputImageFiles(tdir)
                 for f, m in imageFiles:
                     id, href = oeb.manifest.generate(id='image',
-                        href=ascii_filename(f))
+                                                     href=ascii_filename(f))
                     item = oeb.manifest.add(id, href, m)
                     item.html_input_href = f
 
diff --git a/ebook_converter/ebooks/docx/container.py b/ebook_converter/ebooks/docx/container.py
index e9768f4..db11f3d 100644
--- a/ebook_converter/ebooks/docx/container.py
+++ b/ebook_converter/ebooks/docx/container.py
@@ -1,9 +1,12 @@
-import os, sys, shutil
+import os
+import shutil
+import sys
 
 from lxml import etree
 
 from ebook_converter import walk, guess_type
-from ebook_converter.ebooks.metadata import string_to_authors, authors_to_sort_string
+from ebook_converter.ebooks.metadata import authors_to_sort_string
+from ebook_converter.ebooks.metadata import string_to_authors
 from ebook_converter.ebooks.metadata.book.base import Metadata
 from ebook_converter.ebooks.docx import InvalidDOCX
 from ebook_converter.ebooks.docx.names import DOCXNamespace
@@ -11,21 +14,11 @@ from ebook_converter.ptempfile import PersistentTemporaryDirectory
 from ebook_converter.utils.localization import canonicalize_lang
 from ebook_converter.utils.logging import default_log
 from ebook_converter.utils.zipfile import ZipFile
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2013, Kovid Goyal <kovid at kovidgoyal.net>'
-
-
-def fromstring(raw, parser=None):
-    return safe_xml_fromstring(raw)
-
 # Read metadata {{{
-
-
 def read_doc_props(raw, mi, XPath):
-    root = fromstring(raw)
+    root = etree.fromstring(raw)
     titles = XPath('//dc:title')(root)
     if titles:
         title = titles[0].text
@@ -53,29 +46,31 @@ def read_doc_props(raw, mi, XPath):
     desc = XPath('//dc:description')(root)
     if desc:
         raw = etree.tostring(desc[0], method='text', encoding='unicode')
-        raw = raw.replace('_x000d_', '')  # Word 2007 mangles newlines in the summary
+        # Word 2007 mangles newlines in the summary
+        raw = raw.replace('_x000d_', '')
         mi.comments = raw.strip()
 
     langs = []
     for lang in XPath('//dc:language')(root):
         if lang.text and lang.text.strip():
-            l = canonicalize_lang(lang.text)
-            if l:
-                langs.append(l)
+            canonic_lang = canonicalize_lang(lang.text)
+            if canonic_lang:
+                langs.append(canonic_lang)
     if langs:
         mi.languages = langs
 
 
 def read_app_props(raw, mi):
-    root = fromstring(raw)
+    root = etree.fromstring(raw)
     company = root.xpath('//*[local-name()="Company"]')
     if company and company[0].text and company[0].text.strip():
         mi.publisher = company[0].text.strip()
 
 
 def read_default_style_language(raw, mi, XPath):
-    root = fromstring(raw)
-    for lang in XPath('/w:styles/w:docDefaults/w:rPrDefault/w:rPr/w:lang/@w:val')(root):
+    root = etree.fromstring(raw)
+    for lang in XPath('/w:styles/w:docDefaults/w:rPrDefault/w:rPr/w:lang/'
+                      '@w:val')(root):
         lang = canonicalize_lang(lang)
         if lang:
             mi.languages = [lang]
@@ -87,7 +82,9 @@ class DOCX(object):
 
     def __init__(self, path_or_stream, log=None, extract=True):
         self.docx_is_transitional = True
-        stream = path_or_stream if hasattr(path_or_stream, 'read') else open(path_or_stream, 'rb')
+        stream = path_or_stream
+        if not hasattr(path_or_stream, 'read'):
+            stream = open(path_or_stream, 'rb')
         self.name = getattr(stream, 'name', None) or '<stream>'
         self.log = log or default_log
         if extract:
@@ -107,9 +104,9 @@ class DOCX(object):
         try:
             zf = ZipFile(stream)
             zf.extractall(self.tdir)
-        except:
+        except Exception:
             self.log.exception('DOCX appears to be invalid ZIP file, trying a'
-                    ' more forgiving ZIP parser')
+                               ' more forgiving ZIP parser')
             from ebook_converter.utils.localunzip import extractall
             stream.seek(0)
             extractall(stream, self.tdir)
@@ -133,13 +130,17 @@ class DOCX(object):
         try:
             raw = self.read('[Content_Types].xml')
         except KeyError:
-            raise InvalidDOCX('The file %s docx file has no [Content_Types].xml' % self.name)
-        root = fromstring(raw)
+            raise InvalidDOCX('The file %s docx file has no '
+                              '[Content_Types].xml' % self.name)
+        root = etree.fromstring(raw)
         self.content_types = {}
         self.default_content_types = {}
-        for item in root.xpath('//*[local-name()="Types"]/*[local-name()="Default" and @Extension and @ContentType]'):
-            self.default_content_types[item.get('Extension').lower()] = item.get('ContentType')
-        for item in root.xpath('//*[local-name()="Types"]/*[local-name()="Override" and @PartName and @ContentType]'):
+        for item in root.xpath('//*[local-name()="Types"]/*[local-name()='
+                               '"Default" and @Extension and @ContentType]'):
+            self.default_content_types[item.get('Extension').lower()] = \
+                    item.get('ContentType')
+        for item in root.xpath('//*[local-name()="Types"]/*[local-name()='
+                               '"Override" and @PartName and @ContentType]'):
             name = item.get('PartName').lstrip('/')
             self.content_types[name] = item.get('ContentType')
 
@@ -155,15 +156,19 @@ class DOCX(object):
         try:
             raw = self.read('_rels/.rels')
         except KeyError:
-            raise InvalidDOCX('The file %s docx file has no _rels/.rels' % self.name)
-        root = fromstring(raw)
+            raise InvalidDOCX('The file %s docx file has no _rels/.rels' %
+                              self.name)
+        root = etree.fromstring(raw)
         self.relationships = {}
         self.relationships_rmap = {}
-        for item in root.xpath('//*[local-name()="Relationships"]/*[local-name()="Relationship" and @Type and @Target]'):
+        for item in root.xpath('//*[local-name()="Relationships"]/*[local-name'
+                               '()="Relationship" and @Type and @Target]'):
             target = item.get('Target').lstrip('/')
             typ = item.get('Type')
             if target == 'word/document.xml':
-                self.docx_is_transitional = typ != 'http://purl.oclc.org/ooxml/officeDocument/relationships/officeDocument'
+                self.docx_is_transitional = (typ != 'http://purl.oclc.org/'
+                                             'ooxml/officeDocument/'
+                                             'relationships/officeDocument')
             self.relationships[typ] = target
             self.relationships_rmap[target] = typ
 
@@ -171,15 +176,17 @@ class DOCX(object):
     def document_name(self):
         name = self.relationships.get(self.namespace.names['DOCUMENT'], None)
         if name is None:
-            names = tuple(n for n in self.names if n == 'document.xml' or n.endswith('/document.xml'))
+            names = tuple(n for n in self.names if n == 'document.xml' or
+                          n.endswith('/document.xml'))
             if not names:
-                raise InvalidDOCX('The file %s docx file has no main document' % self.name)
+                raise InvalidDOCX('The file %s docx file has no main '
+                                  'document' % self.name)
             name = names[0]
         return name
 
     @property
     def document(self):
-        return fromstring(self.read(self.document_name))
+        return etree.fromstring(self.read(self.document_name))
 
     @property
     def document_relationships(self):
@@ -195,10 +202,13 @@ class DOCX(object):
         except KeyError:
             pass
         else:
-            root = fromstring(raw)
-            for item in root.xpath('//*[local-name()="Relationships"]/*[local-name()="Relationship" and @Type and @Target]'):
+            root = etree.fromstring(raw)
+            for item in root.xpath('//*[local-name()="Relationships"]/*'
+                                   '[local-name()="Relationship" and @Type '
+                                   'and @Target]'):
                 target = item.get('Target')
-                if item.get('TargetMode', None) != 'External' and not target.startswith('#'):
+                if (item.get('TargetMode', None) != 'External' and not
+                        target.startswith('#')):
                     target = '/'.join((base, target.lstrip('/')))
                 typ = item.get('Type')
                 Id = item.get('Id')
@@ -209,13 +219,15 @@ class DOCX(object):
     def get_document_properties_names(self):
         name = self.relationships.get(self.namespace.names['DOCPROPS'], None)
         if name is None:
-            names = tuple(n for n in self.names if n.lower() == 'docprops/core.xml')
+            names = tuple(n for n in self.names
+                          if n.lower() == 'docprops/core.xml')
             if names:
                 name = names[0]
         yield name
         name = self.relationships.get(self.namespace.names['APPPROPS'], None)
         if name is None:
-            names = tuple(n for n in self.names if n.lower() == 'docprops/app.xml')
+            names = tuple(n for n in self.names
+                          if n.lower() == 'docprops/app.xml')
             if names:
                 name = names[0]
         yield name
@@ -239,7 +251,8 @@ class DOCX(object):
             else:
                 read_default_style_language(raw, mi, self.namespace.XPath)
 
-        ap_name = self.relationships.get(self.namespace.names['APPPROPS'], None)
+        ap_name = self.relationships.get(self.namespace.names['APPPROPS'],
+                                         None)
         if ap_name:
             try:
                 raw = self.read(ap_name)
diff --git a/ebook_converter/ebooks/docx/to_html.py b/ebook_converter/ebooks/docx/to_html.py
index 11ce9e2..30c2a64 100644
--- a/ebook_converter/ebooks/docx/to_html.py
+++ b/ebook_converter/ebooks/docx/to_html.py
@@ -1,12 +1,13 @@
 import sys, os, re, math, errno, uuid, numbers
 from collections import OrderedDict, defaultdict
 
+from lxml import etree
 from lxml import html
 from lxml.html.builder import (
     HTML, HEAD, TITLE, BODY, LINK, META, P, SPAN, BR, DIV, A, DT, DL, DD, H1)
 
 from ebook_converter import guess_type
-from ebook_converter.ebooks.docx.container import DOCX, fromstring
+from ebook_converter.ebooks.docx.container import DOCX
 from ebook_converter.ebooks.docx.names import XML, generate_anchor
 from ebook_converter.ebooks.docx.styles import Styles, inherit, PageProperties
 from ebook_converter.ebooks.docx.numbering import Numbering
@@ -311,7 +312,7 @@ class Convert(object):
                     raise
                 self.log.warn('Settings %s file missing' % sename)
             else:
-                self.settings(fromstring(seraw))
+                self.settings(etree.fromstring(seraw))
 
         if foname is not None:
             try:
@@ -327,7 +328,7 @@ class Convert(object):
                 self.log.warn('Endnotes %s do not exist' % enname)
             else:
                 enrel = self.docx.get_relationships(enname)
-        footnotes(fromstring(foraw) if foraw else None, forel, fromstring(enraw) if enraw else None, enrel)
+        footnotes(etree.fromstring(foraw) if foraw else None, forel, etree.fromstring(enraw) if enraw else None, enrel)
 
         if fname is not None:
             embed_relationships = self.docx.get_relationships(fname)[0]
@@ -336,7 +337,7 @@ class Convert(object):
             except KeyError:
                 self.log.warn('Fonts table %s does not exist' % fname)
             else:
-                fonts(fromstring(raw), embed_relationships, self.docx, self.dest_dir)
+                fonts(etree.fromstring(raw), embed_relationships, self.docx, self.dest_dir)
 
         if tname is not None:
             try:
@@ -344,7 +345,7 @@ class Convert(object):
             except KeyError:
                 self.log.warn('Styles %s do not exist' % sname)
             else:
-                self.theme(fromstring(raw))
+                self.theme(etree.fromstring(raw))
 
         styles_loaded = False
         if sname is not None:
@@ -353,7 +354,7 @@ class Convert(object):
             except KeyError:
                 self.log.warn('Styles %s do not exist' % sname)
             else:
-                self.styles(fromstring(raw), fonts, self.theme)
+                self.styles(etree.fromstring(raw), fonts, self.theme)
                 styles_loaded = True
         if not styles_loaded:
             self.styles(None, fonts, self.theme)
@@ -364,7 +365,7 @@ class Convert(object):
             except KeyError:
                 self.log.warn('Numbering styles %s do not exist' % nname)
             else:
-                numbering(fromstring(raw), self.styles, self.docx.get_relationships(nname)[0])
+                numbering(etree.fromstring(raw), self.styles, self.docx.get_relationships(nname)[0])
 
         self.styles.resolve_numbering(numbering)
 
diff --git a/ebook_converter/ebooks/docx/writer/from_html.py b/ebook_converter/ebooks/docx/writer/from_html.py
index c9894a5..b13a0bb 100644
--- a/ebook_converter/ebooks/docx/writer/from_html.py
+++ b/ebook_converter/ebooks/docx/writer/from_html.py
@@ -1,22 +1,19 @@
+import collections
 import re
-from collections import Counter
 
 from ebook_converter.ebooks.docx.writer.container import create_skeleton, page_size, page_effective_area
-from ebook_converter.ebooks.docx.writer.styles import StylesManager, FloatSpec
-from ebook_converter.ebooks.docx.writer.links import LinksManager
-from ebook_converter.ebooks.docx.writer.images import ImagesManager
 from ebook_converter.ebooks.docx.writer.fonts import FontsManager
-from ebook_converter.ebooks.docx.writer.tables import Table
+from ebook_converter.ebooks.docx.writer.images import ImagesManager
+from ebook_converter.ebooks.docx.writer.links import LinksManager
 from ebook_converter.ebooks.docx.writer.lists import ListsManager
+from ebook_converter.ebooks.docx.writer.styles import StylesManager, FloatSpec
+from ebook_converter.ebooks.docx.writer.tables import Table
+from ebook_converter.ebooks.oeb import base
+from ebook_converter.ebooks.oeb import parse_utils
 from ebook_converter.ebooks.oeb.stylizer import Stylizer as Sz, Style as St
-from ebook_converter.ebooks.oeb.base import XPath, barename
 from ebook_converter.utils.localization import lang_as_iso639_1
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2013, Kovid Goyal <kovid at kovidgoyal.net>'
-
-
 def lang_for_tag(tag):
     for attr in ('lang', '{http://www.w3.org/XML/1998/namespace}lang'):
         val = lang_as_iso639_1(tag.get(attr))
@@ -140,7 +137,7 @@ class Block(object):
         self.numbering_id = None
         self.parent_items = None
         self.html_block = html_block
-        self.html_tag = barename(html_block.tag)
+        self.html_tag = parse_utils.barename(html_block.tag)
         self.float_spec = float_spec
         if float_spec is not None:
             float_spec.blocks.append(self)
@@ -387,7 +384,7 @@ class Blocks(object):
     def resolve_language(self):
         default_lang = self.styles_manager.document_lang
         for block in self.all_blocks:
-            count = Counter()
+            count = collections.Counter()
             for run in block.runs:
                 count[run.lang] += 1
             if count:
@@ -473,13 +470,13 @@ class Convert(object):
         self.abshref = self.images_manager.abshref = item.abshref
 
         self.current_lang = lang_for_tag(item.data) or self.styles_manager.document_lang
-        for i, body in enumerate(XPath('//h:body')(item.data)):
+        for i, body in enumerate(base.XPath('//h:body')(item.data)):
             with self.blocks:
                 self.blocks.top_bookmark = self.links_manager.bookmark_for_anchor(self.links_manager.top_anchor, self.current_item, body)
                 self.process_tag(body, stylizer, is_first_tag=i == 0)
 
     def process_tag(self, html_tag, stylizer, is_first_tag=False, float_spec=None):
-        tagname = barename(html_tag.tag)
+        tagname = parse_utils.barename(html_tag.tag)
         tag_style = stylizer.style(html_tag)
         ignore_tag_contents = tagname in {'script', 'style', 'title', 'meta'} or tag_style.is_hidden
         display = tag_style._get('display')
@@ -573,7 +570,7 @@ class Convert(object):
             text = html_tag.text
             if text:
                 block.add_text(text, tag_style, ignore_leading_whitespace=True, is_parent_style=True, link=self.current_link, lang=self.current_lang)
-            elif tagname == 'li' and len(html_tag) and barename(html_tag[0].tag) in ('ul', 'ol') and len(html_tag[0]):
+            elif tagname == 'li' and len(html_tag) and parse_utils.barename(html_tag[0].tag) in ('ul', 'ol') and len(html_tag[0]):
                 block.force_not_empty = True
 
     def add_inline_tag(self, tagname, html_tag, tag_style, stylizer):
diff --git a/ebook_converter/ebooks/fb2/fb2ml.py b/ebook_converter/ebooks/fb2/fb2ml.py
index 9db7965..0749be2 100644
--- a/ebook_converter/ebooks/fb2/fb2ml.py
+++ b/ebook_converter/ebooks/fb2/fb2ml.py
@@ -9,10 +9,10 @@ import uuid
 
 from lxml import etree
 
+from ebook_converter import constants as const
 from ebook_converter import prepare_string_for_xml
 from ebook_converter.constants_old import __appname__, __version__
 from ebook_converter.utils.localization import lang_as_iso639_1
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 from ebook_converter.utils.img import save_cover_data_to
 from ebook_converter.ebooks.oeb.base import urlnormalize
 from ebook_converter.polyglot.binary import as_base64_unicode
@@ -36,9 +36,10 @@ class FB2MLizer(object):
     def reset_state(self):
         # Used to ensure text and tags are always within <p> and </p>
         self.in_p = False
-        # Mapping of image names. OEB allows for images to have the same name but be stored
-        # in different directories. FB2 images are all in a flat layout so we rename all images
-        # into a sequential numbering system to ensure there are no collisions between image names.
+        # Mapping of image names. OEB allows for images to have the same name
+        # but be stored in different directories. FB2 images are all in a flat
+        # layout so we rename all images into a sequential numbering system to
+        # ensure there are no collisions between image names.
         self.image_hrefs = {}
         # Mapping of toc items and their
         self.toc = {}
@@ -68,13 +69,15 @@ class FB2MLizer(object):
         output = self.clean_text('\n'.join(output))
 
         if self.opts.pretty_print:
-            output = etree.tostring(safe_xml_fromstring(output), encoding='unicode', pretty_print=True)
+            output = etree.tostring(etree.fromstring(output),
+                                    encoding='unicode', pretty_print=True)
 
         return '<?xml version="1.0" encoding="UTF-8"?>\n' + output
 
     def clean_text(self, text):
         # Remove pointless tags, but keep their contents.
-        text = re.sub(r'(?mu)<(strong|emphasis|strikethrough|sub|sup)>(\s*)</\1>', r'\2', text)
+        text = re.sub(r'(?mu)<(strong|emphasis|strikethrough|sub|sup)>'
+                      r'(\s*)</\1>', r'\2', text)
 
         # Clean up paragraphs endings.
         text = re.sub(r'(?mu)\s+</p>', '</p>', text)
@@ -96,7 +99,8 @@ class FB2MLizer(object):
         text = re.sub(r'(?mu)</title>\s*<p>', '</title>\n<p>', text)
 
         # Put line breaks between paragraphs on a separate line.
-        text = re.sub(r'(?mu)</(p|title)>\s*<empty-line/>', r'</\1>\n<empty-line/>', text)
+        text = re.sub(r'(?mu)</(p|title)>\s*<empty-line/>',
+                      r'</\1>\n<empty-line/>', text)
         text = re.sub(r'(?mu)<empty-line/>\s*<p>', '<empty-line/>\n<p>', text)
 
         # Remove empty sections.
@@ -115,7 +119,9 @@ class FB2MLizer(object):
         metadata['title'] = self.oeb_book.metadata.title[0].value
         metadata['appname'] = __appname__
         metadata['version'] = __version__
-        metadata['date'] = '%i.%i.%i' % (datetime.now().day, datetime.now().month, datetime.now().year)
+        metadata['date'] = '%i.%i.%i' % (datetime.now().day,
+                                         datetime.now().month,
+                                         datetime.now().year)
         if self.oeb_book.metadata.language:
             lc = lang_as_iso639_1(self.oeb_book.metadata.language[0].value)
             if not lc:
@@ -143,31 +149,38 @@ class FB2MLizer(object):
                 author_middle = ' '.join(author_parts[1:-1])
                 author_last = author_parts[-1]
             metadata['author'] += '<author>'
-            metadata['author'] += '<first-name>%s</first-name>' % prepare_string_for_xml(author_first)
+            metadata['author'] += ('<first-name>%s</first-name>' %
+                                   prepare_string_for_xml(author_first))
             if author_middle:
-                metadata['author'] += '<middle-name>%s</middle-name>' % prepare_string_for_xml(author_middle)
-            metadata['author'] += '<last-name>%s</last-name>' % prepare_string_for_xml(author_last)
+                metadata['author'] += ('<middle-name>%s</middle-name>' %
+                                       prepare_string_for_xml(author_middle))
+            metadata['author'] += ('<last-name>%s</last-name>' %
+                                   prepare_string_for_xml(author_last))
             metadata['author'] += '</author>'
         if not metadata['author']:
-            metadata['author'] = '<author><first-name></first-name><last-name></last-name></author>'
+            metadata['author'] = ('<author><first-name></first-name>'
+                                  '<last-name></last-name></author>')
 
         metadata['keywords'] = ''
         tags = list(map(str, self.oeb_book.metadata.subject))
         if tags:
             tags = ', '.join(prepare_string_for_xml(x) for x in tags)
-            metadata['keywords'] = '<keywords>%s</keywords>'%tags
+            metadata['keywords'] = '<keywords>%s</keywords>' % tags
 
         metadata['sequence'] = ''
         if self.oeb_book.metadata.series:
             index = '1'
             if self.oeb_book.metadata.series_index:
                 index = self.oeb_book.metadata.series_index[0]
-            metadata['sequence'] = '<sequence name="%s" number="%s"/>' % (prepare_string_for_xml('%s' % self.oeb_book.metadata.series[0]), index)
+            seq = prepare_string_for_xml(str(self.oeb_book.metadata.series[0]))
+            metadata['sequence'] = ('<sequence name="%s" number="%s"/>' %
+                                    (seq, index))
 
         year = publisher = isbn = ''
         identifiers = self.oeb_book.metadata['identifier']
         for x in identifiers:
-            if x.get(OPF('scheme'), None).lower() == 'uuid' or str(x).startswith('urn:uuid:'):
+            if (x.get(OPF('scheme'), None).lower() == 'uuid' or
+                    str(x).startswith('urn:uuid:')):
                 metadata['id'] = str(x).split(':')[-1]
                 break
         if metadata['id'] is None:
@@ -179,22 +192,27 @@ class FB2MLizer(object):
         except IndexError:
             pass
         else:
-            year = '<year>%s</year>' % prepare_string_for_xml(date.value.partition('-')[0])
+            year = ('<year>%s</year>' %
+                    prepare_string_for_xml(date.value.partition('-')[0]))
 
         try:
             publisher = self.oeb_book.metadata['publisher'][0]
         except IndexError:
             pass
         else:
-            publisher = '<publisher>%s</publisher>' % prepare_string_for_xml(publisher.value)
+            publisher = ('<publisher>%s</publisher>' %
+                         prepare_string_for_xml(publisher.value))
 
         for x in identifiers:
             if x.get(OPF('scheme'), None).lower() == 'isbn':
                 isbn = '<isbn>%s</isbn>' % prepare_string_for_xml(x.value)
 
-        metadata['year'], metadata['isbn'], metadata['publisher'] = year, isbn, publisher
+        metadata['year'] = year
+        metadata['isbn'] = isbn
+        metadata['publisher'] = publisher
         for key, value in metadata.items():
-            if key not in ('author', 'cover', 'sequence', 'keywords', 'year', 'publisher', 'isbn'):
+            if key not in ('author', 'cover', 'sequence', 'keywords', 'year',
+                           'publisher', 'isbn'):
                 metadata[key] = prepare_string_for_xml(value)
 
         try:
@@ -203,7 +221,8 @@ class FB2MLizer(object):
             metadata['comments'] = ''
         else:
             from ebook_converter.utils.html2text import html2text
-            metadata['comments'] = '<annotation><p>{}</p></annotation>'.format(prepare_string_for_xml(html2text(comments.value).strip()))
+            annot = prepare_string_for_xml(html2text(comments.value).strip())
+            metadata['comments'] = f'<annotation><p>{annot}</p></annotation>'
 
         # Keep the indentation level of the description the same as the body.
         header = textwrap.dedent('''\
@@ -245,7 +264,9 @@ class FB2MLizer(object):
         cover_href = None
 
         # Get the raster cover if it's available.
-        if self.oeb_book.metadata.cover and str(self.oeb_book.metadata.cover[0]) in self.oeb_book.manifest.ids:
+        if (self.oeb_book.metadata.cover and
+                str(self.oeb_book.metadata.cover[0]) in
+                self.oeb_book.manifest.ids):
             id = str(self.oeb_book.metadata.cover[0])
             cover_item = self.oeb_book.manifest.ids[id]
             if cover_item.media_type in OEB_RASTER_IMAGES:
@@ -259,7 +280,8 @@ class FB2MLizer(object):
                 page_name = 'cover'
 
             if page_name:
-                cover_item = self.oeb_book.manifest.hrefs[self.oeb_book.guide[page_name].href]
+                key = self.oeb_book.guide[page_name].href
+                cover_item = self.oeb_book.manifest.hrefs[key]
                 # Get the first image in the page
                 for img in cover_item.xpath('//img'):
                     cover_href = cover_item.abshref(img.get('src'))
@@ -267,10 +289,11 @@ class FB2MLizer(object):
 
         if cover_href:
             # Only write the image tag if it is in the manifest.
-            if cover_href in self.oeb_book.manifest.hrefs and cover_href not in self.image_hrefs:
+            if (cover_href in self.oeb_book.manifest.hrefs and
+                    cover_href not in self.image_hrefs):
                 self.image_hrefs[cover_href] = 'img_%s' % len(self.image_hrefs)
-            return '<coverpage><image l:href="#%s"/></coverpage>' % self.image_hrefs[cover_href]
-
+            return ('<coverpage><image l:href="#%s"/></coverpage>' %
+                    self.image_hrefs[cover_href])
         return ''
 
     def get_text(self):
@@ -285,16 +308,20 @@ class FB2MLizer(object):
 
         for item in self.oeb_book.spine:
             self.log.debug('Converting %s to FictionBook2 XML' % item.href)
-            stylizer = Stylizer(item.data, item.href, self.oeb_book, self.opts, self.opts.output_profile)
+            stylizer = Stylizer(item.data, item.href, self.oeb_book, self.opts,
+                                self.opts.output_profile)
 
-            # Start a <section> if we must sectionize each file or if the TOC references this page
+            # Start a <section> if we must sectionize each file or if the TOC
+            # references this page
             page_section_open = False
-            if self.opts.sectionize == 'files' or None in self.toc.get(item.href, ()):
+            if (self.opts.sectionize == 'files' or
+                    None in self.toc.get(item.href, ())):
                 text.append('<section>')
                 page_section_open = True
                 self.section_level += 1
 
-            text += self.dump_text(item.data.find(XHTML('body')), stylizer, item)
+            text += self.dump_text(item.data.find(XHTML('body')), stylizer,
+                                   item)
 
             if page_section_open:
                 text.append('</section>')
@@ -309,20 +336,23 @@ class FB2MLizer(object):
         return ''.join(text)
 
     def fb2mlize_images(self):
-        '''
-        This function uses the self.image_hrefs dictionary mapping. It is populated by the dump_text function.
-        '''
+        """
+        This function uses the self.image_hrefs dictionary mapping. It is
+        populated by the dump_text function.
+        """
         from ebook_converter.ebooks.oeb.base import OEB_RASTER_IMAGES
 
         images = []
         for item in self.oeb_book.manifest:
-            # Don't write the image if it's not referenced in the document's text.
+            # Don't write the image if it's not referenced in the document's
+            # text.
             if item.href not in self.image_hrefs:
                 continue
             if item.media_type in OEB_RASTER_IMAGES:
                 try:
                     if item.media_type not in ('image/jpeg', 'image/png'):
-                        imdata = save_cover_data_to(item.data, compression_quality=70)
+                        imdata = save_cover_data_to(item.data,
+                                                    compression_quality=70)
                         raw_data = as_base64_unicode(imdata)
                         content_type = 'image/jpeg'
                     else:
@@ -330,11 +360,14 @@ class FB2MLizer(object):
                         content_type = item.media_type
                     # Don't put the encoded image on a single line.
                     step = 72
-                    data = '\n'.join(raw_data[i:i+step] for i in range(0, len(raw_data), step))
-                    images.append('<binary id="%s" content-type="%s">%s</binary>' % (self.image_hrefs[item.href], content_type, data))
+                    data = '\n'.join(raw_data[i:i+step]
+                                     for i in range(0, len(raw_data), step))
+                    images.append('<binary id="%s" content-type="%s">%s'
+                                  '</binary>' % (self.image_hrefs[item.href],
+                                                 content_type, data))
                 except Exception as e:
                     self.log.error('Error: Could not include file %s because '
-                        '%s.' % (item.href, e))
+                                   '%s.' % (item.href, e))
         return '\n'.join(images)
 
     def create_flat_toc(self, nodes, level):
@@ -391,26 +424,31 @@ class FB2MLizer(object):
 
     def dump_text(self, elem_tree, stylizer, page, tag_stack=[]):
         '''
-        This function is intended to be used in a recursive manner. dump_text will
-        run though all elements in the elem_tree and call itself on each element.
+        This function is intended to be used in a recursive manner. dump_text
+        will run though all elements in the elem_tree and call itself on each
+        element.
 
         self.image_hrefs will be populated by calling this function.
 
-        @param elem_tree: etree representation of XHTML content to be transformed.
+        @param elem_tree: etree representation of XHTML content to be
+            transformed.
         @param stylizer: Used to track the style of elements within the tree.
         @param page: OEB page used to determine absolute urls.
         @param tag_stack: List of open FB2 tags to take into account.
 
         @return: List of string representing the XHTML converted to FB2 markup.
         '''
-        from ebook_converter.ebooks.oeb.base import XHTML_NS, barename, namespace
+        from ebook_converter.ebooks.oeb.base import barename
+        from ebook_converter.ebooks.oeb.base import namespace
         elem = elem_tree
 
-        # Ensure what we are converting is not a string and that the fist tag is part of the XHTML namespace.
-        if not isinstance(elem_tree.tag, (str, bytes)) or namespace(elem_tree.tag) != XHTML_NS:
+        # Ensure what we are converting is not a string and that the fist tag
+        # is part of the XHTML namespace.
+        if (not isinstance(elem_tree.tag, (str, bytes)) or
+                namespace(elem_tree.tag) != const.XHTML_NS):
             p = elem.getparent()
-            if p is not None and isinstance(p.tag, (str, bytes)) and namespace(p.tag) == XHTML_NS \
-                    and elem.tail:
+            if (p is not None and isinstance(p.tag, (str, bytes)) and
+                    namespace(p.tag) == const.XHTML_NS and elem.tail):
                 return [elem.tail]
             return []
 
@@ -423,7 +461,8 @@ class FB2MLizer(object):
 
         # FB2 generated output.
         fb2_out = []
-        # FB2 tags in the order they are opened. This will be used to close the tags.
+        # FB2 tags in the order they are opened. This will be used to close
+        # the tags.
         tags = []
         # First tag in tree
         tag = barename(elem_tree.tag)
@@ -432,26 +471,31 @@ class FB2MLizer(object):
             ems = int(round((float(style.marginTop) / style.fontSize) - 1))
             if ems < 0:
                 ems = 0
-        except:
+        except Exception:
             ems = 0
 
         # Convert TOC entries to <title>s and add <section>s
         if self.opts.sectionize == 'toc':
-            # A section cannot be a child of any other element than another section,
-            # so leave the tag alone if there are parents
+            # A section cannot be a child of any other element than another
+            # section, so leave the tag alone if there are parents
             if not tag_stack:
-                # There are two reasons to start a new section here: the TOC pointed to
-                # this page (then we use the first non-<body> on the page as a <title>), or
-                # the TOC pointed to a specific element
+                # There are two reasons to start a new section here: the TOC
+                # pointed to this page (then we use the first non-<body> on
+                # the page as a <title>), or the TOC pointed to a specific
+                # element
                 newlevel = 0
                 toc_entry = self.toc.get(page.href, None)
                 if toc_entry is not None:
                     if None in toc_entry:
-                        if tag != 'body' and hasattr(elem_tree, 'text') and elem_tree.text:
+                        if (tag != 'body' and hasattr(elem_tree, 'text') and
+                                elem_tree.text):
                             newlevel = 1
                             self.toc[page.href] = None
-                    if not newlevel and elem_tree.attrib.get('id', None) is not None:
-                        newlevel = toc_entry.get(elem_tree.attrib.get('id', None), None)
+                    if (not newlevel and
+                            elem_tree.attrib.get('id', None) is not None):
+                        newlevel = toc_entry.get(elem_tree.attrib.get('id',
+                                                                      None),
+                                                 None)
 
                 # Start a new section if necessary
                 if newlevel:
@@ -463,13 +507,14 @@ class FB2MLizer(object):
                     fb2_out.append('<title>')
                     tags.append('title')
             if self.section_level == 0:
-                # If none of the prior processing made a section, make one now to be FB2 spec compliant
+                # If none of the prior processing made a section, make one now
+                # to be FB2 spec compliant
                 fb2_out.append('<section>')
                 self.section_level += 1
 
         # Process the XHTML tag and styles. Converted to an FB2 tag.
-        # Use individual if statement not if else. There can be
-        # only one XHTML tag but it can have multiple styles.
+        # Use individual if statement not if else. There can be only one XHTML
+        # tag but it can have multiple styles.
         if tag == 'img' and elem_tree.attrib.get('src', None):
             # Only write the image tag if it is in the manifest.
             ihref = urlnormalize(page.abshref(elem_tree.attrib['src']))
@@ -479,7 +524,8 @@ class FB2MLizer(object):
                 p_txt, p_tag = self.ensure_p()
                 fb2_out += p_txt
                 tags += p_tag
-                fb2_out.append('<image l:href="#%s"/>' % self.image_hrefs[ihref])
+                fb2_out.append('<image l:href="#%s"/>' %
+                               self.image_hrefs[ihref])
             else:
                 self.log.warn(u'Ignoring image not in manifest: %s' % ihref)
         if tag in ('br', 'hr') or ems >= 1:
@@ -513,7 +559,8 @@ class FB2MLizer(object):
                 p_txt, p_tag = self.ensure_p()
                 fb2_out += p_txt
                 tags += p_tag
-                fb2_out.append('<a l:href="%s">' % urlnormalize(elem_tree.attrib['href']))
+                fb2_out.append('<a l:href="%s">' %
+                               urlnormalize(elem_tree.attrib['href']))
                 tags.append('a')
         if tag == 'b' or style['font-weight'] in ('bold', 'bolder'):
             s_out, s_tags = self.handle_simple_tag('strong', tag_stack+tags)
@@ -523,8 +570,10 @@ class FB2MLizer(object):
             s_out, s_tags = self.handle_simple_tag('emphasis', tag_stack+tags)
             fb2_out += s_out
             tags += s_tags
-        if tag in ('del', 'strike') or style['text-decoration'] == 'line-through':
-            s_out, s_tags = self.handle_simple_tag('strikethrough', tag_stack+tags)
+        if (tag in ('del', 'strike') or
+                style['text-decoration'] == 'line-through'):
+            s_out, s_tags = self.handle_simple_tag('strikethrough',
+                                                   tag_stack+tags)
             fb2_out += s_out
             tags += s_tags
         if tag == 'sub':
@@ -552,7 +601,8 @@ class FB2MLizer(object):
         tags.reverse()
         fb2_out += self.close_tags(tags)
 
-        # Process element text that comes after the close of the XHTML tag but before the next XHTML tag.
+        # Process element text that comes after the close of the XHTML tag but
+        # before the next XHTML tag.
         if hasattr(elem_tree, 'tail') and elem_tree.tail:
             if not self.in_p:
                 fb2_out.append('<p>')
diff --git a/ebook_converter/ebooks/htmlz/oeb2html.py b/ebook_converter/ebooks/htmlz/oeb2html.py
index f0c5640..42b0742 100644
--- a/ebook_converter/ebooks/htmlz/oeb2html.py
+++ b/ebook_converter/ebooks/htmlz/oeb2html.py
@@ -9,8 +9,9 @@ from functools import partial
 from lxml import html
 
 from ebook_converter import prepare_string_for_xml
-from ebook_converter.ebooks.oeb.base import (
-    XHTML, XHTML_NS, SVG_NS, barename, namespace, OEB_IMAGES, XLINK, rewrite_links, urlnormalize)
+from ebook_converter import constants as const
+from ebook_converter.ebooks.oeb import base
+from ebook_converter.ebooks.oeb import parse_utils
 from ebook_converter.ebooks.oeb.stylizer import Stylizer
 from ebook_converter.utils.logging import default_log
 from ebook_converter.polyglot.builtins import as_bytes
@@ -61,9 +62,9 @@ class OEB2HTML(object):
         for item in oeb_book.spine:
             self.log.debug('Converting %s to HTML...' % item.href)
             self.rewrite_ids(item.data, item)
-            rewrite_links(item.data, partial(self.rewrite_link, page=item))
+            base.rewrite_links(item.data, partial(self.rewrite_link, page=item))
             stylizer = Stylizer(item.data, item.href, oeb_book, self.opts)
-            output += self.dump_text(item.data.find(XHTML('body')), stylizer, item)
+            output += self.dump_text(item.data.find(base.tag('xhtml', 'body')), stylizer, item)
             output.append('\n\n')
         output.append('</body></html>')
         return ''.join(output)
@@ -80,7 +81,7 @@ class OEB2HTML(object):
 
     def map_resources(self, oeb_book):
         for item in oeb_book.manifest:
-            if item.media_type in OEB_IMAGES:
+            if item.media_type in base.OEB_IMAGES:
                 if item.href not in self.images:
                     ext = os.path.splitext(item.href)[1]
                     fname = '%s%s' % (len(self.images), ext)
@@ -88,9 +89,9 @@ class OEB2HTML(object):
                     self.images[item.href] = fname
             if item in oeb_book.spine:
                 self.get_link_id(item.href)
-                root = item.data.find(XHTML('body'))
+                root = item.data.find(base.tag('xhtml', 'body'))
                 link_attrs = set(html.defs.link_attrs)
-                link_attrs.add(XLINK('href'))
+                link_attrs.add(base.tag('xlink', 'href'))
                 for el in root.iter():
                     attribs = el.attrib
                     try:
@@ -108,7 +109,7 @@ class OEB2HTML(object):
     def rewrite_link(self, url, page=None):
         if not page:
             return url
-        abs_url = page.abshref(urlnormalize(url))
+        abs_url = page.abshref(base.urlnormalize(url))
         if abs_url in self.images:
             return 'images/%s' % self.images[abs_url]
         if abs_url in self.links:
@@ -121,7 +122,7 @@ class OEB2HTML(object):
                 tag = el.tag
             except UnicodeDecodeError:
                 continue
-            if tag == XHTML('body'):
+            if tag == base.tag('xhtml', 'body'):
                 el.attrib['id'] = self.get_link_id(page.href)[1:]
                 continue
             if 'id' in el.attrib:
@@ -156,9 +157,9 @@ class OEB2HTMLNoCSSizer(OEB2HTML):
 
         # We can only processes tags. If there isn't a tag return any text.
         if not isinstance(elem.tag, (str, bytes)) \
-           or namespace(elem.tag) not in (XHTML_NS, SVG_NS):
+           or parse_utils.namespace(elem.tag) not in (const.XHTML_NS, const.SVG_NS):
             p = elem.getparent()
-            if p is not None and isinstance(p.tag, (str, bytes)) and namespace(p.tag) in (XHTML_NS, SVG_NS) \
+            if p is not None and isinstance(p.tag, (str, bytes)) and parse_utils.namespace(p.tag) in (const.XHTML_NS, const.SVG_NS) \
                     and elem.tail:
                 return [elem.tail]
             return ['']
@@ -167,7 +168,7 @@ class OEB2HTMLNoCSSizer(OEB2HTML):
         text = ['']
         style = stylizer.style(elem)
         tags = []
-        tag = barename(elem.tag)
+        tag = parse_utils.barename(elem.tag)
         attribs = elem.attrib
 
         if tag == 'body':
@@ -245,9 +246,9 @@ class OEB2HTMLInlineCSSizer(OEB2HTML):
 
         # We can only processes tags. If there isn't a tag return any text.
         if not isinstance(elem.tag, (str, bytes)) \
-           or namespace(elem.tag) not in (XHTML_NS, SVG_NS):
+           or parse_utils.namespace(elem.tag) not in (const.XHTML_NS, const.SVG_NS):
             p = elem.getparent()
-            if p is not None and isinstance(p.tag, (str, bytes)) and namespace(p.tag) in (XHTML_NS, SVG_NS) \
+            if p is not None and isinstance(p.tag, (str, bytes)) and parse_utils.namespace(p.tag) in (const.XHTML_NS, const.SVG_NS) \
                     and elem.tail:
                 return [elem.tail]
             return ['']
@@ -256,7 +257,7 @@ class OEB2HTMLInlineCSSizer(OEB2HTML):
         text = ['']
         style = stylizer.style(elem)
         tags = []
-        tag = barename(elem.tag)
+        tag = parse_utils.barename(elem.tag)
         attribs = elem.attrib
 
         style_a = '%s' % style
@@ -327,9 +328,9 @@ class OEB2HTMLClassCSSizer(OEB2HTML):
         for item in oeb_book.spine:
             self.log.debug('Converting %s to HTML...' % item.href)
             self.rewrite_ids(item.data, item)
-            rewrite_links(item.data, partial(self.rewrite_link, page=item))
+            base.rewrite_links(item.data, partial(self.rewrite_link, page=item))
             stylizer = Stylizer(item.data, item.href, oeb_book, self.opts)
-            output += self.dump_text(item.data.find(XHTML('body')), stylizer, item)
+            output += self.dump_text(item.data.find(base.tag('xhtml', 'body')), stylizer, item)
             output.append('\n\n')
         if self.opts.htmlz_class_style == 'external':
             css = u'<link href="style.css" rel="stylesheet" type="text/css" />'
@@ -348,9 +349,9 @@ class OEB2HTMLClassCSSizer(OEB2HTML):
 
         # We can only processes tags. If there isn't a tag return any text.
         if not isinstance(elem.tag, (str, bytes)) \
-           or namespace(elem.tag) not in (XHTML_NS, SVG_NS):
+           or parse_utils.namespace(elem.tag) not in (const.XHTML_NS, const.SVG_NS):
             p = elem.getparent()
-            if p is not None and isinstance(p.tag, (str, bytes)) and namespace(p.tag) in (XHTML_NS, SVG_NS) \
+            if p is not None and isinstance(p.tag, (str, bytes)) and parse_utils.namespace(p.tag) in (const.XHTML_NS, const.SVG_NS) \
                     and elem.tail:
                 return [elem.tail]
             return ['']
@@ -358,7 +359,7 @@ class OEB2HTMLClassCSSizer(OEB2HTML):
         # Setup our variables.
         text = ['']
         tags = []
-        tag = barename(elem.tag)
+        tag = parse_utils.barename(elem.tag)
         attribs = elem.attrib
 
         if tag == 'body':
diff --git a/ebook_converter/ebooks/metadata/fb2.py b/ebook_converter/ebooks/metadata/fb2.py
index f38c8e0..43bc493 100644
--- a/ebook_converter/ebooks/metadata/fb2.py
+++ b/ebook_converter/ebooks/metadata/fb2.py
@@ -1,38 +1,32 @@
 """
 Read meta information from fb2 files
 """
-import os, random
-from functools import partial
-from string import ascii_letters, digits
+import functools
+import os
+import random
+import string
 
 from lxml import etree
 
 from ebook_converter.utils.date import parse_only_date
 from ebook_converter.utils.img import save_cover_data_to
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 from ebook_converter.utils.imghdr import identify
-from ebook_converter import guess_type, guess_all_extensions, prints, force_unicode
+from ebook_converter import guess_type, guess_all_extensions, prints, \
+        force_unicode
 from ebook_converter.ebooks.metadata import MetaInformation, check_isbn
 from ebook_converter.ebooks.chardet import xml_to_unicode
 from ebook_converter.polyglot.binary import as_base64_unicode
 
 
-__license__ = 'GPL v3'
-__copyright__ = ('2011, Roman Mukhin <ramses_ru at hotmail.com>, '
-                 '2008, Anatoly Shipitsin <norguhtar at gmail.com>')
+NAMESPACES = {'fb2': 'http://www.gribuser.ru/xml/fictionbook/2.0',
+              'fb21': 'http://www.gribuser.ru/xml/fictionbook/2.1',
+              'xlink': 'http://www.w3.org/1999/xlink'}
 
-
-NAMESPACES = {
-    'fb2'   :   'http://www.gribuser.ru/xml/fictionbook/2.0',
-    'fb21'  :   'http://www.gribuser.ru/xml/fictionbook/2.1',
-    'xlink' :   'http://www.w3.org/1999/xlink'
-}
-
-tostring = partial(etree.tostring, method='text', encoding='unicode')
+tostring = functools.partial(etree.tostring, method='text', encoding='unicode')
 
 
 def XLINK(tag):
-    return '{%s}%s'%(NAMESPACES['xlink'], tag)
+    return '{%s}%s' % (NAMESPACES['xlink'], tag)
 
 
 class Context(object):
@@ -52,7 +46,7 @@ class Context(object):
         return etree.XPath(*args, namespaces=self.namespaces)
 
     def get_or_create(self, parent, tag, attribs={}, at_start=True):
-        xpathstr='./fb:'+tag
+        xpathstr = './fb:'+tag
         for n, v in attribs.items():
             xpathstr += '[@%s="%s"]' % (n, v)
         ans = self.XPath(xpathstr)(parent)
@@ -73,7 +67,7 @@ class Context(object):
 
     def clear_meta_tags(self, doc, tag):
         for parent in ('title-info', 'src-title-info', 'publish-info'):
-            for x in self.XPath('//fb:%s/fb:%s'%(parent, tag))(doc):
+            for x in self.XPath('//fb:%s/fb:%s' % (parent, tag))(doc):
                 x.getparent().remove(x)
 
     def text2fb2(self, parent, text):
@@ -117,42 +111,41 @@ def get_metadata(stream):
         book_title = str(book_title)
     else:
         book_title = force_unicode(os.path.splitext(
-            os.path.basename(getattr(stream, 'name',
-                'Unknown')))[0])
+            os.path.basename(getattr(stream, 'name', 'Unknown')))[0])
     mi = MetaInformation(book_title, authors)
 
     try:
         _parse_cover(root, mi, ctx)
-    except:
+    except Exception:
         pass
     try:
         _parse_comments(root, mi, ctx)
-    except:
+    except Exception:
         pass
     try:
         _parse_tags(root, mi, ctx)
-    except:
+    except Exception:
         pass
     try:
         _parse_series(root, mi, ctx)
-    except:
+    except Exception:
         pass
     try:
         _parse_isbn(root, mi, ctx)
-    except:
+    except Exception:
         pass
     try:
         _parse_publisher(root, mi, ctx)
-    except:
+    except Exception:
         pass
     try:
         _parse_pubdate(root, mi, ctx)
-    except:
+    except Exception:
         pass
 
     try:
         _parse_language(root, mi, ctx)
-    except:
+    except Exception:
         pass
 
     return mi
@@ -160,11 +153,11 @@ def get_metadata(stream):
 
 def _parse_authors(root, ctx):
     authors = []
-    # pick up authors but only from 1 secrion <title-info>; otherwise it is not consistent!
-    # Those are fallbacks: <src-title-info>, <document-info>
+    # pick up authors but only from 1 secrion <title-info>; otherwise it is
+    # not consistent! Those are fallbacks: <src-title-info>, <document-info>
     author = None
     for author_sec in ['title-info', 'src-title-info', 'document-info']:
-        for au in ctx.XPath('//fb:%s/fb:author'%author_sec)(root):
+        for au in ctx.XPath('//fb:%s/fb:author' % author_sec)(root):
             author = _parse_author(au, ctx)
             if author:
                 authors.append(author)
@@ -207,24 +200,26 @@ def _parse_book_title(root, ctx):
     xp_ti = '//fb:title-info/fb:book-title/text()'
     xp_pi = '//fb:publish-info/fb:book-title/text()'
     xp_si = '//fb:src-title-info/fb:book-title/text()'
-    book_title = ctx.XPath('normalize-space(%s|%s|%s)' % (xp_ti, xp_pi, xp_si))(root)
+    book_title = ctx.XPath('normalize-space(%s|%s|%s)' %
+                           (xp_ti, xp_pi, xp_si))(root)
 
     return book_title
 
 
 def _parse_cover(root, mi, ctx):
     # pickup from <title-info>, if not exists it fallbacks to <src-title-info>
-    imgid = ctx.XPath('substring-after(string(//fb:coverpage/fb:image/@xlink:href), "#")')(root)
+    imgid = ctx.XPath('substring-after(string(//fb:coverpage/fb:image/'
+                      '@xlink:href), "#")')(root)
     if imgid:
         try:
             _parse_cover_data(root, imgid, mi, ctx)
-        except:
+        except Exception:
             pass
 
 
 def _parse_cover_data(root, imgid, mi, ctx):
     from ebook_converter.ebooks.fb2 import base64_decode
-    elm_binary = ctx.XPath('//fb:binary[@id="%s"]'%imgid)(root)
+    elm_binary = ctx.XPath('//fb:binary[@id="%s"]' % imgid)(root)
     if elm_binary:
         mimetype = elm_binary[0].get('content-type', 'image/jpeg')
         mime_extensions = guess_all_extensions(mimetype)
@@ -241,12 +236,13 @@ def _parse_cover_data(root, imgid, mi, ctx):
                 fmt = identify(cdata)[0]
                 mi.cover_data = (fmt, cdata)
         else:
-            prints("WARNING: Unsupported coverpage mime-type '%s' (id=#%s)" % (mimetype, imgid))
+            prints("WARNING: Unsupported coverpage mime-type '%s' (id=#%s)" %
+                   (mimetype, imgid))
 
 
 def _parse_tags(root, mi, ctx):
-    # pick up genre but only from 1 secrion <title-info>; otherwise it is not consistent!
-    # Those are fallbacks: <src-title-info>
+    # pick up genre but only from 1 secrion <title-info>; otherwise it is not
+    # consistent! Those are fallbacks: <src-title-info>
     for genre_sec in ['title-info', 'src-title-info']:
         # -- i18n Translations-- ?
         tags = ctx.XPath('//fb:%s/fb:genre/text()' % genre_sec)(root)
@@ -267,16 +263,20 @@ def _parse_series(root, mi, ctx):
         mi.series = elms_sequence[0].get('name', None)
         if mi.series:
             try:
-                mi.series_index = float('.'.join(elms_sequence[0].get('number', None).split()[:2]))
+                i = float('.'.join(elms_sequence[0].get('number',
+                                                        None).split()[:2]))
+                mi.series_index = i
             except Exception:
                 pass
 
 
 def _parse_isbn(root, mi, ctx):
-    # some people try to put several isbn in this field, but it is not allowed.  try to stick to the 1-st one in this case
+    # some people try to put several isbn in this field, but it is not
+    # allowed. try to stick to the 1-st one in this case
     isbn = ctx.XPath('normalize-space(//fb:publish-info/fb:isbn/text())')(root)
     if isbn:
-        # some people try to put several isbn in this field, but it is not allowed.  try to stick to the 1-st one in this case
+        # some people try to put several isbn in this field, but it is not
+        # allowed. try to stick to the 1-st one in this case
         if ',' in isbn:
             isbn = isbn[:isbn.index(',')]
         if check_isbn(isbn):
@@ -284,9 +284,11 @@ def _parse_isbn(root, mi, ctx):
 
 
 def _parse_comments(root, mi, ctx):
-    # pick up annotation but only from 1 section <title-info>;  fallback: <src-title-info>
+    # pick up annotation but only from 1 section <title-info>;
+    # fallback: <src-title-info>
     for annotation_sec in ['title-info', 'src-title-info']:
-        elms_annotation = ctx.XPath('//fb:%s/fb:annotation' % annotation_sec)(root)
+        elms_annotation = ctx.XPath('//fb:%s/fb:annotation' %
+                                    annotation_sec)(root)
         if elms_annotation:
             mi.comments = tostring(elms_annotation[0])
             # TODO: tags i18n, xslt?
@@ -294,7 +296,8 @@ def _parse_comments(root, mi, ctx):
 
 
 def _parse_publisher(root, mi, ctx):
-    publisher = ctx.XPath('string(//fb:publish-info/fb:publisher/text())')(root)
+    publisher = ctx.XPath('string(//fb:publish-info/fb:publisher/'
+                          'text())')(root)
     if publisher:
         mi.publisher = publisher
 
@@ -315,7 +318,7 @@ def _parse_language(root, mi, ctx):
 
 def _get_fbroot(raw):
     raw = xml_to_unicode(raw, strip_encoding_pats=True)[0]
-    root = safe_xml_fromstring(raw)
+    root = etree.fromstring(raw)
     return ensure_namespace(root)
 
 
@@ -348,10 +351,12 @@ def _set_authors(title_info, mi, ctx):
                 ctx.create_tag(atag, 'first-name').text = author_parts[0]
                 author_parts = author_parts[1:]
                 if len(author_parts) > 1:
-                    ctx.create_tag(atag, 'middle-name', at_start=False).text = author_parts[0]
+                    ctx.create_tag(atag, 'middle-name',
+                                   at_start=False).text = author_parts[0]
                     author_parts = author_parts[1:]
                 if author_parts:
-                    ctx.create_tag(atag, 'last-name', at_start=False).text = ' '.join(author_parts)
+                    a = ' '.join(author_parts)
+                    ctx.create_tag(atag, 'last-name', at_start=False).text = a
 
 
 def _set_tags(title_info, mi, ctx):
@@ -368,12 +373,12 @@ def _set_series(title_info, mi, ctx):
         seq = ctx.get_or_create(title_info, 'sequence')
         seq.set('name', mi.series)
         try:
-            seq.set('number', '%g'%mi.series_index)
-        except:
+            seq.set('number', '%g' % mi.series_index)
+        except Exception:
             seq.set('number', '1')
 
 
-def _rnd_name(size=8, chars=ascii_letters + digits):
+def _rnd_name(size=8, chars=string.ascii_letters + string.digits):
     return ''.join(random.choice(chars) for x in range(size))
 
 
@@ -396,7 +401,9 @@ def _set_cover(title_info, mi, ctx):
             cim_filename = _rnd_pic_file_name('cover')
             cim_tag.attrib[XLINK('href')] = '#' + cim_filename
         fb2_root = cim_tag.getroottree().getroot()
-        cim_binary = ctx.get_or_create(fb2_root, 'binary', attribs={'id': cim_filename}, at_start=False)
+        cim_binary = ctx.get_or_create(fb2_root, 'binary',
+                                       attribs={'id': cim_filename},
+                                       at_start=False)
         cim_binary.attrib['content-type'] = 'image/jpeg'
         cim_binary.text = _encode_into_jpeg(mi.cover_data[1])
 
@@ -425,7 +432,8 @@ def set_metadata(stream, mi, apply_null=False, update_timestamp=False):
     # single quotes in xml declaration. Sigh. See
     # https://www.mobileread.com/forums/showthread.php?p=2273184#post2273184
     raw = b'<?xml version="1.0" encoding="UTF-8"?>\n'
-    raw += etree.tostring(root, method='xml', encoding='utf-8', xml_declaration=False)
+    raw += etree.tostring(root, method='xml', encoding='utf-8',
+                          xml_declaration=False)
 
     stream.seek(0)
     stream.truncate()
@@ -449,6 +457,7 @@ def ensure_namespace(doc):
     if bare_tags:
         import re
         raw = etree.tostring(doc, encoding='unicode')
-        raw = re.sub(r'''<(description|body)\s+xmlns=['"]['"]>''', r'<\1>', raw)
-        doc = safe_xml_fromstring(raw)
+        raw = re.sub(r'''<(description|body)\s+xmlns=['"]['"]>''', r'<\1>',
+                     raw)
+        doc = etree.fromstring(raw)
     return doc
diff --git a/ebook_converter/ebooks/metadata/opf2.py b/ebook_converter/ebooks/metadata/opf2.py
index 586164b..9c85d23 100644
--- a/ebook_converter/ebooks/metadata/opf2.py
+++ b/ebook_converter/ebooks/metadata/opf2.py
@@ -12,29 +12,31 @@ import sys
 import unittest
 import urllib.parse
 import uuid
+import traceback
+import textwrap
 
 from lxml import etree
+from lxml.builder import ElementMaker
 
+from ebook_converter.ebooks.oeb import base
+from ebook_converter import constants as const
 from ebook_converter.ebooks import escape_xpath_attr
 from ebook_converter.constants_old import __appname__, __version__, \
         filesystem_encoding
 from ebook_converter.ebooks.metadata.toc import TOC
-from ebook_converter.ebooks.metadata.utils import parse_opf, pretty_print_opf as _pretty_print
-from ebook_converter.ebooks.metadata import string_to_authors, MetaInformation, check_isbn
+from ebook_converter.ebooks.metadata.utils import parse_opf, \
+        pretty_print_opf as _pretty_print
+from ebook_converter.ebooks.metadata import string_to_authors, \
+        MetaInformation, check_isbn
 from ebook_converter.ebooks.metadata.book.base import Metadata
 from ebook_converter.utils.date import parse_date, isoformat
 from ebook_converter.utils.localization import get_lang, canonicalize_lang
 from ebook_converter import prints, guess_type
 from ebook_converter.utils.cleantext import clean_ascii_chars, clean_xml_chars
 from ebook_converter.utils.config import tweaks
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 from ebook_converter.polyglot.urllib import unquote
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2008, Kovid Goyal kovid@kovidgoyal.net'
-__docformat__ = 'restructuredtext en'
-
 pretty_print_opf = False
 
 
@@ -73,7 +75,7 @@ class Resource(object):  # {{{
         self.fragment = ''
         try:
             self.mime_type = guess_type(href_or_path)[0]
-        except:
+        except Exception:
             self.mime_type = None
         if self.mime_type is None:
             self.mime_type = 'application/octet-stream'
@@ -94,17 +96,21 @@ class Resource(object):  # {{{
                 if isinstance(pc, str):
                     pc = pc.encode('utf-8')
                 pc = pc.decode('utf-8')
-                self.path = os.path.abspath(os.path.join(basedir, pc.replace('/', os.sep)))
+                self.path = os.path.abspath(os.path.join(basedir,
+                                                         pc.replace('/',
+                                                                    os.sep)))
                 self.fragment = url[-1]
 
     def href(self, basedir=None):
-        '''
-        Return a URL pointing to this resource. If it is a file on the filesystem
-        the URL is relative to `basedir`.
+        """
+        Return a URL pointing to this resource. If it is a file on the
+        filesystem the URL is relative to `basedir`.
 
-        `basedir`: If None, the basedir of this resource is used (see :method:`set_basedir`).
-        If this resource has no basedir, then the current working directory is used as the basedir.
-        '''
+        `basedir`: If None, the basedir of this resource is used (see
+            :method:`set_basedir`).
+        If this resource has no basedir, then the current working directory is
+        used as the basedir.
+        """
         if basedir is None:
             if self._basedir:
                 basedir = self._basedir
@@ -117,7 +123,8 @@ class Resource(object):  # {{{
             return frag
         try:
             rpath = os.path.relpath(self.path, basedir)
-        except ValueError:  # On windows path and basedir could be on different drives
+        except ValueError:
+            # On windows path and basedir could be on different drives
             rpath = self.path
         if isinstance(rpath, bytes):
             rpath = rpath.decode(filesystem_encoding)
@@ -130,7 +137,7 @@ class Resource(object):  # {{{
         return self._basedir
 
     def __repr__(self):
-        return 'Resource(%s, %s)'%(repr(self.path), repr(self.href()))
+        return 'Resource(%s, %s)' % (repr(self.path), repr(self.href()))
 
 # }}}
 
@@ -155,7 +162,7 @@ class ResourceCollection(object):  # {{{
 
     def __str__(self):
         resources = map(repr, self)
-        return '[%s]'%', '.join(resources)
+        return '[%s]' % ', '.join(resources)
     __unicode__ = __str__
 
     def __repr__(self):
@@ -211,7 +218,8 @@ class ManifestItem(Resource):  # {{{
         self.mime_type = val
 
     def __unicode__representation__(self):
-        return u'<item id="%s" href="%s" media-type="%s" />'%(self.id, self.href(), self.media_type)
+        return (u'<item id="%s" href="%s" media-type="%s" />' %
+                (self.id, self.href(), self.media_type))
 
     __str__ = __unicode__representation__
 
@@ -223,7 +231,7 @@ class ManifestItem(Resource):  # {{{
             return self.href()
         if index == 1:
             return self.media_type
-        raise IndexError('%d out of bounds.'%index)
+        raise IndexError('%d out of bounds.' % index)
 
 # }}}
 
@@ -234,7 +242,7 @@ class Manifest(ResourceCollection):  # {{{
         self.append(ManifestItem.from_opf_manifest_item(item, dir))
         id = item.get('id', '')
         if not id:
-            id = 'id%d'%self.next_id
+            id = 'id%d' % self.next_id
         self[-1].id = id
         self.next_id += 1
 
@@ -250,15 +258,16 @@ class Manifest(ResourceCollection):  # {{{
 
     @staticmethod
     def from_paths(entries):
-        '''
-        `entries`: List of (path, mime-type) If mime-type is None it is autodetected
-        '''
+        """
+        `entries`: List of (path, mime-type) If mime-type is None it is
+        autodetected
+        """
         m = Manifest()
         for path, mt in entries:
             mi = ManifestItem(path, is_path=True)
             if mt:
                 mi.mime_type = mt
-            mi.id = 'id%d'%m.next_id
+            mi.id = 'id%d' % m.next_id
             m.next_id += 1
             m.append(mi)
         return m
@@ -267,7 +276,7 @@ class Manifest(ResourceCollection):  # {{{
         mi = ManifestItem(path, is_path=True)
         if mime_type:
             mi.mime_type = mime_type
-        mi.id = 'id%d'%self.next_id
+        mi.id = 'id%d' % self.next_id
         self.next_id += 1
         self.append(mi)
         return mi.id
@@ -318,13 +327,13 @@ class Spine(ResourceCollection):  # {{{
     def from_opf_spine_element(itemrefs, manifest):
         s = Spine(manifest)
         seen = set()
-        path_map = {i.id:i.path for i in s.manifest}
+        path_map = {i.id: i.path for i in s.manifest}
         for itemref in itemrefs:
             idref = itemref.get('idref', None)
             if idref is not None:
                 path = path_map.get(idref)
                 if path and path not in seen:
-                    r = Spine.Item(lambda x:idref, path, is_path=True)
+                    r = Spine.Item(lambda x: idref, path, is_path=True)
                     r.is_linear = itemref.get('linear', 'yes') == 'yes'
                     r.idref = idref
                     s.append(r)
@@ -336,8 +345,9 @@ class Spine(ResourceCollection):  # {{{
         s = Spine(manifest)
         for path in paths:
             try:
-                s.append(Spine.Item(s.manifest.id_for_path, path, is_path=True))
-            except:
+                s.append(Spine.Item(s.manifest.id_for_path, path,
+                                    is_path=True))
+            except Exception:
                 continue
         return s
 
@@ -346,10 +356,10 @@ class Spine(ResourceCollection):  # {{{
         self.manifest = manifest
 
     def replace(self, start, end, ids):
-        '''
-        Replace the items between start (inclusive) and end (not inclusive) with
+        """
+        Replace the items between start (inclusive) and end (not inclusive)
         with the items identified by ids. ids can be a list of any length.
-        '''
+        """
         items = []
         for id in ids:
             path = self.manifest.path_for_id(id)
@@ -381,16 +391,18 @@ class Guide(ResourceCollection):  # {{{
 
         @staticmethod
         def from_opf_resource_item(ref, basedir):
-            title, href, type = ref.get('title', ''), ref.get('href'), ref.get('type')
+            title = ref.get('title', '')
+            href = ref.get('href')
+            type = ref.get('type')
             res = Guide.Reference(href, basedir, is_path=True)
             res.title = title
             res.type = type
             return res
 
         def __repr__(self):
-            ans = '<reference type="%s" href="%s" '%(self.type, self.href())
+            ans = '<reference type="%s" href="%s" ' % (self.type, self.href())
             if self.title:
-                ans += 'title="%s" '%self.title
+                ans += 'title="%s" ' % self.title
             return ans + '/>'
 
     @staticmethod
@@ -400,7 +412,7 @@ class Guide(ResourceCollection):  # {{{
             try:
                 ref = Guide.Reference.from_opf_resource_item(ref, base_dir)
                 coll.append(ref)
-            except:
+            except Exception:
                 continue
         return coll
 
@@ -408,7 +420,8 @@ class Guide(ResourceCollection):  # {{{
         for i in tuple(self):
             if 'cover' in i.type.lower():
                 self.remove(i)
-        for typ in ('cover', 'other.ms-coverimage-standard', 'other.ms-coverimage'):
+        for typ in ('cover', 'other.ms-coverimage-standard',
+                    'other.ms-coverimage'):
             self.append(Guide.Reference(path, is_path=True))
             self[-1].type = typ
             self[-1].title = ''
@@ -419,12 +432,12 @@ class Guide(ResourceCollection):  # {{{
 class MetadataField(object):
 
     def __init__(self, name, is_dc=True, formatter=None, none_is=None,
-            renderer=lambda x: str(x)):
-        self.name      = name
-        self.is_dc     = is_dc
+                 renderer=lambda x: str(x)):
+        self.name = name
+        self.is_dc = is_dc
         self.formatter = formatter
-        self.none_is   = none_is
-        self.renderer  = renderer
+        self.none_is = none_is
+        self.renderer = renderer
 
     def __real_get__(self, obj, type=None):
         ans = obj.get_metadata_element(self.name)
@@ -436,7 +449,7 @@ class MetadataField(object):
         if self.formatter is not None:
             try:
                 ans = self.formatter(ans)
-            except:
+            except Exception:
                 return None
         if hasattr(ans, 'strip'):
             ans = ans.strip()
@@ -467,7 +480,8 @@ class TitleSortField(MetadataField):
             matches = obj.title_path(obj.metadata)
             if matches:
                 for match in matches:
-                    ans = match.get('{%s}file-as'%obj.NAMESPACES['opf'], None)
+                    ans = match.get('{%s}file-as' %
+                                    obj.NAMESPACES['opf'], None)
                     if not ans:
                         ans = match.get('file-as', None)
                     if ans:
@@ -488,10 +502,11 @@ class TitleSortField(MetadataField):
                         del match.attrib[attr]
 
 
-def serialize_user_metadata(metadata_elem, all_user_metadata, tail='\n'+(' '*8)):
+def serialize_user_metadata(metadata_elem, all_user_metadata,
+                            tail='\n'+(' '*8)):
     from ebook_converter.utils.config import to_json
-    from ebook_converter.ebooks.metadata.book.json_codec import (object_to_unicode,
-                                                         encode_is_multiple)
+    from ebook_converter.ebooks.metadata.book.json_codec import \
+        object_to_unicode, encode_is_multiple
 
     for name, fm in all_user_metadata.items():
         try:
@@ -499,9 +514,8 @@ def serialize_user_metadata(metadata_elem, all_user_metadata, tail='\n'+(' '*8))
             encode_is_multiple(fm)
             fm = object_to_unicode(fm)
             fm = json.dumps(fm, default=to_json, ensure_ascii=False)
-        except:
+        except Exception:
             prints('Failed to write user metadata:', name)
-            import traceback
             traceback.print_exc()
             continue
         meta = metadata_elem.makeelement('meta')
@@ -514,91 +528,109 @@ def serialize_user_metadata(metadata_elem, all_user_metadata, tail='\n'+(' '*8))
 def dump_dict(cats):
     if not cats:
         cats = {}
-    from ebook_converter.ebooks.metadata.book.json_codec import object_to_unicode
+    from ebook_converter.ebooks.metadata.book.json_codec import \
+        object_to_unicode
     return json.dumps(object_to_unicode(cats), ensure_ascii=False,
-            skipkeys=True)
+                      skipkeys=True)
 
 
 class OPF(object):  # {{{
 
-    MIMETYPE         = 'application/oebps-package+xml'
-    NAMESPACES       = {
-                        None: "http://www.idpf.org/2007/opf",
-                        'dc': "http://purl.org/dc/elements/1.1/",
-                        'opf': "http://www.idpf.org/2007/opf",
-                       }
-    META             = '{%s}meta' % NAMESPACES['opf']
+    MIMETYPE = 'application/oebps-package+xml'
+    NAMESPACES = {None: "http://www.idpf.org/2007/opf",
+                  'dc': "http://purl.org/dc/elements/1.1/",
+                  'opf': "http://www.idpf.org/2007/opf"}
+    META = '{%s}meta' % NAMESPACES['opf']
     xpn = NAMESPACES.copy()
     xpn.pop(None)
     xpn['re'] = 'http://exslt.org/regular-expressions'
     XPath = functools.partial(etree.XPath, namespaces=xpn)
-    CONTENT          = XPath('self::*[re:match(name(), "meta$", "i")]/@content')
-    TEXT             = XPath('string()')
+    CONTENT = XPath('self::*[re:match(name(), "meta$", "i")]/@content')
+    TEXT = XPath('string()')
 
-    metadata_path   = XPath('descendant::*[re:match(name(), "metadata", "i")]')
-    metadata_elem_path = XPath(
-        'descendant::*[re:match(name(), concat($name, "$"), "i") or (re:match(name(), "meta$", "i") '
-        'and re:match(@name, concat("^calibre:", $name, "$"), "i"))]')
-    title_path      = XPath('descendant::*[re:match(name(), "title", "i")]')
-    authors_path    = XPath('descendant::*[re:match(name(), "creator", "i") and (@role="aut" or @opf:role="aut" or (not(@role) and not(@opf:role)))]')
-    bkp_path        = XPath('descendant::*[re:match(name(), "contributor", "i") and (@role="bkp" or @opf:role="bkp")]')
-    tags_path       = XPath('descendant::*[re:match(name(), "subject", "i")]')
-    isbn_path       = XPath('descendant::*[re:match(name(), "identifier", "i") and '
-                            '(re:match(@scheme, "isbn", "i") or re:match(@opf:scheme, "isbn", "i"))]')
-    pubdate_path    = XPath('descendant::*[re:match(name(), "date", "i")]')
-    raster_cover_path = XPath('descendant::*[re:match(name(), "meta", "i") and '
-            're:match(@name, "cover", "i") and @content]')
-    guide_cover_path = XPath('descendant::*[local-name()="guide"]/*[local-name()="reference" and re:match(@type, "cover", "i")]/@href')
-    identifier_path = XPath('descendant::*[re:match(name(), "identifier", "i")]')
-    application_id_path = XPath('descendant::*[re:match(name(), "identifier", "i") and '
-                            '(re:match(@opf:scheme, "calibre|libprs500", "i") or re:match(@scheme, "calibre|libprs500", "i"))]')
-    uuid_id_path    = XPath('descendant::*[re:match(name(), "identifier", "i") and '
-                            '(re:match(@opf:scheme, "uuid", "i") or re:match(@scheme, "uuid", "i"))]')
-    languages_path  = XPath('descendant::*[local-name()="language"]')
+    metadata_path = XPath('descendant::*[re:match(name(), "metadata", "i")]')
+    metadata_elem_path = XPath('descendant::*[re:match(name(), '
+                               'concat($name, "$"), "i") or (re:match(name(), '
+                               '"meta$", "i") and re:match(@name, '
+                               'concat("^calibre:", $name, "$"), "i"))]')
+    title_path = XPath('descendant::*[re:match(name(), "title", "i")]')
+    authors_path = XPath('descendant::*[re:match(name(), "creator", "i") '
+                         'and (@role="aut" or @opf:role="aut" or (not(@role) '
+                         'and not(@opf:role)))]')
+    bkp_path = XPath('descendant::*[re:match(name(), "contributor", "i") and '
+                     '(@role="bkp" or @opf:role="bkp")]')
+    tags_path = XPath('descendant::*[re:match(name(), "subject", "i")]')
+    isbn_path = XPath('descendant::*[re:match(name(), "identifier", "i") and '
+                      '(re:match(@scheme, "isbn", "i") or re:match(@opf:'
+                      'scheme, "isbn", "i"))]')
+    pubdate_path = XPath('descendant::*[re:match(name(), "date", "i")]')
+    raster_cover_path = XPath('descendant::*[re:match(name(), "meta", "i") '
+                              'and re:match(@name, "cover", "i") and '
+                              '@content]')
+    guide_cover_path = XPath('descendant::*[local-name()="guide"]/*[local-'
+                             'name()="reference" and re:match(@type, "cover", '
+                             '"i")]/@href')
+    identifier_path = XPath('descendant::*[re:match(name(), "identifier", '
+                            '"i")]')
+    application_id_path = XPath('descendant::*[re:match(name(), "identifier",'
+                                ' "i") and (re:match(@opf:scheme, '
+                                '"calibre|libprs500", "i") or re:match(@'
+                                'scheme, "calibre|libprs500", "i"))]')
+    uuid_id_path = XPath('descendant::*[re:match(name(), "identifier", "i") '
+                         'and (re:match(@opf:scheme, "uuid", "i") or re:match'
+                         '(@scheme, "uuid", "i"))]')
+    languages_path = XPath('descendant::*[local-name()="language"]')
 
-    manifest_path   = XPath('descendant::*[re:match(name(), "manifest", "i")]/*[re:match(name(), "item", "i")]')
-    manifest_ppath  = XPath('descendant::*[re:match(name(), "manifest", "i")]')
-    spine_path      = XPath('descendant::*[re:match(name(), "spine", "i")]/*[re:match(name(), "itemref", "i")]')
-    guide_path      = XPath('descendant::*[re:match(name(), "guide", "i")]/*[re:match(name(), "reference", "i")]')
+    manifest_path = XPath('descendant::*[re:match(name(), "manifest", "i")]/'
+                          '*[re:match(name(), "item", "i")]')
+    manifest_ppath = XPath('descendant::*[re:match(name(), "manifest", "i")]')
+    spine_path = XPath('descendant::*[re:match(name(), "spine", "i")]/*[re:'
+                       'match(name(), "itemref", "i")]')
+    guide_path = XPath('descendant::*[re:match(name(), "guide", "i")]/*[re:'
+                       'match(name(), "reference", "i")]')
 
-    publisher       = MetadataField('publisher')
-    comments        = MetadataField('description')
-    category        = MetadataField('type')
-    rights          = MetadataField('rights')
-    series          = MetadataField('series', is_dc=False)
+    publisher = MetadataField('publisher')
+    comments = MetadataField('description')
+    category = MetadataField('type')
+    rights = MetadataField('rights')
+    series = MetadataField('series', is_dc=False)
     if tweaks['use_series_auto_increment_tweak_when_importing']:
-        series_index    = MetadataField('series_index', is_dc=False,
-                                        formatter=float, none_is=None)
+        series_index = MetadataField('series_index', is_dc=False,
+                                     formatter=float, none_is=None)
     else:
-        series_index    = MetadataField('series_index', is_dc=False,
-                                        formatter=float, none_is=1)
-    title_sort      = TitleSortField('title_sort', is_dc=False)
-    rating          = MetadataField('rating', is_dc=False, formatter=float)
+        series_index = MetadataField('series_index', is_dc=False,
+                                     formatter=float, none_is=1)
+    title_sort = TitleSortField('title_sort', is_dc=False)
+    rating = MetadataField('rating', is_dc=False, formatter=float)
     publication_type = MetadataField('publication_type', is_dc=False)
-    timestamp       = MetadataField('timestamp', is_dc=False,
-                                    formatter=parse_date, renderer=isoformat)
+    timestamp = MetadataField('timestamp', is_dc=False,
+                              formatter=parse_date, renderer=isoformat)
     user_categories = MetadataField('user_categories', is_dc=False,
                                     formatter=json.loads,
                                     renderer=dump_dict)
     author_link_map = MetadataField('author_link_map', is_dc=False,
-                                formatter=json.loads, renderer=dump_dict)
+                                    formatter=json.loads, renderer=dump_dict)
 
     def __init__(self, stream, basedir=os.getcwd(), unquote_urls=True,
-            populate_spine=True, try_to_guess_cover=True, preparsed_opf=None, read_toc=True):
+                 populate_spine=True, try_to_guess_cover=True,
+                 preparsed_opf=None, read_toc=True):
         self.try_to_guess_cover = try_to_guess_cover
-        self.basedir  = self.base_dir = basedir
+        self.basedir = self.base_dir = basedir
         self.path_to_html_toc = self.html_toc_fragment = None
-        self.root = parse_opf(stream) if preparsed_opf is None else preparsed_opf
+        self.root = preparsed_opf
+        if preparsed_opf is None:
+            self.root = parse_opf(stream)
         try:
             self.package_version = float(self.root.get('version', None))
         except (AttributeError, TypeError, ValueError):
             self.package_version = 0
         self.metadata = self.metadata_path(self.root)
         if not self.metadata:
-            self.metadata = [self.root.makeelement('{http://www.idpf.org/2007/opf}metadata')]
+            self.metadata = [self.root.makeelement('{http://www.idpf.org/2007'
+                                                   '/opf}metadata')]
             self.root.insert(0, self.metadata[0])
             self.metadata[0].tail = '\n'
-        self.metadata      = self.metadata[0]
+        self.metadata = self.metadata[0]
         if unquote_urls:
             self.unquote_urls()
         self.manifest = Manifest()
@@ -623,9 +655,10 @@ class OPF(object):  # {{{
         self._user_metadata_ = {}
         temp = Metadata('x', ['x'])
         from ebook_converter.utils.config import from_json
-        from ebook_converter.ebooks.metadata.book.json_codec import decode_is_multiple
+        from ebook_converter.ebooks.metadata.book.json_codec import \
+            decode_is_multiple
         elems = self.root.xpath('//*[name() = "meta" and starts-with(@name,'
-                '"calibre:user_metadata:") and @content]')
+                                '"calibre:user_metadata:") and @content]')
         for elem in elems:
             name = elem.get('name')
             name = ':'.join(name.split(':')[2:])
@@ -636,9 +669,8 @@ class OPF(object):  # {{{
                 fm = json.loads(fm, object_hook=from_json)
                 decode_is_multiple(fm)
                 temp.set_user_metadata(name, fm)
-            except:
+            except Exception:
                 prints('Failed to read user metadata:', name)
-                import traceback
                 traceback.print_exc()
                 continue
         self._user_metadata_ = temp.get_all_user_metadata(True)
@@ -657,16 +689,16 @@ class OPF(object):  # {{{
 
     def write_user_metadata(self):
         elems = self.root.xpath('//*[name() = "meta" and starts-with(@name,'
-                '"calibre:user_metadata:") and @content]')
+                                '"calibre:user_metadata:") and @content]')
         for elem in elems:
             elem.getparent().remove(elem)
-        serialize_user_metadata(self.metadata,
-                self._user_metadata_)
+        serialize_user_metadata(self.metadata, self._user_metadata_)
 
     def find_toc(self):
         self.toc = None
         try:
-            spine = self.XPath('descendant::*[re:match(name(), "spine", "i")]')(self.root)
+            spine = self.XPath('descendant::*[re:match(name(), "spine", '
+                               '"i")]')(self.root)
             toc = None
             if spine:
                 spine = spine[0]
@@ -682,9 +714,9 @@ class OPF(object):  # {{{
             if toc is None:
                 return
             self.toc = TOC(base_path=self.base_dir)
-            is_ncx = getattr(self, 'manifest', None) is not None and \
-                     self.manifest.type_for_id(toc) is not None and \
-                     'dtbncx' in self.manifest.type_for_id(toc)
+            is_ncx = (getattr(self, 'manifest', None) is not None and
+                      self.manifest.type_for_id(toc) is not None and
+                      'dtbncx' in self.manifest.type_for_id(toc))
             if is_ncx or toc.lower() in ('ncx', 'ncxtoc'):
                 path = self.manifest.path_for_id(toc)
                 if path:
@@ -700,7 +732,7 @@ class OPF(object):  # {{{
                         not os.path.isfile(self.path_to_html_toc):
                     self.path_to_html_toc = None
                 self.toc.read_html_toc(toc)
-        except:
+        except Exception:
             pass
 
     def get_text(self, elem):
@@ -721,11 +753,12 @@ class OPF(object):  # {{{
         c = 1
         while manifest_id in ids:
             c += 1
-            manifest_id = 'id%d'%c
+            manifest_id = 'id%d' % c
         if not media_type:
             media_type = 'application/xhtml+xml'
-        ans = etree.Element('{%s}item'%self.NAMESPACES['opf'],
-                             attrib={'id':manifest_id, 'href':href, 'media-type':media_type})
+        ans = etree.Element('{%s}item' % self.NAMESPACES['opf'],
+                            attrib={'id': manifest_id,
+                                    'href': href, 'media-type': media_type})
         ans.tail = '\n\t\t'
         if append:
             manifest = self.manifest_ppath(self.root)[0]
@@ -735,7 +768,7 @@ class OPF(object):  # {{{
     def replace_manifest_item(self, item, items):
         items = [self.create_manifest_item(*i) for i in items]
         for i, item2 in enumerate(items):
-            item2.set('id', item.get('id')+'.%d'%(i+1))
+            item2.set('id', item.get('id')+'.%d' % (i+1))
         manifest = item.getparent()
         index = manifest.index(item)
         manifest[index:index+1] = items
@@ -761,37 +794,43 @@ class OPF(object):  # {{{
                 return x.get('href', None)
 
     def create_spine_item(self, idref):
-        ans = etree.Element('{%s}itemref'%self.NAMESPACES['opf'], idref=idref)
+        ans = etree.Element('{%s}itemref' % self.NAMESPACES['opf'],
+                            idref=idref)
         ans.tail = '\n\t\t'
         return ans
 
     def replace_spine_items_by_idref(self, idref, new_idrefs):
         items = list(map(self.create_spine_item, new_idrefs))
-        spine = self.XPath('/opf:package/*[re:match(name(), "spine", "i")]')(self.root)[0]
+        spine = self.XPath('/opf:package/*[re:match(name(), "spine", '
+                           '"i")]')(self.root)[0]
         old = [i for i in self.iterspine() if i.get('idref', None) == idref]
         for x in old:
             i = spine.index(x)
             spine[i:i+1] = items
 
     def create_guide_element(self):
-        e = etree.SubElement(self.root, '{%s}guide'%self.NAMESPACES['opf'])
+        e = etree.SubElement(self.root, '{%s}guide' % self.NAMESPACES['opf'])
         e.text = '\n        '
-        e.tail =  '\n'
+        e.tail = '\n'
         return e
 
     def remove_guide(self):
         self.guide = None
-        for g in self.root.xpath('./*[re:match(name(), "guide", "i")]', namespaces={'re':'http://exslt.org/regular-expressions'}):
+        for g in self.root.xpath('./*[re:match(name(), "guide", "i")]',
+                                 namespaces={'re': 'http://exslt.org/regular-'
+                                             'expressions'}):
             self.root.remove(g)
 
     def create_guide_item(self, type, title, href):
-        e = etree.Element('{%s}reference'%self.NAMESPACES['opf'],
-                             type=type, title=title, href=href)
-        e.tail='\n'
+        e = etree.Element('{%s}reference' % self.NAMESPACES['opf'], type=type,
+                          title=title, href=href)
+        e.tail = '\n'
         return e
 
     def add_guide_item(self, type, title, href):
-        g = self.root.xpath('./*[re:match(name(), "guide", "i")]', namespaces={'re':'http://exslt.org/regular-expressions'})[0]
+        g = self.root.xpath('./*[re:match(name(), "guide", "i")]',
+                            namespaces={'re': 'http://exslt.org/regular-'
+                                        'expressions'})[0]
         g.append(self.create_guide_item(type, title, href))
 
     def iterguide(self):
@@ -828,7 +867,10 @@ class OPF(object):  # {{{
                 title.getparent().remove(title)
             titles = ()
         if val:
-            title = titles[0] if titles else self.create_metadata_element('title')
+            if titles:
+                title = titles[0]
+            else:
+                title = self.create_metadata_element('title')
             title.text = re.sub(r'\s+', ' ', str(val))
 
     @property
@@ -847,11 +889,12 @@ class OPF(object):  # {{{
         # for broken implementations that always use the first
         # <dc:creator> element with no attention to the role
         for author in reversed(val):
-            elem = self.metadata.makeelement('{%s}creator'%
-                    self.NAMESPACES['dc'], nsmap=self.NAMESPACES)
+            elem = self.metadata.makeelement('{%s}creator' %
+                                             self.NAMESPACES['dc'],
+                                             nsmap=self.NAMESPACES)
             elem.tail = '\n'
             self.metadata.insert(0, elem)
-            elem.set('{%s}role'%self.NAMESPACES['opf'], 'aut')
+            elem.set('{%s}role' % self.NAMESPACES['opf'], 'aut')
             self.set_text(elem, author.strip())
 
     @property
@@ -859,7 +902,7 @@ class OPF(object):  # {{{
         matches = self.authors_path(self.metadata)
         if matches:
             for match in matches:
-                ans = match.get('{%s}file-as'%self.NAMESPACES['opf'], None)
+                ans = match.get('{%s}file-as' % self.NAMESPACES['opf'], None)
                 if not ans:
                     ans = match.get('file-as', None)
                 if ans:
@@ -872,7 +915,7 @@ class OPF(object):  # {{{
             for key in matches[0].attrib:
                 if key.endswith('file-as'):
                     matches[0].attrib.pop(key)
-            matches[0].set('{%s}file-as'%self.NAMESPACES['opf'], str(val))
+            matches[0].set('{%s}file-as' % self.NAMESPACES['opf'], str(val))
 
     @property
     def tags(self):
@@ -897,8 +940,9 @@ class OPF(object):  # {{{
         for match in self.pubdate_path(self.metadata):
             try:
                 val = parse_date(etree.tostring(match, encoding='unicode',
-                    method='text', with_tail=False).strip())
-            except:
+                                                method='text',
+                                                with_tail=False).strip())
+            except Exception:
                 continue
             if ans is None or val < ans:
                 ans = val
@@ -910,8 +954,9 @@ class OPF(object):  # {{{
         for match in self.pubdate_path(self.metadata):
             try:
                 cval = parse_date(etree.tostring(match, encoding='unicode',
-                    method='text', with_tail=False).strip())
-            except:
+                                                 method='text',
+                                                 with_tail=False).strip())
+            except Exception:
                 match.getparent().remove(match)
             else:
                 if not val:
@@ -953,7 +998,7 @@ class OPF(object):  # {{{
                     x.getparent().remove(x)
             return
         if not matches:
-            attrib = {'{%s}scheme'%self.NAMESPACES['opf']: 'ISBN'}
+            attrib = {'{%s}scheme' % self.NAMESPACES['opf']: 'ISBN'}
             matches = [self.create_metadata_element('identifier',
                                                     attrib=attrib)]
         self.set_text(matches[0], str(val))
@@ -967,17 +1012,19 @@ class OPF(object):  # {{{
             for attr, val in x.attrib.items():
                 if attr.endswith('scheme'):
                     typ = val.lower()
-                    val = etree.tostring(x, with_tail=False, encoding='unicode',
-                            method='text').strip()
+                    val = etree.tostring(x, with_tail=False,
+                                         encoding='unicode',
+                                         method='text').strip()
                     if val and typ not in ('calibre', 'uuid'):
-                        if typ == 'isbn' and val.lower().startswith('urn:isbn:'):
+                        if (typ == 'isbn' and
+                                val.lower().startswith('urn:isbn:')):
                             val = val[len('urn:isbn:'):]
                         identifiers[typ] = val
                     found_scheme = True
                     break
             if not found_scheme:
                 val = etree.tostring(x, with_tail=False, encoding='unicode',
-                            method='text').strip()
+                                     method='text').strip()
                 if val.lower().startswith('urn:isbn:'):
                     val = check_isbn(val.split(':')[-1])
                     if val is not None:
@@ -997,7 +1044,8 @@ class OPF(object):  # {{{
                     self.metadata):
             xid = x.get('id', None)
             is_package_identifier = uuid_id is not None and uuid_id == xid
-            typ = {val.lower() for attr, val in x.attrib.items() if attr.endswith('scheme')}
+            typ = {val.lower() for attr, val in x.attrib.items()
+                   if attr.endswith('scheme')}
             if is_package_identifier:
                 typ = tuple(typ)
                 if typ and typ[0] in identifiers:
@@ -1007,7 +1055,7 @@ class OPF(object):  # {{{
                 x.getparent().remove(x)
 
         for typ, val in identifiers.items():
-            attrib = {'{%s}scheme'%self.NAMESPACES['opf']: typ.upper()}
+            attrib = {'{%s}scheme' % self.NAMESPACES['opf']: typ.upper()}
             self.set_text(self.create_metadata_element(
                 'identifier', attrib=attrib), str(val))
 
@@ -1028,7 +1076,7 @@ class OPF(object):  # {{{
             if attr.endswith('unique-identifier'):
                 uuid_id = self.root.attrib[attr]
                 break
-        attrib = {'{%s}scheme'%self.NAMESPACES['opf']: 'calibre'}
+        attrib = {'{%s}scheme' % self.NAMESPACES['opf']: 'calibre'}
         if uuid_id and uuid_id in removed_ids:
             attrib['id'] = uuid_id
         self.set_text(self.create_metadata_element(
@@ -1043,7 +1091,7 @@ class OPF(object):  # {{{
     def uuid(self, val):
         matches = self.uuid_id_path(self.metadata)
         if not matches:
-            attrib = {'{%s}scheme'%self.NAMESPACES['opf']: 'uuid'}
+            attrib = {'{%s}scheme' % self.NAMESPACES['opf']: 'uuid'}
             matches = [self.create_metadata_element('identifier',
                                                     attrib=attrib)]
         self.set_text(matches[0], str(val))
@@ -1064,9 +1112,9 @@ class OPF(object):  # {{{
         for match in self.languages_path(self.metadata):
             t = self.get_text(match)
             if t and t.strip():
-                l = canonicalize_lang(t.strip())
-                if l:
-                    ans.append(l)
+                cl = canonicalize_lang(t.strip())
+                if cl:
+                    ans.append(cl)
         return ans
 
     @languages.setter
@@ -1076,8 +1124,8 @@ class OPF(object):  # {{{
             x.getparent().remove(x)
 
         for lang in val:
-            l = self.create_metadata_element('language')
-            self.set_text(l, str(lang))
+            cl = self.create_metadata_element('language')
+            self.set_text(cl, str(lang))
 
     @property
     def raw_languages(self):
@@ -1096,7 +1144,7 @@ class OPF(object):  # {{{
         matches = self.bkp_path(self.metadata)
         if not matches:
             matches = [self.create_metadata_element('contributor')]
-            matches[0].set('{%s}role'%self.NAMESPACES['opf'], 'bkp')
+            matches[0].set('{%s}role' % self.NAMESPACES['opf'], 'bkp')
         self.set_text(matches[0], str(val))
 
     def identifier_iter(self):
@@ -1111,7 +1159,8 @@ class OPF(object):  # {{{
                 uuid_elem = self.root.attrib[attr]
                 break
         if uuid_elem:
-            matches = self.root.xpath('//*[@id=%s]'%escape_xpath_attr(uuid_elem))
+            matches = self.root.xpath('//*[@id=%s]' %
+                                      escape_xpath_attr(uuid_elem))
             if matches:
                 for m in matches:
                     raw = m.text
@@ -1126,15 +1175,18 @@ class OPF(object):  # {{{
 
     @property
     def page_progression_direction(self):
-        spine = self.XPath('descendant::*[re:match(name(), "spine", "i")][1]')(self.root)
+        spine = self.XPath('descendant::*[re:match(name(), "spine", '
+                           '"i")][1]')(self.root)
         if spine:
             for k, v in spine[0].attrib.items():
-                if k == 'page-progression-direction' or k.endswith('}page-progression-direction'):
+                if (k == 'page-progression-direction' or
+                        k.endswith('}page-progression-direction')):
                     return v
 
     @property
     def primary_writing_mode(self):
-        for m in self.XPath('//*[local-name()="meta" and @name="primary-writing-mode" and @content]')(self.root):
+        for m in self.XPath('//*[local-name()="meta" and @name="primary-'
+                            'writing-mode" and @content]')(self.root):
             return m.get('content')
 
     def guess_cover(self):
@@ -1153,8 +1205,11 @@ class OPF(object):  # {{{
                 if item.text:
                     prefix = item.text.replace('-', '')
                     for suffix in ['.jpg', '.jpeg', '.gif', '.png', '.bmp']:
-                        cpath = os.access(os.path.join(self.base_dir, prefix+suffix), os.R_OK)
-                        if os.access(os.path.join(self.base_dir, prefix+suffix), os.R_OK):
+                        cpath = os.access(os.path.join(self.base_dir,
+                                                       prefix + suffix),
+                                          os.R_OK)
+                        if os.access(os.path.join(self.base_dir,
+                                                  prefix+suffix), os.R_OK):
                             return cpath
 
     @property
@@ -1188,13 +1243,16 @@ class OPF(object):  # {{{
     def guide_raster_cover(self):
         covers = self.guide_cover_path(self.root)
         if covers:
-            mt_map = {i.get('href'):i for i in self.itermanifest()}
+            mt_map = {i.get('href'): i for i in self.itermanifest()}
             for href in covers:
                 if href:
                     i = mt_map.get(href)
                     if i is not None:
                         iid, mt = i.get('id'), i.get('media-type')
-                        if iid and mt and mt.lower() in {'image/png', 'image/jpeg', 'image/jpg', 'image/gif'}:
+                        if iid and mt and mt.lower() in {'image/png',
+                                                         'image/jpeg',
+                                                         'image/jpg',
+                                                         'image/gif'}:
                             return i
 
     @property
@@ -1214,14 +1272,15 @@ class OPF(object):  # {{{
     @property
     def cover(self):
         if self.guide is not None:
-            for t in ('cover', 'other.ms-coverimage-standard', 'other.ms-coverimage'):
+            for t in ('cover', 'other.ms-coverimage-standard',
+                      'other.ms-coverimage'):
                 for item in self.guide:
                     if item.type and item.type.lower() == t:
                         return item.path
         try:
             if self.try_to_guess_cover:
                 return self.guess_cover()
-        except:
+        except Exception:
             pass
 
     @cover.setter
@@ -1237,13 +1296,16 @@ class OPF(object):  # {{{
             self.guide = Guide()
             self.guide.set_cover(path)
             etree.SubElement(g, 'opf:reference', nsmap=self.NAMESPACES,
-                                attrib={'type':'cover', 'href':self.guide[-1].href()})
+                             attrib={'type': 'cover',
+                                     'href': self.guide[-1].href()})
         id = self.manifest.id_for_path(self.cover)
         if id is None:
-            for t in ('cover', 'other.ms-coverimage-standard', 'other.ms-coverimage'):
+            for t in ('cover', 'other.ms-coverimage-standard',
+                      'other.ms-coverimage'):
                 for item in self.guide:
                     if item.type.lower() == t:
-                        self.create_manifest_item(item.href(), guess_type(path)[0])
+                        self.create_manifest_item(item.href(),
+                                                  guess_type(path)[0])
 
     def get_metadata_element(self, name):
         matches = self.metadata_elem_path(self.metadata, name=name)
@@ -1278,9 +1340,11 @@ class OPF(object):  # {{{
         # We swap attributes instead of elements, as that avoids namespace
         # re-declarations
         smap = {}
-        for child in self.metadata.xpath('./*[@name="calibre:series" or @name="calibre:series_index"]'):
+        for child in self.metadata.xpath('./*[@name="calibre:series" or @name'
+                                         '="calibre:series_index"]'):
             smap[child.get('name')] = (child, self.metadata.index(child))
-        if len(smap) == 2 and smap['calibre:series'][1] > smap['calibre:series_index'][1]:
+        if (len(smap) == 2 and
+                smap['calibre:series'][1] > smap['calibre:series_index'][1]):
             s, si = smap['calibre:series'][0], smap['calibre:series_index'][0]
 
             def swap(attr):
@@ -1293,7 +1357,8 @@ class OPF(object):  # {{{
             _pretty_print(self.root)
         raw = etree.tostring(self.root, encoding=encoding, pretty_print=True)
         if not raw.lstrip().startswith(b'<?xml '):
-            raw = ('<?xml version="1.0"  encoding="%s"?>\n'%encoding.upper()).encode('ascii') + raw
+            raw = ('<?xml version="1.0"  encoding="%s"?>\n' %
+                   encoding.upper()).encode('ascii') + raw
         return raw
 
     def smart_update(self, mi, replace_metadata=False, apply_null=False):
@@ -1302,9 +1367,12 @@ class OPF(object):  # {{{
                      'isbn', 'tags', 'category', 'comments', 'book_producer',
                      'pubdate', 'user_categories', 'author_link_map'):
             val = getattr(mi, attr, None)
-            is_null = val is None or val in ((), [], (None, None), {}) or (attr == 'rating' and val < 0.1)
+            is_null = val is None or val in ((), [], (None, None),
+                                             {}) or (attr == 'rating' and
+                                                     val < 0.1)
             if is_null:
-                if apply_null and attr in {'series', 'tags', 'isbn', 'comments', 'publisher', 'rating'}:
+                if apply_null and attr in {'series', 'tags', 'isbn',
+                                           'comments', 'publisher', 'rating'}:
                     setattr(self, attr, ([] if attr == 'tags' else None))
             else:
                 setattr(self, attr, val)
@@ -1315,7 +1383,9 @@ class OPF(object):  # {{{
             self.languages = langs or []
         temp = self.to_book_metadata()
         temp.smart_update(mi, replace_metadata=replace_metadata)
-        if not replace_metadata and callable(getattr(temp, 'custom_field_keys', None)):
+        if not replace_metadata and callable(getattr(temp,
+                                                     'custom_field_keys',
+                                                     None)):
             # We have to replace non-null fields regardless of the value of
             # replace_metadata to match the behavior of the builtin fields
             # above.
@@ -1346,12 +1416,12 @@ class OPF(object):  # {{{
 class OPFCreator(Metadata):
 
     def __init__(self, base_path, other):
-        '''
+        """
         Initialize.
-        @param base_path: An absolute path to the directory in which this OPF file
-        will eventually be. This is used by the L{create_manifest} method
+        @param base_path: An absolute path to the directory in which this OPF
+        file will eventually be. This is used by the L{create_manifest} method
         to convert paths to files into relative paths.
-        '''
+        """
         Metadata.__init__(self, title='', other=other)
         self.base_path = os.path.abspath(base_path)
         self.page_progression_direction = None
@@ -1368,19 +1438,21 @@ class OPFCreator(Metadata):
             self.guide.set_cover(self.cover)
 
     def create_manifest(self, entries):
-        '''
+        """
         Create <manifest>
 
-        `entries`: List of (path, mime-type) If mime-type is None it is autodetected
-        '''
+        `entries`: List of (path, mime-type) If mime-type is None it is
+        autodetected
+        """
         entries = list(map(lambda x: x if os.path.isabs(x[0]) else
-                      (os.path.abspath(os.path.join(self.base_path, x[0])), x[1]),
-                      entries))
+                           (os.path.abspath(os.path.join(self.base_path,
+                                                         x[0])), x[1]),
+                           entries))
         self.manifest = Manifest.from_paths(entries)
         self.manifest.set_basedir(self.base_path)
 
     def create_manifest_from_files_in(self, files_and_dirs,
-            exclude=lambda x:False):
+                                      exclude=lambda x: False):
         entries = []
 
         def dodir(dir):
@@ -1406,7 +1478,8 @@ class OPFCreator(Metadata):
         `entries`: List of paths
         '''
         entries = list(map(lambda x: x if os.path.isabs(x) else
-                      os.path.abspath(os.path.join(self.base_path, x)), entries))
+                           os.path.abspath(os.path.join(self.base_path, x)),
+                           entries))
         self.spine = Spine.from_paths(entries, self.manifest)
 
     def set_toc(self, toc):
@@ -1431,11 +1504,13 @@ class OPFCreator(Metadata):
             self.manifest.set_basedir(self.base_path)
             if ncx_manifest_entry is not None and toc is not None:
                 if not os.path.isabs(ncx_manifest_entry):
-                    ncx_manifest_entry = os.path.join(self.base_path, ncx_manifest_entry)
+                    ncx_manifest_entry = os.path.join(self.base_path,
+                                                      ncx_manifest_entry)
                 remove = [i for i in self.manifest if i.id == 'ncx']
                 for item in remove:
                     self.manifest.remove(item)
-                self.manifest.append(ManifestItem(ncx_manifest_entry, self.base_path))
+                self.manifest.append(ManifestItem(ncx_manifest_entry,
+                                                  self.base_path))
                 self.manifest[-1].id = 'ncx'
                 self.manifest[-1].mime_type = 'application/x-dtbncx+xml'
         if self.guide is None:
@@ -1448,13 +1523,13 @@ class OPFCreator(Metadata):
         self.guide.set_basedir(self.base_path)
 
         # Actual rendering
-        from lxml.builder import ElementMaker
-        from ebook_converter.ebooks.oeb.base import OPF2_NS, DC11_NS, CALIBRE_NS
-        DNS = OPF2_NS+'___xx___'
-        E = ElementMaker(namespace=DNS, nsmap={None:DNS})
+        DNS = const.OPF2_NS + '___xx___'
+        E = ElementMaker(namespace=DNS, nsmap={None: DNS})
         M = ElementMaker(namespace=DNS,
-                nsmap={'dc':DC11_NS, 'calibre':CALIBRE_NS, 'opf':OPF2_NS})
-        DC = ElementMaker(namespace=DC11_NS)
+                         nsmap={'dc': const.DC11_NS,
+                                'calibre': const.CALIBRE_NS,
+                                'opf': const.OPF2_NS})
+        DC = ElementMaker(namespace=const.DC11_NS)
 
         def DC_ELEM(tag, text, dc_attrs={}, opf_attrs={}):
             if text:
@@ -1462,7 +1537,7 @@ class OPFCreator(Metadata):
             else:
                 elem = getattr(DC, tag)(**dc_attrs)
             for k, v in opf_attrs.items():
-                elem.set('{%s}%s'%(OPF2_NS, k), v)
+                elem.set('{%s}%s' % (const.OPF2_NS, k), v)
             return elem
 
         def CAL_ELEM(name, content):
@@ -1472,18 +1547,18 @@ class OPFCreator(Metadata):
         a = metadata.append
         role = {}
         a(DC_ELEM('title', self.title if self.title else 'Unknown',
-            opf_attrs=role))
+                  opf_attrs=role))
         for i, author in enumerate(self.authors):
-            fa = {'role':'aut'}
+            fa = {'role': 'aut'}
             if i == 0 and self.author_sort:
                 fa['file-as'] = self.author_sort
             a(DC_ELEM('creator', author, opf_attrs=fa))
-        a(DC_ELEM('contributor', '%s (%s) [%s]'%(__appname__, __version__,
-            'https://calibre-ebook.com'), opf_attrs={'role':'bkp',
-                'file-as':__appname__}))
+        a(DC_ELEM('contributor', '%s (%s) [%s]' %
+                  (__appname__, __version__, 'https://calibre-ebook.com'),
+                  opf_attrs={'role': 'bkp', 'file-as': __appname__}))
         a(DC_ELEM('identifier', str(self.application_id),
-            opf_attrs={'scheme':__appname__},
-            dc_attrs={'id':__appname__+'_id'}))
+                  opf_attrs={'scheme': __appname__},
+                  dc_attrs={'id': __appname__+'_id'}))
         if getattr(self, 'pubdate', None) is not None:
             a(DC_ELEM('date', self.pubdate.isoformat()))
         langs = self.languages
@@ -1496,7 +1571,7 @@ class OPFCreator(Metadata):
         if self.publisher:
             a(DC_ELEM('publisher', self.publisher))
         for key, val in self.get_identifiers().items():
-            a(DC_ELEM('identifier', val, opf_attrs={'scheme':key.upper()}))
+            a(DC_ELEM('identifier', val, opf_attrs={'scheme': key.upper()}))
         if self.rights:
             a(DC_ELEM('rights', self.rights))
         if self.tags:
@@ -1515,11 +1590,13 @@ class OPFCreator(Metadata):
         if self.publication_type is not None:
             a(CAL_ELEM('calibre:publication_type', self.publication_type))
         if self.user_categories:
-            from ebook_converter.ebooks.metadata.book.json_codec import object_to_unicode
+            from ebook_converter.ebooks.metadata.book.json_codec import \
+                object_to_unicode
             a(CAL_ELEM('calibre:user_categories',
                        json.dumps(object_to_unicode(self.user_categories))))
         if self.primary_writing_mode:
-            a(M.meta(name='primary-writing-mode', content=self.primary_writing_mode))
+            a(M.meta(name='primary-writing-mode',
+                     content=self.primary_writing_mode))
         manifest = E.manifest()
         if self.manifest is not None:
             for ref in self.manifest:
@@ -1533,7 +1610,8 @@ class OPFCreator(Metadata):
         if self.toc is not None:
             spine.set('toc', 'ncx')
         if self.page_progression_direction is not None:
-            spine.set('page-progression-direction', self.page_progression_direction)
+            spine.set('page-progression-direction',
+                      self.page_progression_direction)
         if self.spine is not None:
             for ref in self.spine:
                 if ref.id is not None:
@@ -1562,8 +1640,8 @@ class OPFCreator(Metadata):
         root.set('unique-identifier', __appname__+'_id')
         root.set('version', '2.0')
         raw = etree.tostring(root, pretty_print=True, xml_declaration=True,
-                encoding=encoding)
-        raw = raw.replace(DNS.encode('utf-8'), OPF2_NS.encode('utf-8'))
+                             encoding=encoding)
+        raw = raw.replace(DNS.encode('utf-8'), const.OPF2_NS.encode('utf-8'))
         opf_stream.write(raw)
         opf_stream.flush()
         if toc is not None and ncx_stream is not None:
@@ -1572,9 +1650,6 @@ class OPFCreator(Metadata):
 
 
 def metadata_to_opf(mi, as_string=True, default_lang=None):
-    from lxml import etree
-    import textwrap
-    from ebook_converter.ebooks.oeb.base import OPF, DC
 
     if not mi.application_id:
         mi.application_id = str(uuid.uuid4())
@@ -1583,15 +1658,15 @@ def metadata_to_opf(mi, as_string=True, default_lang=None):
         mi.uuid = str(uuid.uuid4())
 
     if not mi.book_producer:
-        mi.book_producer = __appname__ + ' (%s) '%__version__ + \
-            '[https://calibre-ebook.com]'
+        mi.book_producer = (__appname__ + ' (%s) ' %
+                            __version__ + '[https://calibre-ebook.com]')
 
     if not mi.languages:
         lang = (get_lang().replace('_', '-').partition('-')[0] if default_lang
                 is None else default_lang)
         mi.languages = [lang]
 
-    root = safe_xml_fromstring(textwrap.dedent(
+    root = etree.fromstring(textwrap.dedent(
     '''
     <package xmlns="http://www.idpf.org/2007/opf" unique-identifier="uuid_id" version="2.0">
         <metadata xmlns:dc="http://purl.org/dc/elements/1.1/" xmlns:opf="http://www.idpf.org/2007/opf">
@@ -1600,20 +1675,20 @@ def metadata_to_opf(mi, as_string=True, default_lang=None):
             </metadata>
         <guide/>
     </package>
-    '''%dict(a=__appname__, id=mi.application_id, uuid=mi.uuid)))
+    ''' % dict(a=__appname__, id=mi.application_id, uuid=mi.uuid)))
     metadata = root[0]
     guide = root[1]
     metadata[0].tail = '\n'+(' '*8)
 
     def factory(tag, text=None, sort=None, role=None, scheme=None, name=None,
-            content=None):
+                content=None):
         attrib = {}
         if sort:
-            attrib[OPF('file-as')] = sort
+            attrib[base.tag('opf', 'file-as')] = sort
         if role:
-            attrib[OPF('role')] = role
+            attrib[base.tag('opf', 'role')] = role
         if scheme:
-            attrib[OPF('scheme')] = scheme
+            attrib[base.tag('opf', 'scheme')] = scheme
         if name:
             attrib['name'] = name
         if content:
@@ -1621,7 +1696,9 @@ def metadata_to_opf(mi, as_string=True, default_lang=None):
         try:
             elem = metadata.makeelement(tag, attrib=attrib)
         except ValueError:
-            elem = metadata.makeelement(tag, attrib={k:clean_xml_chars(v) for k, v in attrib.items()})
+            elem = metadata.makeelement(tag, attrib={k: clean_xml_chars(v)
+                                                     for k, v in
+                                                     attrib.items()})
         elem.tail = '\n'+(' '*8)
         if text:
             try:
@@ -1630,29 +1707,29 @@ def metadata_to_opf(mi, as_string=True, default_lang=None):
                 elem.text = clean_ascii_chars(text.strip())
         metadata.append(elem)
 
-    factory(DC('title'), mi.title)
+    factory(base.tag('dc', 'title'), mi.title)
     for au in mi.authors:
-        factory(DC('creator'), au, mi.author_sort, 'aut')
-    factory(DC('contributor'), mi.book_producer, __appname__, 'bkp')
+        factory(base.tag('dc', 'creator'), au, mi.author_sort, 'aut')
+    factory(base.tag('dc', 'contributor'), mi.book_producer, __appname__, 'bkp')
     if hasattr(mi.pubdate, 'isoformat'):
-        factory(DC('date'), isoformat(mi.pubdate))
+        factory(base.tag('dc', 'date'), isoformat(mi.pubdate))
     if hasattr(mi, 'category') and mi.category:
-        factory(DC('type'), mi.category)
+        factory(base.tag('dc', 'type'), mi.category)
     if mi.comments:
-        factory(DC('description'), clean_ascii_chars(mi.comments))
+        factory(base.tag('dc', 'description'), clean_ascii_chars(mi.comments))
     if mi.publisher:
-        factory(DC('publisher'), mi.publisher)
+        factory(base.tag('dc', 'publisher'), mi.publisher)
     for key, val in mi.get_identifiers().items():
-        factory(DC('identifier'), val, scheme=key.upper())
+        factory(base.tag('dc', 'identifier'), val, scheme=key.upper())
     if mi.rights:
-        factory(DC('rights'), mi.rights)
+        factory(base.tag('dc', 'rights'), mi.rights)
     for lang in mi.languages:
         if not lang or lang.lower() == 'und':
             continue
-        factory(DC('language'), lang)
+        factory(base.tag('dc', 'language'), lang)
     if mi.tags:
         for tag in mi.tags:
-            factory(DC('subject'), tag)
+            factory(base.tag('dc', 'subject'), tag)
     meta = lambda n, c: factory('meta', name='calibre:'+n, content=c)
     if getattr(mi, 'author_link_map', None) is not None:
         meta('author_link_map', dump_dict(mi.author_link_map))
@@ -1673,21 +1750,22 @@ def metadata_to_opf(mi, as_string=True, default_lang=None):
 
     serialize_user_metadata(metadata, mi.get_all_user_metadata(False))
 
-    metadata[-1].tail = '\n' +(' '*4)
+    metadata[-1].tail = '\n' + (' '*4)
 
     if mi.cover:
         if not isinstance(mi.cover, str):
             mi.cover = mi.cover.decode(filesystem_encoding)
         guide.text = '\n'+(' '*8)
-        r = guide.makeelement(OPF('reference'),
-                attrib={'type': 'cover', 'title': 'Cover', 'href': mi.cover})
-        r.tail = '\n' +(' '*4)
+        r = guide.makeelement(base.tag('opf', 'reference'),
+                              attrib={'type': 'cover', 'title': 'Cover',
+                                      'href': mi.cover})
+        r.tail = '\n' + (' '*4)
         guide.append(r)
     if pretty_print_opf:
         _pretty_print(root)
 
     return etree.tostring(root, pretty_print=True, encoding='utf-8',
-            xml_declaration=True) if as_string else root
+                          xml_declaration=True) if as_string else root
 
 
 def test_m2o():
@@ -1699,7 +1777,7 @@ def test_m2o():
     mi.language = 'en'
     mi.comments = 'what a fun book\n\n'
     mi.publisher = 'publisher'
-    mi.set_identifiers({'isbn':'booo', 'dummy':'dummy'})
+    mi.set_identifiers({'isbn': 'booo', 'dummy': 'dummy'})
     mi.tags = ['a', 'b']
     mi.series = 's"c\'l&<>'
     mi.series_index = 3.34
@@ -1711,15 +1789,15 @@ def test_m2o():
     opf = metadata_to_opf(mi)
     print(opf)
     newmi = MetaInformation(OPF(io.BytesIO(opf)))
-    for attr in ('author_sort', 'title_sort', 'comments',
-                    'publisher', 'series', 'series_index', 'rating',
-                    'isbn', 'tags', 'cover_data', 'application_id',
-                    'language', 'cover',
-                    'book_producer', 'timestamp',
-                    'pubdate', 'rights', 'publication_type'):
+    for attr in ('author_sort', 'title_sort', 'comments', 'publisher',
+                 'series', 'series_index', 'rating', 'isbn', 'tags',
+                 'cover_data', 'application_id', 'language', 'cover',
+                 'book_producer', 'timestamp', 'pubdate', 'rights',
+                 'publication_type'):
         o, n = getattr(mi, attr), getattr(newmi, attr)
         if o != n and o.strip() != n.strip():
-            print('FAILED:', attr, getattr(mi, attr), '!=', getattr(newmi, attr))
+            print('FAILED:', attr, getattr(mi, attr), '!=',
+                  getattr(newmi, attr))
     if mi.get_identifiers() != newmi.get_identifiers():
         print('FAILED:', 'identifiers', mi.get_identifiers(), end=' ')
         print('!=', newmi.get_identifiers())
@@ -1766,8 +1844,8 @@ b'''\
         self.assertEqual(opf.rating, 4)
         self.assertEqual(opf.publication_type, 'test')
         self.assertEqual(list(opf.itermanifest())[0].get('href'), 'a ~ b')
-        self.assertEqual(opf.get_identifiers(), {'isbn':'123456789',
-            'dummy':'dummy'})
+        self.assertEqual(opf.get_identifiers(), {'isbn': '123456789',
+                                                 'dummy': 'dummy'})
 
     def testWriting(self):
         for test in [('title', 'New & Title'), ('authors', ['One', 'Two']),
@@ -1802,14 +1880,12 @@ def test():
 
 def test_user_metadata():
     mi = Metadata('Test title', ['test author1', 'test author2'])
-    um = {
-        '#myseries': {'#value#': u'test series\xe4', 'datatype':'text',
-            'is_multiple': None, 'name': u'My Series'},
-        '#myseries_index': {'#value#': 2.45, 'datatype': 'float',
-            'is_multiple': None},
-        '#mytags': {'#value#':['t1','t2','t3'], 'datatype':'text',
-            'is_multiple': '|', 'name': u'My Tags'}
-        }
+    um = {'#myseries': {'#value#': u'test series\xe4', 'datatype': 'text',
+                        'is_multiple': None, 'name': u'My Series'},
+          '#myseries_index': {'#value#': 2.45, 'datatype': 'float',
+                              'is_multiple': None},
+          '#mytags': {'#value#': ['t1', 't2', 't3'], 'datatype': 'text',
+                      'is_multiple': '|', 'name': u'My Tags'}}
     mi.set_all_user_metadata(um)
     raw = metadata_to_opf(mi)
     opfc = OPFCreator(os.getcwd(), other=mi)
diff --git a/ebook_converter/ebooks/metadata/opf3.py b/ebook_converter/ebooks/metadata/opf3.py
index f12a79d..dd146a6 100644
--- a/ebook_converter/ebooks/metadata/opf3.py
+++ b/ebook_converter/ebooks/metadata/opf3.py
@@ -5,6 +5,7 @@ from functools import wraps
 
 from lxml import etree
 
+from ebook_converter import constants as const
 from ebook_converter import prints
 from ebook_converter.ebooks.metadata import authors_to_string, check_isbn, string_to_authors
 from ebook_converter.ebooks.metadata.book.base import Metadata
@@ -15,7 +16,6 @@ from ebook_converter.ebooks.metadata.utils import (
     create_manifest_item, ensure_unique, normalize_languages, parse_opf,
     pretty_print_opf
 )
-from ebook_converter.ebooks.oeb.base import DC, OPF, OPF2_NSMAP
 from ebook_converter.utils.config import from_json, to_json
 from ebook_converter.utils.date import (
     fix_only_date, is_date_undefined, isoformat, parse_date as parse_date_, utcnow,
@@ -46,7 +46,7 @@ def XPath(x):
     try:
         return _xpath_cache[x]
     except KeyError:
-        _xpath_cache[x] = ans = etree.XPath(x, namespaces=OPF2_NSMAP)
+        _xpath_cache[x] = ans = etree.XPath(x, namespaces=const.OPF2_NSMAP)
         return ans
 
 
@@ -213,7 +213,7 @@ def set_refines(elem, existing_refines, *new_refines):
     remove_refines(elem, existing_refines)
     for ref in reversed(new_refines):
         prop, val, scheme = ref
-        r = elem.makeelement(OPF('meta'))
+        r = elem.makeelement(const.OPF_META)
         r.set('refines', '#' + eid), r.set('property', prop)
         r.text = val.strip()
         if scheme:
@@ -249,7 +249,7 @@ def parse_identifier(ident, val, refines):
     # Try the OPF 2 style opf:scheme attribute, which will be present, for
     # example, in EPUB 3 files that have had their metadata set by an
     # application that only understands EPUB 2.
-    scheme = ident.get(OPF('scheme'))
+    scheme = ident.get(const.OPF_SCHEME)
     if scheme and not lval.startswith('urn:'):
         return finalize(scheme, val)
 
@@ -294,7 +294,7 @@ def set_identifiers(root, prefixes, refines, new_identifiers, force_identifiers=
             continue
     metadata = XPath('./opf:metadata')(root)[0]
     for scheme, val in new_identifiers.items():
-        ident = metadata.makeelement(DC('identifier'))
+        ident = metadata.makeelement(const.DC_IDENT)
         ident.text = '%s:%s' % (scheme, val)
         if package_identifier is None:
             metadata.append(ident)
@@ -312,11 +312,11 @@ def identifier_writer(name):
             if is_package_id:
                 package_identifier = ident
             val = (ident.text or '').strip()
-            if (val.startswith(name + ':') or ident.get(OPF('scheme')) == name) and not is_package_id:
+            if (val.startswith(name + ':') or ident.get(const.OPF_SCHEME) == name) and not is_package_id:
                 remove_element(ident, refines)
         metadata = XPath('./opf:metadata')(root)[0]
         if ival:
-            ident = metadata.makeelement(DC('identifier'))
+            ident = metadata.makeelement(const.DC_IDENT)
             ident.text = '%s:%s' % (name, ival)
             if package_identifier is None:
                 metadata.append(ident)
@@ -376,7 +376,7 @@ def set_title(root, prefixes, refines, title, title_sort=None):
     main_title = find_main_title(root, refines, remove_blanks=True)
     if main_title is None:
         m = XPath('./opf:metadata')(root)[0]
-        main_title = m.makeelement(DC('title'))
+        main_title = m.makeelement(const.DC_TITLE)
         m.insert(0, main_title)
     main_title.text = title or None
     ts = [refdef('file-as', title_sort)] if title_sort else ()
@@ -411,7 +411,7 @@ def set_languages(root, prefixes, refines, languages):
         languages = ['und']
     metadata = XPath('./opf:metadata')(root)[0]
     for lang in uniq(languages):
-        l = metadata.makeelement(DC('language'))
+        l = metadata.makeelement(const.DC_LANG)
         l.text = lang
         metadata.append(l)
 # }}}
@@ -440,7 +440,7 @@ def read_authors(root, prefixes, refines):
         if file_as:
             aus = file_as[0][-1]
         else:
-            aus = item.get(OPF('file-as')) or None
+            aus = item.get(const.OPF_FILE_AS) or None
         return Author(normalize_whitespace(val), normalize_whitespace(aus))
 
     for item in XPath('./opf:metadata/dc:creator')(root):
@@ -448,7 +448,7 @@ def read_authors(root, prefixes, refines):
         if val:
             props = properties_for_id_with_scheme(item.get('id'), prefixes, refines)
             role = props.get('role')
-            opf_role = item.get(OPF('role'))
+            opf_role = item.get(const.OPF_ROLE)
             if role:
                 if is_relators_role(props, 'aut'):
                     roled_authors.append(author(item, props, val))
@@ -465,22 +465,22 @@ def set_authors(root, prefixes, refines, authors):
     ensure_prefix(root, prefixes, 'marc')
     for item in XPath('./opf:metadata/dc:creator')(root):
         props = properties_for_id_with_scheme(item.get('id'), prefixes, refines)
-        opf_role = item.get(OPF('role'))
+        opf_role = item.get(const.OPF_ROLE)
         if (opf_role and opf_role.lower() != 'aut') or (props.get('role') and not is_relators_role(props, 'aut')):
             continue
         remove_element(item, refines)
     metadata = XPath('./opf:metadata')(root)[0]
     for author in authors:
         if author.name:
-            a = metadata.makeelement(DC('creator'))
+            a = metadata.makeelement(const.DC_CREATOR)
             aid = ensure_id(a)
             a.text = author.name
             metadata.append(a)
-            m = metadata.makeelement(OPF('meta'), attrib={'refines':'#'+aid, 'property':'role', 'scheme':'marc:relators'})
+            m = metadata.makeelement(const.OPF_META, attrib={'refines':'#'+aid, 'property':'role', 'scheme':'marc:relators'})
             m.text = 'aut'
             metadata.append(m)
             if author.sort:
-                m = metadata.makeelement(OPF('meta'), attrib={'refines':'#'+aid, 'property':'file-as'})
+                m = metadata.makeelement(const.OPF_META, attrib={'refines':'#'+aid, 'property':'file-as'})
                 m.text = author.sort
                 metadata.append(m)
 
@@ -492,7 +492,7 @@ def read_book_producers(root, prefixes, refines):
         if val:
             props = properties_for_id_with_scheme(item.get('id'), prefixes, refines)
             role = props.get('role')
-            opf_role = item.get(OPF('role'))
+            opf_role = item.get(const.OPF_ROLE)
             if role:
                 if is_relators_role(props, 'bkp'):
                     ans.append(normalize_whitespace(val))
@@ -504,18 +504,18 @@ def read_book_producers(root, prefixes, refines):
 def set_book_producers(root, prefixes, refines, producers):
     for item in XPath('./opf:metadata/dc:contributor')(root):
         props = properties_for_id_with_scheme(item.get('id'), prefixes, refines)
-        opf_role = item.get(OPF('role'))
+        opf_role = item.get(const.OPF_ROLE)
         if (opf_role and opf_role.lower() != 'bkp') or (props.get('role') and not is_relators_role(props, 'bkp')):
             continue
         remove_element(item, refines)
     metadata = XPath('./opf:metadata')(root)[0]
     for bkp in producers:
         if bkp:
-            a = metadata.makeelement(DC('contributor'))
+            a = metadata.makeelement(const.DC_CONTRIBUTOR)
             aid = ensure_id(a)
             a.text = bkp
             metadata.append(a)
-            m = metadata.makeelement(OPF('meta'), attrib={'refines':'#'+aid, 'property':'role', 'scheme':'marc:relators'})
+            m = metadata.makeelement(const.OPF_META, attrib={'refines':'#'+aid, 'property':'role', 'scheme':'marc:relators'})
             m.text = 'bkp'
             metadata.append(m)
 # }}}
@@ -552,7 +552,7 @@ def set_pubdate(root, prefixes, refines, val):
     if not is_date_undefined(val):
         val = isoformat(val)
         m = XPath('./opf:metadata')(root)[0]
-        d = m.makeelement(DC('date'))
+        d = m.makeelement(const.DC_DATE)
         d.text = val
         m.append(d)
 
@@ -584,7 +584,7 @@ def create_timestamp(root, prefixes, m, val):
         ensure_prefix(root, prefixes, 'calibre', CALIBRE_PREFIX)
         ensure_prefix(root, prefixes, 'dcterms')
         val = w3cdtf(val)
-        d = m.makeelement(OPF('meta'), attrib={'property':'calibre:timestamp', 'scheme':'dcterms:W3CDTF'})
+        d = m.makeelement(const.OPF_META, attrib={'property':'calibre:timestamp', 'scheme':'dcterms:W3CDTF'})
         d.text = val
         m.append(d)
 
@@ -625,7 +625,7 @@ def set_last_modified(root, prefixes, refines, val=None):
     else:
         ensure_prefix(root, prefixes, 'dcterms')
         m = XPath('./opf:metadata')(root)[0]
-        meta = m.makeelement(OPF('meta'), attrib={'property':'dcterms:modified', 'scheme':'dcterms:W3CDTF'})
+        meta = m.makeelement(const.OPF_META, attrib={'property':'dcterms:modified', 'scheme':'dcterms:W3CDTF'})
         m.append(meta)
     meta.text = val
 # }}}
@@ -648,7 +648,7 @@ def set_comments(root, prefixes, refines, val):
     if val:
         val = val.strip()
         if val:
-            c = m.makeelement(DC('description'))
+            c = m.makeelement(const.DC_DESC)
             c.text = val
             m.append(c)
 # }}}
@@ -670,7 +670,7 @@ def set_publisher(root, prefixes, refines, val):
     if val:
         val = val.strip()
         if val:
-            c = m.makeelement(DC('publisher'))
+            c = m.makeelement(const.DC_PUBLISHER('publisher'))
             c.text = normalize_whitespace(val)
             m.append(c)
 # }}}
@@ -693,7 +693,7 @@ def set_tags(root, prefixes, refines, val):
     if val:
         val = uniq(list(filter(None, val)))
         for x in val:
-            c = m.makeelement(DC('subject'))
+            c = m.makeelement(const.DC_SUBJ)
             c.text = normalize_whitespace(x)
             if c.text:
                 m.append(c)
@@ -725,7 +725,7 @@ def read_rating(root, prefixes, refines):
 def create_rating(root, prefixes, val):
     ensure_prefix(root, prefixes, 'calibre', CALIBRE_PREFIX)
     m = XPath('./opf:metadata')(root)[0]
-    d = m.makeelement(OPF('meta'), attrib={'property':'calibre:rating'})
+    d = m.makeelement(const.OPF_META, attrib={'property':'calibre:rating'})
     d.text = val
     m.append(d)
 
@@ -772,7 +772,7 @@ def read_series(root, prefixes, refines):
 
 def create_series(root, refines, series, series_index):
     m = XPath('./opf:metadata')(root)[0]
-    d = m.makeelement(OPF('meta'), attrib={'property':'belongs-to-collection'})
+    d = m.makeelement(const.OPF_META, attrib={'property':'belongs-to-collection'})
     d.text = series
     m.append(d)
     set_refines(d, refines, refdef('collection-type', 'series'), refdef('group-position', series_index))
@@ -836,7 +836,7 @@ def dict_writer(name, serialize=dump_dict, remove2=True):
         if val:
             ensure_prefix(root, prefixes, 'calibre', CALIBRE_PREFIX)
             m = XPath('./opf:metadata')(root)[0]
-            d = m.makeelement(OPF('meta'), attrib={'property':'calibre:%s' % name})
+            d = m.makeelement(const.OPF_META, attrib={'property':'calibre:%s' % name})
             d.text = serialize(val)
             m.append(d)
     return writer
diff --git a/ebook_converter/ebooks/metadata/toc.py b/ebook_converter/ebooks/metadata/toc.py
index a9330a4..02f04d5 100644
--- a/ebook_converter/ebooks/metadata/toc.py
+++ b/ebook_converter/ebooks/metadata/toc.py
@@ -10,17 +10,13 @@ from lxml.builder import ElementMaker
 
 from ebook_converter.constants_old import __appname__, __version__
 from ebook_converter.ebooks.chardet import xml_to_unicode
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 from ebook_converter.utils.cleantext import clean_xml_chars
 from ebook_converter.polyglot.urllib import unquote
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2010, Kovid Goyal <kovid at kovidgoyal.net>'
-
 NCX_NS = "http://www.daisy.org/z3986/2005/ncx/"
 CALIBRE_NS = "http://calibre.kovidgoyal.net/2009/metadata"
-NSMAP = {None: NCX_NS, 'calibre':CALIBRE_NS}
+NSMAP = {None: NCX_NS, 'calibre': CALIBRE_NS}
 E = ElementMaker(namespace=NCX_NS, nsmap=NSMAP)
 C = ElementMaker(namespace=CALIBRE_NS, nsmap=NSMAP)
 
@@ -30,8 +26,10 @@ def parse_html_toc(data):
     from ebook_converter.utils.cleantext import clean_xml_chars
     from lxml import etree
     if isinstance(data, bytes):
-        data = xml_to_unicode(data, strip_encoding_pats=True, resolve_entities=True)[0]
-    root = parse(clean_xml_chars(data), maybe_xhtml=True, keep_doctype=False, sanitize_names=True)
+        data = xml_to_unicode(data, strip_encoding_pats=True,
+                              resolve_entities=True)[0]
+    root = parse(clean_xml_chars(data), maybe_xhtml=True, keep_doctype=False,
+                 sanitize_names=True)
     for a in root.xpath('//*[@href and local-name()="a"]'):
         purl = urllib.parse.urlparse(unquote(a.get('href')))
         href, fragment = purl[2], purl[5]
@@ -48,8 +46,8 @@ def parse_html_toc(data):
 class TOC(list):
 
     def __init__(self, href=None, fragment=None, text=None, parent=None,
-            play_order=0, base_path=os.getcwd(), type='unknown', author=None,
-            description=None, toc_thumbnail=None):
+                 play_order=0, base_path=os.getcwd(), type='unknown',
+                 author=None, description=None, toc_thumbnail=None):
         self.href = href
         self.fragment = fragment
         if not self.fragment:
@@ -64,7 +62,7 @@ class TOC(list):
         self.toc_thumbnail = toc_thumbnail
 
     def __str__(self):
-        lines = ['TOC: %s#%s %s'%(self.href, self.fragment, self.text)]
+        lines = ['TOC: %s#%s %s' % (self.href, self.fragment, self.text)]
         for child in self:
             c = str(child).splitlines()
             for l in c:
@@ -91,12 +89,14 @@ class TOC(list):
         entry.parent = None
 
     def add_item(self, href, fragment, text, play_order=None, type='unknown',
-            author=None, description=None, toc_thumbnail=None):
+                 author=None, description=None, toc_thumbnail=None):
         if play_order is None:
-            play_order = (self[-1].play_order if len(self) else self.play_order) + 1
+            play_order = (self[-1].play_order
+                          if len(self) else self.play_order) + 1
         self.append(TOC(href=href, fragment=fragment, text=text, parent=self,
                         base_path=self.base_path, play_order=play_order,
-                        type=type, author=author, description=description, toc_thumbnail=toc_thumbnail))
+                        type=type, author=author, description=description,
+                        toc_thumbnail=toc_thumbnail))
         return self[-1]
 
     def top_level_items(self):
@@ -121,7 +121,10 @@ class TOC(list):
 
     @property
     def abspath(self):
-        'Return the file this toc entry points to as a absolute path to a file on the system.'
+        """
+        Return the file this toc entry points to as a absolute path to a file
+        on the system.
+        """
 
         if self.href is None:
             return None
@@ -136,8 +139,9 @@ class TOC(list):
             toc = toc['toc']
         if toc is None:
             try:
-                toc = opfreader.soup.find('guide').find('reference', attrs={'type':'toc'})['href']
-            except:
+                toc = (opfreader.soup.find('guide')
+                       .find('reference', attrs={'type': 'toc'})['href'])
+            except Exception:
                 for item in opfreader.manifest:
                     if 'toc' in item.href().lower():
                         toc = item.href()
@@ -151,13 +155,15 @@ class TOC(list):
                     toc = os.path.join(self.base_path, toc)
                 try:
                     if not os.path.exists(toc):
-                        bn  = os.path.basename(toc)
-                        bn  = bn.replace('_top.htm', '_toc.htm')  # Bug in BAEN OPF files
+                        bn = os.path.basename(toc)
+                        # Bug in BAEN OPF files
+                        bn = bn.replace('_top.htm', '_toc.htm')
                         toc = os.path.join(os.path.dirname(toc), bn)
 
                     self.read_html_toc(toc)
-                except:
-                    print('WARNING: Could not read Table of Contents. Continuing anyway.')
+                except Exception:
+                    print('WARNING: Could not read Table of Contents. '
+                          'Continuing anyway.')
             else:
                 path = opfreader.manifest.item(toc.lower())
                 path = getattr(path, 'path', path)
@@ -177,9 +183,9 @@ class TOC(list):
         self.base_path = os.path.dirname(toc)
         if root is None:
             with open(toc, 'rb') as f:
-                raw  = xml_to_unicode(f.read(), assume_utf8=True,
-                        strip_encoding_pats=True)[0]
-            root = safe_xml_fromstring(raw)
+                raw = xml_to_unicode(f.read(), assume_utf8=True,
+                                     strip_encoding_pats=True)[0]
+            root = etree.fromstring(raw)
         xpn = {'re': 'http://exslt.org/regular-expressions'}
         XPath = functools.partial(etree.XPath, namespaces=xpn)
 
@@ -197,7 +203,7 @@ class TOC(list):
         def process_navpoint(np, dest):
             try:
                 play_order = int(get_attr(np, 1))
-            except:
+            except Exception:
                 play_order = 1
             href = fragment = text = None
             nd = dest
@@ -207,7 +213,7 @@ class TOC(list):
                 text = ''
                 for txt in txt_path(nl):
                     text += etree.tostring(txt, method='text',
-                            encoding='unicode', with_tail=False)
+                                           encoding='unicode', with_tail=False)
                 content = content_path(np)
                 if content and text:
                     content = content[0]
@@ -242,17 +248,14 @@ class TOC(list):
                 self.add_item(href, fragment, txt)
 
     def render(self, stream, uid):
-        root = E.ncx(
-                E.head(
-                    E.meta(name='dtb:uid', content=str(uid)),
-                    E.meta(name='dtb:depth', content=str(self.depth())),
-                    E.meta(name='dtb:generator', content='%s (%s)'%(__appname__,
-                        __version__)),
-                    E.meta(name='dtb:totalPageCount', content='0'),
-                    E.meta(name='dtb:maxPageNumber', content='0'),
-                ),
-                E.docTitle(E.text('Table of Contents')),
-        )
+        root = E.ncx(E.head(E.meta(name='dtb:uid', content=str(uid)),
+                            E.meta(name='dtb:depth',
+                                   content=str(self.depth())),
+                            E.meta(name='dtb:generator', content='%s (%s)' %
+                                   (__appname__, __version__)),
+                            E.meta(name='dtb:totalPageCount', content='0'),
+                            E.meta(name='dtb:maxPageNumber', content='0')),
+                     E.docTitle(E.text('Table of Contents')))
         navmap = E.navMap()
         root.append(navmap)
         root.set('{http://www.w3.org/XML/1998/namespace}lang', 'en')
@@ -263,12 +266,12 @@ class TOC(list):
             if not text:
                 text = ''
             c[1] += 1
-            item_id = 'num_%d'%c[1]
+            item_id = 'num_%d' % c[1]
             text = clean_xml_chars(text)
             elem = E.navPoint(
                     E.navLabel(E.text(re.sub(r'\s+', ' ', text))),
                     E.content(src=str(np.href)+(('#' + str(np.fragment))
-                        if np.fragment else '')),
+                                                if np.fragment else '')),
                     id=item_id,
                     playOrder=str(np.play_order)
             )
@@ -282,7 +285,8 @@ class TOC(list):
                 try:
                     elem.append(C.meta(desc, name='description'))
                 except ValueError:
-                    elem.append(C.meta(clean_xml_chars(desc), name='description'))
+                    elem.append(C.meta(clean_xml_chars(desc),
+                                       name='description'))
             idx = getattr(np, 'toc_thumbnail', None)
             if idx:
                 elem.append(C.meta(idx, name='toc_thumbnail'))
@@ -293,5 +297,5 @@ class TOC(list):
         for np in self:
             navpoint(navmap, np)
         raw = etree.tostring(root, encoding='utf-8', xml_declaration=True,
-                pretty_print=True)
+                             pretty_print=True)
         stream.write(raw)
diff --git a/ebook_converter/ebooks/metadata/utils.py b/ebook_converter/ebooks/metadata/utils.py
index 0fbce09..031c917 100644
--- a/ebook_converter/ebooks/metadata/utils.py
+++ b/ebook_converter/ebooks/metadata/utils.py
@@ -1,12 +1,13 @@
 from collections import namedtuple
 
+from lxml import etree
+
 from ebook_converter.ebooks.chardet import xml_to_unicode
-from ebook_converter.ebooks.oeb.base import OPF
+from ebook_converter.ebooks.oeb import base
 from ebook_converter.ebooks.oeb.polish.utils import guess_type
 from ebook_converter.spell import parse_lang_code
 from ebook_converter.utils.cleantext import clean_xml_chars
 from ebook_converter.utils.localization import lang_as_iso639_1
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 
 
 OPFVersion = namedtuple('OPFVersion', 'major minor patch')
@@ -35,23 +36,26 @@ def parse_opf(stream_or_path):
     raw = stream.read()
     if not raw:
         raise ValueError('Empty file: '+getattr(stream, 'name', 'stream'))
-    raw, encoding = xml_to_unicode(raw, strip_encoding_pats=True, resolve_entities=True, assume_utf8=True)
+    raw, encoding = xml_to_unicode(raw, strip_encoding_pats=True,
+                                   resolve_entities=True, assume_utf8=True)
     raw = raw[raw.find('<'):]
-    root = safe_xml_fromstring(clean_xml_chars(raw))
+    root = etree.fromstring(clean_xml_chars(raw))
     if root is None:
         raise ValueError('Not an OPF file')
     return root
 
 
 def normalize_languages(opf_languages, mi_languages):
-    ' Preserve original country codes and use 2-letter lang codes where possible '
+    """
+    Preserve original country codes and use 2-letter lang codes where possible
+    """
     def parse(x):
         try:
             return parse_lang_code(x)
         except ValueError:
             return None
     opf_languages = filter(None, map(parse, opf_languages))
-    cc_map = {c.langcode:c.countrycode for c in opf_languages}
+    cc_map = {c.langcode: c.countrycode for c in opf_languages}
     mi_languages = filter(None, map(parse, mi_languages))
 
     def norm(x):
@@ -83,9 +87,9 @@ def create_manifest_item(root, href_template, id_template, media_type=None):
     all_hrefs = frozenset(root.xpath('//*/@href'))
     href = ensure_unique(href_template, all_hrefs)
     item_id = ensure_unique(id_template, all_ids)
-    manifest = root.find(OPF('manifest'))
+    manifest = root.find(base.tag('opf', 'manifest'))
     if manifest is not None:
-        i = manifest.makeelement(OPF('item'))
+        i = manifest.makeelement(base.tag('opf', 'item'))
         i.set('href', href), i.set('id', item_id)
         i.set('media-type', media_type or guess_type(href_template))
         manifest.append(i)
@@ -93,6 +97,7 @@ def create_manifest_item(root, href_template, id_template, media_type=None):
 
 
 def pretty_print_opf(root):
-    from ebook_converter.ebooks.oeb.polish.pretty import pretty_opf, pretty_xml_tree
+    from ebook_converter.ebooks.oeb.polish.pretty import pretty_opf, \
+            pretty_xml_tree
     pretty_opf(root)
     pretty_xml_tree(root)
diff --git a/ebook_converter/ebooks/metadata/xmp.py b/ebook_converter/ebooks/metadata/xmp.py
index fc6e154..e9a7faf 100644
--- a/ebook_converter/ebooks/metadata/xmp.py
+++ b/ebook_converter/ebooks/metadata/xmp.py
@@ -1,44 +1,43 @@
-import re, sys, copy, json
-from itertools import repeat
-from collections import defaultdict
+import collections
+import copy
+import itertools
+import json
+import re
+import sys
 
 from lxml import etree
 from lxml.builder import ElementMaker
 
 from ebook_converter import prints
 from ebook_converter.ebooks.metadata import check_isbn, check_doi
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 from ebook_converter.ebooks.metadata.book.base import Metadata
 from ebook_converter.ebooks.metadata.opf2 import dump_dict
 from ebook_converter.utils.date import parse_date, isoformat, now
-from ebook_converter.utils.localization import canonicalize_lang, lang_as_iso639_1
+from ebook_converter.utils.localization import canonicalize_lang, \
+        lang_as_iso639_1
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2014, Kovid Goyal <kovid at kovidgoyal.net>'
+_xml_declaration = re.compile(r'<\?xml[^<>]+encoding\s*=\s*[\'"](.*?)'
+                              r'[\'"][^<>]*>', re.IGNORECASE)
 
-_xml_declaration = re.compile(r'<\?xml[^<>]+encoding\s*=\s*[\'"](.*?)[\'"][^<>]*>', re.IGNORECASE)
-
-NS_MAP = {
-    'rdf': 'http://www.w3.org/1999/02/22-rdf-syntax-ns#',
-    'dc': 'http://purl.org/dc/elements/1.1/',
-    'pdf': 'http://ns.adobe.com/pdf/1.3/',
-    'pdfx': 'http://ns.adobe.com/pdfx/1.3/',
-    'xmp': 'http://ns.adobe.com/xap/1.0/',
-    'xmpidq': 'http://ns.adobe.com/xmp/Identifier/qual/1.0/',
-    'xmpMM': 'http://ns.adobe.com/xap/1.0/mm/',
-    'xmpRights': 'http://ns.adobe.com/xap/1.0/rights/',
-    'xmpBJ': 'http://ns.adobe.com/xap/1.0/bj/',
-    'xmpTPg': 'http://ns.adobe.com/xap/1.0/t/pg/',
-    'xmpDM': 'http://ns.adobe.com/xmp/1.0/DynamicMedia/',
-    'prism': 'http://prismstandard.org/namespaces/basic/2.0/',
-    'crossmark': 'http://crossref.org/crossmark/1.0/',
-    'xml': 'http://www.w3.org/XML/1998/namespace',
-    'x': 'adobe:ns:meta/',
-    'calibre': 'http://calibre-ebook.com/xmp-namespace',
-    'calibreSI': 'http://calibre-ebook.com/xmp-namespace-series-index',
-    'calibreCC': 'http://calibre-ebook.com/xmp-namespace-custom-columns',
-}
+NS_MAP = {'rdf': 'http://www.w3.org/1999/02/22-rdf-syntax-ns#',
+          'dc': 'http://purl.org/dc/elements/1.1/',
+          'pdf': 'http://ns.adobe.com/pdf/1.3/',
+          'pdfx': 'http://ns.adobe.com/pdfx/1.3/',
+          'xmp': 'http://ns.adobe.com/xap/1.0/',
+          'xmpidq': 'http://ns.adobe.com/xmp/Identifier/qual/1.0/',
+          'xmpMM': 'http://ns.adobe.com/xap/1.0/mm/',
+          'xmpRights': 'http://ns.adobe.com/xap/1.0/rights/',
+          'xmpBJ': 'http://ns.adobe.com/xap/1.0/bj/',
+          'xmpTPg': 'http://ns.adobe.com/xap/1.0/t/pg/',
+          'xmpDM': 'http://ns.adobe.com/xmp/1.0/DynamicMedia/',
+          'prism': 'http://prismstandard.org/namespaces/basic/2.0/',
+          'crossmark': 'http://crossref.org/crossmark/1.0/',
+          'xml': 'http://www.w3.org/XML/1998/namespace',
+          'x': 'adobe:ns:meta/',
+          'calibre': 'http://calibre-ebook.com/xmp-namespace',
+          'calibreSI': 'http://calibre-ebook.com/xmp-namespace-series-index',
+          'calibreCC': 'http://calibre-ebook.com/xmp-namespace-custom-columns'}
 KNOWN_ID_SCHEMES = {'isbn', 'url', 'doi'}
 
 
@@ -63,7 +62,7 @@ def parse_xmp_packet(raw_bytes):
     pat = r'''<?xpacket\s+[^>]*?begin\s*=\s*['"]([^'"]*)['"]'''
     encodings = ('8', '16-le', '16-be', '32-le', '32-be')
     header = raw_bytes[:1024]
-    emap = {'\ufeff'.encode('utf-'+x):'utf-'+x for x in encodings}
+    emap = {'\ufeff'.encode('utf-'+x): 'utf-'+x for x in encodings}
     emap[b''] = 'utf-8'
     for q in encodings:
         m = re.search(pat.encode('utf-'+q), header)
@@ -71,15 +70,19 @@ def parse_xmp_packet(raw_bytes):
             enc = emap.get(m.group(1), enc)
             break
     if enc is None:
-        return safe_xml_fromstring(raw_bytes)
-    raw = _xml_declaration.sub('', raw_bytes.decode(enc))  # lxml barfs if encoding declaration present in unicode string
-    return safe_xml_fromstring(raw)
+        return etree.fromstring(raw_bytes)
+    # lxml barfs if encoding declaration present in unicode string
+    raw = _xml_declaration.sub('', raw_bytes.decode(enc))
+    return etree.fromstring(raw)
 
 
 def serialize_xmp_packet(root, encoding='utf-8'):
-    root.tail = '\n' + '\n'.join(repeat(' '*100, 30))  # Adobe spec recommends inserting padding at the end of the packet
-    raw_bytes = etree.tostring(root, encoding=encoding, pretty_print=True, with_tail=True, method='xml')
-    return b'<?xpacket begin="%s" id="W5M0MpCehiHzreSzNTczkc9d"?>\n%s\n<?xpacket end="w"?>' % ('\ufeff'.encode(encoding), raw_bytes)
+    # Adobe spec recommends inserting padding at the end of the packet
+    root.tail = '\n' + '\n'.join(itertools.repeat(' '*100, 30))
+    raw_bytes = etree.tostring(root, encoding=encoding, pretty_print=True,
+                               with_tail=True, method='xml')
+    return ('<?xpacket begin="%s" id="W5M0MpCehiHzreSzNTczkc9d"?>\n%s\n'
+            '<?xpacket end="w"?>' % ('\ufeff'.encode(encoding), raw_bytes))
 
 
 def read_simple_property(elem):
@@ -106,14 +109,15 @@ def read_sequence(parent):
         yield read_simple_property(item)
 
 
-def uniq(vals, kmap=lambda x:x):
+def uniq(vals, kmap=lambda x: x):
     ''' Remove all duplicates from vals, while preserving order. kmap must be a
     callable that returns a hashable value for every item in vals '''
     vals = vals or ()
     lvals = (kmap(x) for x in vals)
     seen = set()
     seen_add = seen.add
-    return tuple(x for x, k in zip(vals, lvals) if k not in seen and not seen_add(k))
+    return tuple(x for x, k in zip(vals, lvals) if k not in seen
+                 and not seen_add(k))
 
 
 def multiple_sequences(expr, root):
@@ -170,7 +174,8 @@ def read_series(root):
 
 def read_user_metadata(mi, root):
     from ebook_converter.utils.config import from_json
-    from ebook_converter.ebooks.metadata.book.json_codec import decode_is_multiple
+    from ebook_converter.ebooks.metadata.book.json_codec import \
+        decode_is_multiple
     fields = set()
     for item in XPath('//calibre:custom_metadata')(root):
         for li in XPath('./rdf:Bag/rdf:li')(item):
@@ -186,7 +191,7 @@ def read_user_metadata(mi, root):
                             decode_is_multiple(fm)
                             mi.set_user_metadata(name, fm)
                             fields.add(name)
-                        except:
+                        except Exception:
                             prints('Failed to read user metadata:', name)
                             import traceback
                             traceback.print_exc()
@@ -194,13 +199,17 @@ def read_user_metadata(mi, root):
 
 def read_xmp_identifers(parent):
     ''' For example:
-    <rdf:li rdf:parseType="Resource"><xmpidq:Scheme>URL</xmp:idq><rdf:value>http://foo.com</rdf:value></rdf:li>
+    <rdf:li rdf:parseType="Resource"><xmpidq:Scheme>URL</xmp:idq>
+    <rdf:value>http://foo.com</rdf:value></rdf:li>
     or the longer form:
-    <rdf:li><rdf:Description><xmpidq:Scheme>URL</xmp:idq><rdf:value>http://foo.com</rdf:value></rdf:Description></rdf:li>
+    <rdf:li><rdf:Description><xmpidq:Scheme>URL</xmp:idq>
+    <rdf:value>http://foo.com</rdf:value></rdf:Description></rdf:li>
     '''
     for li in XPath('./rdf:Bag/rdf:li')(parent):
-        is_resource = li.attrib.get(expand('rdf:parseType'), None) == 'Resource'
-        is_resource = is_resource or (len(li) == 1 and li[0].tag == expand('rdf:Description'))
+        is_resource = li.attrib.get(expand('rdf:parseType'),
+                                    None) == 'Resource'
+        is_resource = is_resource or (len(li) == 1 and
+                                      li[0].tag == expand('rdf:Description'))
         if not is_resource:
             yield None, li.text or ''
         value = XPath('descendant::rdf:value')(li)
@@ -241,12 +250,15 @@ def metadata_from_xmp_packet(raw_bytes):
         if title.startswith(r'\376\377'):
             # corrupted XMP packet generated by Nitro PDF. See
             # https://bugs.launchpad.net/calibre/+bug/1541981
-            raise ValueError('Corrupted XMP metadata packet detected, probably generated by Nitro PDF')
+            raise ValueError('Corrupted XMP metadata packet detected, '
+                             'probably generated by Nitro PDF')
         mi.title = title
     authors = multiple_sequences('//dc:creator', root)
     if authors:
         mi.authors = authors
-    tags = multiple_sequences('//dc:subject', root) or multiple_sequences('//pdf:Keywords', root)
+    tags = multiple_sequences('//dc:subject',
+                              root) or multiple_sequences('//pdf:Keywords',
+                                                          root)
     if tags:
         mi.tags = tags
     comments = first_alt('//dc:description', root)
@@ -256,8 +268,10 @@ def metadata_from_xmp_packet(raw_bytes):
     if publishers:
         mi.publisher = publishers[0]
     try:
-        pubdate = parse_date(first_sequence('//dc:date', root) or first_simple('//xmp:CreateDate', root), assume_utc=False)
-    except:
+        pubdate = (parse_date(first_sequence('//dc:date', root) or
+                              first_simple('//xmp:CreateDate', root),
+                              assume_utc=False))
+    except Exception:
         pass
     else:
         mi.pubdate = pubdate
@@ -291,7 +305,7 @@ def metadata_from_xmp_packet(raw_bytes):
         if val:
             try:
                 setattr(mi, x, json.loads(val))
-            except:
+            except Exception:
                 pass
 
     languages = multiple_sequences('//dc:language', root)
@@ -319,7 +333,7 @@ def metadata_from_xmp_packet(raw_bytes):
                     identifiers[scheme] = val
 
     # Check Dublin Core for recognizable identifier types
-    for scheme, check_func in {'doi':check_doi, 'isbn':check_isbn}.items():
+    for scheme, check_func in {'doi': check_doi, 'isbn': check_isbn}.items():
         if scheme not in identifiers:
             val = check_func(first_simple('//dc:identifier', root))
             if val:
@@ -359,17 +373,21 @@ def consolidate_metadata(info_mi, info):
         else:
             prefer_info = info_date > xmp_mi.metadata_date
     if prefer_info:
-        info_mi.title, info_mi.authors, info_mi.tags = info_title, info_authors, info_tags
+        info_mi.title = info_title
+        info_mi.authors = info_authors
+        info_mi.tags = info_tags
     else:
         # We'll use the xmp tags/authors but fallback to the info ones if the
-        # xmp does not have tags/authors. smart_update() should have taken care of
-        # the rest
-        info_mi.authors, info_mi.tags = (info_authors if xmp_mi.is_null('authors') else xmp_mi.authors), xmp_mi.tags or info_tags
+        # xmp does not have tags/authors. smart_update() should have taken care
+        # of the rest
+        info_mi.authors = (info_authors if xmp_mi.is_null('authors')
+                           else xmp_mi.authors)
+        info_mi.tags = xmp_mi.tags or info_tags
     return info_mi
 
 
 def nsmap(*args):
-    return {x:NS_MAP[x] for x in args}
+    return {x: NS_MAP[x] for x in args}
 
 
 def create_simple_property(parent, tag, value):
@@ -435,7 +453,8 @@ def create_series(calibre, series, series_index):
 
 def create_user_metadata(calibre, all_user_metadata):
     from ebook_converter.utils.config import to_json
-    from ebook_converter.ebooks.metadata.book.json_codec import object_to_unicode, encode_is_multiple
+    from ebook_converter.ebooks.metadata.book.json_codec import \
+        object_to_unicode, encode_is_multiple
 
     s = calibre.makeelement(expand('calibre:custom_metadata'))
     calibre.append(s)
@@ -447,7 +466,7 @@ def create_user_metadata(calibre, all_user_metadata):
             encode_is_multiple(fm)
             fm = object_to_unicode(fm)
             fm = json.dumps(fm, default=to_json, ensure_ascii=False)
-        except:
+        except Exception:
             prints('Failed to write user metadata:', name)
             import traceback
             traceback.print_exc()
@@ -471,7 +490,8 @@ def metadata_to_xmp_packet(mi):
     dc = rdf.makeelement(expand('rdf:Description'), nsmap=nsmap('dc'))
     dc.set(expand('rdf:about'), '')
     rdf.append(dc)
-    for prop, tag in {'title':'dc:title', 'comments':'dc:description'}.items():
+    for prop, tag in {'title': 'dc:title',
+                      'comments': 'dc:description'}.items():
         val = mi.get(prop) or ''
         create_alt_property(dc, tag, val)
     for prop, (tag, ordered) in {'authors': ('dc:creator', True),
@@ -482,18 +502,23 @@ def metadata_to_xmp_packet(mi):
             val = [val]
         create_sequence_property(dc, tag, val, ordered)
     if not mi.is_null('pubdate'):
-        create_sequence_property(dc, 'dc:date', [isoformat(mi.pubdate, as_utc=False)])  # Adobe spec recommends local time
+        # Adobe spec recommends local time
+        create_sequence_property(dc, 'dc:date',
+                                 [isoformat(mi.pubdate, as_utc=False)])
     if not mi.is_null('languages'):
-        langs = list(filter(None, map(lambda x:lang_as_iso639_1(x) or canonicalize_lang(x), mi.languages)))
+        langs = list(filter(None, map(lambda x: lang_as_iso639_1(x) or
+                                      canonicalize_lang(x), mi.languages)))
         if langs:
             create_sequence_property(dc, 'dc:language', langs, ordered=False)
 
-    xmp = rdf.makeelement(expand('rdf:Description'), nsmap=nsmap('xmp', 'xmpidq'))
+    xmp = rdf.makeelement(expand('rdf:Description'),
+                          nsmap=nsmap('xmp', 'xmpidq'))
     xmp.set(expand('rdf:about'), '')
     rdf.append(xmp)
     extra_ids = {}
     for x in ('prism', 'pdfx'):
-        p = extra_ids[x] = rdf.makeelement(expand('rdf:Description'), nsmap=nsmap(x))
+        p = extra_ids[x] = rdf.makeelement(expand('rdf:Description'),
+                                           nsmap=nsmap(x))
         p.set(expand('rdf:about'), '')
         rdf.append(p)
 
@@ -503,7 +528,7 @@ def metadata_to_xmp_packet(mi):
         for scheme, val in identifiers.items():
             if scheme in {'isbn', 'doi'}:
                 for prefix, parent in extra_ids.items():
-                    ie = parent.makeelement(expand('%s:%s'%(prefix, scheme)))
+                    ie = parent.makeelement(expand('%s:%s' % (prefix, scheme)))
                     ie.text = val
                     parent.append(ie)
 
@@ -511,7 +536,8 @@ def metadata_to_xmp_packet(mi):
     d.text = isoformat(now(), as_utc=False)
     xmp.append(d)
 
-    calibre = rdf.makeelement(expand('rdf:Description'), nsmap=nsmap('calibre', 'calibreSI', 'calibreCC'))
+    calibre = rdf.makeelement(expand('rdf:Description'),
+                              nsmap=nsmap('calibre', 'calibreSI', 'calibreCC'))
     calibre.set(expand('rdf:about'), '')
     rdf.append(calibre)
     if not mi.is_null('rating'):
@@ -524,7 +550,8 @@ def metadata_to_xmp_packet(mi):
     if not mi.is_null('series'):
         create_series(calibre, mi.series, mi.series_index)
     if not mi.is_null('timestamp'):
-        create_simple_property(calibre, 'calibre:timestamp', isoformat(mi.timestamp, as_utc=False))
+        create_simple_property(calibre, 'calibre:timestamp',
+                               isoformat(mi.timestamp, as_utc=False))
     for x in ('author_link_map', 'user_categories'):
         val = getattr(mi, x, None)
         if val:
@@ -550,10 +577,11 @@ def find_used_namespaces(elem):
 
 def find_preferred_prefix(namespace, elems):
     for elem in elems:
-        ans = {v:k for k, v in elem.nsmap.items()}.get(namespace, None)
+        ans = {v: k for k, v in elem.nsmap.items()}.get(namespace, None)
         if ans is not None:
             return ans
-        return find_preferred_prefix(namespace, elem.iterchildren(etree.Element))
+        return find_preferred_prefix(namespace,
+                                     elem.iterchildren(etree.Element))
 
 
 def find_nsmap(elems):
@@ -562,7 +590,7 @@ def find_nsmap(elems):
         used_namespaces |= find_used_namespaces(elem)
     ans = {}
     used_namespaces -= {NS_MAP['xml'], NS_MAP['x'], None, NS_MAP['rdf']}
-    rmap = {v:k for k, v in NS_MAP.items()}
+    rmap = {v: k for k, v in NS_MAP.items()}
     i = 0
     for ns in used_namespaces:
         if ns in rmap:
@@ -578,7 +606,10 @@ def find_nsmap(elems):
 
 
 def clone_into(parent, elem):
-    ' Clone the element, assuming that all namespace declarations are present in parent '
+    """
+    Clone the element, assuming that all namespace declarations are present
+    in parent
+    """
     clone = parent.makeelement(elem.tag)
     parent.append(clone)
     if elem.text and not elem.text.isspace():
@@ -591,28 +622,38 @@ def clone_into(parent, elem):
 
 
 def merge_xmp_packet(old, new):
-    ''' Merge metadata present in the old packet that is not present in the new
+    """
+    Merge metadata present in the old packet that is not present in the new
     one into the new one. Assumes the new packet was generated by
-    metadata_to_xmp_packet() '''
+    metadata_to_xmp_packet()
+    """
     old, new = parse_xmp_packet(old), parse_xmp_packet(new)
-    # As per the adobe spec all metadata items have to be present inside top-level rdf:Description containers
+    # As per the adobe spec all metadata items have to be present inside
+    # top-level rdf:Description containers
     item_xpath = XPath('//rdf:RDF/rdf:Description/*')
 
     # First remove all data fields that metadata_to_xmp_packet() knowns about,
     # since either they will have been set or if not present, imply they have
     # been cleared
-    defined_tags = {expand(prefix + ':' + scheme) for prefix in ('prism', 'pdfx') for scheme in KNOWN_ID_SCHEMES}
-    defined_tags |= {expand('dc:' + x) for x in ('identifier', 'title', 'creator', 'date', 'description', 'language', 'publisher', 'subject')}
-    defined_tags |= {expand('xmp:' + x) for x in ('MetadataDate', 'Identifier')}
+    defined_tags = {expand(prefix + ':' + scheme)
+                    for prefix in ('prism', 'pdfx')
+                    for scheme in KNOWN_ID_SCHEMES}
+    defined_tags |= {expand('dc:' + x)
+                     for x in ('identifier', 'title', 'creator', 'date',
+                               'description', 'language', 'publisher',
+                               'subject')}
+    defined_tags |= {expand('xmp:' + x)
+                     for x in ('MetadataDate', 'Identifier')}
     # For redundancy also remove all fields explicitly set in the new packet
     defined_tags |= {x.tag for x in item_xpath(new)}
     calibrens = '{%s}' % NS_MAP['calibre']
     for elem in item_xpath(old):
-        if elem.tag in defined_tags or (elem.tag and elem.tag.startswith(calibrens)):
+        if elem.tag in defined_tags or (elem.tag and
+                                        elem.tag.startswith(calibrens)):
             elem.getparent().remove(elem)
 
     # Group all items into groups based on their namespaces
-    groups = defaultdict(list)
+    groups = collections.defaultdict(list)
     for item in item_xpath(new):
         ns = item.nsmap[item.prefix]
         groups[ns].append(item)
@@ -626,9 +667,14 @@ def merge_xmp_packet(old, new):
     root = A.xmpmeta(R.RDF)
     rdf = root[0]
 
-    for namespace in sorted(groups, key=lambda x:{NS_MAP['dc']:'a', NS_MAP['xmp']:'b', NS_MAP['calibre']:'c'}.get(x, 'z'+x)):
+    for namespace in sorted(groups,
+                            key=lambda x: {NS_MAP['dc']: 'a',
+                                           NS_MAP['xmp']: 'b',
+                                           NS_MAP['calibre']: 'c'}.get(x,
+                                                                       'z'+x)):
         items = groups[namespace]
-        desc = rdf.makeelement(expand('rdf:Description'), nsmap=find_nsmap(items))
+        desc = rdf.makeelement(expand('rdf:Description'),
+                               nsmap=find_nsmap(items))
         desc.set(expand('rdf:about'), '')
         rdf.append(desc)
         for item in items:
diff --git a/ebook_converter/ebooks/mobi/mobiml.py b/ebook_converter/ebooks/mobi/mobiml.py
index 07cea1c..d833d88 100644
--- a/ebook_converter/ebooks/mobi/mobiml.py
+++ b/ebook_converter/ebooks/mobi/mobiml.py
@@ -5,8 +5,10 @@ import copy
 import re
 import numbers
 from lxml import etree
-from ebook_converter.ebooks.oeb.base import namespace, barename
-from ebook_converter.ebooks.oeb.base import XHTML, XHTML_NS, urlnormalize
+
+from ebook_converter import constants as const
+from ebook_converter.ebooks.oeb import base
+from ebook_converter.ebooks.oeb import parse_utils
 from ebook_converter.ebooks.oeb.stylizer import Stylizer
 from ebook_converter.ebooks.oeb.transforms.flatcss import KeyMapper
 from ebook_converter.ebooks.mobi.utils import convert_color_for_font_tag
@@ -23,7 +25,7 @@ def MBP(name):
     return '{%s}%s' % (MBP_NS, name)
 
 
-MOBI_NSMAP = {None: XHTML_NS, 'mbp': MBP_NS}
+MOBI_NSMAP = {None: const.XHTML_NS, 'mbp': const.MBP_NS}
 INLINE_TAGS = {'span', 'a', 'code', 'u', 's', 'big', 'strike', 'tt', 'font', 'q', 'i', 'b', 'em', 'strong', 'sup', 'sub'}
 HEADER_TAGS = {'h1', 'h2', 'h3', 'h4', 'h5', 'h6'}
 # GR: Added 'caption' to both sets
@@ -129,9 +131,9 @@ class MobiMLizer(object):
         'Iterate over the spine and convert it to MOBIML'
         for item in self.oeb.spine:
             stylizer = Stylizer(item.data, item.href, self.oeb, self.opts, self.profile)
-            body = item.data.find(XHTML('body'))
-            nroot = etree.Element(XHTML('html'), nsmap=MOBI_NSMAP)
-            nbody = etree.SubElement(nroot, XHTML('body'))
+            body = item.data.find(base.tag('xhtml', 'body'))
+            nroot = etree.Element(base.tag('xhtml', 'html'), nsmap=MOBI_NSMAP)
+            nbody = etree.SubElement(nroot, base.tag('xhtml', 'body'))
             self.current_spine_item = item
             self.mobimlize_elem(body, stylizer, BlockState(nbody),
                                 [FormatState()])
@@ -162,7 +164,7 @@ class MobiMLizer(object):
         lines = text.split('\n')
         result = lines[:1]
         for line in lines[1:]:
-            result.append(etree.Element(XHTML('br')))
+            result.append(etree.Element(base.tag('xhtml', 'br')))
             if line:
                 result.append(line)
         return result
@@ -194,7 +196,7 @@ class MobiMLizer(object):
                 indent = (indent / abs(indent)) * self.profile.fbase
             if tag in NESTABLE_TAGS and not istate.rendered:
                 para = wrapper = etree.SubElement(
-                    parent, XHTML(tag), attrib=istate.attrib)
+                    parent, base.tag('xhtml', tag), attrib=istate.attrib)
                 bstate.nested.append(para)
                 if tag == 'li' and len(istates) > 1:
                     istates[-2].list_num += 1
@@ -203,21 +205,21 @@ class MobiMLizer(object):
                 para = wrapper = bstate.nested[-1]
             elif not self.opts.mobi_ignore_margins and left > 0 and indent >= 0:
                 ems = self.profile.mobi_ems_per_blockquote
-                para = wrapper = etree.SubElement(parent, XHTML('blockquote'))
+                para = wrapper = etree.SubElement(parent, base.tag('xhtml', 'blockquote'))
                 para = wrapper
                 emleft = int(round(left / self.profile.fbase)) - ems
                 emleft = min((emleft, 10))
                 while emleft > ems / 2:
-                    para = etree.SubElement(para, XHTML('blockquote'))
+                    para = etree.SubElement(para, base.tag('xhtml', 'blockquote'))
                     emleft -= ems
             else:
-                para = wrapper = etree.SubElement(parent, XHTML('p'))
+                para = wrapper = etree.SubElement(parent, base.tag('xhtml', 'p'))
             bstate.inline = bstate.para = para
             vspace = bstate.vpadding + bstate.vmargin
             bstate.vpadding = bstate.vmargin = 0
             if tag not in TABLE_TAGS:
                 if tag in ('ul', 'ol') and vspace > 0:
-                    wrapper.addprevious(etree.Element(XHTML('div'),
+                    wrapper.addprevious(etree.Element(base.tag('xhtml', 'div'),
                         height=self.mobimlize_measure(vspace)))
                 else:
                     wrapper.attrib['height'] = self.mobimlize_measure(vspace)
@@ -225,7 +227,7 @@ class MobiMLizer(object):
             elif tag == 'table' and vspace > 0:
                 vspace = int(round(vspace / self.profile.fbase))
                 while vspace > 0:
-                    wrapper.addprevious(etree.Element(XHTML('br')))
+                    wrapper.addprevious(etree.Element(base.tag('xhtml', 'br')))
                     vspace -= 1
             if istate.halign != 'auto' and isinstance(istate.halign, (bytes, str)):
                 if isinstance(istate.halign, bytes):
@@ -237,7 +239,7 @@ class MobiMLizer(object):
             bstate.inline = para
             pstate = bstate.istate = None
             try:
-                etree.SubElement(para, XHTML(tag), attrib=istate.attrib)
+                etree.SubElement(para, base.tag('xhtml', tag), attrib=istate.attrib)
             except:
                 print('Invalid subelement:', para, tag, istate.attrib)
                 raise
@@ -245,7 +247,7 @@ class MobiMLizer(object):
             para.attrib['valign'] = 'top'
         if istate.ids:
             for id_ in istate.ids:
-                anchor = etree.Element(XHTML('a'), attrib={'id': id_})
+                anchor = etree.Element(base.tag('xhtml', 'a'), attrib={'id': id_})
                 if tag == 'li':
                     try:
                         last = bstate.body[-1][-1]
@@ -262,7 +264,7 @@ class MobiMLizer(object):
                     # This could potentially break if inserting an anchor at
                     # this point in the markup is illegal, but I cannot think
                     # of such a case offhand.
-                    if barename(last.tag) in LEAF_TAGS:
+                    if parse_utils.barename(last.tag) in LEAF_TAGS:
                         last.addprevious(anchor)
                     else:
                         last.append(anchor)
@@ -279,28 +281,28 @@ class MobiMLizer(object):
             elif pstate and pstate.href == href:
                 inline = bstate.anchor
             else:
-                inline = etree.SubElement(inline, XHTML('a'), href=href)
+                inline = etree.SubElement(inline, base.tag('xhtml', 'a'), href=href)
                 bstate.anchor = inline
 
             if fsize != 3:
-                inline = etree.SubElement(inline, XHTML('font'),
+                inline = etree.SubElement(inline, base.tag('xhtml', 'font'),
                                           size=str(fsize))
             if istate.family == 'monospace':
-                inline = etree.SubElement(inline, XHTML('tt'))
+                inline = etree.SubElement(inline, base.tag('xhtml', 'tt'))
             if istate.italic:
-                inline = etree.SubElement(inline, XHTML('i'))
+                inline = etree.SubElement(inline, base.tag('xhtml', 'i'))
             if istate.bold:
-                inline = etree.SubElement(inline, XHTML('b'))
+                inline = etree.SubElement(inline, base.tag('xhtml', 'b'))
             if istate.bgcolor is not None and istate.bgcolor != 'transparent' :
-                inline = etree.SubElement(inline, XHTML('span'),
+                inline = etree.SubElement(inline, base.tag('xhtml', 'span'),
                         bgcolor=convert_color_for_font_tag(istate.bgcolor))
             if istate.fgcolor != 'black':
-                inline = etree.SubElement(inline, XHTML('font'),
+                inline = etree.SubElement(inline, base.tag('xhtml', 'font'),
                         color=convert_color_for_font_tag(istate.fgcolor))
             if istate.strikethrough:
-                inline = etree.SubElement(inline, XHTML('s'))
+                inline = etree.SubElement(inline, base.tag('xhtml', 's'))
             if istate.underline:
-                inline = etree.SubElement(inline, XHTML('u'))
+                inline = etree.SubElement(inline, base.tag('xhtml', 'u'))
             bstate.inline = inline
         bstate.istate = istate
         inline = bstate.inline
@@ -318,7 +320,7 @@ class MobiMLizer(object):
     def mobimlize_elem(self, elem, stylizer, bstate, istates,
             ignore_valign=False):
         if not isinstance(elem.tag, (str, bytes)) \
-           or namespace(elem.tag) != XHTML_NS:
+           or parse_utils.namespace(elem.tag) != const.XHTML_NS:
             return
         style = stylizer.style(elem)
         # <mbp:frame-set/> does not exist lalalala
@@ -333,10 +335,10 @@ class MobiMLizer(object):
                 elem.text = None
                 elem.set('id', id_)
                 elem.tail = tail
-                elem.tag = XHTML('a')
+                elem.tag = base.tag('xhtml', 'a')
             else:
                 return
-        tag = barename(elem.tag)
+        tag = parse_utils.barename(elem.tag)
         istate = copy.copy(istates[-1])
         istate.rendered = False
         istate.list_num = 0
@@ -451,7 +453,7 @@ class MobiMLizer(object):
             if 'width' not in istate.attrib or 'height' not in istate.attrib:
                 href = self.current_spine_item.abshref(elem.attrib['src'])
                 try:
-                    item = self.oeb.manifest.hrefs[urlnormalize(href)]
+                    item = self.oeb.manifest.hrefs[base.urlnormalize(href)]
                 except:
                     self.oeb.logger.warn('Failed to find image:',
                             href)
@@ -534,9 +536,9 @@ class MobiMLizer(object):
             isinstance(valign, numbers.Number) and valign > 0)
         vtag = 'sup' if issup else 'sub'
         if not_baseline and not ignore_valign and tag not in NOT_VTAGS and not isblock:
-            nroot = etree.Element(XHTML('html'), nsmap=MOBI_NSMAP)
-            vbstate = BlockState(etree.SubElement(nroot, XHTML('body')))
-            vbstate.para = etree.SubElement(vbstate.body, XHTML('p'))
+            nroot = etree.Element(base.tag('xhtml', 'html'), nsmap=MOBI_NSMAP)
+            vbstate = BlockState(etree.SubElement(nroot, base.tag('xhtml', 'body')))
+            vbstate.para = etree.SubElement(vbstate.body, base.tag('xhtml', 'p'))
             self.mobimlize_elem(elem, stylizer, vbstate, istates,
                     ignore_valign=True)
             if len(istates) > 0:
@@ -548,8 +550,8 @@ class MobiMLizer(object):
                 self.mobimlize_content('span', '', bstate, istates)
             parent = bstate.para if bstate.inline is None else bstate.inline
             if parent is not None:
-                vtag = etree.SubElement(parent, XHTML(vtag))
-                vtag = etree.SubElement(vtag, XHTML('small'))
+                vtag = etree.SubElement(parent, base.tag('xhtml', vtag))
+                vtag = etree.SubElement(vtag, base.tag('xhtml', 'small'))
                 # Add anchors
                 for child in vbstate.body:
                     if child is not vbstate.para:
@@ -601,7 +603,7 @@ class MobiMLizer(object):
             para = bstate.para
             if para is not None and para.text == '\xa0' and len(para) < 1:
                 if style.height > 2:
-                    para.getparent().replace(para, etree.Element(XHTML('br')))
+                    para.getparent().replace(para, etree.Element(base.tag('xhtml', 'br')))
                 else:
                     # This is too small to be rendered effectively, drop it
                     para.getparent().remove(para)
diff --git a/ebook_converter/ebooks/mobi/reader/mobi8.py b/ebook_converter/ebooks/mobi/reader/mobi8.py
index a50d6bc..02b2f0e 100644
--- a/ebook_converter/ebooks/mobi/reader/mobi8.py
+++ b/ebook_converter/ebooks/mobi/reader/mobi8.py
@@ -8,6 +8,7 @@ import uuid
 
 from lxml import etree
 
+from ebook_converter import constants as const
 from ebook_converter.ebooks.mobi.reader.headers import NULL_INDEX
 from ebook_converter.ebooks.mobi.reader.index import read_index
 from ebook_converter.ebooks.mobi.reader.ncx import read_ncx, build_toc
@@ -17,7 +18,7 @@ from ebook_converter.ebooks.metadata.opf2 import Guide, OPFCreator
 from ebook_converter.ebooks.metadata.toc import TOC
 from ebook_converter.ebooks.mobi.utils import read_font_record
 from ebook_converter.ebooks.oeb.parse_utils import parse_html
-from ebook_converter.ebooks.oeb.base import XPath, XHTML, xml2text
+from ebook_converter.ebooks.oeb.base import XPath, xml2text
 from ebook_converter.polyglot.builtins import as_unicode
 
 
@@ -553,8 +554,8 @@ class Mobi8Reader(object):
         seen = set()
         links = []
         for elem in root.iterdescendants(etree.Element):
-            if reached and elem.tag == XHTML('a') and elem.get('href',
-                    False):
+            if reached and elem.tag == const.XHTML_A and elem.get('href',
+                                                                  False):
                 href = elem.get('href')
                 href, frag = urllib.parse.urldefrag(href)
                 href = base_href + '/' + href
diff --git a/ebook_converter/ebooks/mobi/writer2/serializer.py b/ebook_converter/ebooks/mobi/writer2/serializer.py
index c1f2587..6d0ae8d 100644
--- a/ebook_converter/ebooks/mobi/writer2/serializer.py
+++ b/ebook_converter/ebooks/mobi/writer2/serializer.py
@@ -4,16 +4,11 @@ import re
 import unicodedata
 import urllib.parse
 
+from ebook_converter import constants as const
 from ebook_converter.ebooks.mobi.mobiml import MBP_NS
 from ebook_converter.ebooks.mobi.utils import is_guide_ref_start
-from ebook_converter.ebooks.oeb.base import (
-    OEB_DOCS, XHTML, XHTML_NS, XML_NS, namespace, prefixname, urlnormalize
-)
-
-
-__license__ = 'GPL v3'
-__copyright__ = '2011, Kovid Goyal <kovid@kovidgoyal.net>'
-__docformat__ = 'restructuredtext en'
+from ebook_converter.ebooks.oeb import base
+from ebook_converter.ebooks.oeb import parse_utils
 
 
 class Buf(io.BytesIO):
@@ -25,9 +20,14 @@ class Buf(io.BytesIO):
 
 
 class Serializer(object):
-    NSRMAP = {'': None, XML_NS: 'xml', XHTML_NS: '', MBP_NS: 'mbp'}
+    NSRMAP = {'': None,
+              const.XML_NS: 'xml',
+              const.XHTML_NS: '',
+              MBP_NS: 'mbp'}  # TODO(gryf): check why this is different than
+                              # MBP_NS from const.
 
-    def __init__(self, oeb, images, is_periodical, write_page_breaks_after_item=True):
+    def __init__(self, oeb, images, is_periodical,
+                 write_page_breaks_after_item=True):
         '''
         Write all the HTML markup in oeb into a single in memory buffer
         containing a single html document with links replaced by offsets into
@@ -157,7 +157,8 @@ class Serializer(object):
         buf.write(b'<guide>')
         for ref in self.oeb.guide.values():
             path = urllib.parse.urldefrag(ref.href)[0]
-            if path not in hrefs or hrefs[path].media_type not in OEB_DOCS:
+            if (path not in hrefs or
+                    hrefs[path].media_type not in base.OEB_DOCS):
                 continue
 
             buf.write(b'<reference type="')
@@ -178,28 +179,28 @@ class Serializer(object):
 
         buf.write(b'</guide>')
 
-    def serialize_href(self, href, base=None):
-        '''
+    def serialize_href(self, href, _base=None):
+        """
         Serialize the href attribute of an <a> or <reference> tag. It is
         serialized as filepos="000000000" and a pointer to its location is
         stored in self.href_offsets so that the correct value can be filled in
         at the end.
-        '''
+        """
         hrefs = self.oeb.manifest.hrefs
         try:
-            path, frag = urllib.parse.urldefrag(urlnormalize(href))
+            path, frag = urllib.parse.urldefrag(base.urlnormalize(href))
         except ValueError:
             # Unparseable URL
             return False
-        if path and base:
-            path = base.abshref(path)
+        if path and _base:
+            path = _base.abshref(path)
         if path and path not in hrefs:
             return False
         buf = self.buf
         item = hrefs[path] if path else None
         if item and item.spine_position is None:
             return False
-        path = item.href if item else base.href
+        path = item.href if item else _base.href
         href = '#'.join((path, frag)) if frag else path
         buf.write(b'filepos=')
         self.href_offsets[href].append(buf.tell())
@@ -219,7 +220,7 @@ class Serializer(object):
             if href is not None:
                 # resolve the section url in id_offsets
                 buf.write(b'<mbp:pagebreak />')
-                self.id_offsets[urlnormalize(href)] = buf.tell()
+                self.id_offsets[base.urlnormalize(href)] = buf.tell()
 
             if tocref.klass == "periodical":
                 buf.write(b'<div> <div height="1em"></div>')
@@ -267,7 +268,7 @@ class Serializer(object):
 
             if self.is_periodical and item.is_section_start:
                 for section_toc in top_toc.nodes:
-                    if urlnormalize(item.href) == section_toc.href:
+                    if base.urlnormalize(item.href) == section_toc.href:
                         # create section url of the form r'feed_\d+/index.html'
                         section_url = re.sub(r'article_\d+/', '', section_toc.href)
                         serialize_toc_level(section_toc, section_url)
@@ -287,12 +288,12 @@ class Serializer(object):
         buf = self.buf
         if not item.linear:
             self.breaks.append(buf.tell() - 1)
-        self.id_offsets[urlnormalize(item.href)] = buf.tell()
+        self.id_offsets[base.urlnormalize(item.href)] = buf.tell()
         if item.is_section_start:
             buf.write(b'<a ></a> ')
         if item.is_article_start:
             buf.write(b'<a ></a> <a ></a>')
-        for elem in item.data.find(XHTML('body')):
+        for elem in item.data.find(base.tag('xhtml', 'body')):
             self.serialize_elem(elem, item)
         if self.write_page_breaks_after_item:
             buf.write(b'<mbp:pagebreak/>')
@@ -306,15 +307,15 @@ class Serializer(object):
     def serialize_elem(self, elem, item, nsrmap=NSRMAP):
         buf = self.buf
         if not isinstance(elem.tag, (str, bytes)) \
-            or namespace(elem.tag) not in nsrmap:
+            or parse_utils.namespace(elem.tag) not in nsrmap:
             return
-        tag = prefixname(elem.tag, nsrmap)
+        tag = base.prefixname(elem.tag, nsrmap)
         # Previous layers take care of @name
         id_ = elem.attrib.pop('id', None)
         if id_:
             href = '#'.join((item.href, id_))
             offset = self.anchor_offset or buf.tell()
-            key = urlnormalize(href)
+            key = base.urlnormalize(href)
             # Only set this id_offset if it wasn't previously seen
             self.id_offsets[key] = self.id_offsets.get(key, offset)
         if self.anchor_offset is not None and \
@@ -326,15 +327,15 @@ class Serializer(object):
         buf.write(tag.encode('utf-8'))
         if elem.attrib:
             for attr, val in elem.attrib.items():
-                if namespace(attr) not in nsrmap:
+                if parse_utils.namespace(attr) not in nsrmap:
                     continue
-                attr = prefixname(attr, nsrmap)
+                attr = base.prefixname(attr, nsrmap)
                 buf.write(b' ')
                 if attr == 'href':
                     if self.serialize_href(val, item):
                         continue
                 elif attr == 'src':
-                    href = urlnormalize(item.abshref(val))
+                    href = base.urlnormalize(item.abshref(val))
                     if href in self.images:
                         index = self.images[href]
                         self.used_images.add(href)
diff --git a/ebook_converter/ebooks/mobi/writer8/exth.py b/ebook_converter/ebooks/mobi/writer8/exth.py
index 435aa23..4c3ed6e 100644
--- a/ebook_converter/ebooks/mobi/writer8/exth.py
+++ b/ebook_converter/ebooks/mobi/writer8/exth.py
@@ -2,6 +2,7 @@ import re
 from struct import pack
 from io import BytesIO
 
+from ebook_converter.ebooks.oeb import base
 from ebook_converter.constants_old import iswindows, isosx
 from ebook_converter.ebooks.mobi.utils import (utf8_text, to_base)
 from ebook_converter.utils.localization import lang_as_iso639_1
@@ -95,9 +96,8 @@ def build_exth(metadata, prefer_author_sort=False, is_periodical=False,
 
     # Write UUID as ASIN
     uuid = None
-    from ebook_converter.ebooks.oeb.base import OPF
     for x in metadata['identifier']:
-        if (x.get(OPF('scheme'), None).lower() == 'uuid' or
+        if (x.get(base.tag('opf', 'scheme'), None).lower() == 'uuid' or
                 str(x).startswith('urn:uuid:')):
             uuid = str(x).split(':')[-1]
             break
diff --git a/ebook_converter/ebooks/odt/input.py b/ebook_converter/ebooks/odt/input.py
index ab3f5e2..ba6b7bf 100644
--- a/ebook_converter/ebooks/odt/input.py
+++ b/ebook_converter/ebooks/odt/input.py
@@ -1,11 +1,12 @@
 """
 Convert an ODT file into a Open Ebook
 """
-import os, logging
+import logging
+import os
 
-from lxml import etree
 from css_parser import CSSParser
 from css_parser.css import CSSRule
+from lxml import etree
 
 from odf.odf2xhtml import ODF2XHTML
 from odf.opendocument import load as odLoad
@@ -14,15 +15,9 @@ from odf.namespaces import TEXTNS as odTEXTNS
 
 from ebook_converter import CurrentDir, walk
 from ebook_converter.ebooks.oeb.base import _css_logger
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 from ebook_converter.polyglot.builtins import as_bytes
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2008, Kovid Goyal kovid@kovidgoyal.net'
-__docformat__ = 'restructuredtext en'
-
-
 class Extract(ODF2XHTML):
 
     def extract_pictures(self, zf):
@@ -46,7 +41,7 @@ class Extract(ODF2XHTML):
                 ol.set('start', val)
 
     def fix_markup(self, html, log):
-        root = safe_xml_fromstring(html)
+        root = etree.fromstring(html)
         self.filter_css(root, log)
         self.extract_css(root, log)
         self.epubify_markup(root, log)
diff --git a/ebook_converter/ebooks/oeb/base.py b/ebook_converter/ebooks/oeb/base.py
index 2862fd9..769c87b 100644
--- a/ebook_converter/ebooks/oeb/base.py
+++ b/ebook_converter/ebooks/oeb/base.py
@@ -1,97 +1,45 @@
 """
 Basic support for manipulating OEB 1.x/2.0 content and metadata.
 """
-import os, re, logging, sys, numbers
-from collections import defaultdict
-from itertools import count
-from operator import attrgetter
-import urllib.parse
+import collections
+import itertools
+import logging
+import numbers
+import operator
+import os
+import re
 import string
+import sys
+import urllib.parse
 
-from lxml import etree, html
+from lxml import etree
+from lxml import html
+
+from ebook_converter import constants as const
 from ebook_converter import force_unicode
 from ebook_converter.constants_old import filesystem_encoding, __version__
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 from ebook_converter.ebooks.chardet import xml_to_unicode
 from ebook_converter.ebooks.conversion.preprocess import CSSPreProcessor
 from ebook_converter import (isbytestring, as_unicode, get_types_map)
-from ebook_converter.ebooks.oeb.parse_utils import barename, XHTML_NS, namespace, XHTML, parse_html, NotHTML
+from ebook_converter.ebooks.oeb import parse_utils
 from ebook_converter.utils.cleantext import clean_xml_chars
 from ebook_converter.utils.short_uuid import uuid4
 from ebook_converter.polyglot.urllib import unquote as urlunquote
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2008, Marshall T. Vandegrift <llasram@gmail.com>'
-__docformat__ = 'restructuredtext en'
-
-XML_NS       = 'http://www.w3.org/XML/1998/namespace'
-OEB_DOC_NS   = 'http://openebook.org/namespaces/oeb-document/1.0/'
-OPF1_NS      = 'http://openebook.org/namespaces/oeb-package/1.0/'
-OPF2_NS      = 'http://www.idpf.org/2007/opf'
-OPF_NSES     = {OPF1_NS, OPF2_NS}
-DC09_NS      = 'http://purl.org/metadata/dublin_core'
-DC10_NS      = 'http://purl.org/dc/elements/1.0/'
-DC11_NS      = 'http://purl.org/dc/elements/1.1/'
-DC_NSES      = {DC09_NS, DC10_NS, DC11_NS}
-XSI_NS       = 'http://www.w3.org/2001/XMLSchema-instance'
-DCTERMS_NS   = 'http://purl.org/dc/terms/'
-NCX_NS       = 'http://www.daisy.org/z3986/2005/ncx/'
-SVG_NS       = 'http://www.w3.org/2000/svg'
-XLINK_NS     = 'http://www.w3.org/1999/xlink'
-CALIBRE_NS   = 'http://calibre.kovidgoyal.net/2009/metadata'
-RE_NS        = 'http://exslt.org/regular-expressions'
-MBP_NS       = 'http://www.mobipocket.com'
-EPUB_NS      = 'http://www.idpf.org/2007/ops'
-MATHML_NS    = 'http://www.w3.org/1998/Math/MathML'
-
-XPNSMAP      = {
-        'h': XHTML_NS, 'o1': OPF1_NS, 'o2': OPF2_NS, 'd09': DC09_NS,
-        'd10': DC10_NS, 'd11': DC11_NS, 'xsi': XSI_NS, 'dt': DCTERMS_NS,
-        'ncx': NCX_NS, 'svg': SVG_NS, 'xl': XLINK_NS, 're': RE_NS,
-        'mathml': MATHML_NS, 'mbp': MBP_NS, 'calibre': CALIBRE_NS,
-        'epub':EPUB_NS
-}
-
-OPF1_NSMAP   = {'dc': DC11_NS, 'oebpackage': OPF1_NS}
-OPF2_NSMAP   = {'opf': OPF2_NS, 'dc': DC11_NS, 'dcterms': DCTERMS_NS,
-                'xsi': XSI_NS, 'calibre': CALIBRE_NS}
-
-
-def XML(name):
-    return '{%s}%s' % (XML_NS, name)
-
-
-def OPF(name):
-    return '{%s}%s' % (OPF2_NS, name)
-
-
-def DC(name):
-    return '{%s}%s' % (DC11_NS, name)
-
-
-def XSI(name):
-    return '{%s}%s' % (XSI_NS, name)
-
-
-def DCTERMS(name):
-    return '{%s}%s' % (DCTERMS_NS, name)
-
-
-def NCX(name):
-    return '{%s}%s' % (NCX_NS, name)
-
-
-def SVG(name):
-    return '{%s}%s' % (SVG_NS, name)
-
-
-def XLINK(name):
-    return '{%s}%s' % (XLINK_NS, name)
-
-
-def CALIBRE(name):
-    return '{%s}%s' % (CALIBRE_NS, name)
+def tag(tag_ns, name):
+    tag_map = {'calibre': const.CALIBRE_NS,
+               'dc': const.DC11_NS,
+               'dcterms': const.DCTERMS_NS,
+               'epub': const.EPUB_NS,
+               'ncx': const.NCX_NS,
+               'opf': const.OPF2_NS,
+               'svg': const.SVG_NS,
+               'xhtml': const.XHTML_NS,
+               'xlink': const.XLINK_NS,
+               'xml': const.XML_NS,
+               'xsi': const.XSI_NS}
+    return '{%s}%s' % (tag_map[tag_ns], name)
 
 
 _css_url_re = re.compile(r'url\s*\([\'"]{0,1}(.*?)[\'"]{0,1}\)', re.I)
@@ -99,14 +47,18 @@ _css_import_re = re.compile(r'@import "(.*?)"')
 _archive_re = re.compile(r'[^ ]+')
 
 # Tags that should not be self closed in epub output
-self_closing_bad_tags = {'a', 'abbr', 'address', 'article', 'aside', 'audio', 'b',
-'bdo', 'blockquote', 'body', 'button', 'cite', 'code', 'dd', 'del', 'details',
-'dfn', 'div', 'dl', 'dt', 'em', 'fieldset', 'figcaption', 'figure', 'footer',
-'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'header', 'hgroup', 'i', 'iframe', 'ins', 'kbd',
-'label', 'legend', 'li', 'map', 'mark', 'meter', 'nav', 'ol', 'output', 'p',
-'pre', 'progress', 'q', 'rp', 'rt', 'samp', 'section', 'select', 'small',
-'span', 'strong', 'sub', 'summary', 'sup', 'textarea', 'time', 'ul', 'var',
-'video', 'title', 'script', 'style'}
+self_closing_bad_tags = {'a', 'abbr', 'address', 'article', 'aside', 'audio',
+                         'b', 'bdo', 'blockquote', 'body', 'button', 'cite',
+                         'code', 'dd', 'del', 'details', 'dfn', 'div', 'dl',
+                         'dt', 'em', 'fieldset', 'figcaption', 'figure',
+                         'footer', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6',
+                         'header', 'hgroup', 'i', 'iframe', 'ins', 'kbd',
+                         'label', 'legend', 'li', 'map', 'mark', 'meter',
+                         'nav', 'ol', 'output', 'p', 'pre', 'progress', 'q',
+                         'rp', 'rt', 'samp', 'section', 'select', 'small',
+                         'span', 'strong', 'sub', 'summary', 'sup',
+                         'textarea', 'time', 'ul', 'var', 'video', 'title',
+                         'script', 'style'}
 
 
 def css_text(x):
@@ -157,7 +109,7 @@ def itercsslinks(raw):
         yield match.group(1), match.start(1)
 
 
-_link_attrs = set(html.defs.link_attrs) | {XLINK('href'), 'poster'}
+_link_attrs = set(html.defs.link_attrs) | {tag('xlink', 'href'), 'poster'}
 
 
 def iterlinks(root, find_links_in_css=True):
@@ -170,7 +122,7 @@ def iterlinks(root, find_links_in_css=True):
 
     for el in root.iter('*'):
         try:
-            tag = barename(el.tag).lower()
+            tag = parse_utils.barename(el.tag).lower()
         except Exception:
             continue
         attribs = el.attrib
@@ -225,7 +177,7 @@ def make_links_absolute(root, base_url):
 def resolve_base_href(root):
     base_href = None
     basetags = root.xpath('//base[@href]|//h:base[@href]',
-            namespaces=XPNSMAP)
+                          namespaces=const.XPNSMAP)
     for b in basetags:
         base_href = b.get('href')
         b.drop_tree()
@@ -278,20 +230,20 @@ def rewrite_links(root, link_repl_func, resolve_base_href=False):
                 el.attrib[attrib] = new
 
     parser = CSSParser(raiseExceptions=False, log=_css_logger,
-            fetcher=lambda x:(None, None))
+                       fetcher=lambda x: (None, None))
     for el in root.iter(etree.Element):
         try:
             tag = el.tag
         except UnicodeDecodeError:
             continue
 
-        if tag == XHTML('style') and el.text and \
+        if tag == parse_utils.XHTML('style') and el.text and \
                 (_css_url_re.search(el.text) is not None or '@import' in
-                        el.text):
+                 el.text):
             stylesheet = parser.parseString(el.text, validate=False)
             replaceUrls(stylesheet, link_repl_func)
             repl = css_text(stylesheet)
-            el.text = '\n'+ clean_xml_chars(repl) + '\n'
+            el.text = '\n' + clean_xml_chars(repl) + '\n'
 
         text = el.get('style')
         if text and _css_url_re.search(text) is not None:
@@ -301,43 +253,41 @@ def rewrite_links(root, link_repl_func, resolve_base_href=False):
                 # Parsing errors are raised by css_parser
                 continue
             replaceUrls(stext, link_repl_func)
-            repl = css_text(stext).replace('\n', ' ').replace('\r',
-                    ' ')
+            repl = css_text(stext).replace('\n', ' ').replace('\r', ' ')
             el.set('style', repl)
 
 
 types_map = get_types_map()
-EPUB_MIME      = types_map['.epub']
-XHTML_MIME     = types_map['.xhtml']
-CSS_MIME       = types_map['.css']
-NCX_MIME       = types_map['.ncx']
-OPF_MIME       = types_map['.opf']
-PAGE_MAP_MIME  = 'application/oebps-page-map+xml'
-OEB_DOC_MIME   = 'text/x-oeb1-document'
-OEB_CSS_MIME   = 'text/x-oeb1-css'
-OPENTYPE_MIME  = types_map['.otf']
-GIF_MIME       = types_map['.gif']
-JPEG_MIME      = types_map['.jpeg']
-PNG_MIME       = types_map['.png']
-SVG_MIME       = types_map['.svg']
-BINARY_MIME    = 'application/octet-stream'
+EPUB_MIME = types_map['.epub']
+XHTML_MIME = types_map['.xhtml']
+CSS_MIME = types_map['.css']
+NCX_MIME = types_map['.ncx']
+OPF_MIME = types_map['.opf']
+PAGE_MAP_MIME = 'application/oebps-page-map+xml'
+OEB_DOC_MIME = 'text/x-oeb1-document'
+OEB_CSS_MIME = 'text/x-oeb1-css'
+OPENTYPE_MIME = types_map['.otf']
+GIF_MIME = types_map['.gif']
+JPEG_MIME = types_map['.jpeg']
+PNG_MIME = types_map['.png']
+SVG_MIME = types_map['.svg']
+BINARY_MIME = 'application/octet-stream'
 
-XHTML_CSS_NAMESPACE = '@namespace "%s";\n' % XHTML_NS
+XHTML_CSS_NAMESPACE = '@namespace "%s";\n' % const.XHTML_NS
 
-OEB_STYLES        = {CSS_MIME, OEB_CSS_MIME, 'text/x-oeb-css', 'xhtml/css'}
-OEB_DOCS          = {XHTML_MIME, 'text/html', OEB_DOC_MIME,
-                         'text/x-oeb-document'}
+OEB_STYLES = {CSS_MIME, OEB_CSS_MIME, 'text/x-oeb-css', 'xhtml/css'}
+OEB_DOCS = {XHTML_MIME, 'text/html', OEB_DOC_MIME, 'text/x-oeb-document'}
 OEB_RASTER_IMAGES = {GIF_MIME, JPEG_MIME, PNG_MIME}
-OEB_IMAGES        = {GIF_MIME, JPEG_MIME, PNG_MIME, SVG_MIME}
+OEB_IMAGES = {GIF_MIME, JPEG_MIME, PNG_MIME, SVG_MIME}
 
 MS_COVER_TYPE = 'other.ms-coverimage-standard'
 
-ENTITY_RE     = re.compile(r'&([a-zA-Z_:][a-zA-Z0-9.-_:]+);')
-COLLAPSE_RE   = re.compile(r'[ \t\r\n\v]+')
-QNAME_RE      = re.compile(r'^[{][^{}]+[}][^{}]+$')
+ENTITY_RE = re.compile(r'&([a-zA-Z_:][a-zA-Z0-9.-_:]+);')
+COLLAPSE_RE = re.compile(r'[ \t\r\n\v]+')
+QNAME_RE = re.compile(r'^[{][^{}]+[}][^{}]+$')
 PREFIXNAME_RE = re.compile(r'^[^:]+[:][^:]+')
-XMLDECL_RE    = re.compile(r'^\s*<[?]xml.*?[?]>')
-CSSURL_RE     = re.compile(r'''url[(](?P<q>["']?)(?P<url>[^)]+)(?P=q)[)]''')
+XMLDECL_RE = re.compile(r'^\s*<[?]xml.*?[?]>')
+CSSURL_RE = re.compile(r'''url[(](?P<q>["']?)(?P<url>[^)]+)(?P=q)[)]''')
 
 
 def element(parent, *args, **kwargs):
@@ -349,13 +299,13 @@ def element(parent, *args, **kwargs):
 def prefixname(name, nsrmap):
     if not isqname(name):
         return name
-    ns = namespace(name)
+    ns = parse_utils.namespace(name)
     if ns not in nsrmap:
         return name
     prefix = nsrmap[ns]
     if not prefix:
-        return barename(name)
-    return ':'.join((prefix, barename(name)))
+        return parse_utils.barename(name)
+    return ':'.join((prefix, parse_utils.barename(name)))
 
 
 def isprefixname(name):
@@ -376,11 +326,11 @@ def isqname(name):
 
 
 def XPath(expr):
-    return etree.XPath(expr, namespaces=XPNSMAP)
+    return etree.XPath(expr, namespaces=const.XPNSMAP)
 
 
 def xpath(elem, expr):
-    return elem.xpath(expr, namespaces=XPNSMAP)
+    return elem.xpath(expr, namespaces=const.XPNSMAP)
 
 
 def xml2str(root, pretty_print=False, strip_comments=False, with_tail=True):
@@ -390,7 +340,7 @@ def xml2str(root, pretty_print=False, strip_comments=False, with_tail=True):
             if x.text and '--' in x.text:
                 x.text = x.text.replace('--', '__')
     ans = etree.tostring(root, encoding='utf-8', xml_declaration=True,
-                          pretty_print=pretty_print, with_tail=with_tail)
+                         pretty_print=pretty_print, with_tail=with_tail)
 
     if strip_comments:
         ans = re.compile(br'<!--.*?-->', re.DOTALL).sub(b'', ans)
@@ -399,12 +349,14 @@ def xml2str(root, pretty_print=False, strip_comments=False, with_tail=True):
 
 
 def xml2text(elem, pretty_print=False, method='text'):
-    return etree.tostring(elem, method=method, encoding='unicode', with_tail=False, pretty_print=pretty_print)
+    return etree.tostring(elem, method=method, encoding='unicode',
+                          with_tail=False, pretty_print=pretty_print)
 
 
 def escape_cdata(root):
     pat = re.compile(r'[<>&]')
-    for elem in root.iterdescendants('{%s}style' % XHTML_NS, '{%s}script' % XHTML_NS):
+    for elem in root.iterdescendants('{%s}style' % const.XHTML_NS,
+                                     '{%s}script' % const.XHTML_NS):
         if elem.text and pat.search(elem.text) is not None:
             elem.text = etree.CDATA(elem.text.replace(']]>', r'\]\]\>'))
 
@@ -431,12 +383,12 @@ def serialize(data, media_type, pretty_print=False):
     return bytes(data)
 
 
-ASCII_CHARS   = frozenset(chr(x) for x in range(128))
+ASCII_CHARS = frozenset(chr(x) for x in range(128))
 UNIBYTE_CHARS = frozenset(x.encode('ascii') for x in ASCII_CHARS)
-USAFE         = ('ABCDEFGHIJKLMNOPQRSTUVWXYZ'
-                 'abcdefghijklmnopqrstuvwxyz'
-                 '0123456789' '_.-/~')
-URL_SAFE      = frozenset(USAFE)
+USAFE = ('ABCDEFGHIJKLMNOPQRSTUVWXYZ'
+         'abcdefghijklmnopqrstuvwxyz'
+         '0123456789' '_.-/~')
+URL_SAFE = frozenset(USAFE)
 URL_SAFE_BYTES = frozenset(USAFE.encode('ascii'))
 URL_UNSAFE = [ASCII_CHARS - URL_SAFE, UNIBYTE_CHARS - URL_SAFE_BYTES]
 del USAFE
@@ -466,7 +418,8 @@ def urlnormalize(href):
     try:
         parts = urllib.parse.urlparse(href)
     except ValueError as e:
-        raise ValueError('Failed to parse the URL: %r with underlying error: %s' % (href, as_unicode(e)))
+        raise ValueError('Failed to parse the URL: %r with underlying error: '
+                         '%s' % (href, as_unicode(e)))
     if not parts.scheme or parts.scheme == 'file':
         path, frag = urllib.parse.urldefrag(href)
         parts = ('', '', path, '', '', frag)
@@ -503,8 +456,10 @@ class DummyHandler(logging.Handler):
     def emit(self, record):
         if self.log is not None:
             msg = self.format(record)
-            f = self.log.error if record.levelno >= logging.ERROR \
-                    else self.log.warn
+            if record.levelno >= logging.ERROR:
+                f = self.log.error
+            else:
+                self.log.warn
             f(msg)
 
 
@@ -630,18 +585,21 @@ class Metadata(object):
     metadata items.
     """
 
-    DC_TERMS      = {'contributor', 'coverage', 'creator', 'date',
-                         'description', 'format', 'identifier', 'language',
-                         'publisher', 'relation', 'rights', 'source',
-                         'subject', 'title', 'type'}
+    DC_TERMS = {'contributor', 'coverage', 'creator', 'date', 'description',
+                'format', 'identifier', 'language', 'publisher', 'relation',
+                'rights', 'source', 'subject', 'title', 'type'}
     CALIBRE_TERMS = {'series', 'series_index', 'rating', 'timestamp',
-                         'publication_type', 'title_sort'}
-    OPF_ATTRS     = {'role': OPF('role'), 'file-as': OPF('file-as'),
-                     'scheme': OPF('scheme'), 'event': OPF('event'),
-                     'type': XSI('type'), 'lang': XML('lang'), 'id': 'id'}
-    OPF1_NSMAP    = {'dc': DC11_NS, 'oebpackage': OPF1_NS}
-    OPF2_NSMAP    = {'opf': OPF2_NS, 'dc': DC11_NS, 'dcterms': DCTERMS_NS,
-                     'xsi': XSI_NS, 'calibre': CALIBRE_NS}
+                     'publication_type', 'title_sort'}
+    OPF_ATTRS = {'role': tag('opf', 'role'), 'file-as': tag('opf', 'file-as'),
+                 'scheme': tag('opf', 'scheme'), 'event': tag('opf', 'event'),
+                 'type': tag('xsi', 'type'), 'lang': tag('xml', 'lang'),
+                 'id': 'id'}
+    OPF1_NSMAP = {'dc': const.DC11_NS, 'oebpackage': const.OPF1_NS}
+    OPF2_NSMAP = {'calibre': const.CALIBRE_NS,
+                  'dc': const.DC11_NS,
+                  'dcterms': const.DCTERMS_NS,
+                  'opf': const.OPF2_NS,
+                  'xsi': const.XSI_NS}
 
     class Item(object):
         """An item of OEB data model metadata.
@@ -667,13 +625,13 @@ class Metadata(object):
 
             def term_attr(self, obj):
                 term = obj.term
-                if namespace(term) != DC11_NS:
-                    term = OPF('meta')
+                if parse_utils.namespace(term) != const.DC11_NS:
+                    term = tag('opf', 'meta')
                 allowed = self.allowed
                 if allowed is not None and term not in allowed:
                     raise AttributeError(
                         'attribute %r not valid for metadata term %r' % (
-                            self.attr(term), barename(obj.term)))
+                            self.attr(term), parse_utils.barename(obj.term)))
                 return self.attr(term)
 
             def __get__(self, obj, cls):
@@ -688,23 +646,25 @@ class Metadata(object):
             self.attrib = attrib = dict(attrib)
             self.nsmap = nsmap = dict(nsmap)
             attrib.update(kwargs)
-            if namespace(term) == OPF2_NS:
-                term = barename(term)
-            ns = namespace(term)
-            local = barename(term).lower()
-            if local in Metadata.DC_TERMS and (not ns or ns in DC_NSES):
+            if parse_utils.namespace(term) == const.OPF2_NS:
+                term = parse_utils.barename(term)
+            ns = parse_utils.namespace(term)
+            local = parse_utils.barename(term).lower()
+            if local in Metadata.DC_TERMS and (not ns or ns in const.DC_NSES):
                 # Anything looking like Dublin Core is coerced
-                term = DC(local)
-            elif local in Metadata.CALIBRE_TERMS and ns in (CALIBRE_NS, ''):
+                term = tag('dc', local)
+            elif local in Metadata.CALIBRE_TERMS and ns in (const.CALIBRE_NS,
+                                                            ''):
                 # Ditto for Calibre-specific metadata
-                term = CALIBRE(local)
+                term = tag('calibre', local)
             self.term = term
             self.value = value
             for attr, value in tuple(attrib.items()):
                 if isprefixname(value):
                     attrib[attr] = qname(value, nsmap)
                 nsattr = Metadata.OPF_ATTRS.get(attr, attr)
-                if nsattr == OPF('scheme') and namespace(term) != DC11_NS:
+                if (nsattr == tag('opf', 'scheme') and
+                        parse_utils.namespace(term) != const.DC11_NS):
                     # The opf:meta element takes @scheme, not @opf:scheme
                     nsattr = 'scheme'
                 if attr != nsattr:
@@ -722,21 +682,29 @@ class Metadata(object):
         def content(self, value):
             self.value = value
 
-        scheme  = Attribute(lambda term: 'scheme' if
-                            term == OPF('meta') else OPF('scheme'),
-                            [DC('identifier'), OPF('meta')])
-        file_as = Attribute(OPF('file-as'), [DC('creator'), DC('contributor'),
-                                             DC('title')])
-        role    = Attribute(OPF('role'), [DC('creator'), DC('contributor')])
-        event   = Attribute(OPF('event'), [DC('date')])
-        id      = Attribute('id')
-        type    = Attribute(XSI('type'), [DC('date'), DC('format'),
-                                          DC('type')])
-        lang    = Attribute(XML('lang'), [DC('contributor'), DC('coverage'),
-                                          DC('creator'), DC('publisher'),
-                                          DC('relation'), DC('rights'),
-                                          DC('source'), DC('subject'),
-                                          OPF('meta')])
+        scheme = Attribute(lambda term: 'scheme' if
+                           term == tag('opf', 'meta') else
+                           tag('opf', 'scheme'),
+                           [tag('dc', 'identifier'), tag('opf', 'meta')])
+        file_as = Attribute(tag('opf', 'file-as'), [tag('dc', 'creator'),
+                                                    tag('dc', 'contributor'),
+                                                    tag('dc', 'title')])
+        role = Attribute(tag('opf', 'role'), [tag('dc', 'creator'),
+                                              tag('dc', 'contributor')])
+        event = Attribute(tag('opf', 'event'), [tag('dc', 'date')])
+        id = Attribute('id')
+        type = Attribute(tag('xsi', 'type'), [tag('dc', 'date'),
+                                              tag('dc', 'format'),
+                                              tag('dc', 'type')])
+        lang = Attribute(tag('xml', 'lang'), [tag('dc', 'contributor'),
+                                              tag('dc', 'coverage'),
+                                              tag('dc', 'creator'),
+                                              tag('dc', 'publisher'),
+                                              tag('dc', 'relation'),
+                                              tag('dc', 'rights'),
+                                              tag('dc', 'source'),
+                                              tag('dc', 'subject'),
+                                              tag('opf', 'meta')])
 
         def __getitem__(self, key):
             return self.attrib[key]
@@ -752,7 +720,7 @@ class Metadata(object):
 
         def __repr__(self):
             return 'Item(term=%r, value=%r, attrib=%r)' \
-                % (barename(self.term), self.value, self.attrib)
+                % (parse_utils.barename(self.term), self.value, self.attrib)
 
         def __str__(self):
             return as_unicode(self.value)
@@ -760,11 +728,12 @@ class Metadata(object):
         def to_opf1(self, dcmeta=None, xmeta=None, nsrmap={}):
             attrib = {}
             for key, value in self.attrib.items():
-                if namespace(key) == OPF2_NS:
-                    key = barename(key)
+                if parse_utils.namespace(key) == const.OPF2_NS:
+                    key = parse_utils.barename(key)
                 attrib[key] = prefixname(value, nsrmap)
-            if namespace(self.term) == DC11_NS:
-                name = DC(string.capwords(barename(self.term)))
+            if parse_utils.namespace(self.term) == const.DC11_NS:
+                name = tag('dc',
+                           string.capwords(parse_utils.barename(self.term)))
                 elem = element(dcmeta, name, attrib=attrib)
                 elem.text = self.value
             else:
@@ -777,27 +746,27 @@ class Metadata(object):
             attrib = {}
             for key, value in self.attrib.items():
                 attrib[key] = prefixname(value, nsrmap)
-            if namespace(self.term) == DC11_NS:
+            if parse_utils.namespace(self.term) == const.DC11_NS:
                 elem = element(parent, self.term, attrib=attrib)
                 try:
                     elem.text = self.value
-                except:
+                except Exception:
                     elem.text = repr(self.value)
             else:
-                elem = element(parent, OPF('meta'), attrib=attrib)
+                elem = element(parent, tag('opf', 'meta'), attrib=attrib)
                 elem.attrib['name'] = prefixname(self.term, nsrmap)
                 elem.attrib['content'] = prefixname(self.value, nsrmap)
             return elem
 
     def __init__(self, oeb):
         self.oeb = oeb
-        self.items = defaultdict(list)
+        self.items = collections.defaultdict(list)
         self.primary_writing_mode = None
 
     def add(self, term, value, attrib={}, nsmap={}, **kwargs):
         """Add a new metadata item."""
         item = self.Item(term, value, attrib, nsmap, **kwargs)
-        items = self.items[barename(item.term)]
+        items = self.items[parse_utils.barename(item.term)]
         items.append(item)
         return item
 
@@ -807,15 +776,15 @@ class Metadata(object):
     __iter__ = iterkeys
 
     def clear(self, key):
-        l = self.items[key]
-        for x in list(l):
-            l.remove(x)
+        val = self.items[key]
+        for x in list(val):
+            val.remove(x)
 
     def filter(self, key, predicate):
-        l = self.items[key]
-        for x in list(l):
+        val = self.items[key]
+        for x in list(val):
             if predicate(x):
-                l.remove(x)
+                val.remove(x)
 
     def __getitem__(self, key):
         return self.items[key]
@@ -838,21 +807,21 @@ class Metadata(object):
     def _opf1_nsmap(self):
         nsmap = self._nsmap
         for key, value in nsmap.items():
-            if value in OPF_NSES or value in DC_NSES:
+            if value in const.OPF_NSES or value in const.DC_NSES:
                 del nsmap[key]
         return nsmap
 
     @property
     def _opf2_nsmap(self):
         nsmap = self._nsmap
-        nsmap.update(OPF2_NSMAP)
+        nsmap.update(const.OPF2_NSMAP)
         return nsmap
 
     def to_opf1(self, parent=None):
         nsmap = self._opf1_nsmap
         nsrmap = {value: key for key, value in nsmap.items()}
         elem = element(parent, 'metadata', nsmap=nsmap)
-        dcmeta = element(elem, 'dc-metadata', nsmap=OPF1_NSMAP)
+        dcmeta = element(elem, 'dc-metadata', nsmap=const.OPF1_NSMAP)
         xmeta = element(elem, 'x-metadata')
         for term in self.items:
             for item in self.items[term]:
@@ -865,12 +834,16 @@ class Metadata(object):
     def to_opf2(self, parent=None):
         nsmap = self._opf2_nsmap
         nsrmap = {value: key for key, value in nsmap.items()}
-        elem = element(parent, OPF('metadata'), nsmap=nsmap)
+        elem = element(parent, tag('opf', 'metadata'), nsmap=nsmap)
         for term in self.items:
             for item in self.items[term]:
                 item.to_opf2(elem, nsrmap=nsrmap)
         if self.primary_writing_mode:
-            elem.append(elem.makeelement(OPF('meta'), attrib={'name':'primary-writing-mode', 'content':self.primary_writing_mode}))
+            elem.append(elem.makeelement(tag('opf', 'meta'),
+                                         attrib={'name':
+                                                 'primary-writing-mode',
+                                                 'content':
+                                                 self.primary_writing_mode}))
         return elem
 
 
@@ -936,8 +909,8 @@ class Manifest(object):
             if not data:
                 return
             data = xml_to_unicode(data, strip_encoding_pats=True,
-                    assume_utf8=True, resolve_entities=True)[0]
-            return safe_xml_fromstring(data)
+                                  assume_utf8=True, resolve_entities=True)[0]
+            return etree.fromstring(data)
 
         def _parse_xhtml(self, data):
             orig_data = data
@@ -945,11 +918,13 @@ class Manifest(object):
             self.oeb.log.debug('Parsing', fname, '...')
             self.oeb.html_preprocessor.current_href = self.href
             try:
-                data = parse_html(data, log=self.oeb.log,
-                        decoder=self.oeb.decode,
-                        preprocessor=self.oeb.html_preprocessor,
-                        filename=fname, non_html_file_tags={'ncx'})
-            except NotHTML:
+                data = parse_utils.parse_html(data, log=self.oeb.log,
+                                              decoder=self.oeb.decode,
+                                              preprocessor=self.oeb.
+                                              html_preprocessor,
+                                              filename=fname,
+                                              non_html_file_tags={'ncx'})
+            except parse_utils.NotHTML:
                 return self._parse_xml(orig_data)
             return data
 
@@ -981,7 +956,8 @@ class Manifest(object):
             data = self.oeb.decode(data)
             data = self.oeb.css_preprocessor(data, add_namespace=False)
             parser = CSSParser(loglevel=logging.WARNING,
-                               fetcher=self.override_css_fetch or self._fetch_css,
+                               fetcher=self.override_css_fetch or
+                               self._fetch_css,
                                log=_css_logger)
             data = parser.parseString(data, href=self.href, validate=False)
             data = resolveImports(data)
@@ -1013,8 +989,8 @@ class Manifest(object):
               convert and return as an lxml.etree element in the XHTML
               namespace.
             - XML content is parsed and returned as an lxml.etree element.
-            - CSS and CSS-variant content is parsed and returned as a css_parser
-              CSS DOM stylesheet.
+            - CSS and CSS-variant content is parsed and returned as a
+              css_parser CSS DOM stylesheet.
             - All other content is returned as a :class:`str` or :class:`bytes`
               object with no special parsing.
             """
@@ -1023,7 +999,7 @@ class Manifest(object):
                 if self._loader is None:
                     return None
                 data = self._loader(getattr(self, 'html_input_href',
-                    self.href))
+                                            self.href))
             try:
                 mt = self.media_type.lower()
             except Exception:
@@ -1037,8 +1013,8 @@ class Manifest(object):
             elif mt in OEB_STYLES:
                 data = self._parse_css(data)
             elif mt == 'text/plain':
-                self.oeb.log.warn('%s contains data in TXT format'%self.href,
-                        'converting to HTML')
+                self.oeb.log.warn('%s contains data in TXT format' % self.href,
+                                  'converting to HTML')
                 data = self._parse_txt(data)
                 self.media_type = XHTML_MIME
             self._data = data
@@ -1055,8 +1031,10 @@ class Manifest(object):
         def unload_data_from_memory(self, memory=None):
             if isinstance(self._data, bytes):
                 if memory is None:
-                    from ebook_converter.ptempfile import PersistentTemporaryFile
-                    pt = PersistentTemporaryFile(suffix='_oeb_base_mem_unloader.img')
+                    from ebook_converter.ptempfile import \
+                            PersistentTemporaryFile
+                    pt = PersistentTemporaryFile(suffix='_oeb_base_mem_'
+                                                 'unloader.img')
                     with pt:
                         pt.write(self._data)
                     self.oeb._temp_files.append(pt.name)
@@ -1088,7 +1066,8 @@ class Manifest(object):
 
         @property
         def bytes_representation(self):
-            return serialize(self.data, self.media_type, pretty_print=self.oeb.pretty_print)
+            return serialize(self.data, self.media_type,
+                             pretty_print=self.oeb.pretty_print)
 
         def __str__(self):
             return self.unicode_representation
@@ -1107,7 +1086,11 @@ class Manifest(object):
             href = self.href
             if isinstance(href, bytes):
                 href = force_unicode(href)
-            sp = self.spine_position if isinstance(self.spine_position, numbers.Number) else sys.maxsize
+
+            if isinstance(self.spine_position, numbers.Number):
+                sp = self.spine_position
+            else:
+                sp = sys.maxsize
 
             return sp, (self.media_type or '').lower(), href, self.id
 
@@ -1238,8 +1221,8 @@ class Manifest(object):
         return elem
 
     def to_opf2(self, parent=None):
-        elem = element(parent, OPF('manifest'))
-        for item in sorted(self.items, key=attrgetter('sort_key')):
+        elem = element(parent, tag('opf', 'manifest'))
+        for item in sorted(self.items, key=operator.attrgetter('sort_key')):
             media_type = item.media_type
             if media_type in OEB_DOCS:
                 media_type = XHTML_MIME
@@ -1249,7 +1232,7 @@ class Manifest(object):
                       'media-type': media_type}
             if item.fallback:
                 attrib['fallback'] = item.fallback
-            element(elem, OPF('item'), attrib=attrib)
+            element(elem, tag('opf', 'item'), attrib=attrib)
         return elem
 
     @property
@@ -1341,12 +1324,12 @@ class Spine(object):
         return elem
 
     def to_opf2(self, parent=None):
-        elem = element(parent, OPF('spine'))
+        elem = element(parent, tag('opf', 'spine'))
         for item in self.items:
             attrib = {'idref': item.id}
             if not item.linear:
                 attrib['linear'] = 'no'
-            element(elem, OPF('itemref'), attrib=attrib)
+            element(elem, tag('opf', 'itemref'), attrib=attrib)
         return elem
 
 
@@ -1394,8 +1377,7 @@ class Guide(object):
             self.oeb = oeb
             if type.lower() in self.TYPES:
                 type = type.lower()
-            elif type not in self.TYPES and \
-                 not type.startswith('other.'):
+            elif type not in self.TYPES and not type.startswith('other.'):
                 type = 'other.' + type
             if not title and type in self.TITLES:
                 title = oeb.translate(self.TITLES[type])
@@ -1440,7 +1422,8 @@ class Guide(object):
     __iter__ = iterkeys
 
     def values(self):
-        return sorted(self.refs.values(), key=lambda ref: ref.ORDER.get(ref.type, 10000))
+        return sorted(self.refs.values(),
+                      key=lambda ref: ref.ORDER.get(ref.type, 10000))
 
     def items(self):
         for type, ref in self.refs.items():
@@ -1473,12 +1456,12 @@ class Guide(object):
     def to_opf2(self, parent=None):
         if not len(self):
             return
-        elem = element(parent, OPF('guide'))
+        elem = element(parent, tag('opf', 'guide'))
         for ref in self.refs.values():
             attrib = {'type': ref.type, 'href': urlunquote(ref.href)}
             if ref.title:
                 attrib['title'] = ref.title
-            element(elem, OPF('reference'), attrib=attrib)
+            element(elem, tag('opf', 'reference'), attrib=attrib)
         return elem
 
 
@@ -1499,7 +1482,8 @@ class TOC(object):
     """
 
     def __init__(self, title=None, href=None, klass=None, id=None,
-            play_order=None, author=None, description=None, toc_thumbnail=None):
+                 play_order=None, author=None, description=None,
+                 toc_thumbnail=None):
         self.title = title
         self.href = urlnormalize(href) if href else href
         self.klass = klass
@@ -1513,9 +1497,11 @@ class TOC(object):
         self.description = description
         self.toc_thumbnail = toc_thumbnail
 
-    def add(self, title, href, klass=None, id=None, play_order=0, author=None, description=None, toc_thumbnail=None):
+    def add(self, title, href, klass=None, id=None, play_order=0, author=None,
+            description=None, toc_thumbnail=None):
         """Create and return a new sub-node of this node."""
-        node = TOC(title, href, klass, id, play_order, author, description, toc_thumbnail)
+        node = TOC(title, href, klass, id, play_order, author, description,
+                   toc_thumbnail)
         self.nodes.append(node)
         return node
 
@@ -1583,7 +1569,8 @@ class TOC(object):
         """
         prev = None
         for node in list(self.nodes):
-            if prev and urllib.parse.urldefrag(prev.href)[0] == urllib.parse.urldefrag(node.href)[0]:
+            if (prev and urllib.parse.urldefrag(prev.href)[0] ==
+                    urllib.parse.urldefrag(node.href)[0]):
                 self.nodes.remove(node)
                 prev.nodes.append(node)
             else:
@@ -1597,7 +1584,7 @@ class TOC(object):
             return 1
 
     def get_lines(self, lvl=0):
-        ans = [('\t'*lvl) + 'TOC: %s --> %s'%(self.title, self.href)]
+        ans = [('\t'*lvl) + 'TOC: %s --> %s' % (self.title, self.href)]
         for child in self:
             ans.extend(child.get_lines(lvl+1))
         return ans
@@ -1614,7 +1601,7 @@ class TOC(object):
 
     def to_ncx(self, parent=None):
         if parent is None:
-            parent = etree.Element(NCX('navMap'))
+            parent = etree.Element(tag('ncx', 'navMap'))
         for node in self.nodes:
             id = node.id or uuid_id()
             po = node.play_order
@@ -1623,15 +1610,15 @@ class TOC(object):
             attrib = {'id': id, 'playOrder': str(po)}
             if node.klass:
                 attrib['class'] = node.klass
-            point = element(parent, NCX('navPoint'), attrib=attrib)
-            label = etree.SubElement(point, NCX('navLabel'))
+            point = element(parent, tag('ncx', 'navPoint'), attrib=attrib)
+            label = etree.SubElement(point, tag('ncx', 'navLabel'))
             title = node.title
             if title:
                 title = re.sub(r'\s+', ' ', title)
-            element(label, NCX('text')).text = title
+            element(label, tag('ncx', 'text')).text = title
             # Do not unescape this URL as ADE requires it to be escaped to
             # handle semi colons and other special characters in the file names
-            element(point, NCX('content'), src=node.href)
+            element(point, tag('ncx', 'content'), src=node.href)
             node.to_ncx(point)
         return parent
 
@@ -1659,7 +1646,7 @@ class TOC(object):
             if y is not None:
                 if x.href != y.href:
                     x.play_order = getattr(href_node(x), 'play_order',
-                            self.next_play_order())
+                                           self.next_play_order())
             y = href_node(x)
             if y is not None:
                 x.play_order = y.play_order
@@ -1723,8 +1710,9 @@ class PageList(object):
         return self.pages.remove(page)
 
     def to_ncx(self, parent=None):
-        plist = element(parent, NCX('pageList'), id=uuid_id())
-        values = {t: count(1) for t in ('front', 'normal', 'special')}
+        plist = element(parent, tag('ncx', 'pageList'), id=uuid_id())
+        values = {t: itertools.count(1)
+                  for t in ('front', 'normal', 'special')}
         for page in self.pages:
             id = page.id or uuid_id()
             type = page.type
@@ -1732,30 +1720,31 @@ class PageList(object):
             attrib = {'id': id, 'value': value, 'type': type, 'playOrder': '0'}
             if page.klass:
                 attrib['class'] = page.klass
-            ptarget = element(plist, NCX('pageTarget'), attrib=attrib)
-            label = element(ptarget, NCX('navLabel'))
-            element(label, NCX('text')).text = page.name
-            element(ptarget, NCX('content'), src=page.href)
+            ptarget = element(plist, tag('ncx', 'pageTarget'), attrib=attrib)
+            label = element(ptarget, tag('ncx', 'navLabel'))
+            element(label, tag('ncx', 'text')).text = page.name
+            element(ptarget, tag('ncx', 'content'), src=page.href)
         return plist
 
     def to_page_map(self):
-        pmap = etree.Element(OPF('page-map'), nsmap={None: OPF2_NS})
+        pmap = etree.Element(tag('opf', 'page-map'),
+                             nsmap={None: const.OPF2_NS})
         for page in self.pages:
-            element(pmap, OPF('page'), name=page.name, href=page.href)
+            element(pmap, tag('opf', 'page'), name=page.name, href=page.href)
         return pmap
 
 
 class OEBBook(object):
     """Representation of a book in the IDPF OEB data model."""
 
-    COVER_SVG_XP    = XPath('h:body//svg:svg[position() = 1]')
+    COVER_SVG_XP = XPath('h:body//svg:svg[position() = 1]')
     COVER_OBJECT_XP = XPath('h:body//h:object[@data][position() = 1]')
 
     def __init__(self, logger,
-            html_preprocessor,
-            css_preprocessor=CSSPreProcessor(),
-            encoding='utf-8', pretty_print=False,
-            input_encoding='utf-8'):
+                 html_preprocessor,
+                 css_preprocessor=CSSPreProcessor(),
+                 encoding='utf-8', pretty_print=False,
+                 input_encoding='utf-8'):
         """Create empty book.  Arguments:
 
         :param:`encoding`: Default encoding for textual content read
@@ -1809,7 +1798,7 @@ class OEBBook(object):
         for path in self._temp_files:
             try:
                 os.remove(path)
-            except:
+            except Exception:
                 pass
 
     @classmethod
@@ -1831,11 +1820,12 @@ class OEBBook(object):
             return fix_data(data)
         bom_enc = None
         if data[:4] in (b'\0\0\xfe\xff', b'\xff\xfe\0\0'):
-            bom_enc = {b'\0\0\xfe\xff':'utf-32-be',
-                    b'\xff\xfe\0\0':'utf-32-le'}[data[:4]]
+            bom_enc = {b'\0\0\xfe\xff': 'utf-32-be',
+                       b'\xff\xfe\0\0': 'utf-32-le'}[data[:4]]
             data = data[4:]
         elif data[:2] in (b'\xff\xfe', b'\xfe\xff'):
-            bom_enc = {b'\xff\xfe':'utf-16-le', 'b\xfe\xff':'utf-16-be'}[data[:2]]
+            bom_enc = {b'\xff\xfe': 'utf-16-le',
+                       'b\xfe\xff': 'utf-16-be'}[data[:2]]
             data = data[2:]
         elif data[:3] == b'\xef\xbb\xbf':
             bom_enc = 'utf-8'
@@ -1864,13 +1854,13 @@ class OEBBook(object):
         are tuples of (default) filenames and lxml.etree element structures.
         """
         package = etree.Element('package',
-            attrib={'unique-identifier': self.uid.id})
+                                attrib={'unique-identifier': self.uid.id})
         self.metadata.to_opf1(package)
         self.manifest.to_opf1(package)
         self.spine.to_opf1(package)
         tours = element(package, 'tours')
         tour = element(tours, 'tour',
-            attrib={'id': 'chaptertour', 'title': 'Chapter Tour'})
+                       attrib={'id': 'chaptertour', 'title': 'Chapter Tour'})
         self.toc.to_opf1(tour)
         self.guide.to_opf1(package)
         return {OPF_MIME: ('content.opf', package)}
@@ -1898,7 +1888,8 @@ class OEBBook(object):
                 if added:
                     next += 1
         selector = XPath('ncx:content/@src')
-        for i, elem in enumerate(xpath(ncx, '//*[@playOrder and ./ncx:content[@src]]')):
+        for i, elem in enumerate(xpath(ncx, '//*[@playOrder and '
+                                       './ncx:content[@src]]')):
             href = urlnormalize(selector(elem)[0])
             order = playorder.get(href, i)
             elem.attrib['playOrder'] = str(order)
@@ -1907,25 +1898,26 @@ class OEBBook(object):
     def _to_ncx(self):
         lang = str(self.metadata.language[0])
         lang = lang.replace('_', '-')
-        ncx = etree.Element(NCX('ncx'),
-            attrib={'version': '2005-1', XML('lang'): lang},
-            nsmap={None: NCX_NS})
-        head = etree.SubElement(ncx, NCX('head'))
-        etree.SubElement(head, NCX('meta'),
-            name='dtb:uid', content=str(self.uid))
-        etree.SubElement(head, NCX('meta'),
-            name='dtb:depth', content=str(self.toc.depth()))
+        ncx = etree.Element(tag('ncx', 'ncx'),
+                            attrib={'version': '2005-1',
+                                    tag('xml', 'lang'): lang},
+                            nsmap={None: const.NCX_NS})
+        head = etree.SubElement(ncx, tag('ncx', 'head'))
+        etree.SubElement(head, tag('ncx', 'meta'),
+                         name='dtb:uid', content=str(self.uid))
+        etree.SubElement(head, tag('ncx', 'meta'),
+                         name='dtb:depth', content=str(self.toc.depth()))
         generator = ''.join(['calibre (', __version__, ')'])
-        etree.SubElement(head, NCX('meta'),
-            name='dtb:generator', content=generator)
-        etree.SubElement(head, NCX('meta'),
-            name='dtb:totalPageCount', content=str(len(self.pages)))
-        maxpnum = etree.SubElement(head, NCX('meta'),
-            name='dtb:maxPageNumber', content='0')
-        title = etree.SubElement(ncx, NCX('docTitle'))
-        text = etree.SubElement(title, NCX('text'))
+        etree.SubElement(head, tag('ncx', 'meta'),
+                         name='dtb:generator', content=generator)
+        etree.SubElement(head, tag('ncx', 'meta'), name='dtb:totalPageCount',
+                         content=str(len(self.pages)))
+        maxpnum = etree.SubElement(head, tag('ncx', 'meta'),
+                                   name='dtb:maxPageNumber', content='0')
+        title = etree.SubElement(ncx, tag('ncx', 'docTitle'))
+        text = etree.SubElement(title, tag('ncx', 'text'))
         text.text = str(self.metadata.title[0])
-        navmap = etree.SubElement(ncx, NCX('navMap'))
+        navmap = etree.SubElement(ncx, tag('ncx', 'navMap'))
         self.toc.to_ncx(navmap)
         if len(self.pages) > 0:
             plist = self.pages.to_ncx(ncx)
@@ -1941,27 +1933,29 @@ class OEBBook(object):
         are tuples of (default) filenames and lxml.etree element structures.
         """
         results = {}
-        package = etree.Element(OPF('package'),
-            attrib={'version': '2.0', 'unique-identifier': self.uid.id},
-            nsmap={None: OPF2_NS})
+        package = etree.Element(tag('opf', 'package'),
+                                attrib={'version': '2.0',
+                                        'unique-identifier': self.uid.id},
+                                nsmap={None: const.OPF2_NS})
         self.metadata.to_opf2(package)
         manifest = self.manifest.to_opf2(package)
         spine = self.spine.to_opf2(package)
         self.guide.to_opf2(package)
         results[OPF_MIME] = ('content.opf', package)
         id, href = self.manifest.generate('ncx', 'toc.ncx')
-        etree.SubElement(manifest, OPF('item'), id=id, href=href,
+        etree.SubElement(manifest, tag('opf', 'item'), id=id, href=href,
                          attrib={'media-type': NCX_MIME})
         spine.attrib['toc'] = id
         results[NCX_MIME] = (href, self._to_ncx())
         if page_map and len(self.pages) > 0:
             id, href = self.manifest.generate('page-map', 'page-map.xml')
-            etree.SubElement(manifest, OPF('item'), id=id, href=href,
+            etree.SubElement(manifest, tag('opf', 'item'), id=id, href=href,
                              attrib={'media-type': PAGE_MAP_MIME})
             spine.attrib['page-map'] = id
             results[PAGE_MAP_MIME] = (href, self.pages.to_page_map())
         if self.spine.page_progression_direction in {'ltr', 'rtl'}:
-            spine.attrib['page-progression-direction'] = self.spine.page_progression_direction
+            spine.attrib['page-progression-direction'] = \
+                    self.spine.page_progression_direction
         return results
 
 
@@ -1972,7 +1966,9 @@ def rel_href(base_href, href):
         return href
     if '/' not in base_href:
         return href
-    base = list(filter(lambda x: x and x != '.', os.path.dirname(os.path.normpath(base_href)).replace(os.sep, '/').split('/')))
+    base = list(filter(lambda x: x and x != '.',
+                       os.path.dirname(os.path.normpath(base_href))
+                       .replace(os.sep, '/').split('/')))
     while True:
         try:
             idx = base.index('..')
diff --git a/ebook_converter/ebooks/oeb/parse_utils.py b/ebook_converter/ebooks/oeb/parse_utils.py
index 64be9f2..ef1337b 100644
--- a/ebook_converter/ebooks/oeb/parse_utils.py
+++ b/ebook_converter/ebooks/oeb/parse_utils.py
@@ -1,20 +1,16 @@
 import re
 
-from lxml import etree, html
+from lxml import etree
+from lxml import html
 
+from ebook_converter import constants as const
 from ebook_converter import xml_replace_entities, force_unicode
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 from ebook_converter.constants_old import filesystem_encoding
 from ebook_converter.ebooks.chardet import xml_to_unicode, strip_encoding_declarations
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2011, Kovid Goyal <kovid@kovidgoyal.net>'
-__docformat__ = 'restructuredtext en'
-
-RECOVER_PARSER = etree.XMLParser(recover=True, no_network=True, resolve_entities=False)
-XHTML_NS     = 'http://www.w3.org/1999/xhtml'
-XMLNS_NS     = 'http://www.w3.org/2000/xmlns/'
+RECOVER_PARSER = etree.XMLParser(recover=True, no_network=True,
+                                 resolve_entities=False)
 
 
 class NotHTML(Exception):
@@ -33,15 +29,15 @@ def namespace(name):
 
 
 def XHTML(name):
-    return '{%s}%s' % (XHTML_NS, name)
+    return '{%s}%s' % (const.XHTML_NS, name)
 
 
 def xpath(elem, expr):
-    return elem.xpath(expr, namespaces={'h':XHTML_NS})
+    return elem.xpath(expr, namespaces={'h':const.XHTML_NS})
 
 
 def XPath(expr):
-    return etree.XPath(expr, namespaces={'h':XHTML_NS})
+    return etree.XPath(expr, namespaces={'h':const.XHTML_NS})
 
 
 META_XP = XPath('/h:html/h:head/h:meta[@http-equiv="Content-Type"]')
@@ -111,7 +107,7 @@ def _html4_parse(data):
             elem.text = elem.text.strip('-')
     data = etree.tostring(data, encoding='unicode')
 
-    data = safe_xml_fromstring(data)
+    data = etree.fromstring(data)
     return data
 
 
@@ -204,14 +200,14 @@ def parse_html(data, log=None, decoder=None, preprocessor=None,
 
     # Try with more & more drastic measures to parse
     try:
-        data = safe_xml_fromstring(data, recover=False)
+        data = etree.fromstring(data)
         check_for_html5(pre, data)
     except (HTML5Doc, etree.XMLSyntaxError):
         log.debug('Initial parse failed, using more'
                 ' forgiving parsers')
         raw = data = xml_replace_entities(raw)
         try:
-            data = safe_xml_fromstring(data, recover=False)
+            data = etree.fromstring(data)
             check_for_html5(pre, data)
         except (HTML5Doc, etree.XMLSyntaxError):
             log.debug('Parsing %s as HTML' % filename)
@@ -240,7 +236,7 @@ def parse_html(data, log=None, decoder=None, preprocessor=None,
         if barename(data.tag) in non_html_file_tags:
             raise NotHTML(data.tag)
         log.warn('File %r does not appear to be (X)HTML'%filename)
-        nroot = safe_xml_fromstring('<html></html>')
+        nroot = etree.fromstring('<html></html>')
         has_body = False
         for child in list(data):
             if isinstance(child.tag, (str, bytes)) and barename(child.tag) == 'body':
@@ -249,7 +245,7 @@ def parse_html(data, log=None, decoder=None, preprocessor=None,
         parent = nroot
         if not has_body:
             log.warn('File %r appears to be a HTML fragment'%filename)
-            nroot = safe_xml_fromstring('<html><body/></html>')
+            nroot = etree.fromstring('<html><body/></html>')
             parent = nroot[0]
         for child in list(data.iter()):
             oparent = child.getparent()
@@ -261,16 +257,16 @@ def parse_html(data, log=None, decoder=None, preprocessor=None,
     # Force into the XHTML namespace
     if not namespace(data.tag):
         log.warn('Forcing', filename, 'into XHTML namespace')
-        data.attrib['xmlns'] = XHTML_NS
+        data.attrib['xmlns'] = const.XHTML_NS
         data = etree.tostring(data, encoding='unicode')
 
         try:
-            data = safe_xml_fromstring(data, recover=False)
+            data = etree.fromstring(data)
         except:
             data = data.replace(':=', '=').replace(':>', '>')
             data = data.replace('<http:/>', '')
             try:
-                data = safe_xml_fromstring(data, recover=False)
+                data = etree.fromstring(data)
             except etree.XMLSyntaxError:
                 log.warn('Stripping comments from %s'%
                         filename)
@@ -281,17 +277,17 @@ def parse_html(data, log=None, decoder=None, preprocessor=None,
                     '')
                 data = data.replace("<?xml version='1.0' encoding='utf-8'??>", '')
                 try:
-                    data = safe_xml_fromstring(data)
+                    data = etree.fromstring(data)
                 except etree.XMLSyntaxError:
                     log.warn('Stripping meta tags from %s'% filename)
                     data = re.sub(r'<meta\s+[^>]+?>', '', data)
-                    data = safe_xml_fromstring(data)
-    elif namespace(data.tag) != XHTML_NS:
+                    data = etree.fromstring(data)
+    elif namespace(data.tag) != const.XHTML_NS:
         # OEB_DOC_NS, but possibly others
         ns = namespace(data.tag)
         attrib = dict(data.attrib)
         nroot = etree.Element(XHTML('html'),
-            nsmap={None: XHTML_NS}, attrib=attrib)
+            nsmap={None: const.XHTML_NS}, attrib=attrib)
         for elem in data.iterdescendants():
             if isinstance(elem.tag, (str, bytes)) and \
                 namespace(elem.tag) == ns:
@@ -301,7 +297,7 @@ def parse_html(data, log=None, decoder=None, preprocessor=None,
         data = nroot
 
     # Remove non default prefixes referring to the XHTML namespace
-    data = ensure_namespace_prefixes(data, {None: XHTML_NS})
+    data = ensure_namespace_prefixes(data, {None: const.XHTML_NS})
 
     data = merge_multiple_html_heads_and_bodies(data, log)
     # Ensure has a <head/>
diff --git a/ebook_converter/ebooks/oeb/polish/container.py b/ebook_converter/ebooks/oeb/polish/container.py
index e3b9530..2ee2957 100644
--- a/ebook_converter/ebooks/oeb/polish/container.py
+++ b/ebook_converter/ebooks/oeb/polish/container.py
@@ -14,7 +14,9 @@ from itertools import count
 import urllib.parse
 
 from css_parser import getUrls, replaceUrls
+from lxml import etree
 
+from ebook_converter import constants as const
 from ebook_converter import CurrentDir, walk
 from ebook_converter.constants_old import iswindows
 from ebook_converter.customize.ui import plugin_for_input_format, plugin_for_output_format
@@ -34,7 +36,7 @@ from ebook_converter.ebooks.mobi import MobiError
 from ebook_converter.ebooks.mobi.reader.headers import MetadataHeader
 from ebook_converter.ebooks.mobi.tweak import set_cover
 from ebook_converter.ebooks.oeb.base import (
-    DC11_NS, OEB_DOCS, OEB_STYLES, OPF, OPF2_NS, Manifest, itercsslinks, iterlinks,
+    OEB_DOCS, OEB_STYLES, Manifest, itercsslinks, iterlinks,
     rewrite_links, serialize, urlquote, urlunquote
 )
 from ebook_converter.ebooks.oeb.parse_utils import NotHTML, parse_html
@@ -47,13 +49,11 @@ from ebook_converter.ptempfile import PersistentTemporaryDirectory, PersistentTe
 from ebook_converter.utils.filenames import hardlink_file, nlinks_file
 from ebook_converter.utils.ipc.simple_worker import WorkerError, fork_job
 from ebook_converter.utils.logging import default_log
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 from ebook_converter.utils.zipfile import ZipFile
 
 exists, join, relpath = os.path.exists, os.path.join, os.path.relpath
 
 OEB_FONTS = {guess_type('a.ttf'), guess_type('b.otf'), guess_type('a.woff'), 'application/x-font-ttf', 'application/x-font-otf', 'application/font-sfnt'}
-OPF_NAMESPACES = {'opf':OPF2_NS, 'dc':DC11_NS}
 null = object()
 
 
@@ -195,7 +195,7 @@ class ContainerBase(object):  # {{{
         data, self.used_encoding = xml_to_unicode(
             data, strip_encoding_pats=True, assume_utf8=True, resolve_entities=True)
         data = unicodedata.normalize('NFC', data)
-        return safe_xml_fromstring(data)
+        return etree.fromstring(data)
 
     def parse_xhtml(self, data, fname='<string>', force_html5_parse=False):
         if self.tweak_mode:
@@ -324,7 +324,7 @@ class Container(ContainerBase):  # {{{
             item_id = 'id' + '%d'%c
         manifest = self.opf_xpath('//opf:manifest')[0]
         href = self.name_to_href(name, self.opf_name)
-        item = manifest.makeelement(OPF('item'),
+        item = manifest.makeelement(const.OPF_ITEM,
                                     id=item_id, href=href)
         item.set('media-type', self.mime_map[name])
         self.insert_into_xml(manifest, item)
@@ -380,7 +380,7 @@ class Container(ContainerBase):  # {{{
         if mt in OEB_DOCS:
             manifest = self.opf_xpath('//opf:manifest')[0]
             spine = self.opf_xpath('//opf:spine')[0]
-            si = manifest.makeelement(OPF('itemref'), idref=item_id)
+            si = manifest.makeelement(const.OPF_ITEMREF, idref=item_id)
             self.insert_into_xml(spine, si, index=spine_index)
         return name
 
@@ -533,7 +533,7 @@ class Container(ContainerBase):  # {{{
 
     def opf_xpath(self, expr):
         ' Convenience method to evaluate an XPath expression on the OPF file, has the opf: and dc: namespace prefixes pre-defined. '
-        return self.opf.xpath(expr, namespaces=OPF_NAMESPACES)
+        return self.opf.xpath(expr, namespaces=const.OPF_NAMESPACES)
 
     def has_name(self, name):
         ''' Return True iff a file with the same canonical name as that specified exists. Unlike :meth:`exists` this method is always case-sensitive. '''
@@ -813,7 +813,8 @@ class Container(ContainerBase):  # {{{
         spine = self.opf_xpath('//opf:spine')[0]
         spine.text = tail
         for name, linear in spine_items:
-            i = spine.makeelement('{%s}itemref' % OPF_NAMESPACES['opf'], nsmap={'opf':OPF_NAMESPACES['opf']})
+            i = spine.makeelement(const.OPF_ITEMREF,
+                                  nsmap={'opf': const.OPF2_NS})
             i.tail = tail
             i.set('idref', imap[name])
             spine.append(i)
@@ -944,7 +945,7 @@ class Container(ContainerBase):  # {{{
             item_id = id_prefix + '%d'%c
 
         manifest = self.opf_xpath('//opf:manifest')[0]
-        item = manifest.makeelement(OPF('item'),
+        item = manifest.makeelement(const.OPF_ITEM,
                                     id=item_id, href=href)
         item.set('media-type', media_type)
         self.insert_into_xml(manifest, item)
@@ -993,7 +994,7 @@ class Container(ContainerBase):  # {{{
             self.format_opf()
         data = serialize(data, self.mime_map[name], pretty_print=name in
                          self.pretty_print)
-        if name == self.opf_name and root.nsmap.get(None) == OPF2_NS:
+        if name == self.opf_name and root.nsmap.get(None) == const.OPF2_NS:
             # Needed as I can't get lxml to output opf:role and
             # not output <opf:metadata> as well
             data = re.sub(br'(<[/]{0,1})opf:', r'\1', data)
@@ -1172,7 +1173,7 @@ class EpubContainer(Container):
         container_path = join(self.root, 'META-INF', 'container.xml')
         if not exists(container_path):
             raise InvalidEpub('No META-INF/container.xml in epub')
-        container = safe_xml_fromstring(open(container_path, 'rb').read())
+        container = etree.fromstring(open(container_path, 'rb').read())
         opf_files = container.xpath((
             r'child::ocf:rootfiles/ocf:rootfile'
             '[@media-type="%s" and @full-path]'%guess_type('a.opf')
diff --git a/ebook_converter/ebooks/oeb/polish/css.py b/ebook_converter/ebooks/oeb/polish/css.py
index ef7a5b7..43b209c 100644
--- a/ebook_converter/ebooks/oeb/polish/css.py
+++ b/ebook_converter/ebooks/oeb/polish/css.py
@@ -2,10 +2,11 @@ from collections import defaultdict
 from functools import partial
 
 from css_parser.css import CSSRule, CSSStyleDeclaration
-from ebook_converter.css_selectors import parse, SelectorSyntaxError
 
+from ebook_converter import constants as const
 from ebook_converter import force_unicode
-from ebook_converter.ebooks.oeb.base import OEB_STYLES, OEB_DOCS, XHTML, css_text
+from ebook_converter.css_selectors import parse, SelectorSyntaxError
+from ebook_converter.ebooks.oeb.base import OEB_STYLES, OEB_DOCS, css_text
 from ebook_converter.ebooks.oeb.normalize_css import normalize_filter_css, normalizers
 from ebook_converter.ebooks.oeb.polish.pretty import pretty_script_or_style, pretty_xml_tree, serialize
 from ebook_converter.utils.icu import numeric_sort_key
@@ -382,7 +383,7 @@ def add_stylesheet_links(container, name, text):
     if not sheets:
         return
     for sname in sheets:
-        link = head.makeelement(XHTML('link'), type='text/css', rel='stylesheet', href=container.name_to_href(sname, name))
+        link = head.makeelement(const.XHTML_LINK, type='text/css', rel='stylesheet', href=container.name_to_href(sname, name))
         head.append(link)
     pretty_xml_tree(head)
     return serialize(root, 'text/html')
diff --git a/ebook_converter/ebooks/oeb/polish/opf.py b/ebook_converter/ebooks/oeb/polish/opf.py
index b66adcb..77cd848 100644
--- a/ebook_converter/ebooks/oeb/polish/opf.py
+++ b/ebook_converter/ebooks/oeb/polish/opf.py
@@ -1,13 +1,9 @@
 from lxml import etree
 
-from ebook_converter.ebooks.oeb.polish.container import OPF_NAMESPACES
+from ebook_converter import constants as const
 from ebook_converter.utils.localization import canonicalize_lang
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2014, Kovid Goyal <kovid at kovidgoyal.net>'
-
-
 def get_book_language(container):
     for lang in container.opf_xpath('//dc:language'):
         raw = lang.text
@@ -18,7 +14,7 @@ def get_book_language(container):
 
 
 def set_guide_item(container, item_type, title, name, frag=None):
-    ref_tag = '{%s}reference' % OPF_NAMESPACES['opf']
+    ref_tag = const.OPF_REFERENCE
     href = None
     if name:
         href = container.name_to_href(name, container.opf_name)
@@ -27,23 +23,27 @@ def set_guide_item(container, item_type, title, name, frag=None):
 
     guides = container.opf_xpath('//opf:guide')
     if not guides and href:
-        g = container.opf.makeelement('{%s}guide' % OPF_NAMESPACES['opf'], nsmap={'opf':OPF_NAMESPACES['opf']})
+        g = container.opf.makeelement(const.OPF_GUIDE,
+                                      nsmap={'opf': const.OPF2_NS})
         container.insert_into_xml(container.opf, g)
         guides = [g]
 
     for guide in guides:
         matches = []
         for child in guide.iterchildren(etree.Element):
-            if child.tag == ref_tag and child.get('type', '').lower() == item_type.lower():
+            if (child.tag == ref_tag and
+                    child.get('type', '').lower() == item_type.lower()):
                 matches.append(child)
         if not matches and href:
-            r = guide.makeelement(ref_tag, type=item_type, nsmap={'opf':OPF_NAMESPACES['opf']})
+            r = guide.makeelement(ref_tag, type=item_type,
+                                  nsmap={'opf': const.OPF2_NS})
             container.insert_into_xml(guide, r)
             matches.append(r)
         for m in matches:
             if href:
-                m.set('title', title), m.set('href', href), m.set('type', item_type)
+                m.set('title', title)
+                m.set('href', href)
+                m.set('type', item_type)
             else:
                 container.remove_from_xml(m)
     container.dirty(container.opf_name)
-
diff --git a/ebook_converter/ebooks/oeb/polish/parsing.py b/ebook_converter/ebooks/oeb/polish/parsing.py
index d847094..99cbd5e 100644
--- a/ebook_converter/ebooks/oeb/polish/parsing.py
+++ b/ebook_converter/ebooks/oeb/polish/parsing.py
@@ -1,21 +1,18 @@
 import re
 
-from lxml.etree import Element as LxmlElement
+from lxml import etree
 import html5_parser
 
+from ebook_converter import constants as const
 from ebook_converter import xml_replace_entities
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
-from ebook_converter.ebooks.chardet import xml_to_unicode, strip_encoding_declarations
+from ebook_converter.ebooks.chardet import strip_encoding_declarations
+from ebook_converter.ebooks.chardet import xml_to_unicode
 from ebook_converter.utils.cleantext import clean_xml_chars
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2013, Kovid Goyal <kovid at kovidgoyal.net>'
-
-XHTML_NS     = 'http://www.w3.org/1999/xhtml'
-
-
-def parse_html5(raw, decoder=None, log=None, discard_namespaces=False, line_numbers=True, linenumber_attribute=None, replace_entities=True, fix_newlines=True):
+def parse_html5(raw, decoder=None, log=None, discard_namespaces=False,
+                line_numbers=True, linenumber_attribute=None,
+                replace_entities=True, fix_newlines=True):
     if isinstance(raw, bytes):
         raw = xml_to_unicode(raw)[0] if decoder is None else decoder(raw)
     if replace_entities:
@@ -23,10 +20,14 @@ def parse_html5(raw, decoder=None, log=None, discard_namespaces=False, line_numb
     if fix_newlines:
         raw = raw.replace('\r\n', '\n').replace('\r', '\n')
     raw = clean_xml_chars(raw)
-    root = html5_parser.parse(raw, maybe_xhtml=not discard_namespaces, line_number_attr=linenumber_attribute, keep_doctype=False, sanitize_names=True)
-    if (discard_namespaces and root.tag != 'html') or (
-        not discard_namespaces and (root.tag != '{%s}%s' % (XHTML_NS, 'html') or root.prefix)):
-        raise ValueError('Failed to parse correctly, root has tag: %s and prefix: %s' % (root.tag, root.prefix))
+    root = html5_parser.parse(raw, maybe_xhtml=not discard_namespaces,
+                              line_number_attr=linenumber_attribute,
+                              keep_doctype=False, sanitize_names=True)
+    if ((discard_namespaces and root.tag != 'html') or
+        (not discard_namespaces and
+         (root.tag != '{%s}%s' % (const.XHTML_NS, 'html') or root.prefix))):
+        raise ValueError('Failed to parse correctly, root has tag: %s and '
+                         'prefix: %s' % (root.tag, root.prefix))
     return root
 
 
@@ -48,12 +49,14 @@ def handle_private_entities(data):
                 user_entities[match.group(1)] = val
             if user_entities:
                 data = ('\n' * num_of_nl_in_pre) + data[idx:]
-                pat = re.compile(r'&(%s);'%('|'.join(user_entities.keys())))
-                data = pat.sub(lambda m:user_entities[m.group(1)], data)
+                pat = re.compile(r'&(%s);' % ('|'.join(user_entities.keys())))
+                data = pat.sub(lambda m: user_entities[m.group(1)], data)
     return data
 
 
-def parse(raw, decoder=None, log=None, line_numbers=True, linenumber_attribute=None, replace_entities=True, force_html5_parse=False):
+def parse(raw, decoder=None, log=None, line_numbers=True,
+          linenumber_attribute=None, replace_entities=True,
+          force_html5_parse=False):
     if isinstance(raw, bytes):
         raw = xml_to_unicode(raw)[0] if decoder is None else decoder(raw)
     raw = handle_private_entities(raw)
@@ -70,26 +73,32 @@ def parse(raw, decoder=None, log=None, line_numbers=True, linenumber_attribute=N
         raw = ('\n' * newlines) + raw[match.start():]
         break
 
-    raw = strip_encoding_declarations(raw, limit=10*1024, preserve_newlines=True)
+    raw = strip_encoding_declarations(raw, limit=10*1024,
+                                      preserve_newlines=True)
     if force_html5_parse:
-        return parse_html5(raw, log=log, line_numbers=line_numbers, linenumber_attribute=linenumber_attribute, replace_entities=False, fix_newlines=False)
+        return parse_html5(raw, log=log, line_numbers=line_numbers,
+                           linenumber_attribute=linenumber_attribute,
+                           replace_entities=False, fix_newlines=False)
     try:
-        ans = safe_xml_fromstring(raw, recover=False)
-        if ans.tag != '{%s}html' % XHTML_NS:
+        ans = etree.fromstring(raw)
+        if ans.tag != '{%s}html' % const.XHTML_NS:
             raise ValueError('Root tag is not <html> in the XHTML namespace')
         if linenumber_attribute:
-            for elem in ans.iter(LxmlElement):
+            for elem in ans.iter(etree.element):
                 if elem.sourceline is not None:
                     elem.set(linenumber_attribute, str(elem.sourceline))
         return ans
     except Exception:
         if log is not None:
             log.exception('Failed to parse as XML, parsing as tag soup')
-        return parse_html5(raw, log=log, line_numbers=line_numbers, linenumber_attribute=linenumber_attribute, replace_entities=False, fix_newlines=False)
+        return parse_html5(raw, log=log, line_numbers=line_numbers,
+                           linenumber_attribute=linenumber_attribute,
+                           replace_entities=False, fix_newlines=False)
 
 
 if __name__ == '__main__':
-    from lxml import etree
-    root = parse_html5('\n<html><head><title>a\n</title><p b=1 c=2 a=0>&nbsp;\n<b>b<svg ass="wipe" viewbox="0">', discard_namespaces=False)
+    root = parse_html5('\n<html><head><title>a\n</title><p b=1 c=2 a=0>&nbsp;'
+                       '\n<b>b<svg ass="wipe" viewbox="0">',
+                       discard_namespaces=False)
     print(etree.tostring(root, encoding='utf-8'))
     print()
diff --git a/ebook_converter/ebooks/oeb/polish/pretty.py b/ebook_converter/ebooks/oeb/polish/pretty.py
index 402a546..8620f9e 100644
--- a/ebook_converter/ebooks/oeb/polish/pretty.py
+++ b/ebook_converter/ebooks/oeb/polish/pretty.py
@@ -2,10 +2,10 @@ import textwrap
 
 # from lxml.etree import Element
 
+from ebook_converter import constants as const
 from ebook_converter import force_unicode
-from ebook_converter.ebooks.oeb.base import (
-    serialize, OEB_DOCS, barename, OEB_STYLES, XPNSMAP, XHTML, SVG)
-from ebook_converter.ebooks.oeb.polish.container import OPF_NAMESPACES
+from ebook_converter.ebooks.oeb import parse_utils
+from ebook_converter.ebooks.oeb.base import serialize, OEB_DOCS, OEB_STYLES
 from ebook_converter.ebooks.oeb.polish.utils import guess_type
 from ebook_converter.utils.icu import sort_key
 
@@ -38,15 +38,15 @@ def pretty_opf(root):
     # Put all dc: tags first starting with title and author. Preserve order for
     # the rest.
     def dckey(x):
-        return {'title':0, 'creator':1}.get(barename(x.tag), 2)
-    for metadata in root.xpath('//opf:metadata', namespaces=OPF_NAMESPACES):
-        dc_tags = metadata.xpath('./*[namespace-uri()="%s"]' % OPF_NAMESPACES['dc'])
+        return {'title':0, 'creator':1}.get(parse_utils.barename(x.tag), 2)
+    for metadata in root.xpath('//opf:metadata', namespaces=const.OPF_NAMESPACES):
+        dc_tags = metadata.xpath('./*[namespace-uri()="%s"]' % const.DC11_NS)
         dc_tags.sort(key=dckey)
         for x in reversed(dc_tags):
             metadata.insert(0, x)
 
     # Group items in the manifest
-    spine_ids = root.xpath('//opf:spine/opf:itemref/@idref', namespaces=OPF_NAMESPACES)
+    spine_ids = root.xpath('//opf:spine/opf:itemref/@idref', namespaces=const.OPF_NAMESPACES)
     spine_ids = {x:i for i, x in enumerate(spine_ids)}
 
     def manifest_key(x):
@@ -75,7 +75,7 @@ def pretty_opf(root):
             i = sort_key(href)
         return (cat, i)
 
-    for manifest in root.xpath('//opf:manifest', namespaces=OPF_NAMESPACES):
+    for manifest in root.xpath('//opf:manifest', namespaces=const.OPF_NAMESPACES):
         try:
             children = sorted(manifest, key=manifest_key)
         except AttributeError:
@@ -84,19 +84,11 @@ def pretty_opf(root):
             manifest.insert(0, x)
 
 
-SVG_TAG = SVG('svg')
-BLOCK_TAGS = frozenset(map(XHTML, (
-    'address', 'article', 'aside', 'audio', 'blockquote', 'body', 'canvas', 'col', 'colgroup', 'dd',
-    'div', 'dl', 'dt', 'fieldset', 'figcaption', 'figure', 'footer', 'form',
-    'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'header', 'hgroup', 'hr', 'li',
-    'noscript', 'ol', 'output', 'p', 'pre', 'script', 'section', 'style', 'table', 'tbody', 'td',
-    'tfoot', 'th', 'thead', 'tr', 'ul', 'video', 'img'))) | {SVG_TAG}
-
 
 def isblock(x):
     if callable(x.tag) or not x.tag:
         return True
-    if x.tag in BLOCK_TAGS:
+    if x.tag in const.XHTML_BLOCK_TAGS | {const.SVG_SVG}:
         return True
     return False
 
@@ -141,12 +133,12 @@ def pretty_block(parent, level=1, indent='  '):
     that contain only other block tags '''
     if not parent.text or isspace(parent.text):
         parent.text = ''
-    nn = '\n' if hasattr(parent.tag, 'strip') and barename(parent.tag) in {'tr', 'td', 'th'} else '\n\n'
+    nn = '\n' if hasattr(parent.tag, 'strip') and parse_utils.barename(parent.tag) in {'tr', 'td', 'th'} else '\n\n'
     parent.text = parent.text + nn + (indent * level)
     for i, child in enumerate(parent):
         if isblock(child) and has_only_blocks(child):
             pretty_block(child, level=level+1, indent=indent)
-        elif child.tag == SVG_TAG:
+        elif child.tag == const.SVG_SVG:
             pretty_xml_tree(child, level=level, indent=indent)
         l = level
         if i == len(parent) - 1:
@@ -172,13 +164,13 @@ def pretty_html_tree(container, root):
         child.tail = '\n\n'
         if hasattr(child.tag, 'endswith') and child.tag.endswith('}head'):
             pretty_xml_tree(child)
-    for body in root.findall('h:body', namespaces=XPNSMAP):
+    for body in root.findall('h:body', namespaces=const.XPNSMAP):
         pretty_block(body)
         # Special case the handling of a body that contains a single block tag
         # with all content. In this case we prettify the containing block tag
         # even if it has non block children.
         if (len(body) == 1 and not callable(body[0].tag) and isblock(body[0]) and not has_only_blocks(
-            body[0]) and barename(body[0].tag) not in (
+            body[0]) and parse_utils.barename(body[0].tag) not in (
                     'pre', 'p', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6') and len(body[0]) > 0):
             pretty_block(body[0], level=2)
 
diff --git a/ebook_converter/ebooks/oeb/polish/split.py b/ebook_converter/ebooks/oeb/polish/split.py
index 568aefa..36b8a67 100644
--- a/ebook_converter/ebooks/oeb/polish/split.py
+++ b/ebook_converter/ebooks/oeb/polish/split.py
@@ -1,7 +1,11 @@
-import copy, os, re
+import copy
+import os
+import re
 import urllib.parse
 
-from ebook_converter.ebooks.oeb.base import barename, XPNSMAP, XPath, OPF, XHTML, OEB_DOCS
+from ebook_converter import constants as const
+from ebook_converter.ebooks.oeb import base
+from ebook_converter.ebooks.oeb import parse_utils
 from ebook_converter.ebooks.oeb.polish.errors import MalformedMarkup
 from ebook_converter.ebooks.oeb.polish.toc import node_from_loc
 from ebook_converter.ebooks.oeb.polish.replace import LinkRebaser
@@ -35,7 +39,7 @@ def adjust_split_point(split_point, log):
         parent = sp.getparent()
         if (
             parent is None or
-            barename(parent.tag) in {'body', 'html'} or
+            parse_utils.barename(parent.tag) in {'body', 'html'} or
             (parent.text and parent.text.strip()) or
             parent.index(sp) > 0
         ):
@@ -49,7 +53,7 @@ def adjust_split_point(split_point, log):
 
 
 def get_body(root):
-    return root.find('h:body', namespaces=XPNSMAP)
+    return root.find('h:body', namespaces=const.XPNSMAP)
 
 
 def do_split(split_point, log, before=True):
@@ -113,7 +117,7 @@ def do_split(split_point, log, before=True):
             nix_element(elem)
 
     # Tree 2
-    ancestors = frozenset(XPath('ancestor::*')(split_point2))
+    ancestors = frozenset(base.XPath('ancestor::*')(split_point2))
     for elem in tuple(body2.iterdescendants()):
         if elem is split_point2:
             if not before:
@@ -251,7 +255,7 @@ def split(container, name, loc_or_xpath, before=True, totals=None):
             break
     index = spine.index(spine_item) + 1
 
-    si = spine.makeelement(OPF('itemref'), idref=manifest_item.get('id'))
+    si = spine.makeelement(base.tag('opf', 'itemref'), idref=manifest_item.get('id'))
     if not linear:
         si.set('linear', 'no')
     container.insert_into_xml(spine, si, index=index)
@@ -268,7 +272,7 @@ def multisplit(container, name, xpath, before=True):
     :param before: If True the splits occur before the identified element otherwise after it.
     '''
     root = container.parsed(name)
-    nodes = root.xpath(xpath, namespaces=XPNSMAP)
+    nodes = root.xpath(xpath, namespaces=const.XPNSMAP)
     if not nodes:
         raise AbortError('The expression %s did not match any nodes' % xpath)
     for split_point in nodes:
@@ -329,7 +333,7 @@ def all_anchors(root):
 
 
 def all_stylesheets(container, name):
-    for link in XPath('//h:head/h:link[@href]')(container.parsed(name)):
+    for link in base.XPath('//h:head/h:link[@href]')(container.parsed(name)):
         name = container.href_to_name(link.get('href'), name)
         typ = link.get('type', 'text/css')
         if typ == 'text/css':
@@ -358,14 +362,14 @@ def merge_html(container, names, master, insert_page_breaks=False):
     root = p(master)
 
     # Ensure master has a <head>
-    head = root.find('h:head', namespaces=XPNSMAP)
+    head = root.find('h:head', namespaces=const.XPNSMAP)
     if head is None:
-        head = root.makeelement(XHTML('head'))
+        head = root.makeelement(base.tag('xhtml', 'head'))
         container.insert_into_xml(root, head, 0)
 
     seen_anchors = all_anchors(root)
     seen_stylesheets = set(all_stylesheets(container, master))
-    master_body = p(master).findall('h:body', namespaces=XPNSMAP)[-1]
+    master_body = p(master).findall('h:body', namespaces=const.XPNSMAP)[-1]
     master_base = os.path.dirname(master)
     anchor_map = {n:{} for n in names if n != master}
     first_anchor_map = {}
@@ -377,7 +381,7 @@ def merge_html(container, names, master, insert_page_breaks=False):
         for sheet in all_stylesheets(container, name):
             if sheet not in seen_stylesheets:
                 seen_stylesheets.add(sheet)
-                link = head.makeelement(XHTML('link'), rel='stylesheet', type='text/css', href=container.name_to_href(sheet, master))
+                link = head.makeelement(base.tag('xhtml', 'link'), rel='stylesheet', type='text/css', href=container.name_to_href(sheet, master))
                 container.insert_into_xml(head, link)
 
         # Rebase links if master is in a different directory
@@ -386,7 +390,7 @@ def merge_html(container, names, master, insert_page_breaks=False):
 
         root = p(name)
         children = []
-        for body in p(name).findall('h:body', namespaces=XPNSMAP):
+        for body in p(name).findall('h:body', namespaces=const.XPNSMAP):
             children.append(body.text if body.text and body.text.strip() else '\n\n')
             children.extend(body)
 
@@ -396,7 +400,7 @@ def merge_html(container, names, master, insert_page_breaks=False):
                 break
         if isinstance(first_child, (str, bytes)):
             # body contained only text, no tags
-            first_child = body.makeelement(XHTML('p'))
+            first_child = body.makeelement(base.tag('xhtml', 'p'))
             first_child.text, children[0] = children[0], first_child
 
         amap = anchor_map[name]
@@ -424,7 +428,7 @@ def merge_html(container, names, master, insert_page_breaks=False):
         amap[''] = first_child.get('id')
 
         # Fix links that point to local changed anchors
-        for a in XPath('//h:a[starts-with(@href, "#")]')(root):
+        for a in base.XPath('//h:a[starts-with(@href, "#")]')(root):
             q = a.get('href')[1:]
             if q in amap:
                 a.set('href', '#' + amap[q])
@@ -472,10 +476,10 @@ def merge_css(container, names, master):
     # Remove links to merged stylesheets in the html files, replacing with a
     # link to the master sheet
     for name, mt in container.mime_map.items():
-        if mt in OEB_DOCS:
+        if mt in base.OEB_DOCS:
             removed = False
             root = p(name)
-            for link in XPath('//h:link[@href]')(root):
+            for link in base.XPath('//h:link[@href]')(root):
                 q = container.href_to_name(link.get('href'), name)
                 if q in merged:
                     container.remove_from_xml(link)
@@ -483,9 +487,9 @@ def merge_css(container, names, master):
             if removed:
                 container.dirty(name)
             if removed and master not in set(all_stylesheets(container, name)):
-                head = root.find('h:head', namespaces=XPNSMAP)
+                head = root.find('h:head', namespaces=const.XPNSMAP)
                 if head is not None:
-                    link = head.makeelement(XHTML('link'), type='text/css', rel='stylesheet', href=container.name_to_href(master, name))
+                    link = head.makeelement(base.tag('xhtml', 'link'), type='text/css', rel='stylesheet', href=container.name_to_href(master, name))
                     container.insert_into_xml(head, link)
 
 
diff --git a/ebook_converter/ebooks/oeb/polish/toc.py b/ebook_converter/ebooks/oeb/polish/toc.py
index 15f94b4..42af230 100644
--- a/ebook_converter/ebooks/oeb/polish/toc.py
+++ b/ebook_converter/ebooks/oeb/polish/toc.py
@@ -1,16 +1,16 @@
-import re
-from collections import Counter, OrderedDict
-from functools import partial
-from operator import itemgetter
+import collections
+import functools
+import operator
 import pkg_resources
+import re
 import urllib.parse
 
 from lxml import etree
 from lxml.builder import ElementMaker
 
 from ebook_converter import __version__
-from ebook_converter.ebooks.oeb.base import (
-    XPath, uuid_id, xml2text, NCX, NCX_NS, XML, XHTML, XHTML_NS, serialize, EPUB_NS, XML_NS, OEB_DOCS)
+from ebook_converter import constants as const
+from ebook_converter.ebooks.oeb import base
 from ebook_converter.ebooks.oeb.polish.errors import MalformedMarkup
 from ebook_converter.ebooks.oeb.polish.utils import guess_type, extract
 from ebook_converter.ebooks.oeb.polish.opf import set_guide_item, get_book_language
@@ -18,10 +18,6 @@ from ebook_converter.ebooks.oeb.polish.pretty import pretty_html_tree
 from ebook_converter.utils.localization import get_lang, canonicalize_lang, lang_as_iso639_1
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2013, Kovid Goyal <kovid at kovidgoyal.net>'
-__docformat__ = 'restructuredtext en'
-
 ns = etree.FunctionNamespace('calibre_xpath_extensions')
 ns.prefix = 'calibre'
 ns['lower-case'] = lambda c, x: x.lower() if hasattr(x, 'lower') else x
@@ -81,7 +77,8 @@ class TOC(object):
         seen = set()
         remove = []
         for child in self:
-            key = child.title if only_text else (child.title, child.dest, (child.frag or None))
+            key = child.title if only_text else (child.title, child.dest,
+                                                 (child.frag or None))
             if key in seen:
                 remove.append(child)
             else:
@@ -104,7 +101,7 @@ class TOC(object):
 
     def get_lines(self, lvl=0):
         frag = ('#'+self.frag) if self.frag else ''
-        ans = [('\t'*lvl) + 'TOC: %s --> %s%s'%(self.title, self.dest, frag)]
+        ans = [('\t'*lvl) + 'TOC: %s --> %s%s' % (self.title, self.dest, frag)]
         for child in self:
             ans.extend(child.get_lines(lvl+1))
         return ans
@@ -113,10 +110,8 @@ class TOC(object):
         return '\n'.join(self.get_lines())
 
     def to_dict(self, node_counter=None):
-        ans = {
-            'title':self.title, 'dest':self.dest, 'frag':self.frag,
-            'children':[c.to_dict(node_counter) for c in self.children]
-        }
+        ans = {'title': self.title, 'dest': self.dest, 'frag': self.frag,
+               'children': [c.to_dict(node_counter) for c in self.children]}
         if self.dest_exists is not None:
             ans['dest_exists'] = self.dest_exists
         if self.dest_error is not None:
@@ -131,7 +126,7 @@ class TOC(object):
 
 
 def child_xpath(tag, name):
-    return tag.xpath('./*[calibre:lower-case(local-name()) = "%s"]'%name)
+    return tag.xpath('./*[calibre:lower-case(local-name()) = "%s"]' % name)
 
 
 def add_from_navpoint(container, navpoint, parent, ncx_name):
@@ -142,7 +137,7 @@ def add_from_navpoint(container, navpoint, parent, ncx_name):
         text = ''
         for txt in child_xpath(nl, 'text'):
             text += etree.tostring(txt, method='text',
-                    encoding='unicode', with_tail=False)
+                                   encoding='unicode', with_tail=False)
     content = child_xpath(navpoint, 'content')
     if content:
         content = content[0]
@@ -154,7 +149,8 @@ def add_from_navpoint(container, navpoint, parent, ncx_name):
 
 
 def process_ncx_node(container, node, toc_parent, ncx_name):
-    for navpoint in node.xpath('./*[calibre:lower-case(local-name()) = "navpoint"]'):
+    for navpoint in node.xpath('./*[calibre:lower-case(local-name()) '
+                               '= "navpoint"]'):
         child = add_from_navpoint(container, navpoint, toc_parent, ncx_name)
         if child is not None:
             process_ncx_node(container, navpoint, child, ncx_name)
@@ -171,29 +167,38 @@ def parse_ncx(container, ncx_name):
         if attr.endswith('lang'):
             toc_root.lang = str(val)
             break
-    for uid in root.xpath('//*[calibre:lower-case(local-name()) = "meta" and @name="dtb:uid"]/@content'):
+    for uid in root.xpath('//*[calibre:lower-case(local-name()) = "meta" and '
+                          '@name="dtb:uid"]/@content'):
         if uid:
             toc_root.uid = str(uid)
             break
     for pl in root.xpath('//*[calibre:lower-case(local-name()) = "pagelist"]'):
-        for pt in pl.xpath('descendant::*[calibre:lower-case(local-name()) = "pagetarget"]'):
+        for pt in pl.xpath('descendant::*[calibre:lower-case(local-name()) = '
+                           '"pagetarget"]'):
             pagenum = pt.get('value')
             if pagenum:
-                href = pt.xpath('descendant::*[calibre:lower-case(local-name()) = "content"]/@src')
+                href = pt.xpath('descendant::*[calibre:lower-case(local-name()'
+                                ') = "content"]/@src')
                 if href:
                     dest = container.href_to_name(href[0], base=ncx_name)
                     frag = urllib.parse.urlparse(href[0]).fragment or None
-                    toc_root.page_list.append({'dest': dest, 'pagenum': pagenum, 'frag': frag})
+                    toc_root.page_list.append({'dest': dest,
+                                               'pagenum': pagenum,
+                                               'frag': frag})
     return toc_root
 
 
 def add_from_li(container, li, parent, nav_name):
     dest = frag = text = None
-    for x in li.iterchildren(XHTML('a'), XHTML('span')):
-        text = etree.tostring(x, method='text', encoding='unicode', with_tail=False).strip() or ' '.join(x.xpath('descendant-or-self::*/@title')).strip()
+    for x in li.iterchildren(base.tag('xhtml', 'a'),
+                             base.tag('xhtml', 'span')):
+        text = (etree.tostring(x, method='text', encoding='unicode',
+                               with_tail=False).strip() or
+                ' '.join(x.xpath('descendant-or-self::*/@title')).strip())
         href = x.get('href')
         if href:
-            dest = nav_name if href.startswith('#') else container.href_to_name(href, base=nav_name)
+            dest = (nav_name if href.startswith('#') else
+                    container.href_to_name(href, base=nav_name))
             frag = urllib.parse.urlparse(href).fragment or None
         break
     return parent.add(text or None, dest or None, frag or None)
@@ -207,9 +212,9 @@ def first_child(parent, tagname):
 
 
 def process_nav_node(container, node, toc_parent, nav_name):
-    for li in node.iterchildren(XHTML('li')):
+    for li in node.iterchildren(base.tag('xhtml', 'li')):
         child = add_from_li(container, li, toc_parent, nav_name)
-        ol = first_child(li, XHTML('ol'))
+        ol = first_child(li, base.tag('xhtml', 'ol'))
         if child is not None and ol is not None:
             process_nav_node(container, ol, child, nav_name)
 
@@ -218,14 +223,16 @@ def parse_nav(container, nav_name):
     root = container.parsed(nav_name)
     toc_root = TOC()
     toc_root.lang = toc_root.uid = None
-    et = '{%s}type' % EPUB_NS
-    for nav in root.iterdescendants(XHTML('nav')):
-        if nav.get(et) == 'toc':
-            ol = first_child(nav, XHTML('ol'))
+    xhtml = functools.partial(base.tag, 'xhtml')
+    for nav in root.iterdescendants(base.tag('xhtml', 'nav')):
+        if nav.get(base.tag('epub', 'type')) == 'toc':
+            ol = first_child(nav, base.tag('xhtml', 'ol'))
             if ol is not None:
                 process_nav_node(container, ol, toc_root, nav_name)
-                for h in nav.iterchildren(*map(XHTML, 'h1 h2 h3 h4 h5 h6'.split())):
-                    text = etree.tostring(h, method='text', encoding='unicode', with_tail=False) or h.get('title')
+                for h in nav.iterchildren(*map(xhtml,
+                                               'h1 h2 h3 h4 h5 h6'.split())):
+                    text = etree.tostring(h, method='text', encoding='unicode',
+                                          with_tail=False) or h.get('title')
                     if text:
                         toc_root.toc_title = text
                         break
@@ -235,7 +242,7 @@ def parse_nav(container, nav_name):
 
 def verify_toc_destinations(container, toc):
     anchor_map = {}
-    anchor_xpath = XPath('//*/@id|//h:a/@name')
+    anchor_xpath = base.XPath('//*/@id|//h:a/@name')
     for item in toc.iterdescendants():
         name = item.dest
         if not name:
@@ -284,7 +291,8 @@ def get_x_toc(container, find_toc, parse_toc, verify_destinations=True):
         ans.lang = ans.uid = None
         return ans
     toc = find_toc(container)
-    ans = empty_toc() if toc is None or not container.has_name(toc) else parse_toc(container, toc)
+    ans = (empty_toc() if toc is None or not container.has_name(toc) else
+           parse_toc(container, toc))
     ans.toc_file_name = toc if toc and container.has_name(toc) else None
     if verify_destinations:
         verify_toc_destinations(container, ans)
@@ -294,11 +302,14 @@ def get_x_toc(container, find_toc, parse_toc, verify_destinations=True):
 def get_toc(container, verify_destinations=True):
     ver = container.opf_version_parsed
     if ver.major < 3:
-        return get_x_toc(container, find_existing_ncx_toc, parse_ncx, verify_destinations=verify_destinations)
+        return get_x_toc(container, find_existing_ncx_toc, parse_ncx,
+                         verify_destinations=verify_destinations)
     else:
-        ans = get_x_toc(container, find_existing_nav_toc, parse_nav, verify_destinations=verify_destinations)
+        ans = get_x_toc(container, find_existing_nav_toc, parse_nav,
+                        verify_destinations=verify_destinations)
         if len(ans) == 0:
-            ans = get_x_toc(container, find_existing_ncx_toc, parse_ncx, verify_destinations=verify_destinations)
+            ans = get_x_toc(container, find_existing_ncx_toc, parse_ncx,
+                            verify_destinations=verify_destinations)
         return ans
 
 
@@ -308,25 +319,33 @@ def get_guide_landmarks(container):
         href, frag = href.partition('#')[::2]
         name = container.href_to_name(href, container.opf_name)
         if container.has_name(name):
-            yield {'dest':name, 'frag':frag, 'title':title or '', 'type':rtype or ''}
+            yield {'dest': name,
+                   'frag': frag,
+                   'title': title or '',
+                   'type': rtype or ''}
 
 
 def get_nav_landmarks(container):
     nav = find_existing_nav_toc(container)
     if nav and container.has_name(nav):
         root = container.parsed(nav)
-        et = '{%s}type' % EPUB_NS
-        for elem in root.iterdescendants(XHTML('nav')):
+        et = base('epub', 'type')
+        for elem in root.iterdescendants(base.tag('xhtml', 'nav')):
             if elem.get(et) == 'landmarks':
-                for li in elem.iterdescendants(XHTML('li')):
-                    for a in li.iterdescendants(XHTML('a')):
+                for li in elem.iterdescendants(base.tag('xhtml', 'li')):
+                    for a in li.iterdescendants(base.tag('xhtml', 'a')):
                         href, rtype = a.get('href'), a.get(et)
                         if href:
-                            title = etree.tostring(a, method='text', encoding='unicode', with_tail=False).strip()
+                            title = etree.tostring(a, method='text',
+                                                   encoding='unicode',
+                                                   with_tail=False).strip()
                             href, frag = href.partition('#')[::2]
                             name = container.href_to_name(href, nav)
                             if container.has_name(name):
-                                yield {'dest':name, 'frag':frag, 'title':title or '', 'type':rtype or ''}
+                                yield {'dest': name,
+                                       'frag': frag,
+                                       'title': title or '',
+                                       'type': rtype or ''}
                             break
 
 
@@ -344,7 +363,7 @@ def ensure_id(elem, all_ids):
     elem_id = elem.get('id')
     if elem_id:
         return False, elem_id
-    if elem.tag == XHTML('a'):
+    if elem.tag == base.tag('xhtml', 'a'):
         anchor = elem.get('name', None)
         if anchor:
             elem.set('id', anchor)
@@ -361,7 +380,7 @@ def ensure_id(elem, all_ids):
 
 
 def elem_to_toc_text(elem):
-    text = xml2text(elem).strip()
+    text = base.xml2text(elem).strip()
     if not text:
         text = elem.get('title', '')
     if not text:
@@ -375,7 +394,7 @@ def elem_to_toc_text(elem):
 
 def item_at_top(elem):
     try:
-        body = XPath('//h:body')(elem.getroottree().getroot())[0]
+        body = base.XPath('//h:body')(elem.getroottree().getroot())[0]
     except (TypeError, IndexError, KeyError, AttributeError):
         return False
     tree = body.getroottree()
@@ -387,7 +406,7 @@ def item_at_top(elem):
         try:
             if el.tag.endswith('}img') or (el.text and el.text.strip()):
                 return False
-        except:
+        except Exception:
             return False
         if not path.startswith(epath):
             # Only check tail of non-parent elements
@@ -404,24 +423,26 @@ def from_xpaths(container, xpaths):
     Table of Contents from the ``<h1>``, ``<h2>`` and ``<h3>`` tags.
     '''
     tocroot = TOC()
-    xpaths = [XPath(xp) for xp in xpaths]
+    xpaths = [base.XPath(xp) for xp in xpaths]
 
     # Find those levels that have no elements in all spine items
-    maps = OrderedDict()
+    maps = collections.OrderedDict()
     empty_levels = {i+1 for i, xp in enumerate(xpaths)}
     for spinepath in container.spine_items:
         name = container.abspath_to_name(spinepath)
         root = container.parsed(name)
-        level_item_map = maps[name] = {i+1:frozenset(xp(root)) for i, xp in enumerate(xpaths)}
+        level_item_map = maps[name] = {i + 1: frozenset(xp(root))
+                                       for i, xp in enumerate(xpaths)}
         for lvl, elems in level_item_map.items():
             if elems:
                 empty_levels.discard(lvl)
     # Remove empty levels from all level_maps
     if empty_levels:
         for name, lmap in tuple(maps.items()):
-            lmap = {lvl:items for lvl, items in lmap.items() if lvl not in empty_levels}
-            lmap = sorted(lmap.items(), key=itemgetter(0))
-            lmap = {i+1:items for i, (l, items) in enumerate(lmap)}
+            lmap = {lvl: items for lvl, items in lmap.items()
+                    if lvl not in empty_levels}
+            lmap = sorted(lmap.items(), key=operator.itemgetter(0))
+            lmap = {i + 1: items for i, (l, items) in enumerate(lmap)}
             maps[name] = lmap
 
     node_level_map = {tocroot: 0}
@@ -434,13 +455,15 @@ def from_xpaths(container, xpaths):
             if child is None:
                 return node
             lvl = node_level_map[child]
-            return node if lvl > limit else child if lvl == limit else process_node(child)
+            return (node if lvl > limit else
+                    child if lvl == limit else process_node(child))
 
         return process_node(tocroot)
 
     for name, level_item_map in maps.items():
         root = container.parsed(name)
-        item_level_map = {e:i for i, elems in level_item_map.items() for e in elems}
+        item_level_map = {e: i for i, elems in level_item_map.items()
+                          for e in elems}
         item_dirtied = False
         all_ids = set(root.xpath('//*/@id'))
 
@@ -470,7 +493,7 @@ def from_links(container):
     Generate a Table of Contents from links in the book.
     '''
     toc = TOC()
-    link_path = XPath('//h:a[@href]')
+    link_path = base.XPath('//h:a[@href]')
     seen_titles, seen_dests = set(), set()
     for name, is_linear in container.spine_names:
         root = container.parsed(name)
@@ -506,7 +529,7 @@ def find_text(node):
     pat = re.compile(r'\s+')
     for child in node:
         if isinstance(child, etree._Element):
-            text = xml2text(child).strip()
+            text = base.xml2text(child).strip()
             text = pat.sub(' ', text)
             if len(text) < 1:
                 continue
@@ -526,7 +549,7 @@ def from_files(container):
     for i, spinepath in enumerate(container.spine_items):
         name = container.abspath_to_name(spinepath)
         root = container.parsed(name)
-        body = XPath('//h:body')(root)
+        body = base.XPath('//h:body')(root)
         if not body:
             continue
         text = find_text(body[0])
@@ -576,42 +599,46 @@ def add_id(container, name, loc, totals=None):
 
 def create_ncx(toc, to_href, btitle, lang, uid):
     lang = lang.replace('_', '-')
-    ncx = etree.Element(NCX('ncx'),
-        attrib={'version': '2005-1', XML('lang'): lang},
-        nsmap={None: NCX_NS})
-    head = etree.SubElement(ncx, NCX('head'))
-    etree.SubElement(head, NCX('meta'),
-        name='dtb:uid', content=str(uid))
-    etree.SubElement(head, NCX('meta'),
-        name='dtb:depth', content=str(toc.depth))
+    ncx = etree.Element(base.tag('ncx', 'ncx'),
+                        attrib={'version': '2005-1',
+                                base.tag('xml', 'lang'): lang},
+                        nsmap={None: const.NCX_NS})
+    head = etree.SubElement(ncx, base.tag('ncx', 'head'))
+    etree.SubElement(head, base.tag('ncx', 'meta'),
+                     name='dtb:uid', content=str(uid))
+    etree.SubElement(head, base.tag('ncx', 'meta'),
+                     name='dtb:depth', content=str(toc.depth))
     generator = ''.join(['calibre (', __version__, ')'])
-    etree.SubElement(head, NCX('meta'),
-        name='dtb:generator', content=generator)
-    etree.SubElement(head, NCX('meta'), name='dtb:totalPageCount', content='0')
-    etree.SubElement(head, NCX('meta'), name='dtb:maxPageNumber', content='0')
-    title = etree.SubElement(ncx, NCX('docTitle'))
-    text = etree.SubElement(title, NCX('text'))
+    etree.SubElement(head, base.tag('ncx', 'meta'),
+                     name='dtb:generator', content=generator)
+    etree.SubElement(head, base.tag('ncx', 'meta'), name='dtb:totalPageCount',
+                     content='0')
+    etree.SubElement(head, base.tag('ncx', 'meta'), name='dtb:maxPageNumber',
+                     content='0')
+    title = etree.SubElement(ncx, base.tag('ncx', 'docTitle'))
+    text = etree.SubElement(title, base.tag('ncx', 'text'))
     text.text = btitle
-    navmap = etree.SubElement(ncx, NCX('navMap'))
+    navmap = etree.SubElement(ncx, base.tag('ncx', 'navMap'))
     spat = re.compile(r'\s+')
 
-    play_order = Counter()
+    play_order = collections.Counter()
 
     def process_node(xml_parent, toc_parent):
         for child in toc_parent:
             play_order['c'] += 1
-            point = etree.SubElement(xml_parent, NCX('navPoint'), id='num_%d' % play_order['c'],
-                            playOrder=str(play_order['c']))
-            label = etree.SubElement(point, NCX('navLabel'))
+            point = etree.SubElement(xml_parent, base.tag('ncx', 'navPoint'),
+                                     id='num_%d' % play_order['c'],
+                                     playOrder=str(play_order['c']))
+            label = etree.SubElement(point, base.tag('ncx', 'navLabel'))
             title = child.title
             if title:
                 title = spat.sub(' ', title)
-            etree.SubElement(label, NCX('text')).text = title
+            etree.SubElement(label, base.tag('ncx', 'text')).text = title
             if child.dest:
                 href = to_href(child.dest)
                 if child.frag:
                     href += '#'+child.frag
-                etree.SubElement(point, NCX('content'), src=href)
+                etree.SubElement(point, base.tag('ncx', 'content'), src=href)
             process_node(point, child)
 
     process_node(navmap, toc)
@@ -622,41 +649,43 @@ def commit_ncx_toc(container, toc, lang=None, uid=None):
     tocname = find_existing_ncx_toc(container)
     if tocname is None:
         item = container.generate_item('toc.ncx', id_prefix='toc')
-        tocname = container.href_to_name(item.get('href'), base=container.opf_name)
+        tocname = container.href_to_name(item.get('href'),
+                                         base=container.opf_name)
         ncx_id = item.get('id')
         [s.set('toc', ncx_id) for s in container.opf_xpath('//opf:spine')]
     if not lang:
         lang = get_lang()
-        for l in container.opf_xpath('//dc:language'):
-            l = canonicalize_lang(xml2text(l).strip())
-            if l:
-                lang = l
-                lang = lang_as_iso639_1(l) or l
+        for _l in container.opf_xpath('//dc:language'):
+            _l = canonicalize_lang(base.xml2text(_l).strip())
+            if _l:
+                lang = _l
+                lang = lang_as_iso639_1(_l) or _l
                 break
     lang = lang_as_iso639_1(lang) or lang
     if not uid:
-        uid = uuid_id()
+        uid = base.uuid_id()
         eid = container.opf.get('unique-identifier', None)
         if eid:
-            m = container.opf_xpath('//*[@id="%s"]'%eid)
+            m = container.opf_xpath('//*[@id="%s"]' % eid)
             if m:
-                uid = xml2text(m[0])
+                uid = base.xml2text(m[0])
 
     title = 'Table of Contents'
     m = container.opf_xpath('//dc:title')
     if m:
-        x = xml2text(m[0]).strip()
+        x = base.xml2text(m[0]).strip()
         title = x or title
 
-    to_href = partial(container.name_to_href, base=tocname)
+    to_href = functools.partial(container.name_to_href, base=tocname)
     root = create_ncx(toc, to_href, title, lang, uid)
     container.replace(tocname, root)
     container.pretty_print.add(tocname)
 
 
 def ensure_single_nav_of_type(root, ntype='toc'):
-    et = '{%s}type' % EPUB_NS
-    navs = [n for n in root.iterdescendants(XHTML('nav')) if n.get(et) == ntype]
+    et = base('epub', 'type')
+    navs = [n for n in root.iterdescendants(base.tag('xhtml', 'nav'))
+            if n.get(et) == ntype]
     for x in navs[1:]:
         extract(x)
     if navs:
@@ -667,13 +696,14 @@ def ensure_single_nav_of_type(root, ntype='toc'):
         nav.attrib.update(attrib)
         nav.tail = tail
     else:
-        nav = root.makeelement(XHTML('nav'))
-        first_child(root, XHTML('body')).append(nav)
-    nav.set('{%s}type' % EPUB_NS, ntype)
+        nav = root.makeelement(base.tag('xhtml', 'nav'))
+        first_child(root, base.tag('xhtml', 'body')).append(nav)
+    nav.set(et, ntype)
     return nav
 
 
-def commit_nav_toc(container, toc, lang=None, landmarks=None, previous_nav=None):
+def commit_nav_toc(container, toc, lang=None, landmarks=None,
+                   previous_nav=None):
     from ebook_converter.ebooks.oeb.polish.pretty import pretty_xml_tree
     tocname = find_existing_nav_toc(container)
     if previous_nav is not None:
@@ -684,7 +714,8 @@ def commit_nav_toc(container, toc, lang=None, landmarks=None, previous_nav=None)
     if tocname is None:
         item = container.generate_item('nav.xhtml', id_prefix='nav')
         item.set('properties', 'nav')
-        tocname = container.href_to_name(item.get('href'), base=container.opf_name)
+        tocname = container.href_to_name(item.get('href'),
+                                         base=container.opf_name)
         if previous_nav is not None:
             root = previous_nav[1]
         else:
@@ -698,24 +729,25 @@ def commit_nav_toc(container, toc, lang=None, landmarks=None, previous_nav=None)
     if lang:
         lang = lang_as_iso639_1(lang) or lang
         root.set('lang', lang)
-        root.set('{%s}lang' % XML_NS, lang)
+        root.set(base.tag('xml', 'lang'), lang)
     nav = ensure_single_nav_of_type(root, 'toc')
     if toc.toc_title:
-        nav.append(nav.makeelement(XHTML('h1')))
+        nav.append(nav.makeelement(base.tag('xhtml', 'h1')))
         nav[-1].text = toc.toc_title
 
-    rnode = nav.makeelement(XHTML('ol'))
+    rnode = nav.makeelement(base.tag('xhtml', 'ol'))
     nav.append(rnode)
-    to_href = partial(container.name_to_href, base=tocname)
+    to_href = functools.partial(container.name_to_href, base=tocname)
     spat = re.compile(r'\s+')
 
     def process_node(xml_parent, toc_parent):
         for child in toc_parent:
-            li = xml_parent.makeelement(XHTML('li'))
+            li = xml_parent.makeelement(base.tag('xhtml', 'li'))
             xml_parent.append(li)
             title = child.title or ''
             title = spat.sub(' ', title).strip()
-            a = li.makeelement(XHTML('a' if child.dest else 'span'))
+            a = li.makeelement(base.tag('xhtml', 'a'
+                                        if child.dest else 'span'))
             a.text = title
             li.append(a)
             if child.dest:
@@ -724,14 +756,14 @@ def commit_nav_toc(container, toc, lang=None, landmarks=None, previous_nav=None)
                     href += '#'+child.frag
                 a.set('href', href)
             if len(child):
-                ol = li.makeelement(XHTML('ol'))
+                ol = li.makeelement(base.tag('xhtml', 'ol'))
                 li.append(ol)
                 process_node(ol, child)
     process_node(rnode, toc)
     pretty_xml_tree(nav)
 
     def collapse_li(parent):
-        for li in parent.iterdescendants(XHTML('li')):
+        for li in parent.iterdescendants(base.tag('xhtml', 'li')):
             if len(li) == 1:
                 li.text = None
                 li[0].tail = None
@@ -739,9 +771,9 @@ def commit_nav_toc(container, toc, lang=None, landmarks=None, previous_nav=None)
     nav.tail = '\n'
 
     def create_li(ol, entry):
-        li = ol.makeelement(XHTML('li'))
+        li = ol.makeelement(base.tag('xhtml', 'li'))
         ol.append(li)
-        a = li.makeelement(XHTML('a'))
+        a = li.makeelement(base.tag('xhtml', 'a'))
         li.append(a)
         href = container.name_to_href(entry['dest'], tocname)
         if entry['frag']:
@@ -752,12 +784,13 @@ def commit_nav_toc(container, toc, lang=None, landmarks=None, previous_nav=None)
     if landmarks is not None:
         nav = ensure_single_nav_of_type(root, 'landmarks')
         nav.set('hidden', '')
-        ol = nav.makeelement(XHTML('ol'))
+        ol = nav.makeelement(base.tag('xhtml', 'ol'))
         nav.append(ol)
         for entry in landmarks:
-            if entry['type'] and container.has_name(entry['dest']) and container.mime_map[entry['dest']] in OEB_DOCS:
+            if (entry['type'] and container.has_name(entry['dest']) and
+                    container.mime_map[entry['dest']] in base.OEB_DOCS):
                 a = create_li(ol, entry)
-                a.set('{%s}type' % EPUB_NS, entry['type'])
+                a.set(base.tag('epub', 'type'), entry['type'])
                 a.text = entry['title'] or None
         pretty_xml_tree(nav)
         collapse_li(nav)
@@ -765,10 +798,11 @@ def commit_nav_toc(container, toc, lang=None, landmarks=None, previous_nav=None)
     if toc.page_list:
         nav = ensure_single_nav_of_type(root, 'page-list')
         nav.set('hidden', '')
-        ol = nav.makeelement(XHTML('ol'))
+        ol = nav.makeelement(base.tag('xhtml', 'ol'))
         nav.append(ol)
         for entry in toc.page_list:
-            if container.has_name(entry['dest']) and container.mime_map[entry['dest']] in OEB_DOCS:
+            if (container.has_name(entry['dest']) and
+                    container.mime_map[entry['dest']] in base.OEB_DOCS):
                 a = create_li(ol, entry)
                 a.text = str(entry['pagenum'])
         pretty_xml_tree(nav)
@@ -785,11 +819,12 @@ def commit_toc(container, toc, lang=None, uid=None):
 def remove_names_from_toc(container, names):
     changed = []
     names = frozenset(names)
-    for find_toc, parse_toc, commit_toc in (
-            (find_existing_ncx_toc, parse_ncx, commit_ncx_toc),
-            (find_existing_nav_toc, parse_nav, commit_nav_toc),
-    ):
-        toc = get_x_toc(container, find_toc, parse_toc, verify_destinations=False)
+    for find_toc, parse_toc, commit_toc in ((find_existing_ncx_toc,
+                                             parse_ncx, commit_ncx_toc),
+                                            (find_existing_nav_toc,
+                                             parse_nav, commit_nav_toc)):
+        toc = get_x_toc(container, find_toc, parse_toc,
+                        verify_destinations=False)
         if len(toc) > 0:
             remove = []
             for node in toc.iterdescendants():
@@ -805,15 +840,16 @@ def remove_names_from_toc(container, names):
 
 def find_inline_toc(container):
     for name, linear in container.spine_names:
-        if container.parsed(name).xpath('//*[local-name()="body" and @id="calibre_generated_inline_toc"]'):
+        if container.parsed(name).xpath('//*[local-name()="body" and @id='
+                                        '"calibre_generated_inline_toc"]'):
             return name
 
 
 def toc_to_html(toc, container, toc_name, title, lang=None):
 
     def process_node(html_parent, toc, level=1, indent='  ', style_level=2):
-        li = html_parent.makeelement(XHTML('li'))
-        li.tail = '\n'+ (indent*level)
+        li = html_parent.makeelement(base.tag('xhtml', 'li'))
+        li.tail = '\n' + (indent * level)
         html_parent.append(li)
         name, frag = toc.dest, toc.frag
         href = '#'
@@ -821,32 +857,29 @@ def toc_to_html(toc, container, toc_name, title, lang=None):
             href = container.name_to_href(name, toc_name)
             if frag:
                 href += '#' + frag
-        a = li.makeelement(XHTML('a'), href=href)
+        a = li.makeelement(base.tag('xhtml', 'a'), href=href)
         a.text = toc.title
         li.append(a)
         if len(toc) > 0:
-            parent = li.makeelement(XHTML('ul'))
+            parent = li.makeelement(base.tag('xhtml', 'ul'))
             parent.set('class', 'level%d' % (style_level))
             li.append(parent)
             a.tail = '\n\n' + (indent*(level+2))
             parent.text = '\n'+(indent*(level+3))
             parent.tail = '\n\n' + (indent*(level+1))
             for child in toc:
-                process_node(parent, child, level+3, style_level=style_level + 1)
+                process_node(parent, child, level+3,
+                             style_level=style_level + 1)
             parent[-1].tail = '\n' + (indent*(level+2))
 
-    E = ElementMaker(namespace=XHTML_NS, nsmap={None:XHTML_NS})
-    html = E.html(
-        E.head(
-            E.title(title),
-            E.style(P('templates/inline_toc_styles.css', data=True), type='text/css'),
-        ),
-        E.body(
-            E.h2(title),
-            E.ul(),
-            id="calibre_generated_inline_toc",
-        )
-    )
+    E = ElementMaker(namespace=const.XHTML_NS, nsmap={None: const.XHTML_NS})
+    # TODO(gryf): revisit lack of css.
+    css_f = pkg_resources.resource_filename('ebook_converter',
+                                            'data/inline_toc_styles.css')
+    html = E.html(E.head(E.title(title),
+                         E.style(css_f, type='text/css')),
+                  E.body(E.h2(title), E.ul(),
+                         id="calibre_generated_inline_toc"))
 
     ul = html[1][1]
     ul.set('class', 'level1')
@@ -859,11 +892,12 @@ def toc_to_html(toc, container, toc_name, title, lang=None):
 
 
 def create_inline_toc(container, title=None):
-    '''
-    Create an inline (HTML) Table of Contents from an existing NCX Table of Contents.
+    """
+    Create an inline (HTML) Table of Contents from an existing NCX Table of
+    Contents.
 
     :param title: The title for this table of contents.
-    '''
+    """
     lang = get_book_language(container)
     default_title = 'Table of Contents'
     title = title or default_title
@@ -874,7 +908,7 @@ def create_inline_toc(container, title=None):
 
     name = toc_name
     html = toc_to_html(toc, container, name, title, lang)
-    raw = serialize(html, 'text/html')
+    raw = base.serialize(html, 'text/html')
     if name is None:
         name, c = 'toc.xhtml', 0
         while container.has_name(name):
@@ -884,5 +918,6 @@ def create_inline_toc(container, title=None):
     else:
         with container.open(name, 'wb') as f:
             f.write(raw)
-    set_guide_item(container, 'toc', title, name, frag='calibre_generated_inline_toc')
+    set_guide_item(container, 'toc', title, name,
+                   frag='calibre_generated_inline_toc')
     return name
diff --git a/ebook_converter/ebooks/oeb/reader.py b/ebook_converter/ebooks/oeb/reader.py
index 4139b1b..f5a02f7 100644
--- a/ebook_converter/ebooks/oeb/reader.py
+++ b/ebook_converter/ebooks/oeb/reader.py
@@ -1,21 +1,21 @@
 """
 Container-/OPF-based input OEBBook reader.
 """
-import sys, os, uuid, copy, re, io
-from collections import defaultdict
+import collections
+import copy
+import io
+import os
+import re
+import sys
 import urllib.parse
+import uuid
 
 from lxml import etree
 
-from ebook_converter.ebooks.oeb.base import OPF1_NS, OPF2_NS, OPF2_NSMAP, DC11_NS, \
-    DC_NSES, OPF, xml2text, XHTML_MIME
-from ebook_converter.ebooks.oeb.base import OEB_DOCS, OEB_STYLES, OEB_IMAGES, \
-    PAGE_MAP_MIME, JPEG_MIME, NCX_MIME, SVG_MIME
-from ebook_converter.ebooks.oeb.base import XMLDECL_RE, COLLAPSE_RE, \
-    MS_COVER_TYPE, iterlinks
-from ebook_converter.ebooks.oeb.base import namespace, barename, XPath, xpath, \
-                                    urlnormalize, BINARY_MIME, \
-                                    OEBError, OEBBook, DirContainer
+from ebook_converter import constants as const
+from ebook_converter.ebooks.oeb import base
+from ebook_converter.ebooks.oeb import parse_utils
+from ebook_converter.ebooks.metadata import opf2 as opf_meta
 from ebook_converter.ebooks.oeb.writer import OEBWriter
 from ebook_converter.utils.xml_parse import safe_xml_fromstring
 from ebook_converter.utils.cleantext import clean_xml_chars
@@ -26,18 +26,13 @@ from ebook_converter import guess_type, xml_replace_entities
 from ebook_converter.polyglot.urllib import unquote
 
 
-__all__ = ['OEBReader']
-__license__ = 'GPL v3'
-__copyright__ = '2008, Marshall T. Vandegrift <llasram@gmail.com>'
-
-
 class OEBReader(object):
     """Read an OEBPS 1.x or OPF/OPS 2.0 file collection."""
 
-    COVER_SVG_XP    = XPath('h:body//svg:svg[position() = 1]')
-    COVER_OBJECT_XP = XPath('h:body//h:object[@data][position() = 1]')
+    COVER_SVG_XP = base.XPath('h:body//svg:svg[position() = 1]')
+    COVER_OBJECT_XP = base.XPath('h:body//h:object[@data][position() = 1]')
 
-    Container = DirContainer
+    Container = base.DirContainer
     """Container type used to access book files.  Override in sub-classes."""
 
     DEFAULT_PROFILE = 'PRS505'
@@ -75,61 +70,67 @@ class OEBReader(object):
         for elem in opf.iter(tag=etree.Element):
             nsmap.update(elem.nsmap)
         for elem in opf.iter(tag=etree.Element):
-            if namespace(elem.tag) in ('', OPF1_NS) and ':' not in barename(elem.tag):
-                elem.tag = OPF(barename(elem.tag))
-        nsmap.update(OPF2_NSMAP)
+            if (parse_utils.namespace(elem.tag) in ('', const.OPF1_NS) and
+                    ':' not in parse_utils.barename(elem.tag)):
+                elem.tag = base.tag('opf', parse_utils.barename(elem.tag))
+        nsmap.update(const.OPF2_NSMAP)
         attrib = dict(opf.attrib)
-        nroot = etree.Element(OPF('package'),
-            nsmap={None: OPF2_NS}, attrib=attrib)
-        metadata = etree.SubElement(nroot, OPF('metadata'), nsmap=nsmap)
-        ignored = (OPF('dc-metadata'), OPF('x-metadata'))
-        for elem in xpath(opf, 'o2:metadata//*'):
+        nroot = etree.Element(base.tag('opf', 'package'),
+                              nsmap={None: const.OPF2_NS}, attrib=attrib)
+        metadata = etree.SubElement(nroot, base.tag('opf', 'metadata'),
+                                    nsmap=nsmap)
+        ignored = (base.tag('opf', 'dc-metadata'), base.tag('opf', 'x-metadata'))
+        for elem in base.xpath(opf, 'o2:metadata//*'):
             if elem.tag in ignored:
                 continue
-            if namespace(elem.tag) in DC_NSES:
-                tag = barename(elem.tag).lower()
-                elem.tag = '{%s}%s' % (DC11_NS, tag)
+            if parse_utils.namespace(elem.tag) in const.DC_NSES:
+                tag = parse_utils.barename(elem.tag).lower()
+                elem.tag = '{%s}%s' % (const.DC11_NS, tag)
             if elem.tag.startswith('dc:'):
                 tag = elem.tag.partition(':')[-1].lower()
-                elem.tag = '{%s}%s' % (DC11_NS, tag)
+                elem.tag = '{%s}%s' % (const.DC11_NS, tag)
             metadata.append(elem)
-        for element in xpath(opf, 'o2:metadata//o2:meta'):
+        for element in base.xpath(opf, 'o2:metadata//o2:meta'):
             metadata.append(element)
         for tag in ('o2:manifest', 'o2:spine', 'o2:tours', 'o2:guide'):
-            for element in xpath(opf, tag):
+            for element in base.xpath(opf, tag):
                 nroot.append(element)
         return nroot
 
     def _read_opf(self):
         data = self.oeb.container.read(None)
         data = self.oeb.decode(data)
-        data = XMLDECL_RE.sub('', data)
+        data = base.XMLDECL_RE.sub('', data)
         data = re.sub(r'http://openebook.org/namespaces/oeb-package/1.0(/*)',
-                OPF1_NS, data)
+                      const.OPF1_NS, data)
         try:
-            opf = safe_xml_fromstring(data)
+            opf = etree.fromstring(data)
         except etree.XMLSyntaxError:
             data = xml_replace_entities(clean_xml_chars(data), encoding=None)
             try:
-                opf = safe_xml_fromstring(data)
+                opf = etree.fromstring(data)
                 self.logger.warn('OPF contains invalid HTML named entities')
             except etree.XMLSyntaxError:
                 data = re.sub(r'(?is)<tours>.+</tours>', '', data)
                 data = data.replace('<dc-metadata>',
-                    '<dc-metadata xmlns:dc="http://purl.org/metadata/dublin_core">')
-                opf = safe_xml_fromstring(data)
+                                    '<dc-metadata xmlns:dc="'
+                                    'http://purl.org/metadata/dublin_core">')
+                opf = etree.fromstring(data)
                 self.logger.warn('OPF contains invalid tours section')
 
-        ns = namespace(opf.tag)
-        if ns not in ('', OPF1_NS, OPF2_NS):
-            raise OEBError('Invalid namespace %r for OPF document' % ns)
+        ns = parse_utils.namespace(opf.tag)
+        if ns not in ('', const.OPF1_NS, const.OPF2_NS):
+            raise base.OEBError('Invalid namespace %r for OPF document' % ns)
         opf = self._clean_opf(opf)
         return opf
 
     def _metadata_from_opf(self, opf):
         from ebook_converter.ebooks.metadata.opf2 import OPF
-        from ebook_converter.ebooks.oeb.transforms.metadata import meta_info_to_oeb_metadata
-        stream = io.BytesIO(etree.tostring(opf, xml_declaration=True, encoding='utf-8'))
+        from ebook_converter.ebooks.oeb.transforms.metadata import \
+            meta_info_to_oeb_metadata
+        stream = io.BytesIO(etree.tostring(opf, xml_declaration=True,
+                                           encoding='utf-8'))
+        # o = opf_meta.OPF(stream)
         o = OPF(stream)
         pwm = o.primary_writing_mode
         if pwm:
@@ -139,8 +140,8 @@ class OEBReader(object):
             mi.language = get_lang().replace('_', '-')
         self.oeb.metadata.add('language', mi.language)
         if not mi.book_producer:
-            mi.book_producer = '%(a)s (%(v)s) [http://%(a)s-ebook.com]'%\
-                dict(a=__appname__, v=__version__)
+            mi.book_producer = ('%(a)s (%(v)s) [http://%(a)s-ebook.com]' %
+                                dict(a=__appname__, v=__version__))
         meta_info_to_oeb_metadata(mi, self.oeb.metadata, self.logger)
         m = self.oeb.metadata
         m.add('identifier', str(uuid.uuid4()), id='uuid_id', scheme='uuid')
@@ -162,16 +163,16 @@ class OEBReader(object):
         data.
         '''
         bad = []
-        check = OEB_DOCS.union(OEB_STYLES)
+        check = base.OEB_DOCS.union(base.OEB_STYLES)
         for item in list(self.oeb.manifest.values()):
             if item.media_type in check:
                 try:
                     item.data
                 except KeyboardInterrupt:
                     raise
-                except:
-                    self.logger.exception('Failed to parse content in %s'%
-                            item.href)
+                except Exception:
+                    self.logger.exception('Failed to parse content in %s' %
+                                          item.href)
                     bad.append(item)
                     self.oeb.manifest.remove(item)
         return bad
@@ -181,25 +182,28 @@ class OEBReader(object):
         manifest = self.oeb.manifest
         known = set(manifest.hrefs)
         unchecked = set(manifest.values())
-        cdoc = OEB_DOCS|OEB_STYLES
+        cdoc = base.OEB_DOCS | base.OEB_STYLES
         invalid = set()
         while unchecked:
             new = set()
             for item in unchecked:
                 data = None
-                if (item.media_type in cdoc or item.media_type[-4:] in ('/xml', '+xml')):
+                if (item.media_type in cdoc or
+                        item.media_type[-4:] in ('/xml', '+xml')):
                     try:
                         data = item.data
-                    except:
+                    except Exception:
                         self.oeb.log.exception('Failed to read from manifest '
-                                'entry with id: %s, ignoring'%item.id)
+                                               'entry with id: %s, ignoring' %
+                                               item.id)
                         invalid.add(item)
                         continue
                 if data is None:
                     continue
 
-                if (item.media_type in OEB_DOCS or item.media_type[-4:] in ('/xml', '+xml')):
-                    hrefs = [r[2] for r in iterlinks(data)]
+                if (item.media_type in base.OEB_DOCS or
+                        item.media_type[-4:] in ('/xml', '+xml')):
+                    hrefs = [r[2] for r in base.iterlinks(data)]
                     for href in hrefs:
                         if isinstance(href, bytes):
                             href = href.decode('utf-8')
@@ -207,22 +211,22 @@ class OEBReader(object):
                         if not href:
                             continue
                         try:
-                            href = item.abshref(urlnormalize(href))
+                            href = item.abshref(base.urlnormalize(href))
                             scheme = urllib.parse.urlparse(href).scheme
-                        except:
-                            self.oeb.log.exception(
-                                'Skipping invalid href: %r'%href)
+                        except Exception:
+                            self.oeb.log.exception('Skipping invalid href: '
+                                                   '%r' % href)
                             continue
                         if not scheme and href not in known:
                             new.add(href)
-                elif item.media_type in OEB_STYLES:
+                elif item.media_type in base.OEB_STYLES:
                     try:
                         urls = list(css_parser.getUrls(data))
-                    except:
+                    except Exception:
                         urls = []
                     for url in urls:
                         href, _ = urllib.parse.urldefrag(url)
-                        href = item.abshref(urlnormalize(href))
+                        href = item.abshref(base.urlnormalize(href))
                         scheme = urllib.parse.urlparse(href).scheme
                         if not scheme and href not in known:
                             new.add(href)
@@ -232,7 +236,7 @@ class OEBReader(object):
                 known.add(href)
                 is_invalid = False
                 for item in invalid:
-                    if href == item.abshref(urlnormalize(href)):
+                    if href == item.abshref(base.urlnormalize(href)):
                         is_invalid = True
                         break
                 if is_invalid:
@@ -243,11 +247,12 @@ class OEBReader(object):
                         warned.add(href)
                     continue
                 if href not in warned:
-                    self.logger.warn('Referenced file %r not in manifest' % href)
+                    self.logger.warn('Referenced file %r not in manifest' %
+                                     href)
                     warned.add(href)
                 id, _ = manifest.generate(id='added')
                 guessed = guess_type(href)[0]
-                media_type = guessed or BINARY_MIME
+                media_type = guessed or base.BINARY_MIME
                 added = manifest.add(id, href, media_type)
                 unchecked.add(added)
 
@@ -256,7 +261,7 @@ class OEBReader(object):
 
     def _manifest_from_opf(self, opf):
         manifest = self.oeb.manifest
-        for elem in xpath(opf, '/o2:package/o2:manifest/o2:item'):
+        for elem in base.xpath(opf, '/o2:package/o2:manifest/o2:item'):
             id = elem.get('id')
             href = elem.get('href')
             media_type = elem.get('media-type', None)
@@ -264,7 +269,7 @@ class OEBReader(object):
                 media_type = elem.get('mediatype', None)
             if not media_type or media_type == 'text/xml':
                 guessed = guess_type(href)[0]
-                media_type = guessed or media_type or BINARY_MIME
+                media_type = guessed or media_type or base.BINARY_MIME
             if hasattr(media_type, 'lower'):
                 media_type = media_type.lower()
             fallback = elem.get('fallback')
@@ -285,12 +290,12 @@ class OEBReader(object):
         manifest = self.oeb.manifest
         spine = self.oeb.spine
         unchecked = set(spine)
-        selector = XPath('h:body//h:a/@href')
+        selector = base.XPath('h:body//h:a/@href')
         extras = set()
         while unchecked:
             new = set()
             for item in unchecked:
-                if item.media_type not in OEB_DOCS:
+                if item.media_type not in base.OEB_DOCS:
                     # TODO: handle fallback chains
                     continue
                 for href in selector(item.data):
@@ -298,20 +303,21 @@ class OEBReader(object):
                     if not href:
                         continue
                     try:
-                        href = item.abshref(urlnormalize(href))
+                        href = item.abshref(base.urlnormalize(href))
                     except ValueError:  # Malformed URL
                         continue
                     if href not in manifest.hrefs:
                         continue
                     found = manifest.hrefs[href]
-                    if found.media_type not in OEB_DOCS or \
+                    if found.media_type not in base.OEB_DOCS or \
                        found in spine or found in extras:
                         continue
                     new.add(found)
             extras.update(new)
             unchecked = new
         version = int(self.oeb.version[0])
-        removed_items_to_ignore = getattr(self.oeb, 'removed_items_to_ignore', ())
+        removed_items_to_ignore = getattr(self.oeb, 'removed_items_to_ignore',
+                                          ())
         for item in sorted(extras):
             if item.href in removed_items_to_ignore:
                 continue
@@ -323,34 +329,38 @@ class OEBReader(object):
     def _spine_from_opf(self, opf):
         spine = self.oeb.spine
         manifest = self.oeb.manifest
-        for elem in xpath(opf, '/o2:package/o2:spine/o2:itemref'):
+        for elem in base.xpath(opf, '/o2:package/o2:spine/o2:itemref'):
             idref = elem.get('idref')
             if idref not in manifest.ids:
                 self.logger.warn('Spine item %r not found' % idref)
                 continue
             item = manifest.ids[idref]
-            if item.media_type.lower() in OEB_DOCS and hasattr(item.data, 'xpath') and not getattr(item.data, 'tag', '').endswith('}ncx'):
+            if (item.media_type.lower() in base.OEB_DOCS and
+                    hasattr(item.data, 'xpath') and not
+                    getattr(item.data, 'tag', '').endswith('}ncx')):
                 spine.add(item, elem.get('linear'))
             else:
-                if hasattr(item.data, 'tag') and item.data.tag and item.data.tag.endswith('}html'):
-                    item.media_type = XHTML_MIME
+                if (hasattr(item.data, 'tag') and
+                        item.data.tag and item.data.tag.endswith('}html')):
+                    item.media_type = base.XHTML_MIME
                     spine.add(item, elem.get('linear'))
                 else:
                     self.oeb.log.warn('The item %s is not a XML document.'
-                        ' Removing it from spine.'%item.href)
+                                      ' Removing it from spine.' % item.href)
         if len(spine) == 0:
-            raise OEBError("Spine is empty")
+            raise base.OEBError("Spine is empty")
         self._spine_add_extra()
-        for val in xpath(opf, '/o2:package/o2:spine/@page-progression-direction'):
+        for val in base.xpath(opf,
+                         '/o2:package/o2:spine/@page-progression-direction'):
             if val in {'ltr', 'rtl'}:
                 spine.page_progression_direction = val
 
     def _guide_from_opf(self, opf):
         guide = self.oeb.guide
         manifest = self.oeb.manifest
-        for elem in xpath(opf, '/o2:package/o2:guide/o2:reference'):
+        for elem in base.xpath(opf, '/o2:package/o2:guide/o2:reference'):
             ref_href = elem.get('href')
-            path = urlnormalize(urllib.parse.urldefrag(ref_href)[0])
+            path = base.urlnormalize(urllib.parse.urldefrag(ref_href)[0])
             if path not in manifest.hrefs:
                 corrected_href = None
                 for href in manifest.hrefs:
@@ -366,7 +376,7 @@ class OEBReader(object):
                 guide.add(typ, elem.get('title'), ref_href)
 
     def _find_ncx(self, opf):
-        result = xpath(opf, '/o2:package/o2:spine/@toc')
+        result = base.xpath(opf, '/o2:package/o2:spine/@toc')
         if result:
             id = result[0]
             if id not in self.oeb.manifest.ids:
@@ -375,30 +385,33 @@ class OEBReader(object):
             self.oeb.manifest.remove(item)
             return item
         for item in self.oeb.manifest.values():
-            if item.media_type == NCX_MIME:
+            if item.media_type == base.NCX_MIME:
                 self.oeb.manifest.remove(item)
                 return item
         return None
 
     def _toc_from_navpoint(self, item, toc, navpoint):
-        children = xpath(navpoint, 'ncx:navPoint')
+        children = base.xpath(navpoint, 'ncx:navPoint')
         for child in children:
-            title = ''.join(xpath(child, 'ncx:navLabel/ncx:text/text()'))
-            title = COLLAPSE_RE.sub(' ', title.strip())
-            href = xpath(child, 'ncx:content/@src')
+            title = ''.join(base.xpath(child, 'ncx:navLabel/ncx:text/text()'))
+            title = base.COLLAPSE_RE.sub(' ', title.strip())
+            href = base.xpath(child, 'ncx:content/@src')
             if not title:
                 self._toc_from_navpoint(item, toc, child)
                 continue
-            if (not href or not href[0]) and not xpath(child, 'ncx:navPoint'):
+            if (not href or not href[0]) and not base.xpath(child, 'ncx:navPoint'):
                 # This node is useless
                 continue
-            href = item.abshref(urlnormalize(href[0])) if href and href[0] else ''
+            if href and href[0]:
+                href = item.abshref(base.urlnormalize(href[0]))
+            else:
+                href = ''
             path, _ = urllib.parse.urldefrag(href)
             if path and path not in self.oeb.manifest.hrefs:
-                path = urlnormalize(path)
+                path = base.urlnormalize(path)
             if href and path not in self.oeb.manifest.hrefs:
                 self.logger.warn('TOC reference %r not found' % href)
-                gc = xpath(child, 'ncx:navPoint')
+                gc = base.xpath(child, 'ncx:navPoint')
                 if not gc:
                     # This node is useless
                     continue
@@ -406,36 +419,40 @@ class OEBReader(object):
             klass = child.get('class', 'chapter')
 
             try:
-                po = int(child.get('playOrder', self.oeb.toc.next_play_order()))
-            except:
+                po = int(child.get('playOrder',
+                                   self.oeb.toc.next_play_order()))
+            except Exception:
                 po = self.oeb.toc.next_play_order()
 
-            authorElement = xpath(child,
-                    'descendant::calibre:meta[@name = "author"]')
+            authorElement = base.xpath(child,
+                                  'descendant::calibre:meta[@name = "author"]')
             if authorElement:
                 author = authorElement[0].text
             else:
                 author = None
 
-            descriptionElement = xpath(child,
-                    'descendant::calibre:meta[@name = "description"]')
+            descriptionElement = base.xpath(child,
+                                       'descendant::calibre:meta[@name = '
+                                       '"description"]')
             if descriptionElement:
                 description = etree.tostring(descriptionElement[0],
-                method='text', encoding='unicode').strip()
+                                             method='text',
+                                             encoding='unicode').strip()
                 if not description:
                     description = None
             else:
                 description = None
 
-            index_image = xpath(child,
-                    'descendant::calibre:meta[@name = "toc_thumbnail"]')
+            index_image = base.xpath(child,
+                                'descendant::calibre:meta[@name = '
+                                '"toc_thumbnail"]')
             toc_thumbnail = (index_image[0].text if index_image else None)
             if not toc_thumbnail or not toc_thumbnail.strip():
                 toc_thumbnail = None
 
             node = toc.add(title, href, id=id, klass=klass,
-                    play_order=po, description=description, author=author,
-                           toc_thumbnail=toc_thumbnail)
+                           play_order=po, description=description,
+                           author=author, toc_thumbnail=toc_thumbnail)
 
             self._toc_from_navpoint(item, node, child)
 
@@ -444,31 +461,31 @@ class OEBReader(object):
             return False
         self.log.debug('Reading TOC from NCX...')
         ncx = item.data
-        title = ''.join(xpath(ncx, 'ncx:docTitle/ncx:text/text()'))
-        title = COLLAPSE_RE.sub(' ', title.strip())
+        title = ''.join(base.xpath(ncx, 'ncx:docTitle/ncx:text/text()'))
+        title = base.COLLAPSE_RE.sub(' ', title.strip())
         title = title or str(self.oeb.metadata.title[0])
         toc = self.oeb.toc
         toc.title = title
-        navmaps = xpath(ncx, 'ncx:navMap')
+        navmaps = base.xpath(ncx, 'ncx:navMap')
         for navmap in navmaps:
             self._toc_from_navpoint(item, toc, navmap)
         return True
 
     def _toc_from_tour(self, opf):
-        result = xpath(opf, 'o2:tours/o2:tour')
+        result = base.xpath(opf, 'o2:tours/o2:tour')
         if not result:
             return False
         self.log.debug('Reading TOC from tour...')
         tour = result[0]
         toc = self.oeb.toc
         toc.title = tour.get('title')
-        sites = xpath(tour, 'o2:site')
+        sites = base.xpath(tour, 'o2:site')
         for site in sites:
             title = site.get('title')
             href = site.get('href')
             if not title or not href:
                 continue
-            path, _ = urllib.parse.urldefrag(urlnormalize(href))
+            path, _ = urllib.parse.urldefrag(base.urlnormalize(href))
             if path not in self.oeb.manifest.hrefs:
                 self.logger.warn('TOC reference %r not found' % href)
                 continue
@@ -484,23 +501,23 @@ class OEBReader(object):
         item = self.oeb.manifest.hrefs[itempath]
         html = item.data
         if frag:
-            elems = xpath(html, './/*[@id="%s"]' % frag)
+            elems = base.xpath(html, './/*[@id="%s"]' % frag)
             if not elems:
-                elems = xpath(html, './/*[@name="%s"]' % frag)
+                elems = base.xpath(html, './/*[@name="%s"]' % frag)
             elem = elems[0] if elems else html
-            while elem != html and not xpath(elem, './/h:a[@href]'):
+            while elem != html and not base.xpath(elem, './/h:a[@href]'):
                 elem = elem.getparent()
             html = elem
-        titles = defaultdict(list)
+        titles = collections.defaultdict(list)
         order = []
-        for anchor in xpath(html, './/h:a[@href]'):
+        for anchor in base.xpath(html, './/h:a[@href]'):
             href = anchor.attrib['href']
-            href = item.abshref(urlnormalize(href))
+            href = item.abshref(base.urlnormalize(href))
             path, frag = urllib.parse.urldefrag(href)
             if path not in self.oeb.manifest.hrefs:
                 continue
-            title = xml2text(anchor)
-            title = COLLAPSE_RE.sub(' ', title.strip())
+            title = base.xml2text(anchor)
+            title = base.COLLAPSE_RE.sub(' ', title.strip())
             if href not in titles:
                 order.append(href)
             titles[href].append(title)
@@ -518,15 +535,15 @@ class OEBReader(object):
             if not item.linear:
                 continue
             html = item.data
-            title = ''.join(xpath(html, '/h:html/h:head/h:title/text()'))
-            title = COLLAPSE_RE.sub(' ', title.strip())
+            title = ''.join(base.xpath(html, '/h:html/h:head/h:title/text()'))
+            title = base.COLLAPSE_RE.sub(' ', title.strip())
             if title:
                 titles.append(title)
             headers.append('(unlabled)')
             for tag in ('h1', 'h2', 'h3', 'h4', 'h5', 'strong'):
                 expr = '/h:html/h:body//h:%s[position()=1]/text()'
-                header = ''.join(xpath(html, expr % tag))
-                header = COLLAPSE_RE.sub(' ', header.strip())
+                header = ''.join(base.xpath(html, expr % tag))
+                header = base.COLLAPSE_RE.sub(' ', header.strip())
                 if header:
                     headers[-1] = header
                     break
@@ -558,17 +575,17 @@ class OEBReader(object):
         ncx = item.data
         if ncx is None:
             return False
-        ptargets = xpath(ncx, 'ncx:pageList/ncx:pageTarget')
+        ptargets = base.xpath(ncx, 'ncx:pageList/ncx:pageTarget')
         if not ptargets:
             return False
         pages = self.oeb.pages
         for ptarget in ptargets:
-            name = ''.join(xpath(ptarget, 'ncx:navLabel/ncx:text/text()'))
-            name = COLLAPSE_RE.sub(' ', name.strip())
-            href = xpath(ptarget, 'ncx:content/@src')
+            name = ''.join(base.xpath(ptarget, 'ncx:navLabel/ncx:text/text()'))
+            name = base.COLLAPSE_RE.sub(' ', name.strip())
+            href = base.xpath(ptarget, 'ncx:content/@src')
             if not href:
                 continue
-            href = item.abshref(urlnormalize(href[0]))
+            href = item.abshref(base.urlnormalize(href[0]))
             id = ptarget.get('id')
             type = ptarget.get('type', 'normal')
             klass = ptarget.get('class')
@@ -576,7 +593,7 @@ class OEBReader(object):
         return True
 
     def _find_page_map(self, opf):
-        result = xpath(opf, '/o2:package/o2:spine/@page-map')
+        result = base.xpath(opf, '/o2:package/o2:spine/@page-map')
         if result:
             id = result[0]
             if id not in self.oeb.manifest.ids:
@@ -585,7 +602,7 @@ class OEBReader(object):
             self.oeb.manifest.remove(item)
             return item
         for item in self.oeb.manifest.values():
-            if item.media_type == PAGE_MAP_MIME:
+            if item.media_type == base.PAGE_MAP_MIME:
                 self.oeb.manifest.remove(item)
                 return item
         return None
@@ -596,13 +613,13 @@ class OEBReader(object):
             return False
         pmap = item.data
         pages = self.oeb.pages
-        for page in xpath(pmap, 'o2:page'):
+        for page in base.xpath(pmap, 'o2:page'):
             name = page.get('name', '')
             href = page.get('href')
             if not href:
                 continue
-            name = COLLAPSE_RE.sub(' ', name.strip())
-            href = item.abshref(urlnormalize(href))
+            name = base.COLLAPSE_RE.sub(' ', name.strip())
+            href = item.abshref(base.urlnormalize(href))
             type = 'normal'
             if not name:
                 type = 'special'
@@ -628,14 +645,14 @@ class OEBReader(object):
             if not data:
                 data = b''
         id, href = self.oeb.manifest.generate('cover', 'cover.jpg')
-        item = self.oeb.manifest.add(id, href, JPEG_MIME, data=data)
+        item = self.oeb.manifest.add(id, href, base.JPEG_MIME, data=data)
         return item
 
     def _locate_cover_image(self):
         if self.oeb.metadata.cover:
             id = str(self.oeb.metadata.cover[0])
             item = self.oeb.manifest.ids.get(id, None)
-            if item is not None and item.media_type in OEB_IMAGES:
+            if item is not None and item.media_type in base.OEB_IMAGES:
                 return item
             else:
                 self.logger.warn('Invalid cover image @id %r' % id)
@@ -644,27 +661,27 @@ class OEBReader(object):
             href = self.oeb.guide['cover'].href
             item = self.oeb.manifest.hrefs[href]
             media_type = item.media_type
-            if media_type in OEB_IMAGES:
+            if media_type in base.OEB_IMAGES:
                 return item
-            elif media_type in OEB_DOCS:
+            elif media_type in base.OEB_DOCS:
                 hcover = item
         html = hcover.data
-        if MS_COVER_TYPE in self.oeb.guide:
-            href = self.oeb.guide[MS_COVER_TYPE].href
+        if base.MS_COVER_TYPE in self.oeb.guide:
+            href = self.oeb.guide[base.MS_COVER_TYPE].href
             item = self.oeb.manifest.hrefs.get(href, None)
-            if item is not None and item.media_type in OEB_IMAGES:
+            if item is not None and item.media_type in base.OEB_IMAGES:
                 return item
         if self.COVER_SVG_XP(html):
             svg = copy.deepcopy(self.COVER_SVG_XP(html)[0])
             href = os.path.splitext(hcover.href)[0] + '.svg'
             id, href = self.oeb.manifest.generate(hcover.id, href)
-            item = self.oeb.manifest.add(id, href, SVG_MIME, data=svg)
+            item = self.oeb.manifest.add(id, href, base.SVG_MIME, data=svg)
             return item
         if self.COVER_OBJECT_XP(html):
             object = self.COVER_OBJECT_XP(html)[0]
             href = hcover.abshref(object.get('data'))
             item = self.oeb.manifest.hrefs.get(href, None)
-            if item is not None and item.media_type in OEB_IMAGES:
+            if item is not None and item.media_type in base.OEB_IMAGES:
                 return item
         return self._cover_from_html(hcover)
 
@@ -687,7 +704,8 @@ class OEBReader(object):
             items = [x for x in self.oeb.manifest if x.href == href]
             for x in items:
                 if x not in self.oeb.spine:
-                    self.oeb.log.warn('Removing duplicate manifest item with id:', x.id)
+                    self.oeb.log.warn('Removing duplicate manifest item with '
+                                      'id:', x.id)
                     self.oeb.manifest.remove_duplicate_item(x)
 
     def _all_from_opf(self, opf):
@@ -706,7 +724,7 @@ class OEBReader(object):
 def main(argv=sys.argv):
     reader = OEBReader()
     for arg in argv[1:]:
-        oeb = reader(OEBBook(), arg)
+        oeb = reader(base.OEBBook(), arg)
         for name, doc in oeb.to_opf1().values():
             print(etree.tostring(doc, pretty_print=True))
         for name, doc in oeb.to_opf2(page_map=True).values():
diff --git a/ebook_converter/ebooks/oeb/stylizer.py b/ebook_converter/ebooks/oeb/stylizer.py
index 178579e..cfef868 100644
--- a/ebook_converter/ebooks/oeb/stylizer.py
+++ b/ebook_converter/ebooks/oeb/stylizer.py
@@ -10,17 +10,16 @@ from css_parser.css import (CSSStyleRule, CSSPageRule, CSSFontFaceRule,
         cssproperties)
 from css_parser import (profile as cssprofiles, parseString, parseStyle, log as
         css_parser_log, CSSParser, profiles, replaceUrls)
+
+from ebook_converter import constants as const
 from ebook_converter import force_unicode, as_unicode
 from ebook_converter.ebooks import unit_convert
-from ebook_converter.ebooks.oeb.base import XHTML, XHTML_NS, CSS_MIME, OEB_STYLES, xpath, urlnormalize
+from ebook_converter.ebooks.oeb import base
 from ebook_converter.ebooks.oeb.normalize_css import DEFAULTS, normalizers
 from ebook_converter.css_selectors import Select, SelectorError, INAPPROPRIATE_PSEUDO_CLASSES
 from ebook_converter.tinycss.media3 import CSSMedia3Parser
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2008, Marshall T. Vandegrift <llasram@gmail.com>'
-
 css_parser_log.setLevel(logging.WARN)
 
 _html_css_stylesheet = None
@@ -208,7 +207,7 @@ class Stylizer(object):
         stylesheets = [html_css_stylesheet()]
         if base_css:
             stylesheets.append(parseString(base_css, validate=False))
-        style_tags = xpath(tree, '//*[local-name()="style" or local-name()="link"]')
+        style_tags = base.xpath(tree, '//*[local-name()="style" or local-name()="link"]')
 
         # Add css_parser parsing profiles from output_profile
         for profile in self.opts.output_profile.extra_css_modules:
@@ -219,7 +218,7 @@ class Stylizer(object):
         parser = CSSParser(fetcher=self._fetch_css_file,
                 log=logging.getLogger('calibre.css'))
         for elem in style_tags:
-            if (elem.tag == XHTML('style') and elem.get('type', CSS_MIME) in OEB_STYLES and media_ok(elem.get('media'))):
+            if (elem.tag == base.tag('xhtml', 'style') and elem.get('type', base.CSS_MIME) in base.OEB_STYLES and media_ok(elem.get('media'))):
                 text = elem.text if elem.text else ''
                 for x in elem:
                     t = getattr(x, 'text', None)
@@ -245,7 +244,7 @@ class Stylizer(object):
                                 self.logger.warn('Ignoring missing stylesheet in @import rule:', rule.href)
                                 continue
                             sitem = hrefs[ihref]
-                            if sitem.media_type not in OEB_STYLES:
+                            if sitem.media_type not in base.OEB_STYLES:
                                 self.logger.warn('CSS @import of non-CSS file %r' % rule.href)
                                 continue
                             stylesheets.append(sitem.data)
@@ -254,11 +253,11 @@ class Stylizer(object):
                     replaceUrls(stylesheet, item.abshref,
                             ignoreImportRules=True)
                     stylesheets.append(stylesheet)
-            elif (elem.tag == XHTML('link') and elem.get('href') and elem.get(
+            elif (elem.tag == base.tag('xhtml', 'link') and elem.get('href') and elem.get(
                     'rel', 'stylesheet').lower() == 'stylesheet' and elem.get(
-                    'type', CSS_MIME).lower() in OEB_STYLES and media_ok(elem.get('media'))
+                    'type', base.CSS_MIME).lower() in base.OEB_STYLES and media_ok(elem.get('media'))
                 ):
-                href = urlnormalize(elem.attrib['href'])
+                href = base.urlnormalize(elem.attrib['href'])
                 path = item.abshref(href)
                 sitem = oeb.manifest.hrefs.get(path, None)
                 if sitem is None:
@@ -326,7 +325,8 @@ class Stylizer(object):
 
                                 special_text = ''.join(punctuation_chars) + \
                                         (text[0] if text else '')
-                                span = x.makeelement('{%s}span' % XHTML_NS)
+                                span = x.makeelement('{%s}span' %
+                                                     const.XHTML_NS)
                                 span.text = special_text
                                 span.set('data-fake-first-letter', '1')
                                 span.tail = text[1:]
@@ -340,10 +340,10 @@ class Stylizer(object):
             else:
                 for elem in matches:
                     self.style(elem)._update_cssdict(cssdict)
-        for elem in xpath(tree, '//h:*[@style]'):
+        for elem in base.xpath(tree, '//h:*[@style]'):
             self.style(elem)._apply_style_attr(url_replacer=item.abshref)
         num_pat = re.compile(r'[0-9.]+$')
-        for elem in xpath(tree, '//h:img[@width or @height]'):
+        for elem in base.xpath(tree, '//h:img[@width or @height]'):
             style = self.style(elem)
             # Check if either height or width is not default
             is_styled = style._style.get('width', 'auto') != 'auto' or \
@@ -370,7 +370,7 @@ class Stylizer(object):
             self.logger.warn('CSS import of missing file %r' % path)
             return (None, None)
         item = hrefs[path]
-        if item.media_type not in OEB_STYLES:
+        if item.media_type not in base.OEB_STYLES:
             self.logger.warn('CSS import of non-CSS file %r' % path)
             return (None, None)
         data = item.data.cssText
diff --git a/ebook_converter/ebooks/oeb/transforms/cover.py b/ebook_converter/ebooks/oeb/transforms/cover.py
index bbc23be..f03e52c 100644
--- a/ebook_converter/ebooks/oeb/transforms/cover.py
+++ b/ebook_converter/ebooks/oeb/transforms/cover.py
@@ -1,66 +1,61 @@
 import textwrap
 import urllib.parse
 
+from lxml import etree
+
 from ebook_converter import guess_type
 from ebook_converter.utils.imghdr import identify
-from ebook_converter.utils.xml_parse import safe_xml_fromstring
 from ebook_converter.polyglot.urllib import unquote
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2010, Kovid Goyal <kovid@kovidgoyal.net>'
-__docformat__ = 'restructuredtext en'
-
-
 class CoverManager(object):
 
     SVG_TEMPLATE = textwrap.dedent('''\
-        <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en">
-            <head>
-                <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
-                <meta name="calibre:cover" content="true" />
-                <title>Cover</title>
-                <style type="text/css" title="override_css">
-                    @page {padding: 0pt; margin:0pt}
-                    body { text-align: center; padding:0pt; margin: 0pt; }
-                </style>
-            </head>
-            <body>
-                <div>
-                    <svg version="1.1" xmlns="http://www.w3.org/2000/svg"
-                        xmlns:xlink="http://www.w3.org/1999/xlink"
-                        width="100%%" height="100%%" viewBox="__viewbox__"
-                        preserveAspectRatio="__ar__">
-                        <image width="__width__" height="__height__" xlink:href="%s"/>
-                    </svg>
-                </div>
-            </body>
-        </html>
-        ''')
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en">
+    <head>
+        <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+        <meta name="calibre:cover" content="true" />
+        <title>Cover</title>
+        <style type="text/css" title="override_css">
+            @page {padding: 0pt; margin:0pt}
+            body { text-align: center; padding:0pt; margin: 0pt; }
+        </style>
+    </head>
+    <body>
+        <div>
+            <svg version="1.1" xmlns="http://www.w3.org/2000/svg"
+                xmlns:xlink="http://www.w3.org/1999/xlink"
+                width="100%%" height="100%%" viewBox="__viewbox__"
+                preserveAspectRatio="__ar__">
+                <image width="__width__" height="__height__" xlink:href="%s"/>
+            </svg>
+        </div>
+    </body>
+</html>''')
 
     NONSVG_TEMPLATE = textwrap.dedent('''\
-        <html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en">
-            <head>
-                <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
-                <meta name="calibre:cover" content="true" />
-                <title>Cover</title>
-                <style type="text/css" title="override_css">
-                    @page {padding: 0pt; margin:0pt}
-                    body { text-align: center; padding:0pt; margin: 0pt }
-                    div { padding:0pt; margin: 0pt }
-                    img { padding:0pt; margin: 0pt }
-                </style>
-            </head>
-            <body>
-                <div>
-                    <img src="%s" alt="cover" __style__ />
-                </div>
-            </body>
-        </html>
+<html xmlns="http://www.w3.org/1999/xhtml" xml:lang="en">
+    <head>
+        <meta http-equiv="Content-Type" content="text/html; charset=UTF-8" />
+        <meta name="calibre:cover" content="true" />
+        <title>Cover</title>
+        <style type="text/css" title="override_css">
+            @page {padding: 0pt; margin:0pt}
+            body { text-align: center; padding:0pt; margin: 0pt }
+            div { padding:0pt; margin: 0pt }
+            img { padding:0pt; margin: 0pt }
+        </style>
+    </head>
+    <body>
+        <div>
+            <img src="%s" alt="cover" __style__ />
+        </div>
+    </body>
+</html>
     ''')
 
     def __init__(self, no_default_cover=False, no_svg_cover=False,
-            preserve_aspect_ratio=False, fixed_size=None):
+                 preserve_aspect_ratio=False, fixed_size=None):
         self.no_default_cover = no_default_cover
         self.no_svg_cover = no_svg_cover
         self.preserve_aspect_ratio = preserve_aspect_ratio
@@ -72,9 +67,9 @@ class CoverManager(object):
             style = 'style="height: 100%%"'
         else:
             width, height = fixed_size
-            style = 'style="height: %s; width: %s"'%(height, width)
+            style = 'style="height: %s; width: %s"' % (height, width)
         self.non_svg_template = self.NONSVG_TEMPLATE.replace('__style__',
-                style)
+                                                             style)
 
     def __call__(self, oeb, opts, log):
         self.oeb = oeb
@@ -108,22 +103,23 @@ class CoverManager(object):
             # if self.preserve_aspect_ratio:
             #    width, height = 600, 800
             self.svg_template = self.svg_template.replace('__viewbox__',
-                    '0 0 %d %d'%(width, height))
+                                                          '0 0 %d %d' %
+                                                          (width, height))
             self.svg_template = self.svg_template.replace('__width__',
-                    str(width))
+                                                          str(width))
             self.svg_template = self.svg_template.replace('__height__',
-                    str(height))
+                                                          str(height))
 
             if href is not None:
                 templ = self.non_svg_template if self.no_svg_cover \
                         else self.svg_template
-                tp = templ%unquote(href)
+                tp = templ % unquote(href)
                 id, href = m.generate('titlepage', 'titlepage.xhtml')
                 item = m.add(id, href, guess_type('t.xhtml')[0],
-                        data=safe_xml_fromstring(tp))
+                             data=etree.fromstring(tp))
         else:
-            item = self.oeb.manifest.hrefs[
-                    urllib.parse.urldefrag(self.oeb.guide['titlepage'].href)[0]]
+            key = urllib.parse.urldefrag(self.oeb.guide['titlepage'].href)[0]
+            item = self.oeb.manifest.hrefs[key]
         if item is not None:
             self.oeb.spine.insert(0, item, True)
             if 'cover' not in self.oeb.guide.refs:
diff --git a/ebook_converter/ebooks/oeb/transforms/flatcss.py b/ebook_converter/ebooks/oeb/transforms/flatcss.py
index 3696e0a..6d29be3 100644
--- a/ebook_converter/ebooks/oeb/transforms/flatcss.py
+++ b/ebook_converter/ebooks/oeb/transforms/flatcss.py
@@ -1,26 +1,27 @@
 """
 CSS flattening transform.
 """
-import re, operator, math, numbers
-from collections import defaultdict
-from xml.dom import SyntaxErr
+import collections
+import math
+import numbers
+import operator
+import re
+from xml import dom
 
 from lxml import etree
 import css_parser
-from css_parser.css import Property
+from css_parser import css as cp_css
 
+from ebook_converter import constants as const
 from ebook_converter import guess_type
 from ebook_converter.ebooks import unit_convert
-from ebook_converter.ebooks.oeb.base import (XHTML, XHTML_NS, CSS_MIME, OEB_STYLES,
-        namespace, barename, XPath, css_text)
+from ebook_converter.ebooks.oeb import base
+from ebook_converter.ebooks.oeb import parse_utils
+
 from ebook_converter.ebooks.oeb.stylizer import Stylizer
 from ebook_converter.utils.filenames import ascii_filename, ascii_text
-from ebook_converter.utils.icu import numeric_sort_key
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2008, Marshall T. Vandegrift <llasram@gmail.com>'
-
 COLLAPSE = re.compile(r'[ \t\r\n\v]+')
 STRIPNUM = re.compile(r'[-0-9]+$')
 
@@ -121,7 +122,7 @@ class EmbedFontsCSSRules(object):
             return None
         if not self.href:
             iid, href = oeb.manifest.generate('page_styles', 'page_styles.css')
-            rules = [css_text(x) for x in self.rules]
+            rules = [base.css_text(x) for x in self.rules]
             rules = '\n\n'.join(rules)
             sheet = css_parser.parseString(rules, validate=False)
             self.href = oeb.manifest.add(iid, href, guess_type(href)[0],
@@ -186,7 +187,7 @@ class CSSFlattener(object):
         for item in oeb.manifest.values():
             # Make all links to resources absolute, as these sheets will be
             # consolidated into a single stylesheet at the root of the document
-            if item.media_type in OEB_STYLES:
+            if item.media_type in base.OEB_STYLES:
                 css_parser.replaceUrls(item.data, item.abshref,
                         ignoreImportRules=True)
 
@@ -273,7 +274,7 @@ class CSSFlattener(object):
         css = ''
         for item in self.items:
             html = item.data
-            body = html.find(XHTML('body'))
+            body = html.find(base.tag('xhtml', 'body'))
             if 'style' in html.attrib:
                 b = body.attrib.get('style', '')
                 body.set('style',  html.get('style') + ';' + b)
@@ -310,11 +311,11 @@ class CSSFlattener(object):
                 sizes[csize] += len(COLLAPSE.sub(' ', child.tail))
 
     def baseline_spine(self):
-        sizes = defaultdict(float)
+        sizes = collections.defaultdict(float)
         for item in self.items:
             html = item.data
             stylizer = self.stylizers[item]
-            body = html.find(XHTML('body'))
+            body = html.find(base.tag('xhtml', 'body'))
             fsize = self.context.source.fbase
             self.baseline_node(body, stylizer, sizes, fsize)
         try:
@@ -351,9 +352,9 @@ class CSSFlattener(object):
 
     def flatten_node(self, node, stylizer, names, styles, pseudo_styles, psize, item_id, recurse=True):
         if not isinstance(node.tag, (str, bytes)) \
-           or namespace(node.tag) != XHTML_NS:
+           or parse_utils.namespace(node.tag) != const.XHTML_NS:
             return
-        tag = barename(node.tag)
+        tag = parse_utils.barename(node.tag)
         style = stylizer.style(node)
         cssdict = style.cssdict()
         try:
@@ -375,7 +376,7 @@ class CSSFlattener(object):
                         if 'margin-left' not in cssdict and 'margin-right' not in cssdict:
                             cssdict['margin-left'] = cssdict['margin-right'] = 'auto'
                     else:
-                        for table in node.iterchildren(XHTML("table")):
+                        for table in node.iterchildren(base.tag('xhtml', "table")):
                             ts = stylizer.style(table)
                             if ts.get('margin-left') is None and ts.get('margin-right') is None:
                                 ts.set('margin-left', 'auto')
@@ -391,11 +392,12 @@ class CSSFlattener(object):
             if cssdict.get('vertical-align') == 'inherit':
                 cssdict['vertical-align'] = node.attrib['valign']
             del node.attrib['valign']
-        if node.tag == XHTML('font'):
+        if node.tag == base.tag('xhtml', 'font'):
             tags = ['descendant::h:%s'%x for x in ('p', 'div', 'table', 'h1',
                 'h2', 'h3', 'h4', 'h5', 'h6', 'ol', 'ul', 'dl', 'blockquote')]
-            tag = 'div' if XPath('|'.join(tags))(node) else 'span'
-            node.tag = XHTML(tag)
+            # TODO(gryf): this will override tag from line 355. On purpose?
+            tag = 'div' if base.XPath('|'.join(tags))(node) else 'span'
+            node.tag = base.tag('xhtml', tag)
             if 'size' in node.attrib:
                 def force_int(raw):
                     return int(re.search(r'([0-9+-]+)', raw).group(1))
@@ -425,14 +427,14 @@ class CSSFlattener(object):
                 del node.attrib['face']
         if 'color' in node.attrib:
             try:
-                cssdict['color'] = Property('color', node.attrib['color']).value
-            except (ValueError, SyntaxErr):
+                cssdict['color'] = cp_css.Property('color', node.attrib['color']).value
+            except (ValueError, dom.SyntaxErr):
                 pass
             del node.attrib['color']
         if 'bgcolor' in node.attrib:
             try:
-                cssdict['background-color'] = Property('background-color', node.attrib['bgcolor']).value
-            except (ValueError, SyntaxErr):
+                cssdict['background-color'] = cp_css.Property('background-color', node.attrib['bgcolor']).value
+            except (ValueError, dom.SyntaxErr):
                 pass
             del node.attrib['bgcolor']
         if tag == 'ol' and 'type' in node.attrib:
@@ -573,7 +575,7 @@ class CSSFlattener(object):
 
     def flatten_head(self, item, href, global_href):
         html = item.data
-        head = html.find(XHTML('head'))
+        head = html.find(base.tag('xhtml', 'head'))
 
         def safe_lower(x):
             try:
@@ -583,39 +585,39 @@ class CSSFlattener(object):
             return x
 
         for node in html.xpath('//*[local-name()="style" or local-name()="link"]'):
-            if node.tag == XHTML('link') \
+            if node.tag == base.tag('xhtml', 'link') \
                and safe_lower(node.get('rel', 'stylesheet')) == 'stylesheet' \
-               and safe_lower(node.get('type', CSS_MIME)) in OEB_STYLES:
+               and safe_lower(node.get('type', base.CSS_MIME)) in base.OEB_STYLES:
                 node.getparent().remove(node)
-            elif node.tag == XHTML('style') \
-                 and node.get('type', CSS_MIME) in OEB_STYLES:
+            elif node.tag == base.tag('xhtml', 'style') \
+                 and node.get('type', base.CSS_MIME) in base.OEB_STYLES:
                 node.getparent().remove(node)
         href = item.relhref(href)
-        l = etree.SubElement(head, XHTML('link'),
-            rel='stylesheet', type=CSS_MIME, href=href)
+        l = etree.SubElement(head, base.tag('xhtml', 'link'),
+            rel='stylesheet', type=base.CSS_MIME, href=href)
         l.tail='\n'
         if global_href:
             href = item.relhref(global_href)
-            l = etree.SubElement(head, XHTML('link'),
-                rel='stylesheet', type=CSS_MIME, href=href)
+            l = etree.SubElement(head, base.tag('xhtml', 'link'),
+                rel='stylesheet', type=base.CSS_MIME, href=href)
             l.tail = '\n'
 
     def replace_css(self, css):
         manifest = self.oeb.manifest
         for item in manifest.values():
-            if item.media_type in OEB_STYLES:
+            if item.media_type in base.OEB_STYLES:
                 manifest.remove(item)
         id, href = manifest.generate('css', 'stylesheet.css')
         sheet = css_parser.parseString(css, validate=False)
         if self.transform_css_rules:
             from ebook_converter.ebooks.css_transform_rules import transform_sheet
             transform_sheet(self.transform_css_rules, sheet)
-        item = manifest.add(id, href, CSS_MIME, data=sheet)
+        item = manifest.add(id, href, base.CSS_MIME, data=sheet)
         self.oeb.manifest.main_stylesheet = item
         return href
 
     def collect_global_css(self):
-        global_css = defaultdict(list)
+        global_css = collections.defaultdict(list)
         for item in self.items:
             stylizer = self.stylizers[item]
             if float(self.context.margin_top) >= 0:
@@ -627,7 +629,7 @@ class CSSFlattener(object):
             items = sorted(stylizer.page_rule.items())
             css = ';\n'.join("%s: %s" % (key, val) for key, val in items)
             css = ('@page {\n%s\n}\n'%css) if items else ''
-            rules = [css_text(r) for r in stylizer.font_face_rules + self.embed_font_rules]
+            rules = [base.css_text(r) for r in stylizer.font_face_rules + self.embed_font_rules]
             raw = '\n\n'.join(rules)
             css += '\n\n' + raw
             global_css[css].append(item)
@@ -642,7 +644,7 @@ class CSSFlattener(object):
                 if self.transform_css_rules:
                     from ebook_converter.ebooks.css_transform_rules import transform_sheet
                     transform_sheet(self.transform_css_rules, sheet)
-                manifest.add(id_, href, CSS_MIME, data=sheet)
+                manifest.add(id_, href, base.CSS_MIME, data=sheet)
             gc_map[css] = href
 
         ans = {}
@@ -652,8 +654,8 @@ class CSSFlattener(object):
         return ans
 
     def flatten_spine(self):
-        names = defaultdict(int)
-        styles, pseudo_styles = {}, defaultdict(dict)
+        names = collections.defaultdict(int)
+        styles, pseudo_styles = {}, collections.defaultdict(dict)
         for item in self.items:
             html = item.data
             stylizer = self.stylizers[item]
@@ -661,7 +663,7 @@ class CSSFlattener(object):
                 self.specializer(item, stylizer)
             fsize = self.context.dest.fbase
             self.flatten_node(html, stylizer, names, styles, pseudo_styles, fsize, item.id, recurse=False)
-            self.flatten_node(html.find(XHTML('body')), stylizer, names, styles, pseudo_styles, fsize, item.id)
+            self.flatten_node(html.find(base.tag('xhtml', 'body')), stylizer, names, styles, pseudo_styles, fsize, item.id)
         items = sorted(((key, val) for (val, key) in styles.items()))
         # :hover must come after link and :active must come after :hover
         psels = sorted(pseudo_styles, key=lambda x :
diff --git a/ebook_converter/ebooks/oeb/transforms/htmltoc.py b/ebook_converter/ebooks/oeb/transforms/htmltoc.py
index 8c555f6..1f65c56 100644
--- a/ebook_converter/ebooks/oeb/transforms/htmltoc.py
+++ b/ebook_converter/ebooks/oeb/transforms/htmltoc.py
@@ -1,46 +1,20 @@
 """
 HTML-TOC-adding transform.
 """
-from ebook_converter.ebooks.oeb.base import XML, XHTML, XHTML_NS
-from ebook_converter.ebooks.oeb.base import XHTML_MIME, CSS_MIME
-from ebook_converter.ebooks.oeb.base import element, XPath
+from ebook_converter import constants as const
+from ebook_converter.ebooks.oeb import base
 
 
-__all__ = ['HTMLTOCAdder']
-__license__ = 'GPL v3'
-__copyright__ = '2008, Marshall T. Vandegrift <llasram@gmail.com>'
-
 DEFAULT_TITLE = 'Table of Contents'
+STYLE_CSS = {'nested': '.calibre_toc_header {\n  text-align: center;\n}\n'
+             '.calibre_toc_block {\n  margin-left: 1.2em;\n  text-indent: '
+             '-1.2em;\n}\n.calibre_toc_block .calibre_toc_block {\n  '
+             'margin-left: 2.4em;\n}\n.calibre_toc_block .calibre_toc_block '
+             '.calibre_toc_block {\n  margin-left: 3.6em;\n}\n',
 
-STYLE_CSS = {
-    'nested': """
-.calibre_toc_header {
-  text-align: center;
-}
-.calibre_toc_block {
-  margin-left: 1.2em;
-  text-indent: -1.2em;
-}
-.calibre_toc_block .calibre_toc_block {
-  margin-left: 2.4em;
-}
-.calibre_toc_block .calibre_toc_block .calibre_toc_block {
-  margin-left: 3.6em;
-}
-""",
-
-    'centered': """
-.calibre_toc_header {
-  text-align: center;
-}
-.calibre_toc_block {
-  text-align: center;
-}
-body > .calibre_toc_block {
-  margin-top: 1.2em;
-}
-"""
-    }
+             'centered': '.calibre_toc_header {\n  text-align: center;\n}\n'
+             '.calibre_toc_block {\n  text-align: center;\n}\nbody > '
+             '.calibre_toc_block {\n  margin-top: 1.2em;\n}\n'}
 
 
 class HTMLTOCAdder(object):
@@ -71,7 +45,7 @@ class HTMLTOCAdder(object):
             if href in oeb.manifest.hrefs:
                 item = oeb.manifest.hrefs[href]
                 if (hasattr(item.data, 'xpath') and
-                    XPath('//h:a[@href]')(item.data)):
+                        base.XPath('//h:a[@href]')(item.data)):
                     if oeb.spine.index(item) < 0:
                         if self.position == 'end':
                             oeb.spine.add(item, linear=False)
@@ -91,23 +65,24 @@ class HTMLTOCAdder(object):
             oeb.logger.error('Unknown TOC style %r' % style)
             style = 'nested'
         id, css_href = oeb.manifest.generate('tocstyle', 'tocstyle.css')
-        oeb.manifest.add(id, css_href, CSS_MIME, data=STYLE_CSS[style])
+        oeb.manifest.add(id, css_href, base.CSS_MIME, data=STYLE_CSS[style])
         language = str(oeb.metadata.language[0])
-        contents = element(None, XHTML('html'), nsmap={None: XHTML_NS},
-                           attrib={XML('lang'): language})
-        head = element(contents, XHTML('head'))
-        htitle = element(head, XHTML('title'))
+        contents = base.element(None, base.tag('xhtml', 'html'),
+                                nsmap={None: const.XHTML_NS},
+                                attrib={base.tag('xml', 'lang'): language})
+        head = base.element(contents, base.tag('xhtml', 'head'))
+        htitle = base.element(head, base.tag('xhtml', 'title'))
         htitle.text = title
-        element(head, XHTML('link'), rel='stylesheet', type=CSS_MIME,
-                href=css_href)
-        body = element(contents, XHTML('body'),
-                       attrib={'class': 'calibre_toc'})
-        h1 = element(body, XHTML('h2'),
-                     attrib={'class': 'calibre_toc_header'})
+        base.element(head, base.tag('xhtml', 'link'), rel='stylesheet',
+                     type=base.CSS_MIME, href=css_href)
+        body = base.element(contents, base.tag('xhtml', 'body'),
+                            attrib={'class': 'calibre_toc'})
+        h1 = base.element(body, base.tag('xhtml', 'h2'),
+                          attrib={'class': 'calibre_toc_header'})
         h1.text = title
         self.add_toc_level(body, oeb.toc)
         id, href = oeb.manifest.generate('contents', 'contents.xhtml')
-        item = oeb.manifest.add(id, href, XHTML_MIME, data=contents)
+        item = oeb.manifest.add(id, href, base.XHTML_MIME, data=contents)
         if self.position == 'end':
             oeb.spine.add(item, linear=False)
         else:
@@ -116,10 +91,10 @@ class HTMLTOCAdder(object):
 
     def add_toc_level(self, elem, toc):
         for node in toc:
-            block = element(elem, XHTML('div'),
-                            attrib={'class': 'calibre_toc_block'})
-            line = element(block, XHTML('a'),
-                           attrib={'href': node.href,
-                                   'class': 'calibre_toc_line'})
+            block = base.element(elem, base.tag('xhtml', 'div'),
+                                 attrib={'class': 'calibre_toc_block'})
+            line = base.element(block, base.tag('xhtml', 'a'),
+                                attrib={'href': node.href,
+                                        'class': 'calibre_toc_line'})
             line.text = node.title
             self.add_toc_level(block, node)
diff --git a/ebook_converter/ebooks/oeb/transforms/jacket.py b/ebook_converter/ebooks/oeb/transforms/jacket.py
index 0d1a88b..61a0dbf 100644
--- a/ebook_converter/ebooks/oeb/transforms/jacket.py
+++ b/ebook_converter/ebooks/oeb/transforms/jacket.py
@@ -4,9 +4,10 @@ from string import Formatter
 import pkg_resources
 import urllib.parse
 
+from ebook_converter import constants as const
 from ebook_converter import guess_type, strftime
 from ebook_converter.constants_old import iswindows
-from ebook_converter.ebooks.oeb.base import XPath, XHTML_NS, XHTML, xml2text, urlnormalize
+from ebook_converter.ebooks.oeb.base import XPath, xml2text, urlnormalize
 from ebook_converter.library.comments import comments_to_html, markdown
 from ebook_converter.utils.date import is_date_undefined, as_local_time
 from ebook_converter.ebooks.chardet import strip_encoding_declarations
@@ -303,7 +304,7 @@ def render_jacket(mi, output_profile,
                 'tags_label': 'Tags',
                 'title': title,
                 'title_str': title_str,
-                'xmlns': XHTML_NS}
+                'xmlns': const.XHTML_NS}
 
         for key in mi.custom_field_keys():
             m = mi.get_user_metadata(key, False) or {}
@@ -370,7 +371,7 @@ def render_jacket(mi, output_profile,
         # We cannot use data-calibre-rescale 100 on the body tag as that will just
         # give the body tag a font size of 1em, which is useless.
         for body in root.xpath('//*[local-name()="body"]'):
-            fw = body.makeelement(XHTML('div'))
+            fw = body.makeelement(const.XHTML_DIV)
             fw.set('data-calibre-rescale', '100')
             for child in body:
                 fw.append(child)
@@ -387,9 +388,9 @@ def linearize_jacket(oeb):
     for x in oeb.spine[:4]:
         if XPath(JACKET_XPATH)(x.data):
             for e in XPath('//h:table|//h:tr|//h:th')(x.data):
-                e.tag = XHTML('div')
+                e.tag = const.XHTML_DIV
             for e in XPath('//h:td')(x.data):
-                e.tag = XHTML('span')
+                e.tag = const.XHTML_SPAN
             break
 
 
diff --git a/ebook_converter/ebooks/oeb/transforms/manglecase.py b/ebook_converter/ebooks/oeb/transforms/manglecase.py
index 67b6493..2edf957 100644
--- a/ebook_converter/ebooks/oeb/transforms/manglecase.py
+++ b/ebook_converter/ebooks/oeb/transforms/manglecase.py
@@ -5,9 +5,9 @@ import string
 
 from lxml import etree
 
-from ebook_converter.ebooks.oeb.base import XHTML, XHTML_NS
-from ebook_converter.ebooks.oeb.base import CSS_MIME
-from ebook_converter.ebooks.oeb.base import namespace
+from ebook_converter import constants as const
+from ebook_converter.ebooks.oeb import base
+from ebook_converter.ebooks.oeb import parse_utils
 from ebook_converter.ebooks.oeb.stylizer import Stylizer
 
 
@@ -43,15 +43,16 @@ class CaseMangler(object):
 
     def mangle_spine(self):
         id, href = self.oeb.manifest.generate('manglecase', 'manglecase.css')
-        self.oeb.manifest.add(id, href, CSS_MIME, data=CASE_MANGLER_CSS)
+        self.oeb.manifest.add(id, href, base.CSS_MIME, data=CASE_MANGLER_CSS)
         for item in self.oeb.spine:
             html = item.data
             relhref = item.relhref(href)
-            etree.SubElement(html.find(XHTML('head')), XHTML('link'),
-                             rel='stylesheet', href=relhref, type=CSS_MIME)
+            etree.SubElement(html.find(base.tag('xhtml', 'head')),
+                             base.tag('xhtml', 'link'), rel='stylesheet',
+                             href=relhref, type=base.CSS_MIME)
             stylizer = Stylizer(html, item.href, self.oeb, self.opts,
                                 self.profile)
-            self.mangle_elem(html.find(XHTML('body')), stylizer)
+            self.mangle_elem(html.find(base.tag('xhtml', 'body')), stylizer)
 
     def text_transform(self, transform, text):
         if transform == 'capitalize':
@@ -85,7 +86,8 @@ class CaseMangler(object):
                 else:
                     last.tail = text
             else:
-                child = elem.makeelement(XHTML('span'), attrib=attrib)
+                child = elem.makeelement(base.tag('xhtml', 'span'),
+                                         attrib=attrib)
                 child.text = text.upper()
                 if last is None:
                     elem.insert(0, child)
@@ -99,7 +101,7 @@ class CaseMangler(object):
 
     def mangle_elem(self, elem, stylizer):
         if not isinstance(elem.tag, (str, bytes)) or \
-           namespace(elem.tag) != XHTML_NS:
+           parse_utils.namespace(elem.tag) != const.XHTML_NS:
             return
         children = list(elem)
         style = stylizer.style(elem)
diff --git a/ebook_converter/ebooks/oeb/transforms/metadata.py b/ebook_converter/ebooks/oeb/transforms/metadata.py
index c08a840..be550b6 100644
--- a/ebook_converter/ebooks/oeb/transforms/metadata.py
+++ b/ebook_converter/ebooks/oeb/transforms/metadata.py
@@ -1,15 +1,12 @@
-import os, re
+import os
+import re
+
+from ebook_converter.ebooks.oeb import base
 from ebook_converter.utils.date import isoformat, now
 from ebook_converter import guess_type
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2009, Kovid Goyal <kovid@kovidgoyal.net>'
-__docformat__ = 'restructuredtext en'
-
-
 def meta_info_to_oeb_metadata(mi, m, log, override_input_metadata=False):
-    from ebook_converter.ebooks.oeb.base import OPF
     if not mi.is_null('title'):
         m.clear('title')
         m.add('title', mi.title)
@@ -19,17 +16,17 @@ def meta_info_to_oeb_metadata(mi, m, log, override_input_metadata=False):
         m.clear('title_sort')
         m.add('title_sort', mi.title_sort)
     if not mi.is_null('authors'):
-        m.filter('creator', lambda x : x.role.lower() in ['aut', ''])
+        m.filter('creator', lambda x: x.role.lower() in ['aut', ''])
         for a in mi.authors:
-            attrib = {'role':'aut'}
+            attrib = {'role': 'aut'}
             if mi.author_sort:
-                attrib[OPF('file-as')] = mi.author_sort
+                attrib[base.tag('opf', 'file-as')] = mi.author_sort
             m.add('creator', a, attrib=attrib)
     if not mi.is_null('book_producer'):
-        m.filter('contributor', lambda x : x.role.lower() == 'bkp')
+        m.filter('contributor', lambda x: x.role.lower() == 'bkp')
         m.add('contributor', mi.book_producer, role='bkp')
     elif override_input_metadata:
-        m.filter('contributor', lambda x : x.role.lower() == 'bkp')
+        m.filter('contributor', lambda x: x.role.lower() == 'bkp')
     if not mi.is_null('comments'):
         m.clear('description')
         m.add('description', mi.comments)
@@ -71,7 +68,7 @@ def meta_info_to_oeb_metadata(mi, m, log, override_input_metadata=False):
         m.clear('series_index')
     if not mi.is_null('rating'):
         m.clear('rating')
-        m.add('rating', '%.2f'%mi.rating)
+        m.add('rating', '%.2f' % mi.rating)
     elif override_input_metadata:
         m.clear('rating')
     if not mi.is_null('tags'):
@@ -101,23 +98,25 @@ class MergeMetadata(object):
     'Merge in user metadata, including cover'
 
     def __call__(self, oeb, mi, opts, override_input_metadata=False):
+        _oim = override_input_metadata
         self.oeb, self.log = oeb, oeb.log
         m = self.oeb.metadata
         self.log('Merging user specified metadata...')
         meta_info_to_oeb_metadata(mi, m, oeb.log,
-                override_input_metadata=override_input_metadata)
+                                  override_input_metadata=_oim)
         cover_id = self.set_cover(mi, opts.prefer_metadata_cover)
         m.clear('cover')
         if cover_id is not None:
             m.add('cover', cover_id)
         if mi.uuid is not None:
-            m.filter('identifier', lambda x:x.id=='uuid_id')
+            m.filter('identifier', lambda x: x.id == 'uuid_id')
             self.oeb.metadata.add('identifier', mi.uuid, id='uuid_id',
                                   scheme='uuid')
             self.oeb.uid = self.oeb.metadata.identifier[-1]
         if mi.application_id is not None:
-            m.filter('identifier', lambda x:x.scheme=='calibre')
-            self.oeb.metadata.add('identifier', mi.application_id, scheme='calibre')
+            m.filter('identifier', lambda x: x.scheme == 'calibre')
+            self.oeb.metadata.add('identifier', mi.application_id,
+                                  scheme='calibre')
 
     def set_cover(self, mi, prefer_metadata_cover):
         cdata, ext = b'', 'jpg'
@@ -138,7 +137,8 @@ class MergeMetadata(object):
         if cdata:
             self.oeb.guide.remove('cover')
             self.oeb.guide.remove('titlepage')
-        elif self.oeb.plumber_output_format in {'mobi', 'azw3'} and old_cover is not None:
+        elif (self.oeb.plumber_output_format in {'mobi', 'azw3'} and
+                old_cover is not None):
             # The amazon formats dont support html cover pages, so remove them
             # even if no cover was specified.
             self.oeb.guide.remove('titlepage')
@@ -156,7 +156,9 @@ class MergeMetadata(object):
         new_cover_item = None
         if cdata:
             id, href = self.oeb.manifest.generate('cover', 'cover.'+ext)
-            new_cover_item = self.oeb.manifest.add(id, href, guess_type('cover.'+ext)[0], data=cdata)
+            new_cover_item = self.oeb.manifest.add(id, href,
+                                                   guess_type('cover.'+ext)[0],
+                                                   data=cdata)
             self.oeb.guide.add('cover', 'Cover', href)
         if do_remove_old_cover:
             self.remove_old_cover(item, new_cover_item.href)
@@ -186,7 +188,8 @@ class MergeMetadata(object):
                 if href == cover_item.href:
                     if new_cover_href is not None:
                         replacement_href = item.relhref(new_cover_href)
-                        attr = 'src' if img.tag.endswith('img') else XLINK('href')
+                        attr = ('src' if img.tag.endswith('img')
+                                else XLINK('href'))
                         img.set(attr, replacement_href)
                     else:
                         p = img.getparent()
@@ -202,13 +205,14 @@ class MergeMetadata(object):
         for item in affected_items:
             body = XPath('//h:body')(item.data)
             if body:
-                text = etree.tostring(body[0], method='text', encoding='unicode')
+                text = etree.tostring(body[0], method='text',
+                                      encoding='unicode')
             else:
                 text = ''
             text = re.sub(r'\s+', '', text)
             if not text and not XPath('//h:img|//svg:svg')(item.data):
-                self.log('Removing %s as it is a wrapper around'
-                        ' the cover image'%item.href)
+                self.log('Removing %s as it is a wrapper around the cover '
+                         'image' % item.href)
                 self.oeb.spine.remove(item)
                 self.oeb.manifest.remove(item)
                 self.oeb.guide.remove_by_href(item.href)
diff --git a/ebook_converter/ebooks/oeb/transforms/page_margin.py b/ebook_converter/ebooks/oeb/transforms/page_margin.py
index 8c4e232..bfd81c3 100644
--- a/ebook_converter/ebooks/oeb/transforms/page_margin.py
+++ b/ebook_converter/ebooks/oeb/transforms/page_margin.py
@@ -1,7 +1,8 @@
 import numbers
 from collections import Counter
 
-from ebook_converter.ebooks.oeb.base import barename, XPath
+from ebook_converter.ebooks.oeb import parse_utils
+from ebook_converter.ebooks.oeb.base import XPath
 
 
 __license__ = 'GPL v3'
@@ -142,7 +143,7 @@ class RemoveFakeMargins(object):
 
             for p in paras(body):
                 level = level_of(p, body)
-                level = '%s_%d'%(barename(p.tag), level)
+                level = '%s_%d' % (parse_utils.barename(p.tag), level)
                 if level not in self.levels:
                     self.levels[level] = []
                 self.levels[level].append(p)
diff --git a/ebook_converter/ebooks/oeb/transforms/rasterize.py b/ebook_converter/ebooks/oeb/transforms/rasterize.py
index 074a255..df90c2d 100644
--- a/ebook_converter/ebooks/oeb/transforms/rasterize.py
+++ b/ebook_converter/ebooks/oeb/transforms/rasterize.py
@@ -5,10 +5,8 @@ import os
 import re
 import urllib.parse
 
-# from PyQt5.Qt import (
-    # Qt, QByteArray, QBuffer, QIODevice, QColor, QImage, QPainter, QSvgRenderer)
-
-from ebook_converter.ebooks.oeb.base import XHTML, XLINK
+from ebook_converter import constants as const
+from ebook_converter.ebooks.oeb import base
 from ebook_converter.ebooks.oeb.base import SVG_MIME, PNG_MIME
 from ebook_converter.ebooks.oeb.base import xml2str, xpath
 from ebook_converter.ebooks.oeb.base import urlnormalize
@@ -17,10 +15,7 @@ from ebook_converter.ptempfile import PersistentTemporaryFile
 from ebook_converter.utils.imghdr import what
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2008, Marshall T. Vandegrift <llasram@gmail.com>'
-
-IMAGE_TAGS = {XHTML('img'), XHTML('object')}
+IMAGE_TAGS = {base.tag('xhtml', 'img'), base.tag('xhtml', 'object')}
 KEEP_ATTRS = {'class', 'style', 'width', 'height', 'align'}
 
 
@@ -113,7 +108,7 @@ class SVGRasterizer(object):
             svg = item.data
         hrefs = self.oeb.manifest.hrefs
         for elem in xpath(svg, '//svg:*[@xl:href]'):
-            href = urlnormalize(elem.attrib[XLINK('href')])
+            href = urlnormalize(elem.attrib[base.tag('xlink', 'href')])
             path = urllib.parse.urldefrag(href)[0]
             if not path:
                 continue
@@ -126,7 +121,7 @@ class SVGRasterizer(object):
             with PersistentTemporaryFile(suffix='.'+ext) as pt:
                 pt.write(data)
                 self.temp_files.append(pt.name)
-            elem.attrib[XLINK('href')] = pt.name
+            elem.attrib[base.tag('xlink', 'href')] = pt.name
         return svg
 
     def stylizer(self, item):
@@ -171,7 +166,7 @@ class SVGRasterizer(object):
         href = os.path.splitext(item.href)[0] + '.png'
         id, href = manifest.generate(item.id, href)
         manifest.add(id, href, PNG_MIME, data=data)
-        img = elem.makeelement(XHTML('img'), src=item.relhref(href))
+        img = elem.makeelement(base.tag('xhtml', 'img'), src=item.relhref(href))
         elem.getparent().replace(elem, img)
         for prop in ('width', 'height'):
             if prop in elem.attrib:
@@ -208,7 +203,7 @@ class SVGRasterizer(object):
             id, href = manifest.generate(svgitem.id, href)
             manifest.add(id, href, PNG_MIME, data=data)
             self.images[key] = href
-        elem.tag = XHTML('img')
+        elem.tag = base.tag('xhtml', 'img')
         for attr in elem.attrib:
             if attr not in KEEP_ATTRS:
                 del elem.attrib[attr]
diff --git a/ebook_converter/ebooks/oeb/transforms/split.py b/ebook_converter/ebooks/oeb/transforms/split.py
index 6cce60b..b20f32b 100644
--- a/ebook_converter/ebooks/oeb/transforms/split.py
+++ b/ebook_converter/ebooks/oeb/transforms/split.py
@@ -10,10 +10,11 @@ import urllib.parse
 from lxml.etree import XPath as _XPath
 from lxml import etree
 
+from ebook_converter import constants as const
 from ebook_converter import as_unicode, force_unicode
 from ebook_converter.ebooks.epub import rules
-from ebook_converter.ebooks.oeb.base import (OEB_STYLES, XPNSMAP as NAMESPACES,
-        rewrite_links, XHTML, urlnormalize)
+from ebook_converter.ebooks.oeb.base import \
+        OEB_STYLES, rewrite_links, urlnormalize
 from ebook_converter.ebooks.oeb.polish.split import do_split
 from ebook_converter.polyglot.urllib import unquote
 from ebook_converter.css_selectors import Select, SelectorError
@@ -22,7 +23,7 @@ from ebook_converter.css_selectors import Select, SelectorError
 __license__ = 'GPL v3'
 __copyright__ = '2008, Kovid Goyal kovid@kovidgoyal.net'
 __docformat__ = 'restructuredtext en'
-XPath = functools.partial(_XPath, namespaces=NAMESPACES)
+XPath = functools.partial(_XPath, namespaces=const.XPNSMAP)
 
 SPLIT_POINT_ATTR = 'csp'
 
@@ -104,7 +105,7 @@ class Split(object):
         select = Select(item.data)
         if not self.page_break_selectors:
             return [], []
-        body = item.data.xpath('//h:body', namespaces=NAMESPACES)
+        body = item.data.xpath('//h:body', namespaces=const.XPNSMAP)
         if not body:
             return [], []
         descendants = frozenset(body[0].iterdescendants('*'))
@@ -268,13 +269,13 @@ class FlowSplitter(object):
                     if body is not None:
                         existing_ids = frozenset(body.xpath('//*/@id'))
                         for x in ids - existing_ids:
-                            body.insert(0, body.makeelement(XHTML('div'), id=x, style='height:0pt'))
+                            body.insert(0, body.makeelement(const.XHTML_div, id=x, style='height:0pt'))
                 ids = set()
                 trees.append(tree)
         self.trees = trees
 
     def get_body(self, root):
-        body = root.xpath('//h:body', namespaces=NAMESPACES)
+        body = root.xpath('//h:body', namespaces=const.XPNSMAP)
         if not body:
             return None
         return body[0]
@@ -296,7 +297,7 @@ class FlowSplitter(object):
                 etree.tostring(body, method='text', encoding='unicode'))
         if len(txt) > 1:
             return False
-        for img in root.xpath('//h:img', namespaces=NAMESPACES):
+        for img in root.xpath('//h:img', namespaces=const.XPNSMAP):
             if img.get('style', '') != 'display:none':
                 return False
         if root.xpath('//*[local-name() = "svg"]'):
@@ -401,7 +402,7 @@ class FlowSplitter(object):
                      '//h:br',
                      '//h:li',
                      ):
-            elems = root.xpath(path, namespaces=NAMESPACES)
+            elems = root.xpath(path, namespaces=const.XPNSMAP)
             elem = pick_elem(elems)
             if elem is not None:
                 try:
@@ -436,7 +437,7 @@ class FlowSplitter(object):
         spine_pos = self.item.spine_position
 
         for current, tree in zip(*map(reversed, (self.files, self.trees))):
-            for a in tree.getroot().xpath('//h:a[@href]', namespaces=NAMESPACES):
+            for a in tree.getroot().xpath('//h:a[@href]', namespaces=const.XPNSMAP):
                 href = a.get('href').strip()
                 if href.startswith('#'):
                     anchor = href[1:]
diff --git a/ebook_converter/ebooks/oeb/transforms/structure.py b/ebook_converter/ebooks/oeb/transforms/structure.py
index d3049f2..9b042fd 100644
--- a/ebook_converter/ebooks/oeb/transforms/structure.py
+++ b/ebook_converter/ebooks/oeb/transforms/structure.py
@@ -1,22 +1,19 @@
+import collections
 import re
-import uuid
 import urllib.parse
+import uuid
 
 from lxml import etree
-from collections import OrderedDict, Counter
 
-from ebook_converter.ebooks.oeb.base import XPNSMAP, TOC, XHTML, xml2text, barename
+from ebook_converter import constants as const
+from ebook_converter.ebooks.oeb import parse_utils
+from ebook_converter.ebooks.oeb.base import TOC, xml2text
 from ebook_converter.ebooks import ConversionError
 
 
-__license__ = 'GPL v3'
-__copyright__ = '2009, Kovid Goyal <kovid@kovidgoyal.net>'
-__docformat__ = 'restructuredtext en'
-
-
 def XPath(x):
     try:
-        return etree.XPath(x, namespaces=XPNSMAP)
+        return etree.XPath(x, namespaces=const.XPNSMAP)
     except etree.XPathSyntaxError:
         raise ConversionError(
         'The syntax of the XPath expression %s is invalid.' % repr(x))
@@ -84,7 +81,7 @@ class DetectStructure(object):
                     try:
                         prev = next(elem.itersiblings(tag=etree.Element,
                                 preceding=True))
-                        if (barename(elem.tag) in {'h1', 'h2'} and barename(
+                        if (parse_utils.barename(elem.tag) in {'h1', 'h2'} and parse_utils.barename(
                                 prev.tag) in {'h1', 'h2'} and (not prev.tail or
                                     not prev.tail.split())):
                             # We have two adjacent headings, do not put a page
@@ -165,7 +162,7 @@ class DetectStructure(object):
             chapter_mark = self.opts.chapter_mark
             page_break_before = 'display: block; page-break-before: always'
             page_break_after = 'display: block; page-break-after: always'
-            c = Counter()
+            c = collections.Counter()
             for item, elem in self.detected_chapters:
                 c[item] += 1
                 text = xml2text(elem).strip()
@@ -174,7 +171,7 @@ class DetectStructure(object):
                 if chapter_mark == 'none':
                     continue
                 if chapter_mark == 'rule':
-                    mark = elem.makeelement(XHTML('hr'))
+                    mark = elem.makeelement(const.XHTML_HR)
                 elif chapter_mark == 'pagebreak':
                     if c[item] < 3 and at_start(elem):
                         # For the first two elements in this item, check if they
@@ -184,9 +181,9 @@ class DetectStructure(object):
                         # feedbooks epubs match both a heading tag and its
                         # containing div with the default chapter expression.
                         continue
-                    mark = elem.makeelement(XHTML('div'), style=page_break_after)
+                    mark = elem.makeelement(const.XHTML_DIV, style=page_break_after)
                 else:  # chapter_mark == 'both':
-                    mark = elem.makeelement(XHTML('hr'), style=page_break_before)
+                    mark = elem.makeelement(const.XHTML_HR, style=page_break_before)
                 try:
                     elem.addprevious(mark)
                 except TypeError:
@@ -254,8 +251,8 @@ class DetectStructure(object):
         return text, href
 
     def add_leveled_toc_items(self):
-        added = OrderedDict()
-        added2 = OrderedDict()
+        added = collections.OrderedDict()
+        added2 = collections.OrderedDict()
         counter = 1
 
         def find_matches(expr, doc):
diff --git a/ebook_converter/ebooks/pdf/pdftohtml.py b/ebook_converter/ebooks/pdf/pdftohtml.py
index d10cd82..554dc37 100644
--- a/ebook_converter/ebooks/pdf/pdftohtml.py
+++ b/ebook_converter/ebooks/pdf/pdftohtml.py
@@ -5,10 +5,10 @@ import shutil
 import subprocess
 import sys
 
+from lxml import etree
+
 from ebook_converter import CurrentDir, xml_replace_entities, prints
-from ebook_converter.constants_old import (
-    filesystem_encoding, isbsd, islinux, isosx, iswindows
-)
+from ebook_converter.constants_old import isbsd, islinux, isosx, iswindows
 from ebook_converter.ebooks import ConversionError, DRMError
 from ebook_converter.ebooks.chardet import xml_to_unicode
 from ebook_converter.ptempfile import PersistentTemporaryFile
@@ -26,10 +26,13 @@ def popen(cmd, **kw):
 
 
 if isosx and hasattr(sys, 'frameworks_dir'):
-    base = os.path.join(os.path.dirname(sys.frameworks_dir), 'utils.app', 'Contents', 'MacOS')
+    base = os.path.join(os.path.dirname(sys.frameworks_dir), 'utils.app',
+                        'Contents', 'MacOS')
     PDFTOHTML = os.path.join(base, PDFTOHTML)
 if iswindows and hasattr(sys, 'frozen'):
-    base = sys.extensions_location if hasattr(sys, 'new_app_layout') else os.path.dirname(sys.executable)
+    base = os.path.dirname(sys.executable)
+    if hasattr(sys, 'new_app_layout'):
+        base = sys.extensions_location
     PDFTOHTML = os.path.join(base, 'pdftohtml.exe')
 if (islinux or isbsd) and getattr(sys, 'frozen', False):
     PDFTOHTML = os.path.join(sys.executables_location, 'bin', 'pdftohtml')
@@ -55,7 +58,7 @@ def pdftohtml(output_dir, pdf_path, no_images, as_xml=False):
 
         exe = PDFTOHTML
         cmd = [exe, '-enc', 'UTF-8', '-noframes', '-p', '-nomerge',
-                '-nodrm', a(pdfsrc), a(index)]
+               '-nodrm', a(pdfsrc), a(index)]
 
         if isbsd:
             cmd.remove('-nodrm')
@@ -67,7 +70,7 @@ def pdftohtml(output_dir, pdf_path, no_images, as_xml=False):
         logf = PersistentTemporaryFile('pdftohtml_log')
         try:
             p = popen(cmd, stderr=logf._fd, stdout=logf._fd,
-                    stdin=subprocess.PIPE)
+                      stdin=subprocess.PIPE)
         except OSError as err:
             if err.errno == errno.ENOENT:
                 raise ConversionError('Could not find pdftohtml, check it is '
@@ -79,7 +82,8 @@ def pdftohtml(output_dir, pdf_path, no_images, as_xml=False):
         logf.close()
         out = open(logf.name, 'rb').read().decode('utf-8', 'replace').strip()
         if ret != 0:
-            raise ConversionError('pdftohtml failed with return code: %d\n%s' % (ret, out))
+            raise ConversionError('pdftohtml failed with return code: '
+                                  '%d\n%s' % (ret, out))
         if out:
             prints("pdftohtml log:")
             prints(out)
@@ -90,22 +94,27 @@ def pdftohtml(output_dir, pdf_path, no_images, as_xml=False):
             with open(index, 'r+b') as i:
                 raw = i.read().decode('utf-8', 'replace')
                 raw = flip_images(raw)
-                raw = raw.replace('<head', '<!-- created by ebook-converter\'s pdftohtml -->\n  <head', 1)
+                raw = raw.replace('<head', '<!-- created by ebook-converter\'s'
+                                  ' pdftohtml -->\n  <head', 1)
                 i.seek(0)
                 i.truncate()
-                # versions of pdftohtml >= 0.20 output self closing <br> tags, this
-                # breaks the pdf heuristics regexps, so replace them
+                # versions of pdftohtml >= 0.20 output self closing <br> tags,
+                # this breaks the pdf heuristics regexps, so replace them
                 raw = raw.replace('<br/>', '<br>')
-                raw = re.sub(r'<a\s+name=(\d+)', r'<a id="\1"', raw, flags=re.I)
-                raw = re.sub(r'<a id="(\d+)"', r'<a id="p\1"', raw, flags=re.I)
-                raw = re.sub(r'<a href="index.html#(\d+)"', r'<a href="#p\1"', raw, flags=re.I)
+                raw = re.sub(r'<a\s+name=(\d+)', r'<a id="\1"', raw,
+                             flags=re.I)
+                raw = re.sub(r'<a id="(\d+)"', r'<a id="p\1"', raw,
+                             flags=re.I)
+                raw = re.sub(r'<a href="index.html#(\d+)"', r'<a href="#p\1"',
+                             raw, flags=re.I)
                 raw = xml_replace_entities(raw)
                 raw = raw.replace('\u00a0', ' ')
 
                 i.write(raw.encode('utf-8'))
 
-            cmd = [exe, '-f', '1', '-l', '1', '-xml', '-i', '-enc', 'UTF-8', '-noframes', '-p', '-nomerge',
-                    '-nodrm', '-q', '-stdout', a(pdfsrc)]
+            cmd = [exe, '-f', '1', '-l', '1', '-xml', '-i', '-enc', 'UTF-8',
+                   '-noframes', '-p', '-nomerge', '-nodrm', '-q', '-stdout',
+                   a(pdfsrc)]
             if isbsd:
                 cmd.remove('-nodrm')
             p = popen(cmd, stdout=subprocess.PIPE)
@@ -115,15 +124,14 @@ def pdftohtml(output_dir, pdf_path, no_images, as_xml=False):
 
         try:
             os.remove(pdfsrc)
-        except:
+        except Exception:
             pass
 
 
 def parse_outline(raw, output_dir):
-    from lxml import etree
-    from ebook_converter.utils.xml_parse import safe_xml_fromstring
-    raw = clean_xml_chars(xml_to_unicode(raw, strip_encoding_pats=True, assume_utf8=True)[0])
-    outline = safe_xml_fromstring(raw).xpath('(//outline)[1]')
+    raw = clean_xml_chars(xml_to_unicode(raw, strip_encoding_pats=True,
+                                         assume_utf8=True)[0])
+    outline = etree.fromstring(raw).xpath('(//outline)[1]')
     if outline:
         from ebook_converter.ebooks.oeb.polish.toc import TOC, create_ncx
         outline = outline[0]
@@ -142,13 +150,18 @@ def parse_outline(raw, output_dir):
                         count[0] += 1
         process_node(outline, toc)
         if count[0] > 2:
-            root = create_ncx(toc, (lambda x:x), 'pdftohtml', 'en', 'pdftohtml')
+            root = create_ncx(toc, (lambda x: x), 'pdftohtml', 'en',
+                              'pdftohtml')
             with open(os.path.join(output_dir, 'toc.ncx'), 'wb') as f:
-                f.write(etree.tostring(root, pretty_print=True, with_tail=False, encoding='utf-8', xml_declaration=True))
+                f.write(etree.tostring(root, pretty_print=True,
+                                       with_tail=False, encoding='utf-8',
+                                       xml_declaration=True))
 
 
 def flip_image(img, flip):
-    from ebook_converter.utils.img import flip_image, image_and_format_from_data, image_to_data
+    from ebook_converter.utils.img import image_to_data
+    from ebook_converter.utils.img import image_and_format_from_data
+    from ebook_converter.utils.img import flip_image
     with open(img, 'r+b') as f:
         img, fmt = image_and_format_from_data(f.read())
         img = flip_image(img, horizontal='x' in flip, vertical='y' in flip)
@@ -170,5 +183,5 @@ def flip_images(raw):
         if not os.path.exists(img):
             continue
         flip_image(img, flip)
-    raw = re.sub(r'<STYLE.+?</STYLE>\s*', '', raw, flags=re.I|re.DOTALL)
+    raw = re.sub(r'<STYLE.+?</STYLE>\s*', '', raw, flags=re.I | re.DOTALL)
     return raw
diff --git a/ebook_converter/ebooks/txt/markdownml.py b/ebook_converter/ebooks/txt/markdownml.py
index 1954179..0b862ee 100644
--- a/ebook_converter/ebooks/txt/markdownml.py
+++ b/ebook_converter/ebooks/txt/markdownml.py
@@ -5,8 +5,9 @@ import re
 
 from functools import partial
 
+from ebook_converter import constants as const
 from ebook_converter.ebooks.htmlz.oeb2html import OEB2HTML
-from ebook_converter.ebooks.oeb.base import XHTML, XHTML_NS, barename, namespace, rewrite_links
+from ebook_converter.ebooks.oeb.base import XHTML, barename, namespace, rewrite_links
 from ebook_converter.ebooks.oeb.stylizer import Stylizer
 
 
@@ -110,9 +111,9 @@ class MarkdownMLizer(OEB2HTML):
 
         # We can only processes tags. If there isn't a tag return any text.
         if not isinstance(elem.tag, (str, bytes)) \
-           or namespace(elem.tag) != XHTML_NS:
+           or namespace(elem.tag) != const.XHTML_NS:
             p = elem.getparent()
-            if p is not None and isinstance(p.tag, (str, bytes)) and namespace(p.tag) == XHTML_NS \
+            if p is not None and isinstance(p.tag, (str, bytes)) and namespace(p.tag) == const.XHTML_NS \
                     and elem.tail:
                 return [elem.tail]
             return ['']
diff --git a/ebook_converter/ebooks/txt/textileml.py b/ebook_converter/ebooks/txt/textileml.py
index 54e90d3..7b6f626 100644
--- a/ebook_converter/ebooks/txt/textileml.py
+++ b/ebook_converter/ebooks/txt/textileml.py
@@ -5,8 +5,10 @@ import re
 
 from functools import partial
 
+from ebook_converter import constants as const
 from ebook_converter.ebooks.htmlz.oeb2html import OEB2HTML
-from ebook_converter.ebooks.oeb.base import XHTML, XHTML_NS, barename, namespace, rewrite_links
+from ebook_converter.ebooks.oeb.base import XHTML, barename, namespace, \
+        rewrite_links
 from ebook_converter.ebooks.oeb.stylizer import Stylizer
 from ebook_converter.ebooks import unit_convert
 from ebook_converter.ebooks.textile.unsmarten import unsmarten
@@ -225,9 +227,9 @@ class TextileMLizer(OEB2HTML):
 
         # We can only processes tags. If there isn't a tag return any text.
         if not isinstance(elem.tag, (str, bytes)) \
-           or namespace(elem.tag) != XHTML_NS:
+           or namespace(elem.tag) != const.XHTML_NS:
             p = elem.getparent()
-            if p is not None and isinstance(p.tag, (str, bytes)) and namespace(p.tag) == XHTML_NS \
+            if p is not None and isinstance(p.tag, (str, bytes)) and namespace(p.tag) == const.XHTML_NS \
                     and elem.tail:
                 return [elem.tail]
             return ['']
diff --git a/ebook_converter/ebooks/txt/txtml.py b/ebook_converter/ebooks/txt/txtml.py
index 206b5a6..9b17a11 100644
--- a/ebook_converter/ebooks/txt/txtml.py
+++ b/ebook_converter/ebooks/txt/txtml.py
@@ -5,10 +5,11 @@ import re
 
 from lxml import etree
 
+from ebook_converter import constants as const
+from ebook_converter.ebooks.oeb import base
+from ebook_converter.ebooks.oeb import parse_utils
+from ebook_converter.ebooks.oeb.stylizer import Stylizer
 
-__license__ = 'GPL 3'
-__copyright__ = '2009, John Schember <john@nachtimwald.com>'
-__docformat__ = 'restructuredtext en'
 
 BLOCK_TAGS = [
     'div',
@@ -60,9 +61,6 @@ class TXTMLizer(object):
         return self.mlize_spine()
 
     def mlize_spine(self):
-        from ebook_converter.ebooks.oeb.base import XHTML
-        from ebook_converter.ebooks.oeb.stylizer import Stylizer
-        from ebook_converter.utils.xml_parse import safe_xml_fromstring
         output = [u'']
         output.append(self.get_toc())
         for item in self.oeb_book.spine:
@@ -72,9 +70,11 @@ class TXTMLizer(object):
                     x.text = x.text.replace('--', '__')
             content = etree.tostring(item.data, encoding='unicode')
             content = self.remove_newlines(content)
-            content = safe_xml_fromstring(content)
-            stylizer = Stylizer(content, item.href, self.oeb_book, self.opts, self.opts.output_profile)
-            output += self.dump_text(content.find(XHTML('body')), stylizer, item)
+            content = etree.fromstring(content)
+            stylizer = Stylizer(content, item.href, self.oeb_book, self.opts,
+                                self.opts.output_profile)
+            output += self.dump_text(content.find(base.tag('xhtml', 'body')),
+                                     stylizer, item)
             output += '\n\n\n\n\n\n'
         output = ''.join(output)
         output = '\n'.join(l.rstrip() for l in output.splitlines())
@@ -130,8 +130,12 @@ class TXTMLizer(object):
         text = re.sub('\n[ ]+\n', '\n\n', text)
         if self.opts.remove_paragraph_spacing:
             text = re.sub('\n{2,}', '\n', text)
-            text = re.sub(r'(?msu)^(?P<t>[^\t\n]+?)$', lambda mo: u'%s\n\n' % mo.group('t'), text)
-            text = re.sub(r'(?msu)(?P<b>[^\n])\n+(?P<t>[^\t\n]+?)(?=\n)', lambda mo: '%s\n\n\n\n\n\n%s' % (mo.group('b'), mo.group('t')), text)
+            text = re.sub(r'(?msu)^(?P<t>[^\t\n]+?)$', lambda mo: u'%s\n\n' %
+                          mo.group('t'), text)
+            text = re.sub(r'(?msu)(?P<b>[^\n])\n+(?P<t>[^\t\n]+?)(?=\n)',
+                          lambda mo: '%s\n\n\n\n\n\n%s' % (mo.group('b'),
+                                                           mo.group('t')),
+                          text)
         else:
             text = re.sub('\n{7,}', '\n\n\n\n\n\n', text)
 
@@ -146,7 +150,8 @@ class TXTMLizer(object):
 
         if self.opts.max_line_length:
             max_length = self.opts.max_line_length
-            if self.opts.max_line_length < 25 and not self.opts.force_max_line_length:
+            if (self.opts.max_line_length < 25 and not
+                    self.opts.force_max_line_length):
                 max_length = 25
             short_lines = []
             lines = text.splitlines()
@@ -186,13 +191,13 @@ class TXTMLizer(object):
         @stylizer: The style information attached to the element.
         @page: OEB page used to determine absolute urls.
         '''
-        from ebook_converter.ebooks.oeb.base import XHTML_NS, barename, namespace
 
         if not isinstance(elem.tag, (str, bytes)) \
-           or namespace(elem.tag) != XHTML_NS:
+           or parse_utils.namespace(elem.tag) != const.XHTML_NS:
             p = elem.getparent()
-            if p is not None and isinstance(p.tag, (str, bytes)) and namespace(p.tag) == XHTML_NS \
-                    and elem.tail:
+            if (p is not None and isinstance(p.tag, (str, bytes)) and
+                    parse_utils.namespace(p.tag) == const.XHTML_NS and
+                    elem.tail):
                 return [elem.tail]
             return ['']
 
@@ -205,14 +210,15 @@ class TXTMLizer(object):
                 return [elem.tail]
             return ['']
 
-        tag = barename(elem.tag)
+        tag = parse_utils.barename(elem.tag)
         tag_id = elem.attrib.get('id', None)
         in_block = False
         in_heading = False
 
         # Are we in a heading?
         # This can either be a heading tag or a TOC item.
-        if tag in HEADING_TAGS or '%s#%s' % (page.href, tag_id) in self.toc_ids:
+        if tag in HEADING_TAGS or '%s#%s' % (page.href,
+                                             tag_id) in self.toc_ids:
             in_heading = True
             if not self.last_was_heading:
                 text.append('\n\n\n\n\n\n')
@@ -234,7 +240,7 @@ class TXTMLizer(object):
             ems = int(round((float(style.marginTop) / style.fontSize) - 1))
             if ems >= 1:
                 text.append('\n' * ems)
-        except:
+        except Exception:
             pass
 
         # Process tags that contain text.
diff --git a/ebook_converter/startup.py b/ebook_converter/startup.py
index bfa6ce8..fbfb960 100644
--- a/ebook_converter/startup.py
+++ b/ebook_converter/startup.py
@@ -10,7 +10,7 @@ import builtins
 import locale
 import sys
 
-from ebook_converter import constants
+from ebook_converter import constants_old
 
 # For backwards compat with some third party plugins
 builtins.__dict__['dynamic_property'] = lambda func: func(None)
@@ -41,8 +41,8 @@ if not _run_once:
 
     #
     # Platform specific modules
-    if constants.iswindows:
-        winutil, winutilerror = constants.plugins['winutil']
+    if constants_old.iswindows:
+        winutil, winutilerror = constants_old.plugins['winutil']
         if not winutil:
             raise RuntimeError('Failed to load the winutil plugin: %s'%winutilerror)
         if len(sys.argv) > 1 and not isinstance(sys.argv[1], str):
@@ -57,8 +57,8 @@ if not _run_once:
 
     #
     # Convert command line arguments to unicode
-    enc = constants.preferred_encoding
-    if constants.isosx:
+    enc = constants_old.preferred_encoding
+    if constants_old.isosx:
         enc = 'utf-8'
     for i in range(1, len(sys.argv)):
         if not isinstance(sys.argv[i], str):
@@ -66,7 +66,7 @@ if not _run_once:
 
     #
     # Ensure that the max number of open files is at least 1024
-    if constants.iswindows:
+    if constants_old.iswindows:
         # See https://msdn.microsoft.com/en-us/library/6e3b887c.aspx
         if hasattr(winutil, 'setmaxstdio'):
             winutil.setmaxstdio(max(1024, winutil.getmaxstdio()))
@@ -77,7 +77,7 @@ if not _run_once:
             try:
                 resource.setrlimit(resource.RLIMIT_NOFILE, (min(1024, hard), hard))
             except Exception:
-                if constants.DEBUG:
+                if constants_old.DEBUG:
                     import traceback
                     traceback.print_exc()
 
@@ -122,7 +122,7 @@ if not _run_once:
         bound_signal.connect(slot, **kw)
     builtins.__dict__['connect_lambda'] = connect_lambda
 
-    if constants.islinux or constants.isosx or constants.isfreebsd:
+    if constants_old.islinux or constants_old.isosx or constants_old.isfreebsd:
         # Name all threads at the OS level created using the threading module, see
         # http://bugs.python.org/issue15500
         import threading
@@ -140,7 +140,7 @@ if not _run_once:
                 if name:
                     if isinstance(name, str):
                         name = name.encode('ascii', 'replace').decode('ascii')
-                    constants.plugins['speedup'][0].set_thread_name(name[:15])
+                    constants_old.plugins['speedup'][0].set_thread_name(name[:15])
             except Exception:
                 pass  # Don't care about failure to set name
         threading.Thread.start = new_start
@@ -152,7 +152,7 @@ def test_lopen():
     n = 'f\xe4llen'
     print('testing open()')
 
-    if constants.iswindows:
+    if constants_old.iswindows:
         import msvcrt, win32api
 
         def assert_not_inheritable(f):
diff --git a/ebook_converter/utils/xml_parse.py b/ebook_converter/utils/xml_parse.py
index c83bd5a..2b9a8ef 100644
--- a/ebook_converter/utils/xml_parse.py
+++ b/ebook_converter/utils/xml_parse.py
@@ -1,3 +1,7 @@
+import os
+import tempfile
+import unittest
+
 from lxml import etree
 
 
@@ -24,7 +28,6 @@ def safe_xml_fromstring(string_or_bytes, recover=True):
 
 
 def find_tests():
-    import unittest, tempfile, os
 
     class TestXMLParse(unittest.TestCase):
 
@@ -37,9 +40,11 @@ def find_tests():
             os.remove(self.temp_file)
 
         def test_safe_xml_fromstring(self):
-            templ = '''<!DOCTYPE foo [ <!ENTITY e {id} "{val}" > ]><r>&e;</r>'''
+            templ = '<!DOCTYPE foo [ <!ENTITY e {id} "{val}" > ]><r>&e;</r>'
             external = 'file:///' + self.temp_file.replace(os.sep, '/')
-            self.assertEqual(etree.fromstring(templ.format(id='SYSTEM', val=external)).text, 'external')
+            self.assertEqual(etree.fromstring(templ.format(id='SYSTEM',
+                                                           val=external)).text,
+                             'external')
             for eid, val, expected in (
                 ('', 'normal entity', 'normal entity'),
                 ('', external, external),
@@ -50,7 +55,8 @@ def find_tests():
                 ('PUBLIC', external, None),
                 ('PUBLIC', 'http://example.com', None),
             ):
-                got = getattr(safe_xml_fromstring(templ.format(id=eid, val=val)), 'text', None)
+                got = getattr(etree.fromstring(templ.format(id=eid, val=val)),
+                              'text', None)
                 self.assertEqual(got, expected)
 
     return unittest.defaultTestLoader.loadTestsFromTestCase(TestXMLParse)
diff --git a/ebook_converter/utils/zipfile.py b/ebook_converter/utils/zipfile.py
index d4dc785..b08d006 100644
--- a/ebook_converter/utils/zipfile.py
+++ b/ebook_converter/utils/zipfile.py
@@ -8,7 +8,7 @@ from contextlib import closing
 from tempfile import SpooledTemporaryFile
 
 from ebook_converter import sanitize_file_name
-from ebook_converter.constants import filesystem_encoding
+from ebook_converter.constants_old import filesystem_encoding
 from ebook_converter.ebooks.chardet import detect
 from ebook_converter.polyglot.builtins import as_bytes