mirror of
https://github.com/gryf/ebook-converter.git
synced 2026-02-17 06:35:45 +01:00
39 lines
947 B
Python
39 lines
947 B
Python
"""
|
|
Read meta information from TXT files
|
|
"""
|
|
import re, os
|
|
|
|
from ebook_converter.ebooks.metadata import MetaInformation
|
|
|
|
|
|
__license__ = 'GPL v3'
|
|
__copyright__ = '2009, John Schember <john@nachtimwald.com>'
|
|
|
|
|
|
def get_metadata(stream, extract_cover=True):
|
|
'''
|
|
Return metadata as a L{MetaInfo} object
|
|
'''
|
|
name = getattr(stream, 'name', '').rpartition('.')[0]
|
|
if name:
|
|
name = os.path.basename(name)
|
|
mi = MetaInformation(name or 'Unknown', ['Unknown'])
|
|
stream.seek(0)
|
|
|
|
mdata = ''
|
|
for x in range(0, 4):
|
|
line = stream.readline().decode('utf-8', 'replace')
|
|
if not line:
|
|
break
|
|
else:
|
|
mdata += line
|
|
|
|
mdata = mdata[:1024]
|
|
|
|
mo = re.search('(?u)^[ ]*(?P<title>.+)[ ]*(\n{3}|(\r\n){3}|\r{3})[ ]*(?P<author>.+)[ ]*(\n|\r\n|\r)$', mdata)
|
|
if mo is not None:
|
|
mi.title = mo.group('title')
|
|
mi.authors = mo.group('author').split(',')
|
|
|
|
return mi
|