Major improvements to epub parser

This commit is contained in:
BasioMeusPuga
2018-03-10 15:56:04 +05:30
parent 51d00bb9b5
commit ed8f676a05
9 changed files with 117 additions and 60 deletions

View File

@@ -35,7 +35,10 @@ class ParseEPUB:
def read_book(self):
self.book_ref = EPUB(self.filename)
self.book_ref.read_epub()
contents_found = self.book_ref.read_epub()
if not contents_found:
print('Cannot process: ' + self.filename)
return
self.book = self.book_ref.book
def get_title(self):
@@ -45,19 +48,16 @@ class ParseEPUB:
return self.book['author']
def get_year(self):
return 9999
return self.book['year']
def get_cover_image(self):
try:
return self.book['cover']
except KeyError:
return None
return self.book['cover']
def get_isbn(self):
return self.book['isbn']
def get_tags(self):
return None
return self.book['tags']
def get_contents(self):
extract_path = os.path.join(self.temp_dir, self.file_md5)