forked from LiveCarta/BookConverter
epub converter: change to html.parser
This commit is contained in:
@@ -90,7 +90,8 @@ class EpubPostprocessor:
|
|||||||
nodes = dict()
|
nodes = dict()
|
||||||
for item in self.ebooklib_book.get_items_of_type(ebooklib.ITEM_DOCUMENT):
|
for item in self.ebooklib_book.get_items_of_type(ebooklib.ITEM_DOCUMENT):
|
||||||
html_body_text = item.get_body_content()
|
html_body_text = item.get_body_content()
|
||||||
soup = BeautifulSoup(html_body_text, features='lxml')
|
# html.parser closes tags if needed
|
||||||
|
soup = BeautifulSoup(html_body_text, features='html.parser')
|
||||||
nodes[item.file_name] = soup
|
nodes[item.file_name] = soup
|
||||||
|
|
||||||
return nodes
|
return nodes
|
||||||
|
|||||||
Reference in New Issue
Block a user