Ignore bs4 XMLParsedAsHTMLWarning as per #894 from mcepl

2025-12-06 08:52:55 +01:00 · 2024-03-22 13:01:00 -05:00 · 2024-03-22 13:01:00 -05:00 · dbe6c6105c
commit dbe6c6105c
parent 04231eecfe
1 changed files with 5 additions and 2 deletions
--- a/fanficfare/epubutils.py
+++ b/fanficfare/epubutils.py
@ -10,6 +10,7 @@ logger = logging.getLogger(__name__)

 import os
 import re
+import warnings
 from collections import defaultdict
 from zipfile import ZipFile, ZIP_STORED, ZIP_DEFLATED
 from xml.dom.minidom import parseString
@ -460,8 +461,10 @@ def make_soup(data):

    ## soup and re-soup because BS4/html5lib is more forgiving of
    ## incorrectly nested tags that way.
-    soup = bs4.BeautifulSoup(data,'html5lib')
-    soup = bs4.BeautifulSoup(unicode(soup),'html5lib')
+    with warnings.catch_warnings():
+        warnings.simplefilter("ignore")
+        soup = bs4.BeautifulSoup(data,'html5lib')
+        soup = bs4.BeautifulSoup(unicode(soup),'html5lib')

    for ns in soup.find_all('fff_hide_noscript'):
        ns.name = 'noscript'