From cfd073fb5c9406ef05179476bb20a6bd2c2d3ebc Mon Sep 17 00:00:00 2001 From: David Lynch Date: Thu, 6 Mar 2025 22:31:23 -0600 Subject: [PATCH] Fix an error in _soup if parsed content doesn't have a --- sites/__init__.py | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/sites/__init__.py b/sites/__init__.py index 394bad5..933cb11 100644 --- a/sites/__init__.py +++ b/sites/__init__.py @@ -207,7 +207,7 @@ class Site: text = url fallback_base = '' soup = BeautifulSoup(text, method) - return soup, soup.head.base and soup.head.base.get('href') or fallback_base + return soup, (soup.head and soup.head.base) and soup.head.base.get('href') or fallback_base def _form_in_soup(self, soup): if soup.name == 'form': @@ -247,7 +247,7 @@ class Site: return data, form.attrs.get('action'), form.attrs.get('method', 'get').lower() def _new_tag(self, *args, **kw): - soup, nobase = self._soup('') + soup = BeautifulSoup("", self.options.get('parser')) return soup.new_tag(*args, **kw) def _join_url(self, *args, **kwargs):