mirror of
git://github.com/kovidgoyal/calibre.git
synced 2026-05-05 04:13:47 +02:00
Update NYTimes
This commit is contained in:
parent
d025bc327d
commit
1af85ad42e
2 changed files with 8 additions and 0 deletions
|
|
@ -240,6 +240,7 @@ def decode_url_date(self, url):
|
|||
dict(attrs={'class': lambda x: x and 'skip-to-text-link' in x.split()}),
|
||||
dict(attrs={'class': lambda x: x and 'sharetools' in x.split()}),
|
||||
dict(attrs={'class': lambda x: x and 'ad' in x.split()}),
|
||||
dict(attrs={'class': lambda x: x and 'visually-hidden' in x.split()}),
|
||||
dict(name='div', attrs={'class': re.compile('toolsList')}), # bits
|
||||
dict(name='div', attrs={
|
||||
'class': re.compile('postNavigation')}), # bits
|
||||
|
|
@ -1061,6 +1062,9 @@ def postprocess_html(self, soup, first_fetch):
|
|||
aside.extract()
|
||||
soup = self.strip_anchors(soup, True)
|
||||
|
||||
for t in soup.findAll('time', attrs={'class':'dateline'}):
|
||||
t.name = 'div'
|
||||
|
||||
if soup.find('div', attrs={'id': 'blogcontent'}) is None:
|
||||
if first_fetch:
|
||||
aside = soup.find('div', 'aside')
|
||||
|
|
|
|||
|
|
@ -240,6 +240,7 @@ def decode_url_date(self, url):
|
|||
dict(attrs={'class': lambda x: x and 'skip-to-text-link' in x.split()}),
|
||||
dict(attrs={'class': lambda x: x and 'sharetools' in x.split()}),
|
||||
dict(attrs={'class': lambda x: x and 'ad' in x.split()}),
|
||||
dict(attrs={'class': lambda x: x and 'visually-hidden' in x.split()}),
|
||||
dict(name='div', attrs={'class': re.compile('toolsList')}), # bits
|
||||
dict(name='div', attrs={
|
||||
'class': re.compile('postNavigation')}), # bits
|
||||
|
|
@ -1069,6 +1070,9 @@ def postprocess_html(self, soup, first_fetch):
|
|||
aside.extract()
|
||||
soup = self.strip_anchors(soup, True)
|
||||
|
||||
for t in soup.findAll('time', attrs={'class':'dateline'}):
|
||||
t.name = 'div'
|
||||
|
||||
if soup.find('div', attrs={'id': 'blogcontent'}) is None:
|
||||
if first_fetch:
|
||||
aside = soup.find('div', 'aside')
|
||||
|
|
|
|||
Loading…
Reference in a new issue