Remove site: www.wuxiaworld.xyz - DN parked somewhere questionable for +2 years

2025-12-06 08:52:55 +01:00 · 2025-11-30 10:58:18 -06:00 · 2025-11-30 10:58:18 -06:00 · 9627e6e62c
commit 9627e6e62c
parent 5e644098f9
4 changed files with 0 additions and 188 deletions
--- a/calibre-plugin/plugin-defaults.ini
+++ b/calibre-plugin/plugin-defaults.ini
@ -4537,11 +4537,3 @@ extracharacters:Wolverine,Rogue

 website_encodings:Windows-1252,utf8

-[www.wuxiaworld.xyz]
-use_basic_cache:true
-## Was wuxiaworld.co
-## Note that wuxiaworld.co != wuxiaworld.com
-## When dedup_order_chapter_list:true, use a heuristic algorithm
-## specific to wuxiaworld.xyz order and dedup chapters.
-dedup_order_chapter_list:false
-
--- a/fanficfare/adapters/init.py
+++ b/fanficfare/adapters/init.py
@ -118,7 +118,6 @@ from . import adapter_alternatehistorycom
 from . import adapter_wattpadcom
 from . import adapter_novelonlinefullcom
 from . import adapter_wwwnovelallcom
-from . import adapter_wuxiaworldxyz
 from . import adapter_hentaifoundrycom
 from . import adapter_mugglenetfanfictioncom
 from . import adapter_swiorgru
--- a/fanficfare/adapters/adapter_wuxiaworldxyz.py
+++ b/fanficfare/adapters/adapter_wuxiaworldxyz.py
@ -1,171 +0,0 @@
-#  -*- coding: utf-8 -*-
-
-# Copyright 2020 FanFicFare team
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-#     http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-#
-
-
-from __future__ import absolute_import
-import logging
-import re
-# py2 vs py3 transition
-from ..six.moves.urllib import parse as urlparse
-
-from .base_adapter import BaseSiteAdapter, makeDate
-from fanficfare.htmlcleanup import stripHTML
-from .. import exceptions as exceptions
-
-logger = logging.getLogger(__name__)
-
-
-def getClass():
-    return WuxiaWorldXyzSiteAdapter
-
-
-class WuxiaWorldXyzSiteAdapter(BaseSiteAdapter):
-    DATE_FORMAT = '%Y-%m-%d %H:%M'
-
-    def __init__(self, config, url):
-        BaseSiteAdapter.__init__(self, config, url)
-        self.story.setMetadata('siteabbrev', 'wuxco')
-
-        # get storyId from url--url validation guarantees query correct
-        match = re.match(self.getSiteURLPattern(), url)
-        if not match:
-            raise exceptions.InvalidStoryURL(url, self.getSiteDomain(), self.getSiteExampleURLs())
-
-        story_id = match.group('id')
-        self.story.setMetadata('storyId', story_id)
-        self._setURL('https://%s/%s/' % (self.getSiteDomain(), story_id))
-
-    @staticmethod
-    def getSiteDomain():
-        return 'www.wuxiaworld.xyz'
-
-    @classmethod
-    def getAcceptDomains(cls):
-        return ['www.wuxiaworld.xyz','m.wuxiaworld.xyz','www.wuxiaworld.co','m.wuxiaworld.co']
-
-    @classmethod
-    def getConfigSections(cls):
-        "Only needs to be overriden if has additional ini sections."
-        return cls.getAcceptDomains()
-
-    @classmethod
-    def getSiteExampleURLs(cls):
-        return 'https://%s/story-name' % cls.getSiteDomain()
-
-    def getSiteURLPattern(self):
-        return r'https?://(www|m)\.wuxiaworld\.(xyz|co)/(?P<id>[^/]+)(/)?'
-
-    def extractChapterUrlsAndMetadata(self):
-        logger.debug('URL: %s', self.url)
-
-        data = self.get_request(self.url)
-
-        soup = self.make_soup(data)
-
-        self.setCoverImage(self.url, soup.select_one('img.cover')['src'])
-
-        author = soup.select_one('div.info div span').get_text()
-        self.story.setMetadata('title', soup.select_one('h3.title').get_text())
-        self.story.setMetadata('author', author)
-        self.story.setMetadata('authorId', author)
-        ## site doesn't have authorUrl links.
-
-        ## getting status
-        status_label = soup.find('h3',string='Status:')
-        status = stripHTML(status_label.nextSibling)
-        if status == 'Completed':
-            self.story.setMetadata('status', 'Completed')
-        else:
-            self.story.setMetadata('status', 'In-Progress')
-
-        ### No dates given now?
-        # chapter_info = soup.select_one('.chapter-wrapper')
-        # date = makeDate(chapter_info.select_one('.update-time').get_text(), self.DATE_FORMAT)
-        # if date:
-        #     self.story.setMetadata('dateUpdated', date)
-
-        intro = soup.select_one('div.desc-text')
-        if intro.strong:
-            intro.strong.decompose()
-        self.setDescription(self.url, intro)
-
-        def get_chapters(toc_soup):
-            chapter_info = toc_soup.select_one('div#list-chapter')
-            return [ ch for ch in chapter_info.select('li span ~ a')
-                     if not (ch.has_attr('style') and 'color:Gray;' not in ch('style')) ]
-
-        ## skip grayed out "In preparation" chapters -- couldn't make
-        ## the :not() work in the same select.
-        chapters = get_chapters(soup)
-
-        next_toc_page_url = soup.select_one('li.next a')
-        while next_toc_page_url:
-            logger.debug("TOC list next page: %s"%next_toc_page_url['href'])
-            toc_soup = self.make_soup(self.get_request('https://%s%s' % (self.getSiteDomain(),next_toc_page_url['href'])))
-            chapters.extend(get_chapters(toc_soup))
-            next_toc_page_url = toc_soup.select_one('li.next a')
-
-        if self.getConfig("dedup_order_chapter_list",False):
-            # Sort and deduplicate chapters (some stories in incorrect order and/or duplicates)
-            chapters_data = []
-            numbers_regex = re.compile(r'[^0-9\.]') # Everything except decimal and numbers
-            for ch in chapters:
-                chapter_title = stripHTML(ch)
-                chapter_url = ch['href']
-                if chapter_title.startswith('Chapter'):
-                    target_number = chapter_title.split()[1]
-                else:
-                    target_number = chapter_title.split()[0]
-                try:
-                    number = float(re.sub(numbers_regex, '', target_number))
-                except:
-                    continue # Cannot parse chapter number
-                chapters_data.append((number, chapter_title, chapter_url))
-
-            chapters_data.sort(key=lambda ch: ch[0])
-
-            for index, chapter in enumerate(chapters_data):
-                if index > 0:
-                    # No previous duplicate chapter names or same chapter numbers
-                    if chapter[1] == chapters_data[index-1][1] or chapter[0] == chapters_data[index-1][0]:
-                        continue
-                title = chapter[1]
-                url = urlparse.urljoin(self.url, chapter[2])
-                self.add_chapter(title, url)
-        else:
-            ## normal operation
-            for ch in chapters:
-                self.add_chapter(stripHTML(ch), urlparse.urljoin(self.url, ch['href']))
-
-    def getChapterText(self, url):
-        logger.debug('Getting chapter text from: %s', url)
-        data = self.get_request(url)
-        soup = self.make_soup(data)
-
-        content = soup.select_one('div#chapter-content')
-
-        ## Remove
-        # <div align="left">
-        #     If you find any errors ( broken links, non-standard content, etc.. ), Please let
-        #     us know
-        #     &lt; report chapter &gt; so we can fix it as soon as possible.
-        # </div>
-        report_div = content.select_one('div:last-child')
-        if 'broken links, non-standard content, etc' in stripHTML(report_div):
-            report_div.decompose()
-
-        return self.utf8FromSoup(url, content)
--- a/fanficfare/defaults.ini
+++ b/fanficfare/defaults.ini
@ -4510,11 +4510,3 @@ extracharacters:Wolverine,Rogue

 website_encodings:Windows-1252,utf8

-[www.wuxiaworld.xyz]
-use_basic_cache:true
-## Was wuxiaworld.co
-## Note that wuxiaworld.co != wuxiaworld.com
-## When dedup_order_chapter_list:true, use a heuristic algorithm
-## specific to wuxiaworld.xyz order and dedup chapters.
-dedup_order_chapter_list:false
-