From 1fe2e72b30e60e39b0bd63a3c802b5f09ff1c809 Mon Sep 17 00:00:00 2001
From: David Lynch <kemayo@gmail.com>
Date: Thu, 12 Oct 2017 17:40:26 -0500
Subject: [PATCH] Site handler for fiction.live

---
 sites/fictionlive.py | 84 ++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 84 insertions(+)
 create mode 100644 sites/fictionlive.py
diff --git a/sites/fictionlive.py b/sites/fictionlive.py
new file mode 100644
index 0000000..def19aa
--- /dev/null
+++ b/sites/fictionlive.py
@@ -0,0 +1,84 @@
+#!/usr/bin/python
+
+import itertools
+import datetime
+import re
+from . import register, Site, Section, Chapter
+
+
+@register
+class FictionLive(Site):
+    """Archive of Our Own: it has its own epub export, but the formatting is awful"""
+    @staticmethod
+    def matches(url):
+        # e.g. https://fiction.live/stories/Descendant-of-a-Demon-Lord/SBBA49fQavNQMWxFT
+        match = re.match(r'^(https?://fiction\.live/stories/[^\/]+/[0-9a-zA-Z]+)/?.*', url)
+        if match:
+            return match.group(1)
+
+    def extract(self, url):
+        workid = re.match(r'^https?://fiction\.live/stories/[^\/]+/([0-9a-zA-Z]+)/?.*', url).group(1)
+        return self._extract_work(workid)
+
+    def _extract_work(self, workid):
+        response = self.session.get('https://fiction.live/api/node/{}'.format(workid)).json()
+
+        story = Section(
+            title=response['t'],
+            author=response['u'][0]['n'],
+            url='https://fiction.live/stories/{}/{}'.format(response['t'].replace(' ', '-'), workid)
+        )
+
+        # There's a summary in `d` and `b`.
+
+        chapters = ({'ct': 0},) + tuple(c for c in response['bm'] if not c['title'].startswith('#special')) + ({'ct': 9999999999999999},)
+
+        for prevc, currc, nextc in contextiterate(chapters):
+            # `id`, `title`, `ct`, `isFirst`
+            # https://fiction.live/api/anonkun/chapters/SBBA49fQavNQMWxFT/0/1448245168594
+            # https://fiction.live/api/anonkun/chapters/SBBA49fQavNQMWxFT/1449266444062/1449615394752
+            # https://fiction.live/api/anonkun/chapters/SBBA49fQavNQMWxFT/1502823848216/9999999999999998
+            # i.e. format is [current timestamp] / [next timestamp - 1]
+            chapter_url = 'https://fiction.live/api/anonkun/chapters/{}/{}/{}'.format(workid, currc['ct'], nextc['ct'] - 1)
+            print("Extracting chapter from", chapter_url)
+            data = self.session.get(chapter_url).json()
+            html = []
+
+            updated = currc['ct']
+            for segment in (d for d in data if not d.get('t', '').startswith('#special')):
+                updated = max(updated, segment['ct'])
+                if segment['nt'] == 'chapter':
+                    html.extend(('<div>', segment['b'].replace('<br>', '<br/>'), '</div>'))
+                elif segment['nt'] == 'choice':
+                    votes = {}
+                    for vote in segment['votes']:
+                        votechoices = segment['votes'][vote]
+                        if type(votechoices) == int:
+                            votechoices = (votechoices,)
+                        for choice in votechoices:
+                            choice = segment['choices'][int(choice)]
+                            votes[choice] = votes.get(choice, 0) + 1
+                    choices = [(votes[v], v) for v in votes]
+                    choices.sort(reverse=True)
+                    html.append('<hr/><ul>')
+                    for votecount, choice in choices:
+                        html.append('<li>{}: {}</li>'.format(choice, votecount))
+                    html.append('</ul><hr/>')
+
+            story.add(Chapter(
+                title=currc['title'],
+                contents='\n'.join(html),
+                date=datetime.datetime.fromtimestamp(updated / 1000.0)
+            ))
+
+        return story
+
+
+# Stolen from the itertools docs
+def contextiterate(iterable):
+    "s -> (s0,s1), (s1,s2), (s2, s3), ..."
+    a, b, c = itertools.tee(iterable, 3)
+    next(b, None)
+    next(c, None)
+    next(c, None)
+    return zip(a, b, c)