From c0459faa4398e77211507d6a92b4696ef9555b0a Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Tue, 15 Dec 2009 15:23:48 +0000
Subject: [PATCH 01/94] added

---
 BeautifulSoup.py | 1711 ++++++++++++++++++++++++++++++++++++++++++++++
 constants.py     |  135 ++++
 downaloder.py    |   74 ++
 ffa.py           |  187 +++++
 fictionalley.py  |   75 ++
 ficwad.py        |   97 +++
 output.py        |  136 ++++
 7 files changed, 2415 insertions(+)
 create mode 100644 BeautifulSoup.py
 create mode 100644 constants.py
 create mode 100644 downaloder.py
 create mode 100644 ffa.py
 create mode 100644 fictionalley.py
 create mode 100644 ficwad.py
 create mode 100644 output.py

diff --git a/BeautifulSoup.py b/BeautifulSoup.py
new file mode 100644
index 00000000..458f08a1
--- /dev/null
+++ b/BeautifulSoup.py
@@ -0,0 +1,1711 @@
+"""Beautiful Soup
+Elixir and Tonic
+"The Screen-Scraper's Friend"
+v3.0.0
+http://www.crummy.com/software/BeautifulSoup/
+
+Beautiful Soup parses a (possibly invalid) XML or HTML document into a
+tree representation. It provides methods and Pythonic idioms that make
+it easy to navigate, search, and modify the tree.
+
+A well-formed XML/HTML document yields a well-formed data
+structure. An ill-formed XML/HTML document yields a correspondingly
+ill-formed data structure. If your document is only locally
+well-formed, you can use this library to find and process the
+well-formed part of it.
+
+Beautiful Soup works with Python 2.2 and up. It has no external
+dependencies, but you'll have more success at converting data to UTF-8
+if you also install these three packages:
+
+* chardet, for auto-detecting character encodings
+  http://chardet.feedparser.org/
+* cjkcodecs and iconv_codec, which add more encodings to the ones supported
+  by stock Python.
+  http://cjkpython.i18n.org/
+
+Beautiful Soup defines classes for two main parsing strategies:
+    
+ * BeautifulStoneSoup, for parsing XML, SGML, or your domain-specific
+   language that kind of looks like XML.
+
+ * BeautifulSoup, for parsing run-of-the-mill HTML code, be it valid
+   or invalid. This class has web browser-like heuristics for
+   obtaining a sensible parse tree in the face of common HTML errors.
+
+Beautiful Soup also defines a class (UnicodeDammit) for autodetecting
+the encoding of an HTML or XML document, and converting it to
+Unicode. Much of this code is taken from Mark Pilgrim's Universal Feed Parser.
+
+For more than you ever wanted to know about Beautiful Soup, see the
+documentation:
+http://www.crummy.com/software/BeautifulSoup/documentation.html
+
+"""
+from __future__ import generators
+
+__author__ = "Leonard Richardson (leonardr@segfault.org)"
+__version__ = "3.0.0"
+__date__ = "$Date: 2004/10/18 00:14:20 $"
+__copyright__ = "Copyright (c) 2004-2005 Leonard Richardson"
+__license__ = "PSF"
+
+from sgmllib import SGMLParser, SGMLParseError
+import codecs
+import types
+import re
+import sgmllib
+from htmlentitydefs import name2codepoint
+
+#This code makes Beautiful Soup able to parse XML with namespaces
+sgmllib.tagfind = re.compile('[a-zA-Z][-_.:a-zA-Z0-9]*')
+
+DEFAULT_OUTPUT_ENCODING = "utf-8"
+
+# First, the classes that represent markup elements.
+
+class PageElement:
+    """Contains the navigational information for some part of the page
+    (either a tag or a piece of text)"""
+
+    def setup(self, parent=None, previous=None):
+        """Sets up the initial relations between this element and
+        other elements."""        
+        self.parent = parent
+        self.previous = previous
+        self.next = None
+        self.previousSibling = None
+        self.nextSibling = None
+        if self.parent and self.parent.contents:
+            self.previousSibling = self.parent.contents[-1]
+            self.previousSibling.nextSibling = self
+
+    def replaceWith(self, replaceWith):        
+        oldParent = self.parent
+        myIndex = self.parent.contents.index(self)
+        if hasattr(replaceWith, 'parent') and replaceWith.parent == self.parent:
+            # We're replacing this element with one of its siblings.
+            index = self.parent.contents.index(replaceWith)
+            if index and index < myIndex:
+                # Furthermore, it comes before this element. That
+                # means that when we extract it, the index of this
+                # element will change.
+                myIndex = myIndex - 1
+        self.extract()        
+        oldParent.insert(myIndex, replaceWith)
+        
+    def extract(self):
+        """Destructively rips this element out of the tree."""        
+        if self.parent:
+            try:
+                self.parent.contents.remove(self)
+            except ValueError:
+                pass
+
+        #Find the two elements that would be next to each other if
+        #this element (and any children) hadn't been parsed. Connect
+        #the two.        
+        lastChild = self._lastRecursiveChild()
+        nextElement = lastChild.next
+
+        if self.previous:
+            self.previous.next = nextElement
+        if nextElement:
+            nextElement.previous = self.previous
+        self.previous = None
+        lastChild.next = None
+
+        self.parent = None        
+        if self.previousSibling:
+            self.previousSibling.nextSibling = self.nextSibling
+        if self.nextSibling:
+            self.nextSibling.previousSibling = self.previousSibling
+        self.previousSibling = self.nextSibling = None       
+
+    def _lastRecursiveChild(self):
+        "Finds the last element beneath this object to be parsed."
+        lastChild = self
+        while hasattr(lastChild, 'contents') and lastChild.contents:
+            lastChild = lastChild.contents[-1]
+        return lastChild
+
+    def insert(self, position, newChild):
+        if (isinstance(newChild, basestring)
+            or isinstance(newChild, unicode)) \
+            and not isinstance(newChild, NavigableString):
+            newChild = NavigableString(newChild)        
+
+        position =  min(position, len(self.contents))
+        if hasattr(newChild, 'parent') and newChild.parent != None:
+            # We're 'inserting' an element that's already one
+            # of this object's children. 
+            if newChild.parent == self:
+                index = self.find(newChild)
+                if index and index < position:
+                    # Furthermore we're moving it further down the
+                    # list of this object's children. That means that
+                    # when we extract this element, our target index
+                    # will jump down one.
+                    position = position - 1
+            newChild.extract()
+            
+        newChild.parent = self
+        previousChild = None
+        if position == 0:
+            newChild.previousSibling = None
+            newChild.previous = self
+        else:
+            previousChild = self.contents[position-1]
+            newChild.previousSibling = previousChild
+            newChild.previousSibling.nextSibling = newChild
+            newChild.previous = previousChild._lastRecursiveChild()
+        if newChild.previous:
+            newChild.previous.next = newChild        
+
+        newChildsLastElement = newChild._lastRecursiveChild()
+
+        if position >= len(self.contents):
+            newChild.nextSibling = None
+            
+            parent = self
+            parentsNextSibling = None
+            while not parentsNextSibling:
+                parentsNextSibling = parent.nextSibling
+                parent = parent.parent
+                if not parent: # This is the last element in the document.
+                    break
+            if parentsNextSibling:
+                newChildsLastElement.next = parentsNextSibling
+            else:
+                newChildsLastElement.next = None
+        else:
+            nextChild = self.contents[position]            
+            newChild.nextSibling = nextChild            
+            if newChild.nextSibling:
+                newChild.nextSibling.previousSibling = newChild
+            newChildsLastElement.next = nextChild
+
+        if newChildsLastElement.next:
+            newChildsLastElement.next.previous = newChildsLastElement
+        self.contents.insert(position, newChild)
+
+    def findNext(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the first item that matches the given criteria and
+        appears after this Tag in the document."""
+        return self._findOne(self.findAllNext, name, attrs, text, **kwargs)
+
+    def findAllNext(self, name=None, attrs={}, text=None, limit=None,
+                    **kwargs):
+        """Returns all items that match the given criteria and appear
+        before after Tag in the document."""
+        return self._findAll(name, attrs, text, limit, self.nextGenerator)
+
+    def findNextSibling(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the closest sibling to this Tag that matches the
+        given criteria and appears after this Tag in the document."""
+        return self._findOne(self.findNextSiblings, name, attrs, text,
+                             **kwargs)
+
+    def findNextSiblings(self, name=None, attrs={}, text=None, limit=None,
+                         **kwargs):
+        """Returns the siblings of this Tag that match the given
+        criteria and appear after this Tag in the document."""
+        return self._findAll(name, attrs, text, limit,
+                             self.nextSiblingGenerator, **kwargs)
+
+    def findPrevious(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the first item that matches the given criteria and
+        appears before this Tag in the document."""
+        return self._findOne(self.findAllPrevious, name, attrs, text, **kwargs)
+
+    def findAllPrevious(self, name=None, attrs={}, text=None, limit=None,
+                        **kwargs):
+        """Returns all items that match the given criteria and appear
+        before this Tag in the document."""
+        return self._findAll(name, attrs, text, limit, self.previousGenerator,
+                           **kwargs)
+
+    def findPreviousSibling(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the closest sibling to this Tag that matches the
+        given criteria and appears before this Tag in the document."""
+        return self._findOne(self.findPreviousSiblings, name, attrs, text,
+                             **kwargs)
+
+    def findPreviousSiblings(self, name=None, attrs={}, text=None,
+                             limit=None, **kwargs):
+        """Returns the siblings of this Tag that match the given
+        criteria and appear before this Tag in the document."""
+        return self._findAll(name, attrs, text, limit,
+                             self.previousSiblingGenerator, **kwargs)
+
+    def findParent(self, name=None, attrs={}, **kwargs):
+        """Returns the closest parent of this Tag that matches the given
+        criteria."""
+        # NOTE: We can't use _findOne because findParents takes a different
+        # set of arguments.
+        r = None
+        l = self.findParents(name, attrs, 1)
+        if l:
+            r = l[0]
+        return r
+
+    def findParents(self, name=None, attrs={}, limit=None, **kwargs):
+        """Returns the parents of this Tag that match the given
+        criteria."""
+
+        return self._findAll(name, attrs, None, limit, self.parentGenerator,
+                             **kwargs)
+
+    #These methods do the real heavy lifting.
+
+    def _findOne(self, method, name, attrs, text, **kwargs):
+        r = None
+        l = method(name, attrs, text, 1, **kwargs)
+        if l:
+            r = l[0]
+        return r
+    
+    def _findAll(self, name, attrs, text, limit, generator, **kwargs):
+        "Iterates over a generator looking for things that match."
+
+        if isinstance(name, SoupStrainer):
+            strainer = name
+        else:
+            # Build a SoupStrainer
+            strainer = SoupStrainer(name, attrs, text, **kwargs)
+        results = ResultSet(strainer)
+        g = generator()
+        while True:
+            try:
+                i = g.next()
+            except StopIteration:
+                break
+            if i:
+                found = strainer.search(i)
+                if found:
+                    results.append(found)
+                    if limit and len(results) >= limit:
+                        break
+        return results
+
+    #These Generators can be used to navigate starting from both
+    #NavigableStrings and Tags.                
+    def nextGenerator(self):
+        i = self
+        while i:
+            i = i.next
+            yield i
+
+    def nextSiblingGenerator(self):
+        i = self
+        while i:
+            i = i.nextSibling
+            yield i
+
+    def previousGenerator(self):
+        i = self
+        while i:
+            i = i.previous
+            yield i
+
+    def previousSiblingGenerator(self):
+        i = self
+        while i:
+            i = i.previousSibling
+            yield i
+
+    def parentGenerator(self):
+        i = self
+        while i:
+            i = i.parent
+            yield i
+
+    # Utility methods
+    def substituteEncoding(self, str, encoding=None):
+        encoding = encoding or "utf-8"
+        return str.replace("%SOUP-ENCODING%", encoding)    
+
+    def toEncoding(self, s, encoding=None):
+        """Encodes an object to a string in some encoding, or to Unicode.
+        ."""
+        if isinstance(s, unicode):
+            if encoding:
+                s = s.encode(encoding)
+        elif isinstance(s, str):
+            if encoding:
+                s = s.encode(encoding)
+            else:
+                s = unicode(s)
+        else:
+            if encoding:
+                s  = self.toEncoding(str(s), encoding)
+            else:
+                s = unicode(s)
+        return s
+
+class NavigableString(unicode, PageElement):
+
+    def __getattr__(self, attr):
+        """text.string gives you text. This is for backwards
+        compatibility for Navigable*String, but for CData* it lets you
+        get the string without the CData wrapper."""
+        if attr == 'string':
+            return self
+        else:
+            raise AttributeError, "'%s' object has no attribute '%s'" % (self.__class__.__name__, attr)
+
+    def __unicode__(self):
+        return __str__(self, None)
+
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        if encoding:
+            return self.encode(encoding)
+        else:
+            return self
+        
+class CData(NavigableString):
+
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return "<![CDATA[%s]]>" % NavigableString.__str__(self, encoding)
+
+class ProcessingInstruction(NavigableString):
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        output = self
+        if "%SOUP-ENCODING%" in output:
+            output = self.substituteEncoding(output, encoding)
+        return "<?%s?>" % self.toEncoding(output, encoding)
+
+class Comment(NavigableString):
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return "<!--%s-->" % NavigableString.__str__(self, encoding)    
+
+class Declaration(NavigableString):
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return "<!%s>" % NavigableString.__str__(self, encoding)        
+
+class Tag(PageElement):
+
+    """Represents a found HTML tag with its attributes and contents."""
+
+    def __init__(self, parser, name, attrs=None, parent=None,
+                 previous=None):
+        "Basic constructor."
+
+        # We don't actually store the parser object: that lets extracted
+        # chunks be garbage-collected
+        self.parserClass = parser.__class__
+        self.isSelfClosing = parser.isSelfClosingTag(name)
+        self.name = name
+        if attrs == None:
+            attrs = []
+        self.attrs = attrs
+        self.contents = []
+        self.setup(parent, previous)
+        self.hidden = False
+        self.containsSubstitutions = False
+
+    def get(self, key, default=None):
+        """Returns the value of the 'key' attribute for the tag, or
+        the value given for 'default' if it doesn't have that
+        attribute."""
+        return self._getAttrMap().get(key, default)    
+
+    def has_key(self, key):
+        return self._getAttrMap().has_key(key)
+
+    def __getitem__(self, key):
+        """tag[key] returns the value of the 'key' attribute for the tag,
+        and throws an exception if it's not there."""
+        return self._getAttrMap()[key]
+
+    def __iter__(self):
+        "Iterating over a tag iterates over its contents."
+        return iter(self.contents)
+
+    def __len__(self):
+        "The length of a tag is the length of its list of contents."
+        return len(self.contents)
+
+    def __contains__(self, x):
+        return x in self.contents
+
+    def __nonzero__(self):
+        "A tag is non-None even if it has no contents."
+        return True
+
+    def __setitem__(self, key, value):        
+        """Setting tag[key] sets the value of the 'key' attribute for the
+        tag."""
+        self._getAttrMap()
+        self.attrMap[key] = value
+        found = False
+        for i in range(0, len(self.attrs)):
+            if self.attrs[i][0] == key:
+                self.attrs[i] = (key, value)
+                found = True
+        if not found:
+            self.attrs.append((key, value))
+        self._getAttrMap()[key] = value
+
+    def __delitem__(self, key):
+        "Deleting tag[key] deletes all 'key' attributes for the tag."
+        for item in self.attrs:
+            if item[0] == key:
+                self.attrs.remove(item)
+                #We don't break because bad HTML can define the same
+                #attribute multiple times.
+            self._getAttrMap()
+            if self.attrMap.has_key(key):
+                del self.attrMap[key]
+
+    def __call__(self, *args, **kwargs):
+        """Calling a tag like a function is the same as calling its
+        findAll() method. Eg. tag('a') returns a list of all the A tags
+        found within this tag."""
+        return apply(self.findAll, args, kwargs)
+
+    def __getattr__(self, tag):
+        #print "Getattr %s.%s" % (self.__class__, tag)
+        if len(tag) > 3 and tag.rfind('Tag') == len(tag)-3:
+            return self.find(tag[:-3])
+        elif tag.find('__') != 0:
+            return self.find(tag)
+
+    def __eq__(self, other):
+        """Returns true iff this tag has the same name, the same attributes,
+        and the same contents (recursively) as the given tag.
+
+        NOTE: right now this will return false if two tags have the
+        same attributes in a different order. Should this be fixed?"""
+        if not hasattr(other, 'name') or not hasattr(other, 'attrs') or not hasattr(other, 'contents') or self.name != other.name or self.attrs != other.attrs or len(self) != len(other):
+            return False
+        for i in range(0, len(self.contents)):
+            if self.contents[i] != other.contents[i]:
+                return False
+        return True
+
+    def __ne__(self, other):
+        """Returns true iff this tag is not identical to the other tag,
+        as defined in __eq__."""
+        return not self == other
+
+    def __repr__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        """Renders this tag as a string."""
+        return self.__str__(encoding)
+
+    def __unicode__(self):
+        return self.__str__(None)
+
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING,
+                prettyPrint=False, indentLevel=0):
+        """Returns a string or Unicode representation of this tag and
+        its contents. To get Unicode, pass None for encoding.
+
+        NOTE: since Python's HTML parser consumes whitespace, this
+        method is not certain to reproduce the whitespace present in
+        the original string."""
+
+        encodedName = self.toEncoding(self.name, encoding)
+        
+        attrs = []
+        if self.attrs:
+            for key, val in self.attrs:
+                fmt = '%s="%s"'
+                if isString(val):
+                    if self.containsSubstitutions and '%SOUP-ENCODING%' in val:
+                        val = self.substituteEncoding(val, encoding)
+                    if '"' in val:
+                        fmt = "%s='%s'"
+                        # This can't happen naturally, but it can happen
+                        # if you modify an attribute value and print it out.
+                        if "'" in val:
+                            val = val.replace("'", "&squot;")
+                attrs.append(fmt % (self.toEncoding(key, encoding),
+                                    self.toEncoding(val, encoding)))
+        close = ''
+        closeTag = ''
+        if self.isSelfClosing:
+            close = ' /'
+        else:
+            closeTag = '</%s>' % encodedName
+
+        indentTag, indentContents = 0, 0
+        if prettyPrint:
+            indentTag = indentLevel
+            space = (' ' * (indentTag-1))
+            indentContents = indentTag + 1
+        contents = self.renderContents(encoding, prettyPrint, indentContents)
+        if self.hidden:
+            s = contents
+        else:
+            s = []
+            attributeString = ''
+            if attrs:
+                attributeString = ' ' + ' '.join(attrs)            
+            if prettyPrint:
+                s.append(space)
+            s.append('<%s%s%s>' % (encodedName, attributeString, close))
+            if prettyPrint:
+                s.append("\n")
+            s.append(contents)
+            if prettyPrint and contents and contents[-1] != "\n":
+                s.append("\n")
+            if prettyPrint and closeTag:
+                s.append(space)
+            s.append(closeTag)
+            if prettyPrint and closeTag and self.nextSibling:
+                s.append("\n")
+            s = ''.join(s)
+        return s
+
+    def prettify(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return self.__str__(encoding, True)
+
+    def renderContents(self, encoding=DEFAULT_OUTPUT_ENCODING,
+                       prettyPrint=False, indentLevel=0):
+        """Renders the contents of this tag as a string in the given
+        encoding. If encoding is None, returns a Unicode string.."""
+        s=[]
+        for c in self:
+            text = None
+            if isinstance(c, NavigableString):
+                text = c.__str__(encoding)
+            elif isinstance(c, Tag):
+                s.append(c.__str__(encoding, prettyPrint, indentLevel))
+            if text and prettyPrint:
+                text = text.strip()              
+            if text:
+                if prettyPrint:
+                    s.append(" " * (indentLevel-1))
+                s.append(text)
+                if prettyPrint:
+                    s.append("\n")
+        return ''.join(s)    
+
+    #Soup methods
+
+    def find(self, name=None, attrs={}, recursive=True, text=None,
+              **kwargs):
+        """Return only the first child of this
+        Tag matching the given criteria."""
+        r = None
+        l = self.findAll(name, attrs, recursive, text, 1)
+        if l:
+            r = l[0]
+        return r
+    findChild = find
+
+    def findAll(self, name=None, attrs={}, recursive=True, text=None,
+                limit=None, **kwargs):
+        """Extracts a list of Tag objects that match the given
+        criteria.  You can specify the name of the Tag and any
+        attributes you want the Tag to have.
+
+        The value of a key-value pair in the 'attrs' map can be a
+        string, a list of strings, a regular expression object, or a
+        callable that takes a string and returns whether or not the
+        string matches for some custom definition of 'matches'. The
+        same is true of the tag name."""
+        generator = self.recursiveChildGenerator
+        if not recursive:
+            generator = self.childGenerator
+        return self._findAll(name, attrs, text, limit, generator, **kwargs)
+    findAllChildren = findAll
+    
+    #Utility methods
+
+    def append(self, tag):
+        """Appends the given tag to the contents of this tag."""
+        self.contents.append(tag)
+
+    #Private methods
+
+    def _getAttrMap(self):
+        """Initializes a map representation of this tag's attributes,
+        if not already initialized."""
+        if not getattr(self, 'attrMap'):
+            self.attrMap = {}
+            for (key, value) in self.attrs:
+                self.attrMap[key] = value 
+        return self.attrMap
+
+    #Generator methods
+    def childGenerator(self):
+        for i in range(0, len(self.contents)):
+            yield self.contents[i]
+        raise StopIteration
+    
+    def recursiveChildGenerator(self):
+        stack = [(self, 0)]
+        while stack:
+            tag, start = stack.pop()
+            if isinstance(tag, Tag):            
+                for i in range(start, len(tag.contents)):
+                    a = tag.contents[i]
+                    yield a
+                    if isinstance(a, Tag) and tag.contents:
+                        if i < len(tag.contents) - 1:
+                            stack.append((tag, i+1))
+                        stack.append((a, 0))
+                        break
+        raise StopIteration
+
+# Next, a couple classes to represent queries and their results.
+class SoupStrainer:
+    """Encapsulates a number of ways of matching a markup element (tag or
+    text)."""
+
+    def __init__(self, name=None, attrs={}, text=None, **kwargs):
+        self.name=name
+        self.attrs=attrs.copy()
+        self.attrs.update(kwargs)
+        self.text = text
+
+    def __str__(self):
+        if self.text:
+            return self.text
+        else:
+            return "%s|%s" % (self.name, self.attrs)
+    
+    def searchTag(self, markupName=None, markupAttrs={}):
+        found = None
+        markup = None
+        if isinstance(markupName, Tag):
+            markup = markupName
+            markupAttrs = markup
+        callFunctionWithTagData = callable(self.name) \
+                                and not isinstance(markupName, Tag)
+
+        if (not self.name) \
+               or callFunctionWithTagData \
+               or (markup and self._matches(markup, self.name)) \
+               or (not markup and self._matches(markupName, self.name)):
+            if callFunctionWithTagData:
+                match = self.name(markupName, markupAttrs)
+            else:
+                match = True            
+                markupAttrMap = None
+                for attr, matchAgainst in self.attrs.items():
+                    if not markupAttrMap:
+                         if hasattr(markupAttrs, 'get'):
+                            markupAttrMap = markupAttrs
+                         else:
+                            markupAttrMap = {}
+                            for k,v in markupAttrs:
+                                markupAttrMap[k] = v
+                    attrValue = markupAttrMap.get(attr)
+                    if not self._matches(attrValue, matchAgainst):
+                        match = False
+                        break
+            if match:
+                if markup:
+                    found = markup
+                else:
+                    found = markupName
+        return found
+
+    def search(self, markup):
+        #print 'looking for %s in %s' % (self, markup)
+        found = None
+        # If given a list of items, scan it for a text element that
+        # matches.        
+        if isList(markup) and not isinstance(markup, Tag):
+            for element in markup:
+                if isinstance(element, NavigableString) \
+                       and self.search(element):
+                    found = element
+                    break
+        # If it's a Tag, make sure its name or attributes match.
+        # Don't bother with Tags if we're searching for text.
+        elif isinstance(markup, Tag):
+            if not self.text:
+                found = self.searchTag(markup)
+        # If it's text, make sure the text matches.
+        elif isinstance(markup, NavigableString) or \
+                 isString(markup):
+            if self._matches(markup, self.text):
+                found = markup
+        else:
+            raise Exception, "I don't know how to match against a %s" \
+                  % markup.__class__
+        return found
+        
+    def _matches(self, markup, matchAgainst):    
+        #print "Matching %s against %s" % (markup, matchAgainst)
+        result = False
+        if matchAgainst == True and type(matchAgainst) == types.BooleanType:
+            result = markup != None
+        elif callable(matchAgainst):
+            result = matchAgainst(markup)
+        else:
+            #Custom match methods take the tag as an argument, but all
+            #other ways of matching match the tag name as a string.
+            if isinstance(markup, Tag):
+                markup = markup.name
+            if markup and not isString(markup):
+                markup = unicode(markup)
+            #Now we know that chunk is either a string, or None.
+            if hasattr(matchAgainst, 'match'):
+                # It's a regexp object.
+                result = markup and matchAgainst.search(markup)
+            elif isList(matchAgainst):
+                result = markup in matchAgainst
+            elif hasattr(matchAgainst, 'items'):
+                result = markup.has_key(matchAgainst)
+            elif matchAgainst and isString(markup):
+                if isinstance(markup, unicode):
+                    matchAgainst = unicode(matchAgainst)
+                else:
+                    matchAgainst = str(matchAgainst)
+
+            if not result:
+                result = matchAgainst == markup
+        return result
+
+class ResultSet(list):
+    """A ResultSet is just a list that keeps track of the SoupStrainer
+    that created it."""
+    def __init__(self, source):
+        list.__init__([])
+        self.source = source
+
+# Now, some helper functions.
+
+def isList(l):
+    """Convenience method that works with all 2.x versions of Python
+    to determine whether or not something is listlike."""
+    return hasattr(l, '__iter__') \
+           or (type(l) in (types.ListType, types.TupleType))
+
+def isString(s):
+    """Convenience method that works with all 2.x versions of Python
+    to determine whether or not something is stringlike."""
+    try:
+        return isinstance(s, unicode) or isintance(s, basestring) 
+    except NameError:
+        return isinstance(s, str)
+
+def buildTagMap(default, *args):
+    """Turns a list of maps, lists, or scalars into a single map.
+    Used to build the SELF_CLOSING_TAGS, NESTABLE_TAGS, and
+    NESTING_RESET_TAGS maps out of lists and partial maps."""
+    built = {}
+    for portion in args:
+        if hasattr(portion, 'items'):
+            #It's a map. Merge it.
+            for k,v in portion.items():
+                built[k] = v
+        elif isList(portion):
+            #It's a list. Map each item to the default.
+            for k in portion:
+                built[k] = default
+        else:
+            #It's a scalar. Map it to the default.
+            built[portion] = default
+    return built
+
+# Now, the parser classes.
+
+class BeautifulStoneSoup(Tag, SGMLParser):
+
+    """This class contains the basic parser and search code. It defines
+    a parser that knows nothing about tag behavior except for the
+    following:
+   
+      You can't close a tag without closing all the tags it encloses.
+      That is, "<foo><bar></foo>" actually means
+      "<foo><bar></bar></foo>".
+
+    [Another possible explanation is "<foo><bar /></foo>", but since
+    this class defines no SELF_CLOSING_TAGS, it will never use that
+    explanation.]
+
+    This class is useful for parsing XML or made-up markup languages,
+    or when BeautifulSoup makes an assumption counter to what you were
+    expecting."""
+
+    XML_ENTITY_LIST = {}
+    for i in ["quot", "apos", "amp", "lt", "gt"]:
+        XML_ENTITY_LIST[i] = True 
+
+    SELF_CLOSING_TAGS = {}
+    NESTABLE_TAGS = {}
+    RESET_NESTING_TAGS = {}
+    QUOTE_TAGS = {}
+
+    MARKUP_MASSAGE = [(re.compile('(<[^<>]*)/>'),
+                       lambda x: x.group(1) + ' />'),
+                      (re.compile('<!\s+([^<>]*)>'),
+                       lambda x: '<!' + x.group(1) + '>')
+                      ]
+
+    ROOT_TAG_NAME = u'[document]'
+
+    HTML_ENTITIES = "html"
+    XML_ENTITIES = "xml"
+
+    def __init__(self, markup="", parseOnlyThese=None, fromEncoding=None,
+                 markupMassage=True, smartQuotesTo=XML_ENTITIES,
+                 convertEntities=None, selfClosingTags=None):
+        """The Soup object is initialized as the 'root tag', and the
+        provided markup (which can be a string or a file-like object)
+        is fed into the underlying parser. 
+
+        sgmllib will process most bad HTML, and the BeautifulSoup
+        class has some tricks for dealing with some HTML that kills
+        sgmllib, but Beautiful Soup can nonetheless choke or lose data
+        if your data uses self-closing tags or declarations
+        incorrectly.
+
+        By default, Beautiful Soup uses regexes to sanitize input,
+        avoiding the vast majority of these problems. If the problems
+        don't apply to you, pass in False for markupMassage, and
+        you'll get better performance.
+
+        The default parser massage techniques fix the two most common
+        instances of invalid HTML that choke sgmllib:
+
+         <br/> (No space between name of closing tag and tag close)
+         <! --Comment--> (Extraneous whitespace in declaration)
+
+        You can pass in a custom list of (RE object, replace method)
+        tuples to get Beautiful Soup to scrub your input the way you
+        want."""
+
+        self.parseOnlyThese = parseOnlyThese
+        self.fromEncoding = fromEncoding
+        self.smartQuotesTo = smartQuotesTo
+        self.convertEntities = convertEntities
+        if self.convertEntities:
+            # It doesn't make sense to convert encoded characters to
+            # entities even while you're converting entities to Unicode.
+            # Just convert it all to Unicode.
+            self.smartQuotesTo = None
+        self.instanceSelfClosingTags = buildTagMap(None, selfClosingTags)
+        SGMLParser.__init__(self)
+            
+        if hasattr(markup, 'read'):        # It's a file-type object.
+            markup = markup.read()
+        self.markup = markup
+        self.markupMassage = markupMassage
+        try:
+            self._feed()
+        except StopParsing:
+            pass
+        self.markup = None                 # The markup can now be GCed
+        
+    def _feed(self, inDocumentEncoding=None):
+        # Convert the document to Unicode.
+        markup = self.markup
+        if isinstance(markup, unicode):
+            if not hasattr(self, 'originalEncoding'):
+                self.originalEncoding = None
+        else:
+            dammit = UnicodeDammit\
+                     (markup, [self.fromEncoding, inDocumentEncoding],
+                      smartQuotesTo=self.smartQuotesTo)
+            markup = dammit.unicode
+            self.originalEncoding = dammit.originalEncoding
+        if markup:
+            if self.markupMassage:
+                if not isList(self.markupMassage):
+                    self.markupMassage = self.MARKUP_MASSAGE            
+                for fix, m in self.markupMassage:
+                    markup = fix.sub(m, markup)
+        self.reset()
+
+        SGMLParser.feed(self, markup)
+        # Close out any unfinished strings and close all the open tags.
+        self.endData()
+        while self.currentTag.name != self.ROOT_TAG_NAME:
+            self.popTag()
+
+    def __getattr__(self, methodName):
+        """This method routes method call requests to either the SGMLParser
+        superclass or the Tag superclass, depending on the method name."""
+        #print "__getattr__ called on %s.%s" % (self.__class__, methodName)
+
+        if methodName.find('start_') == 0 or methodName.find('end_') == 0 \
+               or methodName.find('do_') == 0:
+            return SGMLParser.__getattr__(self, methodName)
+        elif methodName.find('__') != 0:
+            return Tag.__getattr__(self, methodName)
+        else:
+            raise AttributeError
+
+    def isSelfClosingTag(self, name):
+        """Returns true iff the given string is the name of a
+        self-closing tag according to this parser."""
+        return self.SELF_CLOSING_TAGS.has_key(name) \
+               or self.instanceSelfClosingTags.has_key(name)
+            
+    def reset(self):
+        Tag.__init__(self, self, self.ROOT_TAG_NAME)
+        self.hidden = 1
+        SGMLParser.reset(self)
+        self.currentData = []
+        self.currentTag = None
+        self.tagStack = []
+        self.quoteStack = []
+        self.pushTag(self)
+    
+    def popTag(self):
+        tag = self.tagStack.pop()
+        # Tags with just one string-owning child get the child as a
+        # 'string' property, so that soup.tag.string is shorthand for
+        # soup.tag.contents[0]
+        if len(self.currentTag.contents) == 1 and \
+           isinstance(self.currentTag.contents[0], NavigableString):
+            self.currentTag.string = self.currentTag.contents[0]
+
+        #print "Pop", tag.name
+        if self.tagStack:
+            self.currentTag = self.tagStack[-1]
+        return self.currentTag
+
+    def pushTag(self, tag):
+        #print "Push", tag.name
+        if self.currentTag:
+            self.currentTag.append(tag)
+        self.tagStack.append(tag)
+        self.currentTag = self.tagStack[-1]
+
+    def endData(self, containerClass=NavigableString):
+        if self.currentData:
+            currentData = ''.join(self.currentData)
+            if not currentData.strip():
+                if '\n' in currentData:
+                    currentData = '\n'
+                else:
+                    currentData = ' '
+            self.currentData = []
+            if self.parseOnlyThese and len(self.tagStack) <= 1 and \
+                   (not self.parseOnlyThese.text or \
+                    not self.parseOnlyThese.search(currentData)):
+                return
+            o = containerClass(currentData)
+            o.setup(self.currentTag, self.previous)
+            if self.previous:
+                self.previous.next = o
+            self.previous = o
+            self.currentTag.contents.append(o)
+
+
+    def _popToTag(self, name, inclusivePop=True):
+        """Pops the tag stack up to and including the most recent
+        instance of the given tag. If inclusivePop is false, pops the tag
+        stack up to but *not* including the most recent instqance of
+        the given tag."""
+        #print "Popping to %s" % name
+        if name == self.ROOT_TAG_NAME:
+            return            
+
+        numPops = 0
+        mostRecentTag = None
+        for i in range(len(self.tagStack)-1, 0, -1):
+            if name == self.tagStack[i].name:
+                numPops = len(self.tagStack)-i
+                break
+        if not inclusivePop:
+            numPops = numPops - 1
+
+        for i in range(0, numPops):
+            mostRecentTag = self.popTag()
+        return mostRecentTag    
+
+    def _smartPop(self, name):
+
+        """We need to pop up to the previous tag of this type, unless
+        one of this tag's nesting reset triggers comes between this
+        tag and the previous tag of this type, OR unless this tag is a
+        generic nesting trigger and another generic nesting trigger
+        comes between this tag and the previous tag of this type.
+
+        Examples:
+         <p>Foo<b>Bar<p> should pop to 'p', not 'b'.
+         <p>Foo<table>Bar<p> should pop to 'table', not 'p'.
+         <p>Foo<table><tr>Bar<p> should pop to 'tr', not 'p'.
+         <p>Foo<b>Bar<p> should pop to 'p', not 'b'.
+
+         <li><ul><li> *<li>* should pop to 'ul', not the first 'li'.
+         <tr><table><tr> *<tr>* should pop to 'table', not the first 'tr'
+         <td><tr><td> *<td>* should pop to 'tr', not the first 'td'
+        """
+
+        nestingResetTriggers = self.NESTABLE_TAGS.get(name)
+        isNestable = nestingResetTriggers != None
+        isResetNesting = self.RESET_NESTING_TAGS.has_key(name)
+        popTo = None
+        inclusive = True
+        for i in range(len(self.tagStack)-1, 0, -1):
+            p = self.tagStack[i]
+            if (not p or p.name == name) and not isNestable:
+                #Non-nestable tags get popped to the top or to their
+                #last occurance.
+                popTo = name
+                break
+            if (nestingResetTriggers != None
+                and p.name in nestingResetTriggers) \
+                or (nestingResetTriggers == None and isResetNesting
+                    and self.RESET_NESTING_TAGS.has_key(p.name)):
+                
+                #If we encounter one of the nesting reset triggers
+                #peculiar to this tag, or we encounter another tag
+                #that causes nesting to reset, pop up to but not
+                #including that tag.
+                popTo = p.name
+                inclusive = False
+                break
+            p = p.parent
+        if popTo:
+            self._popToTag(popTo, inclusive)
+
+    def unknown_starttag(self, name, attrs, selfClosing=0):
+        #print "Start tag %s" % name
+        if self.quoteStack:
+            #This is not a real tag.
+            #print "<%s> is not real!" % name
+            attrs = ''.join(map(lambda(x, y): ' %s="%s"' % (x, y), attrs))
+            self.handle_data('<%s%s>' % (name, attrs))
+            return        
+        self.endData()
+
+        if not self.isSelfClosingTag(name) and not selfClosing:
+            self._smartPop(name)
+
+        if self.parseOnlyThese and len(self.tagStack) <= 1 \
+               and (self.parseOnlyThese.text or not self.parseOnlyThese.searchTag(name, attrs)):
+            return
+
+        tag = Tag(self, name, attrs, self.currentTag, self.previous)
+        if self.previous:
+            self.previous.next = tag
+        self.previous = tag
+        self.pushTag(tag)
+        if selfClosing or self.isSelfClosingTag(name):
+            self.popTag()                
+        if name in self.QUOTE_TAGS:
+            #print "Beginning quote (%s)" % name
+            self.quoteStack.append(name)
+            self.literal = 1
+        return tag
+
+    def unknown_endtag(self, name):
+        #print "End tag %s" % name
+        if self.quoteStack and self.quoteStack[-1] != name:
+            #This is not a real end tag.
+            #print "</%s> is not real!" % name
+            self.handle_data('</%s>' % name)
+            return
+        self.endData()
+        self._popToTag(name)
+        if self.quoteStack and self.quoteStack[-1] == name:
+            self.quoteStack.pop()
+            self.literal = (len(self.quoteStack) > 0)
+
+    def handle_data(self, data):
+        self.currentData.append(data)
+
+    def _toStringSubclass(self, text, subclass):
+        """Adds a certain piece of text to the tree as a NavigableString
+        subclass."""
+        self.endData()
+        self.handle_data(text)
+        self.endData(subclass)
+
+    def handle_pi(self, text):
+        """Handle a processing instruction as a ProcessingInstruction
+        object, possibly one with a %SOUP-ENCODING% slot into which an
+        encoding will be plugged later."""
+        if text[:3] == "xml":
+            text = "xml version='1.0' encoding='%SOUP-ENCODING%'"
+        self._toStringSubclass(text, ProcessingInstruction)
+
+    def handle_comment(self, text):
+        "Handle comments as Comment objects."
+        self._toStringSubclass(text, Comment)
+
+    def handle_charref(self, ref):
+        "Handle character references as data."
+        if self.convertEntities in [self.HTML_ENTITIES,
+                                    self.XML_ENTITIES]:
+            data = unichr(int(ref))
+        else:
+            data = '&#%s;' % ref
+        self.handle_data(data)
+
+    def handle_entityref(self, ref):
+        """Handle entity references as data, possibly converting known
+        HTML entity references to the corresponding Unicode
+        characters."""
+        data = None
+        if self.convertEntities == self.HTML_ENTITIES or \
+               (self.convertEntities == self.XML_ENTITIES and \
+                self.XML_ENTITY_LIST.get(ref)):
+            try:
+                data = unichr(name2codepoint[ref])
+            except KeyError:
+                pass
+        if not data:
+            data = '&%s;' % ref
+        self.handle_data(data)
+        
+    def handle_decl(self, data):
+        "Handle DOCTYPEs and the like as Declaration objects."
+        self._toStringSubclass(data, Declaration)
+
+    def parse_declaration(self, i):
+        """Treat a bogus SGML declaration as raw data. Treat a CDATA
+        declaration as a CData object."""
+        j = None
+        if self.rawdata[i:i+9] == '<![CDATA[':
+             k = self.rawdata.find(']]>', i)
+             if k == -1:
+                 k = len(self.rawdata)
+             data = self.rawdata[i+9:k]
+             j = k+3
+             self._toStringSubclass(data, CData)
+        else:
+            try:
+                j = SGMLParser.parse_declaration(self, i)
+            except SGMLParseError:
+                toHandle = self.rawdata[i:]
+                self.handle_data(toHandle)
+                j = i + len(toHandle)
+        return j
+
+class BeautifulSoup(BeautifulStoneSoup):
+
+    """This parser knows the following facts about HTML:
+
+    * Some tags have no closing tag and should be interpreted as being
+      closed as soon as they are encountered.
+
+    * The text inside some tags (ie. 'script') may contain tags which
+      are not really part of the document and which should be parsed
+      as text, not tags. If you want to parse the text as tags, you can
+      always fetch it and parse it explicitly.
+
+    * Tag nesting rules:
+
+      Most tags can't be nested at all. For instance, the occurance of
+      a <p> tag should implicitly close the previous <p> tag.
+
+       <p>Para1<p>Para2
+        should be transformed into:
+       <p>Para1</p><p>Para2
+
+      Some tags can be nested arbitrarily. For instance, the occurance
+      of a <blockquote> tag should _not_ implicitly close the previous
+      <blockquote> tag.
+
+       Alice said: <blockquote>Bob said: <blockquote>Blah
+        should NOT be transformed into:
+       Alice said: <blockquote>Bob said: </blockquote><blockquote>Blah
+
+      Some tags can be nested, but the nesting is reset by the
+      interposition of other tags. For instance, a <tr> tag should
+      implicitly close the previous <tr> tag within the same <table>,
+      but not close a <tr> tag in another table.
+
+       <table><tr>Blah<tr>Blah
+        should be transformed into:
+       <table><tr>Blah</tr><tr>Blah
+        but,
+       <tr>Blah<table><tr>Blah
+        should NOT be transformed into
+       <tr>Blah<table></tr><tr>Blah
+
+    Differing assumptions about tag nesting rules are a major source
+    of problems with the BeautifulSoup class. If BeautifulSoup is not
+    treating as nestable a tag your page author treats as nestable,
+    try ICantBelieveItsBeautifulSoup, MinimalSoup, or
+    BeautifulStoneSoup before writing your own subclass."""
+
+    def __init__(self, *args, **kwargs):
+        if not kwargs.has_key('smartQuotesTo'):
+            kwargs['smartQuotesTo'] = self.HTML_ENTITIES
+        BeautifulStoneSoup.__init__(self, *args, **kwargs)
+
+    SELF_CLOSING_TAGS = buildTagMap(None,
+                                    ['br' , 'hr', 'input', 'img', 'meta',
+                                    'spacer', 'link', 'frame', 'base'])
+
+    QUOTE_TAGS = {'script': None}
+    
+    #According to the HTML standard, each of these inline tags can
+    #contain another tag of the same type. Furthermore, it's common
+    #to actually use these tags this way.
+    NESTABLE_INLINE_TAGS = ['span', 'font', 'q', 'object', 'bdo', 'sub', 'sup',
+                            'center']
+
+    #According to the HTML standard, these block tags can contain
+    #another tag of the same type. Furthermore, it's common
+    #to actually use these tags this way.
+    NESTABLE_BLOCK_TAGS = ['blockquote', 'div', 'fieldset', 'ins', 'del']
+
+    #Lists can contain other lists, but there are restrictions.    
+    NESTABLE_LIST_TAGS = { 'ol' : [],
+                           'ul' : [],
+                           'li' : ['ul', 'ol'],
+                           'dl' : [],
+                           'dd' : ['dl'],
+                           'dt' : ['dl'] }
+
+    #Tables can contain other tables, but there are restrictions.    
+    NESTABLE_TABLE_TAGS = {'table' : [], 
+                           'tr' : ['table', 'tbody', 'tfoot', 'thead'],
+                           'td' : ['tr'],
+                           'th' : ['tr'],
+                           'thead' : ['table'],
+                           'tbody' : ['table'],
+                           'tfoot' : ['table'],
+                           }
+
+    NON_NESTABLE_BLOCK_TAGS = ['address', 'form', 'p', 'pre']
+
+    #If one of these tags is encountered, all tags up to the next tag of
+    #this type are popped.
+    RESET_NESTING_TAGS = buildTagMap(None, NESTABLE_BLOCK_TAGS, 'noscript',
+                                     NON_NESTABLE_BLOCK_TAGS,
+                                     NESTABLE_LIST_TAGS,
+                                     NESTABLE_TABLE_TAGS)
+
+    NESTABLE_TAGS = buildTagMap([], NESTABLE_INLINE_TAGS, NESTABLE_BLOCK_TAGS,
+                                NESTABLE_LIST_TAGS, NESTABLE_TABLE_TAGS)
+
+    # Used to detect the charset in a META tag; see start_meta
+    CHARSET_RE = re.compile("((^|;)\s*charset=)([^;]*)")
+
+    def start_meta(self, attrs):
+        """Beautiful Soup can detect a charset included in a META tag,
+        try to convert the document to that charset, and re-parse the
+        document from the beginning."""
+        httpEquiv = None
+        contentType = None
+        contentTypeIndex = None
+        tagNeedsEncodingSubstitution = False
+
+        for i in range(0, len(attrs)):
+            key, value = attrs[i]
+            key = key.lower()
+            if key == 'http-equiv':
+                httpEquiv = value
+            elif key == 'content':
+                contentType = value
+                contentTypeIndex = i
+
+        if httpEquiv and contentType: # It's an interesting meta tag.
+            match = self.CHARSET_RE.search(contentType)
+            if match:
+                if getattr(self, 'declaredHTMLEncoding') or \
+                       (self.originalEncoding == self.fromEncoding):
+                    # This is our second pass through the document, or
+                    # else an encoding was specified explicitly and it
+                    # worked. Rewrite the meta tag.
+                    newAttr = self.CHARSET_RE.sub\
+                              (lambda(match):match.group(1) +
+                               "%SOUP-ENCODING%", value)
+                    attrs[contentTypeIndex] = (attrs[contentTypeIndex][0],
+                                               newAttr)
+                    tagNeedsEncodingSubstitution = True
+                else:
+                    # This is our first pass through the document.
+                    # Go through it again with the new information.
+                    newCharset = match.group(3)
+                    if newCharset and newCharset != self.originalEncoding:
+                        self.declaredHTMLEncoding = newCharset
+                        self._feed(self.declaredHTMLEncoding)
+                        raise StopParsing
+        tag = self.unknown_starttag("meta", attrs)
+        if tagNeedsEncodingSubstitution:
+            tag.containsSubstitutions = True
+
+class StopParsing(Exception):
+    pass
+   
+class ICantBelieveItsBeautifulSoup(BeautifulSoup):
+
+    """The BeautifulSoup class is oriented towards skipping over
+    common HTML errors like unclosed tags. However, sometimes it makes
+    errors of its own. For instance, consider this fragment:
+
+     <b>Foo<b>Bar</b></b>
+
+    This is perfectly valid (if bizarre) HTML. However, the
+    BeautifulSoup class will implicitly close the first b tag when it
+    encounters the second 'b'. It will think the author wrote
+    "<b>Foo<b>Bar", and didn't close the first 'b' tag, because
+    there's no real-world reason to bold something that's already
+    bold. When it encounters '</b></b>' it will close two more 'b'
+    tags, for a grand total of three tags closed instead of two. This
+    can throw off the rest of your document structure. The same is
+    true of a number of other tags, listed below.
+
+    It's much more common for someone to forget to close a 'b' tag
+    than to actually use nested 'b' tags, and the BeautifulSoup class
+    handles the common case. This class handles the not-co-common
+    case: where you can't believe someone wrote what they did, but
+    it's valid HTML and BeautifulSoup screwed up by assuming it
+    wouldn't be."""
+
+    I_CANT_BELIEVE_THEYRE_NESTABLE_INLINE_TAGS = \
+     ['em', 'big', 'i', 'small', 'tt', 'abbr', 'acronym', 'strong',
+      'cite', 'code', 'dfn', 'kbd', 'samp', 'strong', 'var', 'b',
+      'big']
+
+    I_CANT_BELIEVE_THEYRE_NESTABLE_BLOCK_TAGS = ['noscript']
+
+    NESTABLE_TAGS = buildTagMap([], BeautifulSoup.NESTABLE_TAGS,
+                                I_CANT_BELIEVE_THEYRE_NESTABLE_BLOCK_TAGS,
+                                I_CANT_BELIEVE_THEYRE_NESTABLE_INLINE_TAGS)
+
+class MinimalSoup(BeautifulSoup):
+    """The MinimalSoup class is for parsing HTML that contains
+    pathologically bad markup. It makes no assumptions about tag
+    nesting, but it does know which tags are self-closing, that
+    <script> tags contain Javascript and should not be parsed, that
+    META tags may contain encoding information, and so on.
+
+    This also makes it better for subclassing than BeautifulStoneSoup
+    or BeautifulSoup."""
+    
+    RESET_NESTING_TAGS = buildTagMap('noscript')
+    NESTABLE_TAGS = {}
+
+class BeautifulSOAP(BeautifulStoneSoup):
+    """This class will push a tag with only a single string child into
+    the tag's parent as an attribute. The attribute's name is the tag
+    name, and the value is the string child. An example should give
+    the flavor of the change:
+
+    <foo><bar>baz</bar></foo>
+     =>
+    <foo bar="baz"><bar>baz</bar></foo>
+
+    You can then access fooTag['bar'] instead of fooTag.barTag.string.
+
+    This is, of course, useful for scraping structures that tend to
+    use subelements instead of attributes, such as SOAP messages. Note
+    that it modifies its input, so don't print the modified version
+    out.
+
+    I'm not sure how many people really want to use this class; let me
+    know if you do. Mainly I like the name."""
+
+    def popTag(self):
+        if len(self.tagStack) > 1:
+            tag = self.tagStack[-1]
+            parent = self.tagStack[-2]
+            parent._getAttrMap()
+            if (isinstance(tag, Tag) and len(tag.contents) == 1 and
+                isinstance(tag.contents[0], NavigableString) and 
+                not parent.attrMap.has_key(tag.name)):
+                parent[tag.name] = tag.contents[0]
+        BeautifulStoneSoup.popTag(self)
+
+#Enterprise class names! It has come to our attention that some people
+#think the names of the Beautiful Soup parser classes are too silly
+#and "unprofessional" for use in enterprise screen-scraping. We feel
+#your pain! For such-minded folk, the Beautiful Soup Consortium And
+#All-Night Kosher Bakery recommends renaming this file to
+#"RobustParser.py" (or, in cases of extreme enterprisitude,
+#"RobustParserBeanInterface.class") and using the following
+#enterprise-friendly class aliases:
+class RobustXMLParser(BeautifulStoneSoup):
+    pass
+class RobustHTMLParser(BeautifulSoup):
+    pass
+class RobustWackAssHTMLParser(ICantBelieveItsBeautifulSoup):
+    pass
+class RobustInsanelyWackAssHTMLParser(MinimalSoup):
+    pass
+class SimplifyingSOAPParser(BeautifulSOAP):
+    pass
+
+######################################################
+#
+# Bonus library: Unicode, Dammit
+#
+# This class forces XML data into a standard format (usually to UTF-8
+# or Unicode).  It is heavily based on code from Mark Pilgrim's
+# Universal Feed Parser. It does not rewrite the XML or HTML to
+# reflect a new encoding: that happens in BeautifulStoneSoup.handle_pi
+# (XML) and BeautifulSoup.start_meta (HTML).
+
+# Autodetects character encodings.
+# Download from http://chardet.feedparser.org/
+try:
+    import chardet
+#    import chardet.constants
+#    chardet.constants._debug = 1
+except:
+    chardet = None
+chardet = None
+
+# cjkcodecs and iconv_codec make Python know about more character encodings.
+# Both are available from http://cjkpython.i18n.org/
+# They're built in if you use Python 2.4.
+try:
+    import cjkcodecs.aliases
+except:
+    pass
+try:
+    import iconv_codec
+except:
+    pass
+
+class UnicodeDammit:
+    """A class for detecting the encoding of a *ML document and
+    converting it to a Unicode string. If the source encoding is
+    windows-1252, can replace MS smart quotes with their HTML or XML
+    equivalents."""
+
+    # This dictionary maps commonly seen values for "charset" in HTML
+    # meta tags to the corresponding Python codec names. It only covers
+    # values that aren't in Python's aliases and can't be determined
+    # by the heuristics in find_codec.
+    CHARSET_ALIASES = { "macintosh" : "mac-roman",
+                        "x-sjis" : "shift-jis" }
+    
+    def __init__(self, markup, overrideEncodings=[],
+                 smartQuotesTo='xml'):
+        self.markup, documentEncoding, sniffedEncoding = \
+                     self._detectEncoding(markup)
+        self.smartQuotesTo = smartQuotesTo
+        self.triedEncodings = []
+        if isinstance(markup, unicode):
+            return markup
+
+        u = None
+        for proposedEncoding in overrideEncodings:
+            u = self._convertFrom(proposedEncoding)
+            if u: break
+        if not u:
+            for proposedEncoding in (documentEncoding, sniffedEncoding):
+                u = self._convertFrom(proposedEncoding)
+                if u: break
+                
+        # If no luck and we have auto-detection library, try that:
+        if not u and chardet and not isinstance(self.markup, unicode):
+            u = self._convertFrom(chardet.detect(self.markup)['encoding'])
+
+        # As a last resort, try utf-8 and windows-1252:
+        if not u:
+            for proposed_encoding in ("utf-8", "windows-1252"):
+                u = self._convertFrom(proposed_encoding)
+                if u: break
+        self.unicode = u
+        if not u: self.originalEncoding = None
+
+    def _subMSChar(self, orig):
+        """Changes a MS smart quote character to an XML or HTML
+        entity."""
+        sub = self.MS_CHARS.get(orig)
+        if type(sub) == types.TupleType:
+            if self.smartQuotesTo == 'xml':
+                sub = '&#x%s;' % sub[1]
+            else:
+                sub = '&%s;' % sub[0]
+        return sub            
+
+    def _convertFrom(self, proposed):        
+        proposed = self.find_codec(proposed)
+        if not proposed or proposed in self.triedEncodings:
+            return None
+        self.triedEncodings.append(proposed)
+        markup = self.markup
+
+        # Convert smart quotes to HTML if coming from an encoding
+        # that might have them.
+        if self.smartQuotesTo and proposed in("windows-1252",
+                                              "ISO-8859-1",
+                                              "ISO-8859-2"):
+            markup = re.compile("([\x80-\x9f])").sub \
+                     (lambda(x): self._subMSChar(x.group(1)),
+                      markup)
+
+        try:
+            # print "Trying to convert document to %s" % proposed
+            u = self._toUnicode(markup, proposed)
+            self.markup = u       
+            self.originalEncoding = proposed
+        except Exception, e:
+            # print "That didn't work!"
+            # print e
+            return None        
+        #print "Correct encoding: %s" % proposed
+        return self.markup
+
+    def _toUnicode(self, data, encoding):
+        '''Given a string and its encoding, decodes the string into Unicode.
+        %encoding is a string recognized by encodings.aliases'''
+
+        # strip Byte Order Mark (if present)
+        if (len(data) >= 4) and (data[:2] == '\xfe\xff') \
+               and (data[2:4] != '\x00\x00'):
+            encoding = 'utf-16be'
+            data = data[2:]
+        elif (len(data) >= 4) and (data[:2] == '\xff\xfe') \
+                 and (data[2:4] != '\x00\x00'):
+            encoding = 'utf-16le'
+            data = data[2:]
+        elif data[:3] == '\xef\xbb\xbf':
+            encoding = 'utf-8'
+            data = data[3:]
+        elif data[:4] == '\x00\x00\xfe\xff':
+            encoding = 'utf-32be'
+            data = data[4:]
+        elif data[:4] == '\xff\xfe\x00\x00':
+            encoding = 'utf-32le'
+            data = data[4:]
+        newdata = unicode(data, encoding)
+        return newdata
+    
+    def _detectEncoding(self, xml_data):
+        """Given a document, tries to detect its XML encoding."""
+        xml_encoding = sniffed_xml_encoding = None
+        try:
+            if xml_data[:4] == '\x4c\x6f\xa7\x94':
+                # EBCDIC
+                xml_data = self._ebcdic_to_ascii(xml_data)
+            elif xml_data[:4] == '\x00\x3c\x00\x3f':
+                # UTF-16BE
+                sniffed_xml_encoding = 'utf-16be'
+                xml_data = unicode(xml_data, 'utf-16be').encode('utf-8')
+            elif (len(xml_data) >= 4) and (xml_data[:2] == '\xfe\xff') \
+                     and (xml_data[2:4] != '\x00\x00'):
+                # UTF-16BE with BOM
+                sniffed_xml_encoding = 'utf-16be'
+                xml_data = unicode(xml_data[2:], 'utf-16be').encode('utf-8')
+            elif xml_data[:4] == '\x3c\x00\x3f\x00':
+                # UTF-16LE
+                sniffed_xml_encoding = 'utf-16le'
+                xml_data = unicode(xml_data, 'utf-16le').encode('utf-8')
+            elif (len(xml_data) >= 4) and (xml_data[:2] == '\xff\xfe') and \
+                     (xml_data[2:4] != '\x00\x00'):
+                # UTF-16LE with BOM
+                sniffed_xml_encoding = 'utf-16le'
+                xml_data = unicode(xml_data[2:], 'utf-16le').encode('utf-8')
+            elif xml_data[:4] == '\x00\x00\x00\x3c':
+                # UTF-32BE
+                sniffed_xml_encoding = 'utf-32be'
+                xml_data = unicode(xml_data, 'utf-32be').encode('utf-8')
+            elif xml_data[:4] == '\x3c\x00\x00\x00':
+                # UTF-32LE
+                sniffed_xml_encoding = 'utf-32le'
+                xml_data = unicode(xml_data, 'utf-32le').encode('utf-8')
+            elif xml_data[:4] == '\x00\x00\xfe\xff':
+                # UTF-32BE with BOM
+                sniffed_xml_encoding = 'utf-32be'
+                xml_data = unicode(xml_data[4:], 'utf-32be').encode('utf-8')
+            elif xml_data[:4] == '\xff\xfe\x00\x00':
+                # UTF-32LE with BOM
+                sniffed_xml_encoding = 'utf-32le'
+                xml_data = unicode(xml_data[4:], 'utf-32le').encode('utf-8')
+            elif xml_data[:3] == '\xef\xbb\xbf':
+                # UTF-8 with BOM
+                sniffed_xml_encoding = 'utf-8'
+                xml_data = unicode(xml_data[3:], 'utf-8').encode('utf-8')
+            else:
+                sniffed_xml_encoding = 'ascii'
+                pass
+            xml_encoding_match = re.compile \
+                                 ('^<\?.*encoding=[\'"](.*?)[\'"].*\?>')\
+                                 .match(xml_data)
+        except:
+            xml_encoding_match = None
+        if xml_encoding_match:
+            xml_encoding = xml_encoding_match.groups()[0].lower()
+            if sniffed_xml_encoding and \
+               (xml_encoding in ('iso-10646-ucs-2', 'ucs-2', 'csunicode',
+                                 'iso-10646-ucs-4', 'ucs-4', 'csucs4',
+                                 'utf-16', 'utf-32', 'utf_16', 'utf_32',
+                                 'utf16', 'u16')):
+                xml_encoding = sniffed_xml_encoding
+        return xml_data, xml_encoding, sniffed_xml_encoding
+
+
+    def find_codec(self, charset):
+        return self._codec(self.CHARSET_ALIASES.get(charset, charset)) \
+               or (charset and self._codec(charset.replace("-", ""))) \
+               or (charset and self._codec(charset.replace("-", "_"))) \
+               or charset
+
+    def _codec(self, charset):
+        if not charset: return charset 
+        codec = None
+        try:
+            codecs.lookup(charset)
+            codec = charset
+        except LookupError:
+            pass
+        return codec
+
+    EBCDIC_TO_ASCII_MAP = None
+    def _ebcdic_to_ascii(self, s):
+        c = self.__class__
+        if not c.EBCDIC_TO_ASCII_MAP:
+            emap = (0,1,2,3,156,9,134,127,151,141,142,11,12,13,14,15,
+                    16,17,18,19,157,133,8,135,24,25,146,143,28,29,30,31,
+                    128,129,130,131,132,10,23,27,136,137,138,139,140,5,6,7,
+                    144,145,22,147,148,149,150,4,152,153,154,155,20,21,158,26,
+                    32,160,161,162,163,164,165,166,167,168,91,46,60,40,43,33,
+                    38,169,170,171,172,173,174,175,176,177,93,36,42,41,59,94,
+                    45,47,178,179,180,181,182,183,184,185,124,44,37,95,62,63,
+                    186,187,188,189,190,191,192,193,194,96,58,35,64,39,61,34,
+                    195,97,98,99,100,101,102,103,104,105,196,197,198,199,200,
+                    201,202,106,107,108,109,110,111,112,113,114,203,204,205,
+                    206,207,208,209,126,115,116,117,118,119,120,121,122,210,
+                    211,212,213,214,215,216,217,218,219,220,221,222,223,224,
+                    225,226,227,228,229,230,231,123,65,66,67,68,69,70,71,72,
+                    73,232,233,234,235,236,237,125,74,75,76,77,78,79,80,81,
+                    82,238,239,240,241,242,243,92,159,83,84,85,86,87,88,89,
+                    90,244,245,246,247,248,249,48,49,50,51,52,53,54,55,56,57,
+                    250,251,252,253,254,255)
+            import string
+            c.EBCDIC_TO_ASCII_MAP = string.maketrans( \
+            ''.join(map(chr, range(256))), ''.join(map(chr, emap)))
+        return s.translate(c.EBCDIC_TO_ASCII_MAP)
+
+    MS_CHARS = { '\x80' : ('euro', '20AC'),
+                 '\x81' : ' ',
+                 '\x82' : ('sbquo', '201A'),
+                 '\x83' : ('fnof', '192'),
+                 '\x84' : ('bdquo', '201E'),
+                 '\x85' : ('hellip', '2026'),
+                 '\x86' : ('dagger', '2020'),
+                 '\x87' : ('Dagger', '2021'),
+                 '\x88' : ('circ', '2C6'),
+                 '\x89' : ('permil', '2030'),
+                 '\x8A' : ('Scaron', '160'),
+                 '\x8B' : ('lsaquo', '2039'),
+                 '\x8C' : ('OElig', '152'),
+                 '\x8D' : '?',
+                 '\x8E' : ('#x17D', '17D'),
+                 '\x8F' : '?',
+                 '\x90' : '?',
+                 '\x91' : ('lsquo', '2018'),
+                 '\x92' : ('rsquo', '2019'),
+                 '\x93' : ('ldquo', '201C'),
+                 '\x94' : ('rdquo', '201D'),
+                 '\x95' : ('bull', '2022'),
+                 '\x96' : ('ndash', '2013'),
+                 '\x97' : ('mdash', '2014'),
+                 '\x98' : ('tilde', '2DC'),
+                 '\x99' : ('trade', '2122'),
+                 '\x9a' : ('scaron', '161'),
+                 '\x9b' : ('rsaquo', '203A'),
+                 '\x9c' : ('oelig', '153'),
+                 '\x9d' : '?',
+                 '\x9e' : ('#x17E', '17E'),
+                 '\x9f' : ('Yuml', ''),}
+
+#######################################################################
+
+
+#By default, act as an HTML pretty-printer.
+if __name__ == '__main__':
+    import sys
+    soup = BeautifulStoneSoup(sys.stdin.read())
+    print soup.prettify()
diff --git a/constants.py b/constants.py
new file mode 100644
index 00000000..9fba0cc9
--- /dev/null
+++ b/constants.py
@@ -0,0 +1,135 @@
+CSS = '''body { margin-left: 5%; margin-right: 5%; margin-top: 5%; margin-bottom: 5%; text-align: justify; }
+pre { font-size: x-small; }
+h1 { text-align: center; }
+h2 { text-align: center; }
+h3 { text-align: center; }
+h4 { text-align: center; }
+h5 { text-align: center; }
+h6 { text-align: center; }
+.CI {
+    text-align:center;
+    margin-top:0px;
+    margin-bottom:0px;
+    padding:0px;
+    }
+.center   {text-align: center;}
+.smcap    {font-variant: small-caps;}
+.u        {text-decoration: underline;}
+.bold     {font-weight: bold;}
+'''
+
+MIMETYPE = '''application/epub+zip'''
+
+CONTAINER = '''<?xml version="1.0"?>
+<container version="1.0" xmlns="urn:oasis:names:tc:opendocument:xmlns:container">
+  <rootfiles>
+    <rootfile full-path="OEBPS/content.opf" media-type="application/oebps-package+xml"/>
+  </rootfiles>
+</container>
+'''
+
+CONTENT_START = '''<?xml version="1.0"?>
+<package version="2.0" xmlns="http://www.idpf.org/2007/opf"
+         unique-identifier="BookId-Epub-%s">
+ <metadata xmlns:dc="http://purl.org/dc/elements/1.1/"
+           xmlns:opf="http://www.idpf.org/2007/opf">
+   <dc:title>%s</dc:title> 
+   <dc:creator opf:role="aut">%s</dc:creator>
+   <dc:language>en-UK</dc:language> 
+   <dc:rights></dc:rights> 
+   <dc:publisher>sgzmd</dc:publisher> 
+   <dc:identifier id="BookId">urn:uuid:sigizmund.com062820072147132</dc:identifier>
+ </metadata>
+ <manifest>
+  <item id="ncx" href="toc.ncx" media-type="text/xml" />
+  <item id="style" href="stylesheet.css" media-type="text/css" />
+'''
+
+CONTENT_ITEM = '<item id="%s" href="%s" media-type="application/xhtml+xml" />'
+
+CONTENT_END_MANIFEST = '''</manifest>
+<spine toc="ncx">
+'''
+
+CONTENT_ITEMREF = '''<itemref idref="%s" />'''
+
+CONTENT_END = '''</spine>
+</package>
+'''
+
+TOC_START = '''<?xml version="1.0" encoding="UTF-8"?>
+<ncx xmlns="http://www.daisy.org/z3986/2005/ncx/" version="2005-1">
+  <head>
+    <meta name="dtb:uid" content="sigizmund.com062820072147132"/>
+    <meta name="dtb:depth" content="1"/>
+    <meta name="dtb:totalPageCount" content="0"/>
+    <meta name="dtb:maxPageNumber" content="0"/>
+  </head>
+  <docTitle>
+    <text>%s</text>
+  </docTitle>
+  <navMap>
+'''
+
+TOC_ITEM = '''<navPoint id="%s" playOrder="%d">
+  <navLabel>
+    <text>%s</text>
+  </navLabel>
+  <content src="%s"/>
+</navPoint>
+'''
+
+TOC_END = '''</navMap>
+</ncx>
+'''
+
+XHTML_START = '''<?xml version="1.0" encoding="iso-8859-1"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN" "http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml">
+<head>
+<title>%s</title>
+<link href="stylesheet.css" type="text/css" rel="stylesheet" />
+</head>
+<body>
+<div>
+<h3>%s</h3>
+'''
+
+XHTML_END = '''</div>
+</body>
+</html>
+'''
+
+acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
+      'blockquote', 'br', 'center', 'cite', 'code', 'col',
+      'colgroup', 'dd', 'del', 'dfn', 'dir', 'div', 'dl', 'dt', 'em',
+      'font', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'i', 
+      'ins', 'kbd', 'label', 'li', 'ol', 
+      'p', 'pre', 'q', 's', 'samp', 'small', 'span', 'strike',
+      'strong', 'sub', 'sup', 'u', 'ul']
+
+acceptable_attributes = ['href']
+
+entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', '&lsquo;' : '\'', '&quot;' : '"' }
+
+FB2_PROLOGUE = '<FictionBook>'
+FB2_DESCRIPTION = '''<description>
+<title-info>
+  <genre>fanfiction</genre>
+  <author>
+  <first-name></first-name>
+  <middle-name></middle-name>
+  <last-name>%s</last-name>
+  </author>
+  <book-title>%s</book-title>
+  <lang>eng</lang>
+</title-info>
+<document-info>
+  <author>
+  <nickname>sgzmd</nickname>
+  </author>
+<date value="%s">%s</date>
+<id>sgzmd_%s</id>
+<version>2.0</version>
+</document-info>
+</description>'''
diff --git a/downaloder.py b/downaloder.py
new file mode 100644
index 00000000..220a2c23
--- /dev/null
+++ b/downaloder.py
@@ -0,0 +1,74 @@
+import os
+import re
+import sys
+import shutil
+import os.path
+import getpass
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+import ffa
+import ficwad
+import output
+import fictionalley
+
+class FanficLoader:
+	'''A controller class which handles the interaction between various specific downloaders and writers'''
+	booksDirectory = "books"
+	
+	def __init__(self, adapter, writerClass):
+		self.adapter = adapter
+		self.writerClass = writerClass
+		
+	def download(self):
+		urls = self.adapter.extractIndividualUrls()
+		self.writer = self.writerClass(self.booksDirectory, self.adapter.getStoryName(), self.adapter.getAuthorName())
+		
+		for u,n in urls:
+			text = self.adapter.getText(u)
+			self.writer.writeChapter(n, text)
+		
+		self.writer.finalise()
+	
+
+if __name__ == '__main__':
+	(url, format) = sys.argv[1:]
+	
+	if type(url) is unicode:
+		print('URL is unicode')
+		url = url.encode('latin1')
+	
+	adapter = None
+	writerClass = None
+	
+	if url.find('fanficauthors') != -1:
+		adapter = ffa.FFA(url)
+	elif url.find('fictionalley') != -1:
+		adapter = fictionalley.FictionAlley(url)
+	elif url.find('ficwad') != -1:
+		adapter = ficwad.FicWad(url)
+	else:
+		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
+		sys.exit(1)
+	
+	if format == 'epub':
+		writerClass = output.EPubFanficWriter
+	
+	if adapter.requiresLogin(url):
+		print("Meow, URL %s requires you to haz been logged in! Please can I haz this datas?" % url)
+		sys.stdout.write("Can I haz ur login? ")
+		login = sys.stdin.readline().strip()
+		password = getpass.getpass(prompt='Can I haz ur password? ')
+		print("Login: `%s`, Password: `%s`" % (login, password))
+		
+		adapter.setLogin(login)
+		adapter.setPassword(password)
+		
+	
+	loader = FanficLoader(adapter, writerClass)
+	loader.download()
+	
\ No newline at end of file
diff --git a/ffa.py b/ffa.py
new file mode 100644
index 00000000..9153d2be
--- /dev/null
+++ b/ffa.py
@@ -0,0 +1,187 @@
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import base64
+import os.path
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+from constants import *
+
+from ficwad import *
+
+class FFA:
+	storyName = None
+	
+	def __init__(self):
+		self.grabUrl = re.compile('(\<option.+value=\")(.+?)\"\>(.+?)\<')
+		self.grabAuthor = re.compile('.+pemail.+\'(\w+)')
+	
+	def getPasswordLine(self):
+		return '<input type="password" name="pass"'
+		
+	def getLoginScript(self):
+		return '/scripts/login.php'
+		
+	def getLoginPasswordOthers(self):
+		login = dict(login = 'name', password = 'pass')
+		other = dict(submit = 'Log In', remember='yes')
+		return (login, other)
+	
+	def getPrintableUrl(self, url):
+		return url + '?print=yes'
+	
+	def _findIndex(self, lines, what, start):
+		for i in range(start, len(lines)):
+			if lines[i].find(what) != -1:
+				return i
+		return -1
+	
+	def extractIndividualUrls(self, data, host, first, fetch = False):
+		lines = data.split('\n')
+		
+		optionLines = filter(lambda x : x.find('<option value="') != -1, lines)
+		
+		authorLines = filter(lambda x : x.find('pemail') != -1, lines)
+		for al in authorLines:
+			m = self.grabAuthor.match(al)
+			if m != None:
+				self.authorName = m.group(1)
+				break
+				
+		
+		optionsLines = optionLines[:len(optionLines)/2]
+		
+		storyName = first.split("/")[1]
+		
+		result = []
+		urls = []
+		for line in optionLines:
+			m = self.grabUrl.match(line)
+			u = m.group(2)
+			if u.find('" selected="selected') != -1:
+				u = u.replace('" selected="selected', '')
+			
+			if u in urls:
+				continue
+			else:
+				urls.append(u)
+			
+			result.append((self.getPrintableUrl(storyName + "/" + u), m.group(3)))
+		
+		self.soup = bs.BeautifulSoup(data)
+		titles = self.soup.findAll(name = 'title', recursive=True)
+		if len(titles) > 0:
+			title = titles[0]
+			print(title)
+			(website, rest) = title.string.split('::')
+			story_chapter = rest.split("-")
+			
+			story = story_chapter[0].strip()
+			self.storyName = story
+		
+		return result
+	
+	def getStoryName(self):
+		return self.storyName
+	
+	def getAuthorName(self):
+		return self.authorName
+	
+	def getText(self, data, fetch = False):
+		lines = data.split('\n')
+		begin = self._findIndex(lines, '</select>', 0)+1
+		if begin == 0:
+			begiun = self._findIndex(lines, '<div><p>', 24)
+		
+		if begin == 0:
+			print('BAD start')
+			pp.pprint(lines)
+			sys.abort()
+		end = self._findIndex(lines, '<form action="index.php"><div class="topandbotline"', begin)
+		print('<!-- ========= begin=%d, end=%d ============= -->' % (begin, end))
+		return "\n".join(lines[begin:end])
+
+class Downloader:
+	login = None
+	password = None
+	url = None
+	host = None
+	first = None
+	opener = None
+	
+	writer = None
+	
+	def __init__(self, url, login, password):
+		self.login = login
+		self.password = password
+		self.url = url
+
+		self.infoProvider = FicWad() #FFA()
+
+		parse = up.urlparse(url)
+		self.host = parse.scheme + '://' + parse.netloc
+		self.first = parse.path;
+		
+		self.loginUrl = self.host + self.infoProvider.getLoginScript()
+		
+		self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+		
+	
+	def _loginRequired(self):
+		print('is login required?')
+		resp = self.opener.open(self.url)
+		data = resp.read()
+		if data.find(self.infoProvider.getPasswordLine()) != -1:
+			print('yep')
+			return True
+		else:
+			print('nada')
+			return False
+		
+	def _login(self):
+		(login, data) = self.infoProvider.getLoginPasswordOthers()
+
+		data[login['login']] = self.login
+		data[login['password']] = self.password
+		
+		urlvals = u.urlencode(data)
+		req = self.opener.open(self.loginUrl, urlvals)
+		
+		if req.read().find(self.infoProvider.getPasswordLine()) != -1:
+			return False
+		else:
+			return True
+	
+	def _getContent(self, url):
+		print("<!-- Opening %s -->" % url)
+		return self.opener.open(url).read()
+	
+	def download(self):
+		first = self._getContent(self.host + self.first)
+		urls = self.infoProvider.extractIndividualUrls(first, self.host, self.first)
+		
+		self.writer = EPubFanficWriter("books", self.infoProvider.getStoryName(), self.infoProvider.getAuthorName())
+		
+		for u,n in urls:
+			text = self.infoProvider.getText(self._getContent(self.host+"/"+u))
+			self.writer.writeChapter(n, text)
+		
+		self.writer.finalise()
+		
+
+if __name__ == '__main__':
+	f = Downloader(sys.argv[1], 'sigizmund', '***************')
+	if f._loginRequired():
+		f._login()
+	f.download()
+	
+	
+	
\ No newline at end of file
diff --git a/fictionalley.py b/fictionalley.py
new file mode 100644
index 00000000..6ccc5ad8
--- /dev/null
+++ b/fictionalley.py
@@ -0,0 +1,75 @@
+import os
+import re
+import sys
+import shutil
+import os.path
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+class FictionAlley:
+	def __init__(self):
+		pass
+	
+	def extractIndividualUrls(self, data, host, contents):
+		soup = bs.BeautifulStoneSoup(data)
+		
+		title = soup.find('title').string
+		self.storyName = "-".join(title.split('-')[1:]).strip()
+		
+		authors = soup.findAll('a')
+		
+		print('Story "%s" by %s' % (self.storyName, self.authorName))
+		
+		links = soup.findAll('a', { 'class' : 'chapterlink' } )
+
+		result = []
+		for a in links:
+			url = a['href']
+			title = a.string
+			result.append((url,title))
+			
+		return result
+	
+	def getStoryName(self):
+		return self.storyName
+
+	def getAuthorName(self):
+		return self.authorName
+	
+
+	def getText(self, data, fetch = False):
+		soup = bs.BeautifulStoneSoup(data)
+		div = soup.find('div', {'id' : 'storytext'})
+		if None == div:
+			return '<html/>'
+		
+		return div.prettify()
+	
+	def getPrintableUrl(self, url):
+		return url
+	
+	def getPasswordLine(self):
+		return 'opaopapassword'
+
+	def getLoginScript(self):
+		return 'opaopaloginscript'
+
+	def getLoginPasswordOthers(self):
+		login = dict(login = 'name', password = 'pass')
+		other = dict(submit = 'Log In', remember='yes')
+		return (login, other)
+
+		
+if __name__ == '__main__':
+	url = 'http://www.fictionalley.org/authors/drt/DA.html'
+	data = u2.urlopen(url).read()
+	host = up.urlparse(url).netloc
+	fw = FictionAlley()
+	fw.authorName = 'DrT'
+	urls = fw.extractIndividualUrls(data, host, url)
+	pp.pprint(urls)
+	print(fw.getText(data))
\ No newline at end of file
diff --git a/ficwad.py b/ficwad.py
new file mode 100644
index 00000000..1861dab2
--- /dev/null
+++ b/ficwad.py
@@ -0,0 +1,97 @@
+import os
+import re
+import sys
+import shutil
+import os.path
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+class FicWad:
+	def __init__(self, url):
+		self.url = url
+		self.host = up.urlparse(url).netloc
+	
+	def requiresLogin(self, url):
+		return False
+	
+	def performLogin(self, url):
+		pass
+		
+	def setLogin(self, login):
+		self.login = login
+	
+	def setPassword(self, password):
+		self.password = password
+	
+	def extractIndividualUrls(self):
+		data = u2.urlopen(self.url).read()
+		soup = bs.BeautifulStoneSoup(data)
+		
+		title = soup.find('title').string
+		self.storyName = title.split('::')[0].strip()
+		
+		author = soup.find('span', {'class' : 'author'})
+		self.authorName = author.a.string
+		
+		print('Story "%s" by %s' % (self.storyName, self.authorName))
+		
+		select = soup.find('select', { 'name' : 'goto' } )
+		
+		allOptions = select.findAll('option')
+		result = []
+		for o in allOptions:
+			url = o['value']
+#			if type(url) is unicode:
+#				url = url.encode('utf-8')
+			title = o.string
+			result.append((url,title))
+			
+		return result
+	
+	def getStoryName(self):
+		return self.storyName
+
+	def getAuthorName(self):
+		return self.authorName
+	
+	def getText(self, url):
+		print(type(url))
+		if url.find('http://') == -1:
+			url = 'http://' + self.host + '/' + url
+		
+		data = u2.urlopen(url).read()
+		
+		soup = bs.BeautifulStoneSoup(data)
+		div = soup.find('div', {'id' : 'storytext'})
+		if None == div:
+			return '<html/>'
+		
+		return div.prettify()
+	
+	def getPrintableUrl(self, url):
+		return url
+	
+	def getPasswordLine(self):
+		return 'opaopapassword'
+
+	def getLoginScript(self):
+		return 'opaopaloginscript'
+
+	def getLoginPasswordOthers(self):
+		login = dict(login = 'name', password = 'pass')
+		other = dict(submit = 'Log In', remember='yes')
+		return (login, other)
+
+		
+if __name__ == '__main__':
+	url = 'http://www.ficwad.com/story/14536'
+	data = u2.urlopen(url).read()
+	host = up.urlparse(url).netloc
+	fw = FicWad()
+	urls = fw.extractIndividualUrls(data, host, url)
+	pp.pprint(urls)
+	print(fw.getText(data))
\ No newline at end of file
diff --git a/output.py b/output.py
new file mode 100644
index 00000000..72c39fea
--- /dev/null
+++ b/output.py
@@ -0,0 +1,136 @@
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import base64
+import os.path
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+from constants import *
+
+class FanficWriter:
+	def __init__(self):
+		pass
+		
+	def writeChapter(self, title, text):
+		pass
+	
+	def finalise(self):
+		pass
+
+class HTMLWriter(FanficWriter):
+	def __init__(self, base, name, author):
+		pass
+
+	def writeChapter(self, title, text):
+		pass
+	
+	def finalise(self):
+		pass
+
+class EPubFanficWriter(FanficWriter):
+	chapters = []
+	
+	def __init__(self, base, name, author):
+		self.basePath = base
+		self.name = name.replace(" ", "_")
+		self.storyTitle = name
+		self.directory = self.basePath + '/' + self.name
+		
+		self.authorName = author
+
+		if os.path.exists(self.directory):
+			shutil.rmtree(self.directory)
+		
+		os.mkdir(self.directory)
+		
+		os.mkdir(self.directory + '/META-INF')
+		os.mkdir(self.directory + '/OEBPS')
+		
+		print >> open(self.directory + '/mimetype', 'w'), MIMETYPE
+		print >> open(self.directory + '/META-INF/container.xml', 'w'), CONTAINER
+		print >> open(self.directory + '/OEBPS/stylesheet.css', 'w'), CSS
+
+	def _removeEntities(self, text):
+		for e in entities:
+			v = entities[e]
+			text = text.replace(e, v)
+		
+		return text
+	
+	def writeChapter(self, title, text):
+		fileName = base64.b64encode(title) + ".xhtml"
+		filePath = self.directory + "/OEBPS/" + fileName
+		f = open(filePath, 'w')
+		
+		text = self._removeEntities(text)
+		
+		self.soup = bs.BeautifulStoneSoup(text)
+
+		allTags = self.soup.findAll(recursive=True)
+		for t in allTags:
+			for attr in t._getAttrMap().keys():
+				if attr not in acceptable_attributes:
+					del t[attr]
+	    
+		allPs = self.soup.findAll(recursive=True)
+		for p in allPs:
+			if p.string != None and (len(p.string.strip()) == 0 or p.string.strip() == '&nbsp;' ) :
+				p.extract()
+				
+		allBrs = self.soup.findAll(recursive=True, name = ["br", "hr"])
+		for br in allBrs:
+			if (br.string != None and len(br.string.strip()) != 0) or (br.contents != None):
+				br.name = 'p'
+
+#		cleanup(self.soup )
+		
+		text = self.soup.prettify()
+		
+		print >> f, XHTML_START % (title, title)
+		print >> f, text
+		print >> f, XHTML_END
+		
+		self.chapters.append((title, fileName))
+	
+	def finalise(self):
+		
+		### writing table of contents -- ncx file
+		
+		tocFilePath = self.directory + "/OEBPS/toc.ncx"
+		toc = open(tocFilePath, 'w')
+		print >> toc, TOC_START % self.storyTitle
+
+		### writing content -- opf file
+		opfFilePath = self.directory + "/OEBPS/content.opf"
+		opf = open(opfFilePath, 'w')
+		
+		print >> opf, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName)
+
+		ids = []
+		
+		i = 0
+		for t,f in self.chapters:
+			chapterId = base64.b64encode(t)
+			print >> toc, TOC_ITEM % (chapterId, i, cgi.escape(t), f)
+			
+			print >> opf, CONTENT_ITEM % (chapterId, f)
+			
+			ids.append(chapterId)
+			
+			i = i + 1
+		
+		print >> toc, TOC_END
+		print >> opf, CONTENT_END_MANIFEST		
+		
+		for chapterId in ids:
+			print >> opf, CONTENT_ITEMREF % chapterId
+		
+		print >> opf, CONTENT_END
\ No newline at end of file

From a9748061f0b602f682f9ea96680ab8a565662998 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Tue, 15 Dec 2009 15:26:45 +0000
Subject: [PATCH 02/94] minor changes

---
 downaloder.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/downaloder.py b/downaloder.py
index 220a2c23..66951aba 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -54,7 +54,7 @@ if __name__ == '__main__':
 	else:
 		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
 		sys.exit(1)
-	
+
 	if format == 'epub':
 		writerClass = output.EPubFanficWriter
 	

From 6ef95c634d4d791ad6c4f137c8ec92119680a20f Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 11:26:55 +0000
Subject: [PATCH 03/94] FFA changed, architecture changed, not quite ready yet

---
 constants.py  |   2 +-
 downaloder.py |   3 +
 ffa.py        | 289 +++++++++++++++++++++++++-------------------------
 ficwad.py     |   1 -
 output.py     |  30 ++++--
 5 files changed, 174 insertions(+), 151 deletions(-)

diff --git a/constants.py b/constants.py
index 9fba0cc9..6387cb70 100644
--- a/constants.py
+++ b/constants.py
@@ -83,7 +83,7 @@ TOC_END = '''</navMap>
 </ncx>
 '''
 
-XHTML_START = '''<?xml version="1.0" encoding="iso-8859-1"?>
+XHTML_START = '''<?xml version="1.0" encoding="UTF-8"?>
 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN" "http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd">
 <html xmlns="http://www.w3.org/1999/xhtml">
 <head>
diff --git a/downaloder.py b/downaloder.py
index 66951aba..48311aeb 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -28,7 +28,10 @@ class FanficLoader:
 		urls = self.adapter.extractIndividualUrls()
 		self.writer = self.writerClass(self.booksDirectory, self.adapter.getStoryName(), self.adapter.getAuthorName())
 		
+		i = 0
 		for u,n in urls:
+			print('Downloading chapter %d/%d' % (i, len(urls)))
+			i = i+1
 			text = self.adapter.getText(u)
 			self.writer.writeChapter(n, text)
 		
diff --git a/ffa.py b/ffa.py
index 9153d2be..1bd35b07 100644
--- a/ffa.py
+++ b/ffa.py
@@ -1,3 +1,5 @@
+# -*- coding: utf-8 -*-
+
 import os
 import re
 import sys
@@ -6,182 +8,183 @@ import uuid
 import shutil
 import base64
 import os.path
+import logging
+import unittest
 import urllib as u
 import pprint as pp
 import urllib2 as u2
+import login_password
 import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
 from constants import *
 
-from ficwad import *
-
 class FFA:
-	storyName = None
+	def __init__(self, url):
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		self.opener = u2.build_opener(u2.HTTPCookieProcessor())
 	
-	def __init__(self):
-		self.grabUrl = re.compile('(\<option.+value=\")(.+?)\"\>(.+?)\<')
-		self.grabAuthor = re.compile('.+pemail.+\'(\w+)')
+		logging.debug("Created FFA: url=%s" % (self.url))
 	
-	def getPasswordLine(self):
-		return '<input type="password" name="pass"'
+	def _getLoginScript(self):
+		return self.path
+
+	def requiresLogin(self, url = None):
+		resp = self.opener.open(self.url)
+		data = resp.read()
+		if data.find('<legend>Please login to continue</legend>') != -1:
+			return True
+		else:
+			return False
+ 
+	def performLogin(self, url = None):
+		if url == None:
+			url = self.url
 		
-	def getLoginScript(self):
-		return '/scripts/login.php'
+		data = {}
 		
-	def getLoginPasswordOthers(self):
-		login = dict(login = 'name', password = 'pass')
-		other = dict(submit = 'Log In', remember='yes')
-		return (login, other)
+		data['username'] = self.login
+		data['password'] = self.password
+		data['submit'] = 'Submit'
+		
+		urlvals = u.urlencode(data)
+		loginUrl = 'http://' + self.host + self._getLoginScript()
+		logging.debug("Will now login to URL %s" % loginUrl)
+		
+		req = self.opener.open(loginUrl, urlvals)
+		
+		if self.requiresLogin():
+			return False
+		else:
+			return True
 	
-	def getPrintableUrl(self, url):
-		return url + '?print=yes'
-	
-	def _findIndex(self, lines, what, start):
-		for i in range(start, len(lines)):
-			if lines[i].find(what) != -1:
-				return i
-		return -1
-	
-	def extractIndividualUrls(self, data, host, first, fetch = False):
+	def extractIndividualUrls(self):
+		data = self.opener.open(self.url).read()
+		soup = bs.BeautifulStoneSoup(data)
+
+		self.author = soup.find('a', {'href' : '/contact/'}).string
+		self.storyName = str(soup.find('h1', {'class' : 'textCenter'}).contents[0]).strip()
+		
+		logging.debug("Story `%s` by `%s`" % (self.storyName, self.author))
+		
+		selector = soup.find('select', {'class' : 'tinput'})
+		options = selector.findAll('option')
+		
+		urls = []
+		
+		for o in options:
+			title = o.string
+			url = o['value']
+			
+			urls.append((url,title))
+		
+		return urls
+
+	def getText(self, url):
+		if url.find('http://') == -1:
+			url = 'http://' + self.host + '/' + url
+		
+		data = self.opener.open(url).read()
+		
 		lines = data.split('\n')
 		
-		optionLines = filter(lambda x : x.find('<option value="') != -1, lines)
+		emit = False
 		
-		authorLines = filter(lambda x : x.find('pemail') != -1, lines)
-		for al in authorLines:
-			m = self.grabAuthor.match(al)
-			if m != None:
-				self.authorName = m.group(1)
-				break
-				
+		post = ''
 		
-		optionsLines = optionLines[:len(optionLines)/2]
-		
-		storyName = first.split("/")[1]
-		
-		result = []
-		urls = []
-		for line in optionLines:
-			m = self.grabUrl.match(line)
-			u = m.group(2)
-			if u.find('" selected="selected') != -1:
-				u = u.replace('" selected="selected', '')
-			
-			if u in urls:
+		for l in lines:
+			if l.find('</div></form>') != -1:
+				logging.debug('emit = True')
+				emit = True
 				continue
-			else:
-				urls.append(u)
+			elif l.find('<form action="#">') != -1:
+				logging.debug('emit = False')
+				if emit:
+					break
+				else:
+					emit = False
 			
-			result.append((self.getPrintableUrl(storyName + "/" + u), m.group(3)))
+			if emit:
+				post = post + l + '\n'
 		
-		self.soup = bs.BeautifulSoup(data)
-		titles = self.soup.findAll(name = 'title', recursive=True)
-		if len(titles) > 0:
-			title = titles[0]
-			print(title)
-			(website, rest) = title.string.split('::')
-			story_chapter = rest.split("-")
-			
-			story = story_chapter[0].strip()
-			self.storyName = story
-		
-		return result
+		return post
+
+	def setLogin(self, login):
+		self.login = login
+
+	def setPassword(self, password):
+		self.password = password
 	
 	def getStoryName(self):
 		return self.storyName
-	
+		
 	def getAuthorName(self):
-		return self.authorName
-	
-	def getText(self, data, fetch = False):
-		lines = data.split('\n')
-		begin = self._findIndex(lines, '</select>', 0)+1
-		if begin == 0:
-			begiun = self._findIndex(lines, '<div><p>', 24)
-		
-		if begin == 0:
-			print('BAD start')
-			pp.pprint(lines)
-			sys.abort()
-		end = self._findIndex(lines, '<form action="index.php"><div class="topandbotline"', begin)
-		print('<!-- ========= begin=%d, end=%d ============= -->' % (begin, end))
-		return "\n".join(lines[begin:end])
+		return self.author
 
-class Downloader:
-	login = None
-	password = None
-	url = None
-	host = None
-	first = None
-	opener = None
-	
-	writer = None
-	
-	def __init__(self, url, login, password):
-		self.login = login
-		self.password = password
-		self.url = url
+	def getPrintableUrl(self, url):
+		return url
 
-		self.infoProvider = FicWad() #FFA()
-
-		parse = up.urlparse(url)
-		self.host = parse.scheme + '://' + parse.netloc
-		self.first = parse.path;
-		
-		self.loginUrl = self.host + self.infoProvider.getLoginScript()
-		
-		self.opener = u2.build_opener(u2.HTTPCookieProcessor())
-		
+class FFA_UnitTests(unittest.TestCase):
+	def setUp(self):
+		logging.basicConfig(level=logging.DEBUG)
+		pass
 	
-	def _loginRequired(self):
-		print('is login required?')
-		resp = self.opener.open(self.url)
-		data = resp.read()
-		if data.find(self.infoProvider.getPasswordLine()) != -1:
-			print('yep')
-			return True
-		else:
-			print('nada')
-			return False
-		
-	def _login(self):
-		(login, data) = self.infoProvider.getLoginPasswordOthers()
-
-		data[login['login']] = self.login
-		data[login['password']] = self.password
-		
-		urlvals = u.urlencode(data)
-		req = self.opener.open(self.loginUrl, urlvals)
-		
-		if req.read().find(self.infoProvider.getPasswordLine()) != -1:
-			return False
-		else:
-			return True
+	def testRequiresLoginNeg(self):
+		f = FFA('http://jeconais.fanficauthors.net/Happily_Ever_After/Introduction/')
+		self.assertFalse(f.requiresLogin())
 	
-	def _getContent(self, url):
-		print("<!-- Opening %s -->" % url)
-		return self.opener.open(url).read()
+	def testRequiresLogin(self):
+		f = FFA('http://jeconais.fanficauthors.net/Rons_Harem/Rons_Harem/')
+		self.assertTrue(f.requiresLogin())
 	
-	def download(self):
-		first = self._getContent(self.host + self.first)
-		urls = self.infoProvider.extractIndividualUrls(first, self.host, self.first)
+	def testPerformLogin(self):
+		f = FFA('http://jeconais.fanficauthors.net/Rons_Harem/Rons_Harem/')
 		
-		self.writer = EPubFanficWriter("books", self.infoProvider.getStoryName(), self.infoProvider.getAuthorName())
+		if login_password != None:
+			f.setLogin(login_password.login)
+			f.setPassword(login_password.password)
 		
-		for u,n in urls:
-			text = self.infoProvider.getText(self._getContent(self.host+"/"+u))
-			self.writer.writeChapter(n, text)
+		self.assertTrue(f.performLogin(None))
 		
-		self.writer.finalise()
+	def testExtractURLsAuthorStoryName(self):
+		f = FFA('http://draco664.fanficauthors.net/Apprentice_Potter/Prologue/')
+		f.extractIndividualUrls()
+		
+		self.assertEquals('Draco664', f.getAuthorName())
+		self.assertEquals('Apprentice Potter', f.getStoryName())
+	
+	def testExtractUrls(self):
+		f = FFA('http://draco664.fanficauthors.net/Apprentice_Potter/Prologue/')
+		urls = f.extractIndividualUrls()
+		self.assertEquals(25, len(urls))
+		
+		self.assertEquals('Grievances', urls[2][1])
+		self.assertEquals('/Apprentice_Potter/Prologue/', urls[0][0])
+	
+	def testGetText(self):
+		f = FFA('http://jeconais.fanficauthors.net/Happily_Ever_After/Introduction/')
+		data = f.getText('http://jeconais.fanficauthors.net/Happily_Ever_After/Introduction/')
+		
+		self.assertTrue(data.find('smiled slightly, and settled back in her rocking chair') != -1)
+		
+	def testGetTextLogin(self):
+		url = 'http://viridian.fanficauthors.net/Out_of_the_Darkness_A_Jinchuurikis_Tale/A_Harrowing_Escape/'
+		f = FFA(url)
+		
+		if login_password != None:
+			f.setLogin(login_password.login)
+			f.setPassword(login_password.password)
+		
+		if f.requiresLogin():
+			f.performLogin()
+		
+		data = f.getText(url)
+		seek = 'So Hokage-sama” I said, “this is how we came'
+		self.assertTrue(data.find(seek) != -1)
 		
-
 if __name__ == '__main__':
-	f = Downloader(sys.argv[1], 'sigizmund', '***************')
-	if f._loginRequired():
-		f._login()
-	f.download()
-	
-	
-	
\ No newline at end of file
+	unittest.main()
\ No newline at end of file
diff --git a/ficwad.py b/ficwad.py
index 1861dab2..23622c29 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -59,7 +59,6 @@ class FicWad:
 		return self.authorName
 	
 	def getText(self, url):
-		print(type(url))
 		if url.find('http://') == -1:
 			url = 'http://' + self.host + '/' + url
 		
diff --git a/output.py b/output.py
index 72c39fea..894fdefd 100644
--- a/output.py
+++ b/output.py
@@ -1,11 +1,15 @@
+# -*- coding: utf-8 -*-
+
 import os
 import re
 import sys
 import cgi
 import uuid
+import codecs
 import shutil
 import base64
 import os.path
+import zipfile
 import urllib as u
 import pprint as pp
 import urllib2 as u2
@@ -15,6 +19,9 @@ import htmlentitydefs as hdefs
 
 from constants import *
 
+import zipdir
+
+
 class FanficWriter:
 	def __init__(self):
 		pass
@@ -54,9 +61,9 @@ class EPubFanficWriter(FanficWriter):
 		os.mkdir(self.directory + '/META-INF')
 		os.mkdir(self.directory + '/OEBPS')
 		
-		print >> open(self.directory + '/mimetype', 'w'), MIMETYPE
-		print >> open(self.directory + '/META-INF/container.xml', 'w'), CONTAINER
-		print >> open(self.directory + '/OEBPS/stylesheet.css', 'w'), CSS
+		print >> codecs.open(self.directory + '/mimetype', 'w', 'utf-8'), MIMETYPE
+		print >> codecs.open(self.directory + '/META-INF/container.xml', 'w', 'utf-8'), CONTAINER
+		print >> codecs.open(self.directory + '/OEBPS/stylesheet.css', 'w', 'utf-8'), CSS
 
 	def _removeEntities(self, text):
 		for e in entities:
@@ -68,6 +75,7 @@ class EPubFanficWriter(FanficWriter):
 	def writeChapter(self, title, text):
 		fileName = base64.b64encode(title) + ".xhtml"
 		filePath = self.directory + "/OEBPS/" + fileName
+		
 		f = open(filePath, 'w')
 		
 		text = self._removeEntities(text)
@@ -93,21 +101,24 @@ class EPubFanficWriter(FanficWriter):
 #		cleanup(self.soup )
 		
 		text = self.soup.prettify()
+		print(text)
 		
 		print >> f, XHTML_START % (title, title)
-		print >> f, text
+		f.write(text)
 		print >> f, XHTML_END
 		
 		self.chapters.append((title, fileName))
 	
 	def finalise(self):
-		
+		print("Finalising...")
 		### writing table of contents -- ncx file
 		
 		tocFilePath = self.directory + "/OEBPS/toc.ncx"
 		toc = open(tocFilePath, 'w')
 		print >> toc, TOC_START % self.storyTitle
 
+		print("Printing toc and refs")
+
 		### writing content -- opf file
 		opfFilePath = self.directory + "/OEBPS/content.opf"
 		opf = open(opfFilePath, 'w')
@@ -126,6 +137,8 @@ class EPubFanficWriter(FanficWriter):
 			ids.append(chapterId)
 			
 			i = i + 1
+			
+		print('Toc and refs printed, proceesing to ref-ids....')
 		
 		print >> toc, TOC_END
 		print >> opf, CONTENT_END_MANIFEST		
@@ -133,4 +146,9 @@ class EPubFanficWriter(FanficWriter):
 		for chapterId in ids:
 			print >> opf, CONTENT_ITEMREF % chapterId
 		
-		print >> opf, CONTENT_END
\ No newline at end of file
+		print >> opf, CONTENT_END
+		
+		print('Finished')
+		
+		filename = self.directory + '.epub'
+		zipdir.toZip(filename, self.directory)
\ No newline at end of file

From 861d1561d94a8a41f2d6eef3c990a4ff340d0076 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 11:29:10 +0000
Subject: [PATCH 04/94] test change

---
 output.py | 3 +--
 1 file changed, 1 insertion(+), 2 deletions(-)

diff --git a/output.py b/output.py
index 894fdefd..d2107fe5 100644
--- a/output.py
+++ b/output.py
@@ -21,7 +21,6 @@ from constants import *
 
 import zipdir
 
-
 class FanficWriter:
 	def __init__(self):
 		pass
@@ -151,4 +150,4 @@ class EPubFanficWriter(FanficWriter):
 		print('Finished')
 		
 		filename = self.directory + '.epub'
-		zipdir.toZip(filename, self.directory)
\ No newline at end of file
+		zipdir.toZip(filename, self.directory)

From 259c0f3650307d541448a77c62025341e58f6213 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 11:30:23 +0000
Subject: [PATCH 05/94] sample change

---
 output.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/output.py b/output.py
index d2107fe5..bd82a6e3 100644
--- a/output.py
+++ b/output.py
@@ -148,6 +148,6 @@ class EPubFanficWriter(FanficWriter):
 		print >> opf, CONTENT_END
 		
 		print('Finished')
-		
+
 		filename = self.directory + '.epub'
 		zipdir.toZip(filename, self.directory)

From bcf82e263206a9bed4bdd9e78f20dd1b4e343630 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 11:34:15 +0000
Subject: [PATCH 06/94] zipdir added

---
 zipdir.py | 41 +++++++++++++++++++++++++++++++++++++++++
 1 file changed, 41 insertions(+)
 create mode 100644 zipdir.py

diff --git a/zipdir.py b/zipdir.py
new file mode 100644
index 00000000..1b54cf97
--- /dev/null
+++ b/zipdir.py
@@ -0,0 +1,41 @@
+import os
+import zipfile
+
+def toZip(filename, directory):
+	zippedHelp = zipfile.ZipFile(filename, "w", compression=zipfile.ZIP_DEFLATED)
+	lst = os.listdir(directory)
+	
+	for entity in lst:
+		if entity.startswith('.'):
+			continue
+
+		each = os.path.join(directory,entity)
+		print(each)
+
+		if os.path.isfile(each):
+			print(each)
+			zippedHelp.write(each, arcname=entity)
+		else:
+			addFolderToZip(zippedHelp,entity, each)
+ 	
+	zippedHelp.close()
+
+def addFolderToZip(zippedHelp,folder,fpath):
+	print('addFolderToZip(%s)' % folder)
+	
+	if folder == '.' or folder == '..':
+		return
+	
+	folderFiles = os.listdir(fpath)
+	for f in folderFiles:
+		print('------%s' % f)
+		if os.path.isfile(fpath + '/' + f):
+			print('basename=%s' % os.path.basename(fpath + '/' + f))
+			zippedHelp.write(fpath + '/' + f, folder + '/' + f, zipfile.ZIP_DEFLATED)
+		elif os.path.isdir(f):
+			addFolderToZip(zippedHelp,f)
+
+if __name__ == '__main__':
+	toZip('sample.epub', "books/Harry's_Second_Chance:_Back_From_the_Future")
+	z = zipfile.ZipFile('sample.epub', 'r')
+	print(z.namelist())
\ No newline at end of file

From 5adcf131b370a16843fd8b5753de9fe657fb1c1c Mon Sep 17 00:00:00 2001
From: kirillov <kirillov@niceholdsure-lm.london.corp.yahoo.com>
Date: Thu, 17 Dec 2009 12:38:15 +0000
Subject: [PATCH 07/94] fanfiction.net support added

---
 ffnet.py | 123 +++++++++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 123 insertions(+)
 create mode 100644 ffnet.py

diff --git a/ffnet.py b/ffnet.py
new file mode 100644
index 00000000..9e511819
--- /dev/null
+++ b/ffnet.py
@@ -0,0 +1,123 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import base64
+import os.path
+import logging
+import unittest
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import login_password
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+from constants import *
+
+class FFNet:
+	def __init__(self, url):
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		
+		(empty, s, self.storyId, chapter) = self.path.split('/')
+		
+		logging.debug('self.storyId=%s, chapter=%s' % (self.storyId, chapter))
+		
+		self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+	
+		logging.debug("Created FF.Net: url=%s" % (self.url))
+	
+	def _getLoginScript(self):
+		return self.path
+
+	def requiresLogin(self, url = None):
+		return False
+
+	def performLogin(self, url = None):
+		return True
+	
+	def extractIndividualUrls(self):
+		data = self.opener.open(self.url).read().decode('utf-8')
+
+		urls = []
+		lines = data.split('\n')
+		for l in lines:
+			if l.find("<img src='http://c.fanfiction.net/static/ficons/script.png' width=16 height=16  border=0  align=absmiddle>") != -1:
+				s2 = bs.BeautifulStoneSoup(l)
+				self.storyName = s2.find('b').string
+			elif l.find("<a href='/u/") != -1:
+				s2 = bs.BeautifulStoneSoup(l)
+				self.authorName = s2.a.string
+			elif l.find("<SELECT title='chapter navigation'") != -1:
+				if len(urls) > 0:
+					continue
+				u = l.decode('utf-8')
+				u = u.replace("&#187;", "-")
+				s2 = bs.BeautifulSoup(u)
+				options = s2.findAll('option')
+				for o in options:
+					url = 'http://fanfiction.net/s/' + self.storyId + '/' + o['value']
+					title = o.string
+					logging.debug('URL = `%s`, Title = `%s`' % (url, title))
+					urls.append((url,title))
+		
+		return urls
+	
+	def getText(self, url):
+		data = self.opener.open(url).read().decode('utf-8')
+		lines = data.split('\n')
+		for l in lines:
+			if l.find('<!-- start story -->') != -1:
+				s2 = bs.BeautifulStoneSoup(l)
+				return s2.div.prettify()
+		
+		
+	def setLogin(self, login):
+		self.login = login
+
+	def setPassword(self, password):
+		self.password = password
+
+	def getStoryName(self):
+		return self.storyName
+
+	def getAuthorName(self):
+		return self.authorName
+
+class FFA_UnitTests(unittest.TestCase):
+	def setUp(self):
+		logging.basicConfig(level=logging.DEBUG)
+		pass
+	
+	def testChaptersAuthStory(self):
+		f = FFNet('http://www.fanfiction.net/s/5257563/1')
+		f.extractIndividualUrls()
+		
+		self.assertEquals('Beka0502', f.getAuthorName())
+		self.assertEquals("Draco's Redemption", f.getStoryName())
+
+	def testChaptersCountNames(self):
+		f = FFNet('http://www.fanfiction.net/s/5257563/1')
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals(8, len(urls))
+	
+	def testGetText(self):
+		url = 'http://www.fanfiction.net/s/5257563/1'
+		f = FFNet(url)
+		text = f.getText(url)
+		self.assertTrue(text.find('He was just about to look at some photos when he heard a crack') != -1)
+	
+	def getPrintableUrl(self, url):
+		return url
+	
+if __name__ == '__main__':
+	unittest.main()
\ No newline at end of file

From 41caae6226f68160c1b6e610f8b414078b35d75f Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 12:38:34 +0000
Subject: [PATCH 08/94] fanfiction.net support added

---
 downaloder.py | 3 +++
 1 file changed, 3 insertions(+)

diff --git a/downaloder.py b/downaloder.py
index 48311aeb..58c375a3 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -12,6 +12,7 @@ import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
 import ffa
+import ffnet
 import ficwad
 import output
 import fictionalley
@@ -54,6 +55,8 @@ if __name__ == '__main__':
 		adapter = fictionalley.FictionAlley(url)
 	elif url.find('ficwad') != -1:
 		adapter = ficwad.FicWad(url)
+	elif url.find('fanfiction.net') != -1:
+		adapter = ffnet.FFNet(url)
 	else:
 		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
 		sys.exit(1)

From fd2ccb30ffbbd55ab0188fbdd703b20f56729866 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 12:45:12 +0000
Subject: [PATCH 09/94] login_password

---
 ffa.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/ffa.py b/ffa.py
index 1bd35b07..da4a374a 100644
--- a/ffa.py
+++ b/ffa.py
@@ -13,13 +13,18 @@ import unittest
 import urllib as u
 import pprint as pp
 import urllib2 as u2
-import login_password
 import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
 from constants import *
 
+try:
+	import login_password
+except:
+	# tough luck
+	pass
+
 class FFA:
 	def __init__(self, url):
 		self.url = url

From 6e73e5dc11dd44294d5d298b07c75cecde27eab5 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 12:46:06 +0000
Subject: [PATCH 10/94] login_password again

---
 ffnet.py | 7 ++++++-
 1 file changed, 6 insertions(+), 1 deletion(-)

diff --git a/ffnet.py b/ffnet.py
index 9e511819..bc2f7a2e 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -13,13 +13,18 @@ import unittest
 import urllib as u
 import pprint as pp
 import urllib2 as u2
-import login_password
 import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
 from constants import *
 
+try:
+	import login_password
+except:
+	# tough luck
+	pass
+
 class FFNet:
 	def __init__(self, url):
 		self.url = url

From d2d183430dfeba81cad2312e9fbdc891df6f562c Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 12:53:59 +0000
Subject: [PATCH 11/94] small changes to make work on other machines. why
 there's no Python 2.6 on Ubuntu?

---
 ffa.py    | 1 +
 zipdir.py | 4 +---
 2 files changed, 2 insertions(+), 3 deletions(-)

diff --git a/ffa.py b/ffa.py
index da4a374a..1a5a7387 100644
--- a/ffa.py
+++ b/ffa.py
@@ -93,6 +93,7 @@ class FFA:
 		if url.find('http://') == -1:
 			url = 'http://' + self.host + '/' + url
 		
+		logging.info('Downloading: %s' % url)
 		data = self.opener.open(url).read()
 		
 		lines = data.split('\n')
diff --git a/zipdir.py b/zipdir.py
index 1b54cf97..cd9b493b 100644
--- a/zipdir.py
+++ b/zipdir.py
@@ -28,7 +28,6 @@ def addFolderToZip(zippedHelp,folder,fpath):
 	
 	folderFiles = os.listdir(fpath)
 	for f in folderFiles:
-		print('------%s' % f)
 		if os.path.isfile(fpath + '/' + f):
 			print('basename=%s' % os.path.basename(fpath + '/' + f))
 			zippedHelp.write(fpath + '/' + f, folder + '/' + f, zipfile.ZIP_DEFLATED)
@@ -37,5 +36,4 @@ def addFolderToZip(zippedHelp,folder,fpath):
 
 if __name__ == '__main__':
 	toZip('sample.epub', "books/Harry's_Second_Chance:_Back_From_the_Future")
-	z = zipfile.ZipFile('sample.epub', 'r')
-	print(z.namelist())
\ No newline at end of file
+	z = zipfile.ZipFile('sample.epub', 'r')
\ No newline at end of file

From f55e6d3c05be0a0e718213aad8ed18da2b18c224 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 13:37:13 +0000
Subject: [PATCH 12/94] epub zip is now produced correctly, also TOC works with
 Stanza now

---
 constants.py |  2 +-
 output.py    | 10 ++++++++--
 zipdir.py    |  6 +++---
 3 files changed, 12 insertions(+), 6 deletions(-)

diff --git a/constants.py b/constants.py
index 6387cb70..27515658 100644
--- a/constants.py
+++ b/constants.py
@@ -41,7 +41,7 @@ CONTENT_START = '''<?xml version="1.0"?>
    <dc:identifier id="BookId">urn:uuid:sigizmund.com062820072147132</dc:identifier>
  </metadata>
  <manifest>
-  <item id="ncx" href="toc.ncx" media-type="text/xml" />
+  <item id="ncx" href="toc.ncx" media-type="application/x-dtbncx+xml"/>
   <item id="style" href="stylesheet.css" media-type="text/css" />
 '''
 
diff --git a/output.py b/output.py
index bd82a6e3..3159fe78 100644
--- a/output.py
+++ b/output.py
@@ -69,6 +69,8 @@ class EPubFanficWriter(FanficWriter):
 			v = entities[e]
 			text = text.replace(e, v)
 		
+		text = text.replace('&', '&amp;')
+		
 		return text
 	
 	def writeChapter(self, title, text):
@@ -100,9 +102,10 @@ class EPubFanficWriter(FanficWriter):
 #		cleanup(self.soup )
 		
 		text = self.soup.prettify()
-		print(text)
 		
-		print >> f, XHTML_START % (title, title)
+		tt = self._removeEntities(title)
+		
+		print >> f, XHTML_START % (tt, tt)
 		f.write(text)
 		print >> f, XHTML_END
 		
@@ -147,6 +150,9 @@ class EPubFanficWriter(FanficWriter):
 		
 		print >> opf, CONTENT_END
 		
+		opf.close()
+		toc.close()
+		
 		print('Finished')
 
 		filename = self.directory + '.epub'
diff --git a/zipdir.py b/zipdir.py
index cd9b493b..e5d596e7 100644
--- a/zipdir.py
+++ b/zipdir.py
@@ -21,7 +21,7 @@ def toZip(filename, directory):
 	zippedHelp.close()
 
 def addFolderToZip(zippedHelp,folder,fpath):
-	print('addFolderToZip(%s)' % folder)
+	#print('addFolderToZip(%s)' % folder)
 	
 	if folder == '.' or folder == '..':
 		return
@@ -29,11 +29,11 @@ def addFolderToZip(zippedHelp,folder,fpath):
 	folderFiles = os.listdir(fpath)
 	for f in folderFiles:
 		if os.path.isfile(fpath + '/' + f):
-			print('basename=%s' % os.path.basename(fpath + '/' + f))
+			#print('basename=%s' % os.path.basename(fpath + '/' + f))
 			zippedHelp.write(fpath + '/' + f, folder + '/' + f, zipfile.ZIP_DEFLATED)
 		elif os.path.isdir(f):
 			addFolderToZip(zippedHelp,f)
 
 if __name__ == '__main__':
-	toZip('sample.epub', "books/Harry's_Second_Chance:_Back_From_the_Future")
+	toZip('sample.epub', "books/A_Time_To_Reflect")
 	z = zipfile.ZipFile('sample.epub', 'r')
\ No newline at end of file

From 8c621d6a59136f28ca69ae26c80d423c3a0671da Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 13:44:07 +0000
Subject: [PATCH 13/94] Small bug in ff.net parsing was fixed

---
 ffnet.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/ffnet.py b/ffnet.py
index bc2f7a2e..faf7b334 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -32,7 +32,13 @@ class FFNet:
 		self.host = parsedUrl.netloc
 		self.path = parsedUrl.path
 		
-		(empty, s, self.storyId, chapter) = self.path.split('/')
+		if self.path.startswith('/'):
+			self.path = self.path[1:]
+		
+		if self.path.endswith('/'):
+			self.path = self.path[:-1]
+		
+		(s, self.storyId, chapter) = self.path.split('/')
 		
 		logging.debug('self.storyId=%s, chapter=%s' % (self.storyId, chapter))
 		

From a01e0e2ed6e61a9ef8c6bd064aebac8b458c9a44 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 14:37:31 +0000
Subject: [PATCH 14/94] Fixed few problems, including the slash in filename

---
 downaloder.py |  4 ++++
 output.py     | 37 +++++++++++++++++++++++++++++++------
 2 files changed, 35 insertions(+), 6 deletions(-)

diff --git a/downaloder.py b/downaloder.py
index 58c375a3..10dde292 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -53,6 +53,8 @@ if __name__ == '__main__':
 		adapter = ffa.FFA(url)
 	elif url.find('fictionalley') != -1:
 		adapter = fictionalley.FictionAlley(url)
+		print >> sys.stderr, "FictionAlley adapter is broken, try to find this fic on fanfiction.net or fanficauthors"
+		sys.exit(0)
 	elif url.find('ficwad') != -1:
 		adapter = ficwad.FicWad(url)
 	elif url.find('fanfiction.net') != -1:
@@ -63,6 +65,8 @@ if __name__ == '__main__':
 
 	if format == 'epub':
 		writerClass = output.EPubFanficWriter
+	elif format == 'html':
+		writerClass = output.HTMLWriter
 	
 	if adapter.requiresLogin(url):
 		print("Meow, URL %s requires you to haz been logged in! Please can I haz this datas?" % url)
diff --git a/output.py b/output.py
index 3159fe78..222618c9 100644
--- a/output.py
+++ b/output.py
@@ -7,6 +7,7 @@ import cgi
 import uuid
 import codecs
 import shutil
+import string
 import base64
 import os.path
 import zipfile
@@ -17,9 +18,11 @@ import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
+import zipdir
+import html_constants
 from constants import *
 
-import zipdir
+
 
 class FanficWriter:
 	def __init__(self):
@@ -32,14 +35,36 @@ class FanficWriter:
 		pass
 
 class HTMLWriter(FanficWriter):
+	body = ''
+	
 	def __init__(self, base, name, author):
-		pass
-
+		self.basePath = base
+		self.name = name.replace(" ", "_")
+		self.storyTitle = name
+		self.fileName = self.basePath + '/' + self.name + '.html'
+		self.authorName = author
+		
+		if os.path.exists(self.fileName):
+			os.remove(self.fileName)
+		
+		
+		self.xhtmlTemplate = string.Template(html_constants.XHTML_START)
+		self.chapterStartTemplate = string.Template(html_constants.XHTML_CHAPTER_START)
+		
 	def writeChapter(self, title, text):
-		pass
+		title = title.decode('utf-8')
+		text = text.decode('utf-8')
+		self.body = self.body + '\n' + self.chapterStartTemplate.substitute({'chapter' : title})
+		self.body = self.body + '\n' + text
 	
 	def finalise(self):
-		pass
+		html = self.xhtmlTemplate.substitute({'title' : self.storyTitle, 'author' : self.authorName, 'body' : self.body})
+		soup = bs.BeautifulSoup(html)
+		result = soup.prettify()
+		
+		f = open(self.fileName, 'w')
+		f.write(result)
+		f.close()
 
 class EPubFanficWriter(FanficWriter):
 	chapters = []
@@ -74,7 +99,7 @@ class EPubFanficWriter(FanficWriter):
 		return text
 	
 	def writeChapter(self, title, text):
-		fileName = base64.b64encode(title) + ".xhtml"
+		fileName = base64.b64encode(title).replace('/', '_') + ".xhtml"
 		filePath = self.directory + "/OEBPS/" + fileName
 		
 		f = open(filePath, 'w')

From 59697f1a755dfd5c91530829e9e144668f50073d Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 15:16:51 +0000
Subject: [PATCH 15/94] Added adapter.py, now all working adapters must
 implement FanfictionSiteAdapter interface

---
 adapter.py | 30 ++++++++++++++++++++++++++++++
 ffa.py     |  3 ++-
 ffnet.py   |  3 ++-
 ficwad.py  |  8 +++++---
 4 files changed, 39 insertions(+), 5 deletions(-)
 create mode 100644 adapter.py

diff --git a/adapter.py b/adapter.py
new file mode 100644
index 00000000..41e040d9
--- /dev/null
+++ b/adapter.py
@@ -0,0 +1,30 @@
+class FanfictionSiteAdapter:
+	def __init__(self, url):
+		pass
+	
+	def requiresLogin(self, url = None):
+		pass
+	
+	def performLogin(self, url = None):
+		pass
+	
+	def extractIndividualUrls(self):
+		pass
+		
+	def getText(self, url):
+		pass
+
+	def setLogin(self, login):
+		pass
+
+	def setPassword(self, password):
+		pass
+
+	def getStoryName(self):
+		pass
+
+	def getAuthorName(self):
+		pass
+
+	def getPrintableUrl(self, url):
+		pass
\ No newline at end of file
diff --git a/ffa.py b/ffa.py
index 1a5a7387..b8c307ec 100644
--- a/ffa.py
+++ b/ffa.py
@@ -18,6 +18,7 @@ import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
 from constants import *
+from adapter import *
 
 try:
 	import login_password
@@ -25,7 +26,7 @@ except:
 	# tough luck
 	pass
 
-class FFA:
+class FFA(FanfictionSiteAdapter):
 	def __init__(self, url):
 		self.url = url
 		parsedUrl = up.urlparse(url)
diff --git a/ffnet.py b/ffnet.py
index faf7b334..4ea30115 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -18,6 +18,7 @@ import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
 from constants import *
+from adapter import *
 
 try:
 	import login_password
@@ -25,7 +26,7 @@ except:
 	# tough luck
 	pass
 
-class FFNet:
+class FFNet(FanfictionSiteAdapter):
 	def __init__(self, url):
 		self.url = url
 		parsedUrl = up.urlparse(url)
diff --git a/ficwad.py b/ficwad.py
index 23622c29..35b3b76e 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -10,7 +10,9 @@ import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
-class FicWad:
+from adapter import *
+
+class FicWad(FanfictionSiteAdapter):
 	def __init__(self, url):
 		self.url = url
 		self.host = up.urlparse(url).netloc
@@ -90,7 +92,7 @@ if __name__ == '__main__':
 	url = 'http://www.ficwad.com/story/14536'
 	data = u2.urlopen(url).read()
 	host = up.urlparse(url).netloc
-	fw = FicWad()
-	urls = fw.extractIndividualUrls(data, host, url)
+	fw = FicWad(url)
+	urls = fw.extractIndividualUrls()
 	pp.pprint(urls)
 	print(fw.getText(data))
\ No newline at end of file

From 2352ba6dfcf99acd7c88ac5b094004cdd2aac608 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 15:18:31 +0000
Subject: [PATCH 16/94] forgot about html_constants

---
 html_constants.py | 17 +++++++++++++++++
 1 file changed, 17 insertions(+)
 create mode 100644 html_constants.py

diff --git a/html_constants.py b/html_constants.py
new file mode 100644
index 00000000..c698e8f4
--- /dev/null
+++ b/html_constants.py
@@ -0,0 +1,17 @@
+XHTML_START = '''<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN" "http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml">
+<head>
+<title>${title} by ${author}</title>
+<link href="stylesheet.css" type="text/css" rel="stylesheet" />
+</head>
+<body>
+<div>
+<h1>${title} by ${author}</h1>
+${body}
+</body></html>
+'''
+
+XHTML_CHAPTER_START = '''<h2>${chapter}</h2>'''
+
+XHTML_END = ''''''

From 028c2df521c00c600044eff83a781b92dac9378b Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Thu, 17 Dec 2009 15:32:05 +0000
Subject: [PATCH 17/94] Fixed a problem with &#[digits]; for fanfiction.net.
 Just why BeautifulSoup cannot handle them?

---
 ffnet.py | 15 ++++++++++++---
 1 file changed, 12 insertions(+), 3 deletions(-)

diff --git a/ffnet.py b/ffnet.py
index 4ea30115..5b252543 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -33,6 +33,10 @@ class FFNet(FanfictionSiteAdapter):
 		self.host = parsedUrl.netloc
 		self.path = parsedUrl.path
 		
+		spl = self.path.split('/')
+		if len(spl) == 5:
+			self.path = "/".join(spl[1:-1])
+		
 		if self.path.startswith('/'):
 			self.path = self.path[1:]
 		
@@ -72,7 +76,7 @@ class FFNet(FanfictionSiteAdapter):
 				if len(urls) > 0:
 					continue
 				u = l.decode('utf-8')
-				u = u.replace("&#187;", "-")
+				u = re.sub('&\#[0-9]+;', ' ', u)
 				s2 = bs.BeautifulSoup(u)
 				options = s2.findAll('option')
 				for o in options:
@@ -128,8 +132,13 @@ class FFA_UnitTests(unittest.TestCase):
 		text = f.getText(url)
 		self.assertTrue(text.find('He was just about to look at some photos when he heard a crack') != -1)
 	
-	def getPrintableUrl(self, url):
-		return url
+	def testBrokenWands(self):
+		url = 'http://www.fanfiction.net/s/1527263/30/Harry_Potter_and_Broken_Wands'
+		f = FFNet(url)
+		text = f.getText(url)
+		
+		urls = f.extractIndividualUrls()
+		
 	
 if __name__ == '__main__':
 	unittest.main()
\ No newline at end of file

From 615228a2acfe21e9dd24e3d51641d32dfe5f5b51 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Fri, 18 Dec 2009 11:23:37 +0000
Subject: [PATCH 18/94] changed slightly to make it work with AppEngine

---
 __init__.py   |  0
 downaloder.py | 12 +++++++++---
 ffnet.py      | 21 ++++++++++++++++++---
 output.py     | 23 +++++++++++++++++------
 4 files changed, 44 insertions(+), 12 deletions(-)
 create mode 100644 __init__.py

diff --git a/__init__.py b/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/downaloder.py b/downaloder.py
index 10dde292..8c520ce6 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -21,22 +21,28 @@ class FanficLoader:
 	'''A controller class which handles the interaction between various specific downloaders and writers'''
 	booksDirectory = "books"
 	
-	def __init__(self, adapter, writerClass):
+	def __init__(self, adapter, writerClass, quiet = False, inmemory = False):
 		self.adapter = adapter
 		self.writerClass = writerClass
+		self.quiet = quiet
+		self.inmemory = inmemory
 		
 	def download(self):
 		urls = self.adapter.extractIndividualUrls()
-		self.writer = self.writerClass(self.booksDirectory, self.adapter.getStoryName(), self.adapter.getAuthorName())
+		self.writer = self.writerClass(self.booksDirectory, self.adapter.getStoryName(), self.adapter.getAuthorName(), inmemory=self.inmemory)
 		
 		i = 0
 		for u,n in urls:
-			print('Downloading chapter %d/%d' % (i, len(urls)))
+			if not self.quiet:
+				print('Downloading chapter %d/%d' % (i, len(urls)))
 			i = i+1
 			text = self.adapter.getText(u)
 			self.writer.writeChapter(n, text)
 		
 		self.writer.finalise()
+		
+		if self.inmemory:
+			return self.writer.output.getvalue()
 	
 
 if __name__ == '__main__':
diff --git a/ffnet.py b/ffnet.py
index 5b252543..4af36792 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -26,6 +26,12 @@ except:
 	# tough luck
 	pass
 
+try:
+	from google.appengine.api.urlfetch import fetch as googlefetch
+	appEngine = True
+except:
+	appEngine = False
+
 class FFNet(FanfictionSiteAdapter):
 	def __init__(self, url):
 		self.url = url
@@ -47,7 +53,10 @@ class FFNet(FanfictionSiteAdapter):
 		
 		logging.debug('self.storyId=%s, chapter=%s' % (self.storyId, chapter))
 		
-		self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+		if not appEngine:
+			self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+		else:
+			self.opener = None
 	
 		logging.debug("Created FF.Net: url=%s" % (self.url))
 	
@@ -60,8 +69,14 @@ class FFNet(FanfictionSiteAdapter):
 	def performLogin(self, url = None):
 		return True
 	
+	def _fetchUrl(self, url):
+		if not appEngine:
+			return self.opener.open(url).read().decode('utf-8')
+		else:
+			return googlefetch(url).content
+	
 	def extractIndividualUrls(self):
-		data = self.opener.open(self.url).read().decode('utf-8')
+		data = self._fetchUrl(self.url)
 
 		urls = []
 		lines = data.split('\n')
@@ -88,7 +103,7 @@ class FFNet(FanfictionSiteAdapter):
 		return urls
 	
 	def getText(self, url):
-		data = self.opener.open(url).read().decode('utf-8')
+		data = self._fetchUrl(url)
 		lines = data.split('\n')
 		for l in lines:
 			if l.find('<!-- start story -->') != -1:
diff --git a/output.py b/output.py
index 222618c9..039451f4 100644
--- a/output.py
+++ b/output.py
@@ -11,6 +11,7 @@ import string
 import base64
 import os.path
 import zipfile
+import StringIO
 import urllib as u
 import pprint as pp
 import urllib2 as u2
@@ -37,16 +38,22 @@ class FanficWriter:
 class HTMLWriter(FanficWriter):
 	body = ''
 	
-	def __init__(self, base, name, author):
+	def __init__(self, base, name, author, inmemory=False):
 		self.basePath = base
 		self.name = name.replace(" ", "_")
 		self.storyTitle = name
 		self.fileName = self.basePath + '/' + self.name + '.html'
 		self.authorName = author
 		
-		if os.path.exists(self.fileName):
+		self.inmemory = inmemory
+
+		if not self.inmemory and os.path.exists(self.fileName):
 			os.remove(self.fileName)
 		
+		if self.inmemory:
+			self.output = StringIO.StringIO()
+		else:
+			self.output = open(self.fileName, 'w')
 		
 		self.xhtmlTemplate = string.Template(html_constants.XHTML_START)
 		self.chapterStartTemplate = string.Template(html_constants.XHTML_CHAPTER_START)
@@ -62,14 +69,18 @@ class HTMLWriter(FanficWriter):
 		soup = bs.BeautifulSoup(html)
 		result = soup.prettify()
 		
-		f = open(self.fileName, 'w')
-		f.write(result)
-		f.close()
+#		f = open(self.fileName, 'w')
+#		f.write(result)
+#		f.close()
+
+		self.output.write(result)
+		if not self.inmemory:
+			self.output.close()
 
 class EPubFanficWriter(FanficWriter):
 	chapters = []
 	
-	def __init__(self, base, name, author):
+	def __init__(self, base, name, author, inmemory=False):
 		self.basePath = base
 		self.name = name.replace(" ", "_")
 		self.storyTitle = name

From 33855b787738d97ef6b7e2cecc0a0c0727a07f83 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Fri, 18 Dec 2009 11:40:29 +0000
Subject: [PATCH 19/94] zipdir with in-memory stuff added

---
 zipdir.py | 27 +++++++++++++++++++++++++--
 1 file changed, 25 insertions(+), 2 deletions(-)

diff --git a/zipdir.py b/zipdir.py
index e5d596e7..e51b34ff 100644
--- a/zipdir.py
+++ b/zipdir.py
@@ -1,6 +1,8 @@
 import os
 import zipfile
 
+import StringIO
+
 def toZip(filename, directory):
 	zippedHelp = zipfile.ZipFile(filename, "w", compression=zipfile.ZIP_DEFLATED)
 	lst = os.listdir(directory)
@@ -34,6 +36,27 @@ def addFolderToZip(zippedHelp,folder,fpath):
 		elif os.path.isdir(f):
 			addFolderToZip(zippedHelp,f)
 
+def inMemoryZip(files):
+	# files have a structure of {'path/to/file' => content} dictionary
+	io = StringIO.StringIO()
+	memzip = zipfile.ZipFile(io, 'a', compression=zipfile.ZIP_DEFLATED)
+	memzip.debug = 3
+	
+	for path in files:
+		memzip.writestr(path, files[path])
+	
+	for zf in memzip.filelist:
+		zf.create_system = 0
+	
+	memzip.close()
+	
+	return io.getvalue()
+
 if __name__ == '__main__':
-	toZip('sample.epub', "books/A_Time_To_Reflect")
-	z = zipfile.ZipFile('sample.epub', 'r')
\ No newline at end of file
+#	toZip('sample.epub', "books/A_Time_To_Reflect")
+#	z = zipfile.ZipFile('sample.epub', 'r')
+	files = {'test.txt' : 'test', 'data/abc.txt' : 'abc'}
+	data = inMemoryZip(files)
+	f = open('res.zip', 'w')
+	f.write(data)
+	f.close()
\ No newline at end of file

From ef97755ed37f03c1ea5799a29a74d9b24f6c16b3 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Fri, 18 Dec 2009 12:26:23 +0000
Subject: [PATCH 20/94] AppEngine version. Not quite clear is it working or n
 ot

---
 downaloder.py |   3 ++
 output.py     | 126 +++++++++++++++++++++++++++++++++++---------------
 zipdir.py     |  11 ++++-
 3 files changed, 102 insertions(+), 38 deletions(-)

diff --git a/downaloder.py b/downaloder.py
index 8c520ce6..34b369db 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -4,6 +4,7 @@ import sys
 import shutil
 import os.path
 import getpass
+import logging
 import urllib as u
 import pprint as pp
 import urllib2 as u2
@@ -42,10 +43,12 @@ class FanficLoader:
 		self.writer.finalise()
 		
 		if self.inmemory:
+			self.name = self.writer.name
 			return self.writer.output.getvalue()
 	
 
 if __name__ == '__main__':
+	logging.basicConfig(level=logging.DEBUG)
 	(url, format) = sys.argv[1:]
 	
 	if type(url) is unicode:
diff --git a/output.py b/output.py
index 039451f4..3042441d 100644
--- a/output.py
+++ b/output.py
@@ -12,6 +12,7 @@ import base64
 import os.path
 import zipfile
 import StringIO
+import logging
 import urllib as u
 import pprint as pp
 import urllib2 as u2
@@ -80,25 +81,56 @@ class HTMLWriter(FanficWriter):
 class EPubFanficWriter(FanficWriter):
 	chapters = []
 	
+	files = {}
+	
+	def _writeFile(self, fileName, data):
+		if fileName in self.files:
+			self.files[fileName].write(data.decode('utf-8'))
+		else:
+			if self.inmemory:
+				self.files[fileName] = StringIO.StringIO()
+			else:
+				self.files[fileName] = open(self.directory + '/' + fileName, 'w')
+
+			self._writeFile(fileName, data)
+		
+		
+	def _closeFiles(self):
+		if not self.inmemory:
+			for f in self.files:
+				self.files[f].close()
+	
 	def __init__(self, base, name, author, inmemory=False):
 		self.basePath = base
 		self.name = name.replace(" ", "_")
 		self.storyTitle = name
 		self.directory = self.basePath + '/' + self.name
-		
+		self.inmemory = inmemory
 		self.authorName = author
 
-		if os.path.exists(self.directory):
-			shutil.rmtree(self.directory)
+		if not self.inmemory:
+			self.inmemory = True
+			self.writeToFile = True
+		else:
+			self.writeToFile = False
 		
-		os.mkdir(self.directory)
+
+		if not self.inmemory:
+			if os.path.exists(self.directory):
+				shutil.rmtree(self.directory)
 		
-		os.mkdir(self.directory + '/META-INF')
-		os.mkdir(self.directory + '/OEBPS')
+			os.mkdir(self.directory)
 		
-		print >> codecs.open(self.directory + '/mimetype', 'w', 'utf-8'), MIMETYPE
-		print >> codecs.open(self.directory + '/META-INF/container.xml', 'w', 'utf-8'), CONTAINER
-		print >> codecs.open(self.directory + '/OEBPS/stylesheet.css', 'w', 'utf-8'), CSS
+			os.mkdir(self.directory + '/META-INF')
+			os.mkdir(self.directory + '/OEBPS')
+		
+#		print >> codecs.open(self.directory + '/mimetype', 'w', 'utf-8'), MIMETYPE
+#		print >> codecs.open(self.directory + '/META-INF/container.xml', 'w', 'utf-8'), CONTAINER
+#		print >> codecs.open(self.directory + '/OEBPS/stylesheet.css', 'w', 'utf-8'), CSS
+
+		self._writeFile('mimetype', MIMETYPE)
+		self._writeFile('META-INF/container.xml', CONTAINER)
+		self._writeFile('OEBPS/stylesheet.css', CSS)
 
 	def _removeEntities(self, text):
 		for e in entities:
@@ -113,7 +145,9 @@ class EPubFanficWriter(FanficWriter):
 		fileName = base64.b64encode(title).replace('/', '_') + ".xhtml"
 		filePath = self.directory + "/OEBPS/" + fileName
 		
-		f = open(filePath, 'w')
+		fn = 'OEBPS/' + fileName
+		
+#		f = open(filePath, 'w')
 		
 		text = self._removeEntities(text)
 		
@@ -141,55 +175,75 @@ class EPubFanficWriter(FanficWriter):
 		
 		tt = self._removeEntities(title)
 		
-		print >> f, XHTML_START % (tt, tt)
-		f.write(text)
-		print >> f, XHTML_END
+		self._writeFile(fn, XHTML_START % (tt, tt))
+		self._writeFile(fn, text)
+		self._writeFile(fn, XHTML_END)
+#		print >> f, XHTML_START % (tt, tt)
+#		f.write(text)
+#		print >> f, XHTML_END
 		
 		self.chapters.append((title, fileName))
 	
 	def finalise(self):
-		print("Finalising...")
+		logging.debug("Finalising...")
 		### writing table of contents -- ncx file
 		
-		tocFilePath = self.directory + "/OEBPS/toc.ncx"
-		toc = open(tocFilePath, 'w')
-		print >> toc, TOC_START % self.storyTitle
-
-		print("Printing toc and refs")
-
+		tocFilePath = "OEBPS/toc.ncx"
+#		toc = open(tocFilePath, 'w')
+#		print >> toc, TOC_START % self.storyTitle
+		self._writeFile(tocFilePath, TOC_START % self.storyTitle)
 		### writing content -- opf file
-		opfFilePath = self.directory + "/OEBPS/content.opf"
-		opf = open(opfFilePath, 'w')
+		opfFilePath = "OEBPS/content.opf"
 		
-		print >> opf, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName)
+#		opf = open(opfFilePath, 'w')
+		self._writeFile(opfFilePath, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName))
+#		print >> opf, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName)
 
 		ids = []
 		
 		i = 0
 		for t,f in self.chapters:
 			chapterId = base64.b64encode(t)
-			print >> toc, TOC_ITEM % (chapterId, i, cgi.escape(t), f)
-			
-			print >> opf, CONTENT_ITEM % (chapterId, f)
+#			print >> toc, TOC_ITEM % (chapterId, i, cgi.escape(t), f)
+			self._writeFile(tocFilePath, TOC_ITEM % (chapterId, i, cgi.escape(t), f))
+#			print >> opf, CONTENT_ITEM % (chapterId, f)
+			self._writeFile(opfFilePath, CONTENT_ITEM % (chapterId, f))
 			
 			ids.append(chapterId)
 			
 			i = i + 1
 			
-		print('Toc and refs printed, proceesing to ref-ids....')
+#		logging.d('Toc and refs printed, proceesing to ref-ids....')
 		
-		print >> toc, TOC_END
-		print >> opf, CONTENT_END_MANIFEST		
+#		print >> toc, TOC_END
+#		print >> opf, CONTENT_END_MANIFEST		
+
+		self._writeFile(tocFilePath, TOC_END)
+		self._writeFile(opfFilePath, CONTENT_END_MANIFEST)
 		
 		for chapterId in ids:
-			print >> opf, CONTENT_ITEMREF % chapterId
+#			print >> opf, CONTENT_ITEMREF % chapterId
+			self._writeFile(opfFilePath, CONTENT_ITEMREF % chapterId)
 		
-		print >> opf, CONTENT_END
+#		print >> opf, CONTENT_END
+		self._writeFile(opfFilePath, CONTENT_END)
 		
-		opf.close()
-		toc.close()
+#		opf.close()
+#		toc.close()
+		
+#		print('Finished')
+		
+		self._closeFiles()
 		
-		print('Finished')
-
 		filename = self.directory + '.epub'
-		zipdir.toZip(filename, self.directory)
+		
+		zipdata = zipdir.inMemoryZip(self.files)
+		
+		if self.writeToFile:
+			f = open(filename, 'w')
+			f.write(zipdata.getvalue())
+			f.close()
+		else:
+			self.output = zipdata
+			
+#		zipdir.toZip(filename, self.directory)
diff --git a/zipdir.py b/zipdir.py
index e51b34ff..0da2691d 100644
--- a/zipdir.py
+++ b/zipdir.py
@@ -1,5 +1,6 @@
 import os
 import zipfile
+import logging
 
 import StringIO
 
@@ -43,14 +44,20 @@ def inMemoryZip(files):
 	memzip.debug = 3
 	
 	for path in files:
-		memzip.writestr(path, files[path])
+		if type(files[path]) != type('str'):
+			data = files[path].getvalue()
+		else:
+			data = files[path]
+		
+#		logging.debug(data)
+		memzip.writestr(path, data.encode('utf-8'))
 	
 	for zf in memzip.filelist:
 		zf.create_system = 0
 	
 	memzip.close()
 	
-	return io.getvalue()
+	return io
 
 if __name__ == '__main__':
 #	toZip('sample.epub', "books/A_Time_To_Reflect")

From 1f897843e0becfacd5390e71a28a18bda5799754 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Fri, 18 Dec 2009 14:51:53 +0000
Subject: [PATCH 21/94] Whole lot of fixes related to appengine

---
 BeautifulSoup.py  | 1711 +++++++++++++++++++++++++++++++++++++++++++++
 __init__.py       |    0
 adapter.py        |   32 +
 constants.py      |  135 ++++
 downaloder.py     |  103 +++
 ffa.py            |  197 ++++++
 ffnet.py          |  162 +++++
 fictionalley.py   |   75 ++
 ficwad.py         |   98 +++
 html_constants.py |   17 +
 output.py         |  252 +++++++
 zipdir.py         |   69 ++
 12 files changed, 2851 insertions(+)
 create mode 100644 BeautifulSoup.py
 create mode 100644 __init__.py
 create mode 100644 adapter.py
 create mode 100644 constants.py
 create mode 100644 downaloder.py
 create mode 100644 ffa.py
 create mode 100644 ffnet.py
 create mode 100644 fictionalley.py
 create mode 100644 ficwad.py
 create mode 100644 html_constants.py
 create mode 100644 output.py
 create mode 100644 zipdir.py

diff --git a/BeautifulSoup.py b/BeautifulSoup.py
new file mode 100644
index 00000000..458f08a1
--- /dev/null
+++ b/BeautifulSoup.py
@@ -0,0 +1,1711 @@
+"""Beautiful Soup
+Elixir and Tonic
+"The Screen-Scraper's Friend"
+v3.0.0
+http://www.crummy.com/software/BeautifulSoup/
+
+Beautiful Soup parses a (possibly invalid) XML or HTML document into a
+tree representation. It provides methods and Pythonic idioms that make
+it easy to navigate, search, and modify the tree.
+
+A well-formed XML/HTML document yields a well-formed data
+structure. An ill-formed XML/HTML document yields a correspondingly
+ill-formed data structure. If your document is only locally
+well-formed, you can use this library to find and process the
+well-formed part of it.
+
+Beautiful Soup works with Python 2.2 and up. It has no external
+dependencies, but you'll have more success at converting data to UTF-8
+if you also install these three packages:
+
+* chardet, for auto-detecting character encodings
+  http://chardet.feedparser.org/
+* cjkcodecs and iconv_codec, which add more encodings to the ones supported
+  by stock Python.
+  http://cjkpython.i18n.org/
+
+Beautiful Soup defines classes for two main parsing strategies:
+    
+ * BeautifulStoneSoup, for parsing XML, SGML, or your domain-specific
+   language that kind of looks like XML.
+
+ * BeautifulSoup, for parsing run-of-the-mill HTML code, be it valid
+   or invalid. This class has web browser-like heuristics for
+   obtaining a sensible parse tree in the face of common HTML errors.
+
+Beautiful Soup also defines a class (UnicodeDammit) for autodetecting
+the encoding of an HTML or XML document, and converting it to
+Unicode. Much of this code is taken from Mark Pilgrim's Universal Feed Parser.
+
+For more than you ever wanted to know about Beautiful Soup, see the
+documentation:
+http://www.crummy.com/software/BeautifulSoup/documentation.html
+
+"""
+from __future__ import generators
+
+__author__ = "Leonard Richardson (leonardr@segfault.org)"
+__version__ = "3.0.0"
+__date__ = "$Date: 2004/10/18 00:14:20 $"
+__copyright__ = "Copyright (c) 2004-2005 Leonard Richardson"
+__license__ = "PSF"
+
+from sgmllib import SGMLParser, SGMLParseError
+import codecs
+import types
+import re
+import sgmllib
+from htmlentitydefs import name2codepoint
+
+#This code makes Beautiful Soup able to parse XML with namespaces
+sgmllib.tagfind = re.compile('[a-zA-Z][-_.:a-zA-Z0-9]*')
+
+DEFAULT_OUTPUT_ENCODING = "utf-8"
+
+# First, the classes that represent markup elements.
+
+class PageElement:
+    """Contains the navigational information for some part of the page
+    (either a tag or a piece of text)"""
+
+    def setup(self, parent=None, previous=None):
+        """Sets up the initial relations between this element and
+        other elements."""        
+        self.parent = parent
+        self.previous = previous
+        self.next = None
+        self.previousSibling = None
+        self.nextSibling = None
+        if self.parent and self.parent.contents:
+            self.previousSibling = self.parent.contents[-1]
+            self.previousSibling.nextSibling = self
+
+    def replaceWith(self, replaceWith):        
+        oldParent = self.parent
+        myIndex = self.parent.contents.index(self)
+        if hasattr(replaceWith, 'parent') and replaceWith.parent == self.parent:
+            # We're replacing this element with one of its siblings.
+            index = self.parent.contents.index(replaceWith)
+            if index and index < myIndex:
+                # Furthermore, it comes before this element. That
+                # means that when we extract it, the index of this
+                # element will change.
+                myIndex = myIndex - 1
+        self.extract()        
+        oldParent.insert(myIndex, replaceWith)
+        
+    def extract(self):
+        """Destructively rips this element out of the tree."""        
+        if self.parent:
+            try:
+                self.parent.contents.remove(self)
+            except ValueError:
+                pass
+
+        #Find the two elements that would be next to each other if
+        #this element (and any children) hadn't been parsed. Connect
+        #the two.        
+        lastChild = self._lastRecursiveChild()
+        nextElement = lastChild.next
+
+        if self.previous:
+            self.previous.next = nextElement
+        if nextElement:
+            nextElement.previous = self.previous
+        self.previous = None
+        lastChild.next = None
+
+        self.parent = None        
+        if self.previousSibling:
+            self.previousSibling.nextSibling = self.nextSibling
+        if self.nextSibling:
+            self.nextSibling.previousSibling = self.previousSibling
+        self.previousSibling = self.nextSibling = None       
+
+    def _lastRecursiveChild(self):
+        "Finds the last element beneath this object to be parsed."
+        lastChild = self
+        while hasattr(lastChild, 'contents') and lastChild.contents:
+            lastChild = lastChild.contents[-1]
+        return lastChild
+
+    def insert(self, position, newChild):
+        if (isinstance(newChild, basestring)
+            or isinstance(newChild, unicode)) \
+            and not isinstance(newChild, NavigableString):
+            newChild = NavigableString(newChild)        
+
+        position =  min(position, len(self.contents))
+        if hasattr(newChild, 'parent') and newChild.parent != None:
+            # We're 'inserting' an element that's already one
+            # of this object's children. 
+            if newChild.parent == self:
+                index = self.find(newChild)
+                if index and index < position:
+                    # Furthermore we're moving it further down the
+                    # list of this object's children. That means that
+                    # when we extract this element, our target index
+                    # will jump down one.
+                    position = position - 1
+            newChild.extract()
+            
+        newChild.parent = self
+        previousChild = None
+        if position == 0:
+            newChild.previousSibling = None
+            newChild.previous = self
+        else:
+            previousChild = self.contents[position-1]
+            newChild.previousSibling = previousChild
+            newChild.previousSibling.nextSibling = newChild
+            newChild.previous = previousChild._lastRecursiveChild()
+        if newChild.previous:
+            newChild.previous.next = newChild        
+
+        newChildsLastElement = newChild._lastRecursiveChild()
+
+        if position >= len(self.contents):
+            newChild.nextSibling = None
+            
+            parent = self
+            parentsNextSibling = None
+            while not parentsNextSibling:
+                parentsNextSibling = parent.nextSibling
+                parent = parent.parent
+                if not parent: # This is the last element in the document.
+                    break
+            if parentsNextSibling:
+                newChildsLastElement.next = parentsNextSibling
+            else:
+                newChildsLastElement.next = None
+        else:
+            nextChild = self.contents[position]            
+            newChild.nextSibling = nextChild            
+            if newChild.nextSibling:
+                newChild.nextSibling.previousSibling = newChild
+            newChildsLastElement.next = nextChild
+
+        if newChildsLastElement.next:
+            newChildsLastElement.next.previous = newChildsLastElement
+        self.contents.insert(position, newChild)
+
+    def findNext(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the first item that matches the given criteria and
+        appears after this Tag in the document."""
+        return self._findOne(self.findAllNext, name, attrs, text, **kwargs)
+
+    def findAllNext(self, name=None, attrs={}, text=None, limit=None,
+                    **kwargs):
+        """Returns all items that match the given criteria and appear
+        before after Tag in the document."""
+        return self._findAll(name, attrs, text, limit, self.nextGenerator)
+
+    def findNextSibling(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the closest sibling to this Tag that matches the
+        given criteria and appears after this Tag in the document."""
+        return self._findOne(self.findNextSiblings, name, attrs, text,
+                             **kwargs)
+
+    def findNextSiblings(self, name=None, attrs={}, text=None, limit=None,
+                         **kwargs):
+        """Returns the siblings of this Tag that match the given
+        criteria and appear after this Tag in the document."""
+        return self._findAll(name, attrs, text, limit,
+                             self.nextSiblingGenerator, **kwargs)
+
+    def findPrevious(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the first item that matches the given criteria and
+        appears before this Tag in the document."""
+        return self._findOne(self.findAllPrevious, name, attrs, text, **kwargs)
+
+    def findAllPrevious(self, name=None, attrs={}, text=None, limit=None,
+                        **kwargs):
+        """Returns all items that match the given criteria and appear
+        before this Tag in the document."""
+        return self._findAll(name, attrs, text, limit, self.previousGenerator,
+                           **kwargs)
+
+    def findPreviousSibling(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the closest sibling to this Tag that matches the
+        given criteria and appears before this Tag in the document."""
+        return self._findOne(self.findPreviousSiblings, name, attrs, text,
+                             **kwargs)
+
+    def findPreviousSiblings(self, name=None, attrs={}, text=None,
+                             limit=None, **kwargs):
+        """Returns the siblings of this Tag that match the given
+        criteria and appear before this Tag in the document."""
+        return self._findAll(name, attrs, text, limit,
+                             self.previousSiblingGenerator, **kwargs)
+
+    def findParent(self, name=None, attrs={}, **kwargs):
+        """Returns the closest parent of this Tag that matches the given
+        criteria."""
+        # NOTE: We can't use _findOne because findParents takes a different
+        # set of arguments.
+        r = None
+        l = self.findParents(name, attrs, 1)
+        if l:
+            r = l[0]
+        return r
+
+    def findParents(self, name=None, attrs={}, limit=None, **kwargs):
+        """Returns the parents of this Tag that match the given
+        criteria."""
+
+        return self._findAll(name, attrs, None, limit, self.parentGenerator,
+                             **kwargs)
+
+    #These methods do the real heavy lifting.
+
+    def _findOne(self, method, name, attrs, text, **kwargs):
+        r = None
+        l = method(name, attrs, text, 1, **kwargs)
+        if l:
+            r = l[0]
+        return r
+    
+    def _findAll(self, name, attrs, text, limit, generator, **kwargs):
+        "Iterates over a generator looking for things that match."
+
+        if isinstance(name, SoupStrainer):
+            strainer = name
+        else:
+            # Build a SoupStrainer
+            strainer = SoupStrainer(name, attrs, text, **kwargs)
+        results = ResultSet(strainer)
+        g = generator()
+        while True:
+            try:
+                i = g.next()
+            except StopIteration:
+                break
+            if i:
+                found = strainer.search(i)
+                if found:
+                    results.append(found)
+                    if limit and len(results) >= limit:
+                        break
+        return results
+
+    #These Generators can be used to navigate starting from both
+    #NavigableStrings and Tags.                
+    def nextGenerator(self):
+        i = self
+        while i:
+            i = i.next
+            yield i
+
+    def nextSiblingGenerator(self):
+        i = self
+        while i:
+            i = i.nextSibling
+            yield i
+
+    def previousGenerator(self):
+        i = self
+        while i:
+            i = i.previous
+            yield i
+
+    def previousSiblingGenerator(self):
+        i = self
+        while i:
+            i = i.previousSibling
+            yield i
+
+    def parentGenerator(self):
+        i = self
+        while i:
+            i = i.parent
+            yield i
+
+    # Utility methods
+    def substituteEncoding(self, str, encoding=None):
+        encoding = encoding or "utf-8"
+        return str.replace("%SOUP-ENCODING%", encoding)    
+
+    def toEncoding(self, s, encoding=None):
+        """Encodes an object to a string in some encoding, or to Unicode.
+        ."""
+        if isinstance(s, unicode):
+            if encoding:
+                s = s.encode(encoding)
+        elif isinstance(s, str):
+            if encoding:
+                s = s.encode(encoding)
+            else:
+                s = unicode(s)
+        else:
+            if encoding:
+                s  = self.toEncoding(str(s), encoding)
+            else:
+                s = unicode(s)
+        return s
+
+class NavigableString(unicode, PageElement):
+
+    def __getattr__(self, attr):
+        """text.string gives you text. This is for backwards
+        compatibility for Navigable*String, but for CData* it lets you
+        get the string without the CData wrapper."""
+        if attr == 'string':
+            return self
+        else:
+            raise AttributeError, "'%s' object has no attribute '%s'" % (self.__class__.__name__, attr)
+
+    def __unicode__(self):
+        return __str__(self, None)
+
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        if encoding:
+            return self.encode(encoding)
+        else:
+            return self
+        
+class CData(NavigableString):
+
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return "<![CDATA[%s]]>" % NavigableString.__str__(self, encoding)
+
+class ProcessingInstruction(NavigableString):
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        output = self
+        if "%SOUP-ENCODING%" in output:
+            output = self.substituteEncoding(output, encoding)
+        return "<?%s?>" % self.toEncoding(output, encoding)
+
+class Comment(NavigableString):
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return "<!--%s-->" % NavigableString.__str__(self, encoding)    
+
+class Declaration(NavigableString):
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return "<!%s>" % NavigableString.__str__(self, encoding)        
+
+class Tag(PageElement):
+
+    """Represents a found HTML tag with its attributes and contents."""
+
+    def __init__(self, parser, name, attrs=None, parent=None,
+                 previous=None):
+        "Basic constructor."
+
+        # We don't actually store the parser object: that lets extracted
+        # chunks be garbage-collected
+        self.parserClass = parser.__class__
+        self.isSelfClosing = parser.isSelfClosingTag(name)
+        self.name = name
+        if attrs == None:
+            attrs = []
+        self.attrs = attrs
+        self.contents = []
+        self.setup(parent, previous)
+        self.hidden = False
+        self.containsSubstitutions = False
+
+    def get(self, key, default=None):
+        """Returns the value of the 'key' attribute for the tag, or
+        the value given for 'default' if it doesn't have that
+        attribute."""
+        return self._getAttrMap().get(key, default)    
+
+    def has_key(self, key):
+        return self._getAttrMap().has_key(key)
+
+    def __getitem__(self, key):
+        """tag[key] returns the value of the 'key' attribute for the tag,
+        and throws an exception if it's not there."""
+        return self._getAttrMap()[key]
+
+    def __iter__(self):
+        "Iterating over a tag iterates over its contents."
+        return iter(self.contents)
+
+    def __len__(self):
+        "The length of a tag is the length of its list of contents."
+        return len(self.contents)
+
+    def __contains__(self, x):
+        return x in self.contents
+
+    def __nonzero__(self):
+        "A tag is non-None even if it has no contents."
+        return True
+
+    def __setitem__(self, key, value):        
+        """Setting tag[key] sets the value of the 'key' attribute for the
+        tag."""
+        self._getAttrMap()
+        self.attrMap[key] = value
+        found = False
+        for i in range(0, len(self.attrs)):
+            if self.attrs[i][0] == key:
+                self.attrs[i] = (key, value)
+                found = True
+        if not found:
+            self.attrs.append((key, value))
+        self._getAttrMap()[key] = value
+
+    def __delitem__(self, key):
+        "Deleting tag[key] deletes all 'key' attributes for the tag."
+        for item in self.attrs:
+            if item[0] == key:
+                self.attrs.remove(item)
+                #We don't break because bad HTML can define the same
+                #attribute multiple times.
+            self._getAttrMap()
+            if self.attrMap.has_key(key):
+                del self.attrMap[key]
+
+    def __call__(self, *args, **kwargs):
+        """Calling a tag like a function is the same as calling its
+        findAll() method. Eg. tag('a') returns a list of all the A tags
+        found within this tag."""
+        return apply(self.findAll, args, kwargs)
+
+    def __getattr__(self, tag):
+        #print "Getattr %s.%s" % (self.__class__, tag)
+        if len(tag) > 3 and tag.rfind('Tag') == len(tag)-3:
+            return self.find(tag[:-3])
+        elif tag.find('__') != 0:
+            return self.find(tag)
+
+    def __eq__(self, other):
+        """Returns true iff this tag has the same name, the same attributes,
+        and the same contents (recursively) as the given tag.
+
+        NOTE: right now this will return false if two tags have the
+        same attributes in a different order. Should this be fixed?"""
+        if not hasattr(other, 'name') or not hasattr(other, 'attrs') or not hasattr(other, 'contents') or self.name != other.name or self.attrs != other.attrs or len(self) != len(other):
+            return False
+        for i in range(0, len(self.contents)):
+            if self.contents[i] != other.contents[i]:
+                return False
+        return True
+
+    def __ne__(self, other):
+        """Returns true iff this tag is not identical to the other tag,
+        as defined in __eq__."""
+        return not self == other
+
+    def __repr__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        """Renders this tag as a string."""
+        return self.__str__(encoding)
+
+    def __unicode__(self):
+        return self.__str__(None)
+
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING,
+                prettyPrint=False, indentLevel=0):
+        """Returns a string or Unicode representation of this tag and
+        its contents. To get Unicode, pass None for encoding.
+
+        NOTE: since Python's HTML parser consumes whitespace, this
+        method is not certain to reproduce the whitespace present in
+        the original string."""
+
+        encodedName = self.toEncoding(self.name, encoding)
+        
+        attrs = []
+        if self.attrs:
+            for key, val in self.attrs:
+                fmt = '%s="%s"'
+                if isString(val):
+                    if self.containsSubstitutions and '%SOUP-ENCODING%' in val:
+                        val = self.substituteEncoding(val, encoding)
+                    if '"' in val:
+                        fmt = "%s='%s'"
+                        # This can't happen naturally, but it can happen
+                        # if you modify an attribute value and print it out.
+                        if "'" in val:
+                            val = val.replace("'", "&squot;")
+                attrs.append(fmt % (self.toEncoding(key, encoding),
+                                    self.toEncoding(val, encoding)))
+        close = ''
+        closeTag = ''
+        if self.isSelfClosing:
+            close = ' /'
+        else:
+            closeTag = '</%s>' % encodedName
+
+        indentTag, indentContents = 0, 0
+        if prettyPrint:
+            indentTag = indentLevel
+            space = (' ' * (indentTag-1))
+            indentContents = indentTag + 1
+        contents = self.renderContents(encoding, prettyPrint, indentContents)
+        if self.hidden:
+            s = contents
+        else:
+            s = []
+            attributeString = ''
+            if attrs:
+                attributeString = ' ' + ' '.join(attrs)            
+            if prettyPrint:
+                s.append(space)
+            s.append('<%s%s%s>' % (encodedName, attributeString, close))
+            if prettyPrint:
+                s.append("\n")
+            s.append(contents)
+            if prettyPrint and contents and contents[-1] != "\n":
+                s.append("\n")
+            if prettyPrint and closeTag:
+                s.append(space)
+            s.append(closeTag)
+            if prettyPrint and closeTag and self.nextSibling:
+                s.append("\n")
+            s = ''.join(s)
+        return s
+
+    def prettify(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return self.__str__(encoding, True)
+
+    def renderContents(self, encoding=DEFAULT_OUTPUT_ENCODING,
+                       prettyPrint=False, indentLevel=0):
+        """Renders the contents of this tag as a string in the given
+        encoding. If encoding is None, returns a Unicode string.."""
+        s=[]
+        for c in self:
+            text = None
+            if isinstance(c, NavigableString):
+                text = c.__str__(encoding)
+            elif isinstance(c, Tag):
+                s.append(c.__str__(encoding, prettyPrint, indentLevel))
+            if text and prettyPrint:
+                text = text.strip()              
+            if text:
+                if prettyPrint:
+                    s.append(" " * (indentLevel-1))
+                s.append(text)
+                if prettyPrint:
+                    s.append("\n")
+        return ''.join(s)    
+
+    #Soup methods
+
+    def find(self, name=None, attrs={}, recursive=True, text=None,
+              **kwargs):
+        """Return only the first child of this
+        Tag matching the given criteria."""
+        r = None
+        l = self.findAll(name, attrs, recursive, text, 1)
+        if l:
+            r = l[0]
+        return r
+    findChild = find
+
+    def findAll(self, name=None, attrs={}, recursive=True, text=None,
+                limit=None, **kwargs):
+        """Extracts a list of Tag objects that match the given
+        criteria.  You can specify the name of the Tag and any
+        attributes you want the Tag to have.
+
+        The value of a key-value pair in the 'attrs' map can be a
+        string, a list of strings, a regular expression object, or a
+        callable that takes a string and returns whether or not the
+        string matches for some custom definition of 'matches'. The
+        same is true of the tag name."""
+        generator = self.recursiveChildGenerator
+        if not recursive:
+            generator = self.childGenerator
+        return self._findAll(name, attrs, text, limit, generator, **kwargs)
+    findAllChildren = findAll
+    
+    #Utility methods
+
+    def append(self, tag):
+        """Appends the given tag to the contents of this tag."""
+        self.contents.append(tag)
+
+    #Private methods
+
+    def _getAttrMap(self):
+        """Initializes a map representation of this tag's attributes,
+        if not already initialized."""
+        if not getattr(self, 'attrMap'):
+            self.attrMap = {}
+            for (key, value) in self.attrs:
+                self.attrMap[key] = value 
+        return self.attrMap
+
+    #Generator methods
+    def childGenerator(self):
+        for i in range(0, len(self.contents)):
+            yield self.contents[i]
+        raise StopIteration
+    
+    def recursiveChildGenerator(self):
+        stack = [(self, 0)]
+        while stack:
+            tag, start = stack.pop()
+            if isinstance(tag, Tag):            
+                for i in range(start, len(tag.contents)):
+                    a = tag.contents[i]
+                    yield a
+                    if isinstance(a, Tag) and tag.contents:
+                        if i < len(tag.contents) - 1:
+                            stack.append((tag, i+1))
+                        stack.append((a, 0))
+                        break
+        raise StopIteration
+
+# Next, a couple classes to represent queries and their results.
+class SoupStrainer:
+    """Encapsulates a number of ways of matching a markup element (tag or
+    text)."""
+
+    def __init__(self, name=None, attrs={}, text=None, **kwargs):
+        self.name=name
+        self.attrs=attrs.copy()
+        self.attrs.update(kwargs)
+        self.text = text
+
+    def __str__(self):
+        if self.text:
+            return self.text
+        else:
+            return "%s|%s" % (self.name, self.attrs)
+    
+    def searchTag(self, markupName=None, markupAttrs={}):
+        found = None
+        markup = None
+        if isinstance(markupName, Tag):
+            markup = markupName
+            markupAttrs = markup
+        callFunctionWithTagData = callable(self.name) \
+                                and not isinstance(markupName, Tag)
+
+        if (not self.name) \
+               or callFunctionWithTagData \
+               or (markup and self._matches(markup, self.name)) \
+               or (not markup and self._matches(markupName, self.name)):
+            if callFunctionWithTagData:
+                match = self.name(markupName, markupAttrs)
+            else:
+                match = True            
+                markupAttrMap = None
+                for attr, matchAgainst in self.attrs.items():
+                    if not markupAttrMap:
+                         if hasattr(markupAttrs, 'get'):
+                            markupAttrMap = markupAttrs
+                         else:
+                            markupAttrMap = {}
+                            for k,v in markupAttrs:
+                                markupAttrMap[k] = v
+                    attrValue = markupAttrMap.get(attr)
+                    if not self._matches(attrValue, matchAgainst):
+                        match = False
+                        break
+            if match:
+                if markup:
+                    found = markup
+                else:
+                    found = markupName
+        return found
+
+    def search(self, markup):
+        #print 'looking for %s in %s' % (self, markup)
+        found = None
+        # If given a list of items, scan it for a text element that
+        # matches.        
+        if isList(markup) and not isinstance(markup, Tag):
+            for element in markup:
+                if isinstance(element, NavigableString) \
+                       and self.search(element):
+                    found = element
+                    break
+        # If it's a Tag, make sure its name or attributes match.
+        # Don't bother with Tags if we're searching for text.
+        elif isinstance(markup, Tag):
+            if not self.text:
+                found = self.searchTag(markup)
+        # If it's text, make sure the text matches.
+        elif isinstance(markup, NavigableString) or \
+                 isString(markup):
+            if self._matches(markup, self.text):
+                found = markup
+        else:
+            raise Exception, "I don't know how to match against a %s" \
+                  % markup.__class__
+        return found
+        
+    def _matches(self, markup, matchAgainst):    
+        #print "Matching %s against %s" % (markup, matchAgainst)
+        result = False
+        if matchAgainst == True and type(matchAgainst) == types.BooleanType:
+            result = markup != None
+        elif callable(matchAgainst):
+            result = matchAgainst(markup)
+        else:
+            #Custom match methods take the tag as an argument, but all
+            #other ways of matching match the tag name as a string.
+            if isinstance(markup, Tag):
+                markup = markup.name
+            if markup and not isString(markup):
+                markup = unicode(markup)
+            #Now we know that chunk is either a string, or None.
+            if hasattr(matchAgainst, 'match'):
+                # It's a regexp object.
+                result = markup and matchAgainst.search(markup)
+            elif isList(matchAgainst):
+                result = markup in matchAgainst
+            elif hasattr(matchAgainst, 'items'):
+                result = markup.has_key(matchAgainst)
+            elif matchAgainst and isString(markup):
+                if isinstance(markup, unicode):
+                    matchAgainst = unicode(matchAgainst)
+                else:
+                    matchAgainst = str(matchAgainst)
+
+            if not result:
+                result = matchAgainst == markup
+        return result
+
+class ResultSet(list):
+    """A ResultSet is just a list that keeps track of the SoupStrainer
+    that created it."""
+    def __init__(self, source):
+        list.__init__([])
+        self.source = source
+
+# Now, some helper functions.
+
+def isList(l):
+    """Convenience method that works with all 2.x versions of Python
+    to determine whether or not something is listlike."""
+    return hasattr(l, '__iter__') \
+           or (type(l) in (types.ListType, types.TupleType))
+
+def isString(s):
+    """Convenience method that works with all 2.x versions of Python
+    to determine whether or not something is stringlike."""
+    try:
+        return isinstance(s, unicode) or isintance(s, basestring) 
+    except NameError:
+        return isinstance(s, str)
+
+def buildTagMap(default, *args):
+    """Turns a list of maps, lists, or scalars into a single map.
+    Used to build the SELF_CLOSING_TAGS, NESTABLE_TAGS, and
+    NESTING_RESET_TAGS maps out of lists and partial maps."""
+    built = {}
+    for portion in args:
+        if hasattr(portion, 'items'):
+            #It's a map. Merge it.
+            for k,v in portion.items():
+                built[k] = v
+        elif isList(portion):
+            #It's a list. Map each item to the default.
+            for k in portion:
+                built[k] = default
+        else:
+            #It's a scalar. Map it to the default.
+            built[portion] = default
+    return built
+
+# Now, the parser classes.
+
+class BeautifulStoneSoup(Tag, SGMLParser):
+
+    """This class contains the basic parser and search code. It defines
+    a parser that knows nothing about tag behavior except for the
+    following:
+   
+      You can't close a tag without closing all the tags it encloses.
+      That is, "<foo><bar></foo>" actually means
+      "<foo><bar></bar></foo>".
+
+    [Another possible explanation is "<foo><bar /></foo>", but since
+    this class defines no SELF_CLOSING_TAGS, it will never use that
+    explanation.]
+
+    This class is useful for parsing XML or made-up markup languages,
+    or when BeautifulSoup makes an assumption counter to what you were
+    expecting."""
+
+    XML_ENTITY_LIST = {}
+    for i in ["quot", "apos", "amp", "lt", "gt"]:
+        XML_ENTITY_LIST[i] = True 
+
+    SELF_CLOSING_TAGS = {}
+    NESTABLE_TAGS = {}
+    RESET_NESTING_TAGS = {}
+    QUOTE_TAGS = {}
+
+    MARKUP_MASSAGE = [(re.compile('(<[^<>]*)/>'),
+                       lambda x: x.group(1) + ' />'),
+                      (re.compile('<!\s+([^<>]*)>'),
+                       lambda x: '<!' + x.group(1) + '>')
+                      ]
+
+    ROOT_TAG_NAME = u'[document]'
+
+    HTML_ENTITIES = "html"
+    XML_ENTITIES = "xml"
+
+    def __init__(self, markup="", parseOnlyThese=None, fromEncoding=None,
+                 markupMassage=True, smartQuotesTo=XML_ENTITIES,
+                 convertEntities=None, selfClosingTags=None):
+        """The Soup object is initialized as the 'root tag', and the
+        provided markup (which can be a string or a file-like object)
+        is fed into the underlying parser. 
+
+        sgmllib will process most bad HTML, and the BeautifulSoup
+        class has some tricks for dealing with some HTML that kills
+        sgmllib, but Beautiful Soup can nonetheless choke or lose data
+        if your data uses self-closing tags or declarations
+        incorrectly.
+
+        By default, Beautiful Soup uses regexes to sanitize input,
+        avoiding the vast majority of these problems. If the problems
+        don't apply to you, pass in False for markupMassage, and
+        you'll get better performance.
+
+        The default parser massage techniques fix the two most common
+        instances of invalid HTML that choke sgmllib:
+
+         <br/> (No space between name of closing tag and tag close)
+         <! --Comment--> (Extraneous whitespace in declaration)
+
+        You can pass in a custom list of (RE object, replace method)
+        tuples to get Beautiful Soup to scrub your input the way you
+        want."""
+
+        self.parseOnlyThese = parseOnlyThese
+        self.fromEncoding = fromEncoding
+        self.smartQuotesTo = smartQuotesTo
+        self.convertEntities = convertEntities
+        if self.convertEntities:
+            # It doesn't make sense to convert encoded characters to
+            # entities even while you're converting entities to Unicode.
+            # Just convert it all to Unicode.
+            self.smartQuotesTo = None
+        self.instanceSelfClosingTags = buildTagMap(None, selfClosingTags)
+        SGMLParser.__init__(self)
+            
+        if hasattr(markup, 'read'):        # It's a file-type object.
+            markup = markup.read()
+        self.markup = markup
+        self.markupMassage = markupMassage
+        try:
+            self._feed()
+        except StopParsing:
+            pass
+        self.markup = None                 # The markup can now be GCed
+        
+    def _feed(self, inDocumentEncoding=None):
+        # Convert the document to Unicode.
+        markup = self.markup
+        if isinstance(markup, unicode):
+            if not hasattr(self, 'originalEncoding'):
+                self.originalEncoding = None
+        else:
+            dammit = UnicodeDammit\
+                     (markup, [self.fromEncoding, inDocumentEncoding],
+                      smartQuotesTo=self.smartQuotesTo)
+            markup = dammit.unicode
+            self.originalEncoding = dammit.originalEncoding
+        if markup:
+            if self.markupMassage:
+                if not isList(self.markupMassage):
+                    self.markupMassage = self.MARKUP_MASSAGE            
+                for fix, m in self.markupMassage:
+                    markup = fix.sub(m, markup)
+        self.reset()
+
+        SGMLParser.feed(self, markup)
+        # Close out any unfinished strings and close all the open tags.
+        self.endData()
+        while self.currentTag.name != self.ROOT_TAG_NAME:
+            self.popTag()
+
+    def __getattr__(self, methodName):
+        """This method routes method call requests to either the SGMLParser
+        superclass or the Tag superclass, depending on the method name."""
+        #print "__getattr__ called on %s.%s" % (self.__class__, methodName)
+
+        if methodName.find('start_') == 0 or methodName.find('end_') == 0 \
+               or methodName.find('do_') == 0:
+            return SGMLParser.__getattr__(self, methodName)
+        elif methodName.find('__') != 0:
+            return Tag.__getattr__(self, methodName)
+        else:
+            raise AttributeError
+
+    def isSelfClosingTag(self, name):
+        """Returns true iff the given string is the name of a
+        self-closing tag according to this parser."""
+        return self.SELF_CLOSING_TAGS.has_key(name) \
+               or self.instanceSelfClosingTags.has_key(name)
+            
+    def reset(self):
+        Tag.__init__(self, self, self.ROOT_TAG_NAME)
+        self.hidden = 1
+        SGMLParser.reset(self)
+        self.currentData = []
+        self.currentTag = None
+        self.tagStack = []
+        self.quoteStack = []
+        self.pushTag(self)
+    
+    def popTag(self):
+        tag = self.tagStack.pop()
+        # Tags with just one string-owning child get the child as a
+        # 'string' property, so that soup.tag.string is shorthand for
+        # soup.tag.contents[0]
+        if len(self.currentTag.contents) == 1 and \
+           isinstance(self.currentTag.contents[0], NavigableString):
+            self.currentTag.string = self.currentTag.contents[0]
+
+        #print "Pop", tag.name
+        if self.tagStack:
+            self.currentTag = self.tagStack[-1]
+        return self.currentTag
+
+    def pushTag(self, tag):
+        #print "Push", tag.name
+        if self.currentTag:
+            self.currentTag.append(tag)
+        self.tagStack.append(tag)
+        self.currentTag = self.tagStack[-1]
+
+    def endData(self, containerClass=NavigableString):
+        if self.currentData:
+            currentData = ''.join(self.currentData)
+            if not currentData.strip():
+                if '\n' in currentData:
+                    currentData = '\n'
+                else:
+                    currentData = ' '
+            self.currentData = []
+            if self.parseOnlyThese and len(self.tagStack) <= 1 and \
+                   (not self.parseOnlyThese.text or \
+                    not self.parseOnlyThese.search(currentData)):
+                return
+            o = containerClass(currentData)
+            o.setup(self.currentTag, self.previous)
+            if self.previous:
+                self.previous.next = o
+            self.previous = o
+            self.currentTag.contents.append(o)
+
+
+    def _popToTag(self, name, inclusivePop=True):
+        """Pops the tag stack up to and including the most recent
+        instance of the given tag. If inclusivePop is false, pops the tag
+        stack up to but *not* including the most recent instqance of
+        the given tag."""
+        #print "Popping to %s" % name
+        if name == self.ROOT_TAG_NAME:
+            return            
+
+        numPops = 0
+        mostRecentTag = None
+        for i in range(len(self.tagStack)-1, 0, -1):
+            if name == self.tagStack[i].name:
+                numPops = len(self.tagStack)-i
+                break
+        if not inclusivePop:
+            numPops = numPops - 1
+
+        for i in range(0, numPops):
+            mostRecentTag = self.popTag()
+        return mostRecentTag    
+
+    def _smartPop(self, name):
+
+        """We need to pop up to the previous tag of this type, unless
+        one of this tag's nesting reset triggers comes between this
+        tag and the previous tag of this type, OR unless this tag is a
+        generic nesting trigger and another generic nesting trigger
+        comes between this tag and the previous tag of this type.
+
+        Examples:
+         <p>Foo<b>Bar<p> should pop to 'p', not 'b'.
+         <p>Foo<table>Bar<p> should pop to 'table', not 'p'.
+         <p>Foo<table><tr>Bar<p> should pop to 'tr', not 'p'.
+         <p>Foo<b>Bar<p> should pop to 'p', not 'b'.
+
+         <li><ul><li> *<li>* should pop to 'ul', not the first 'li'.
+         <tr><table><tr> *<tr>* should pop to 'table', not the first 'tr'
+         <td><tr><td> *<td>* should pop to 'tr', not the first 'td'
+        """
+
+        nestingResetTriggers = self.NESTABLE_TAGS.get(name)
+        isNestable = nestingResetTriggers != None
+        isResetNesting = self.RESET_NESTING_TAGS.has_key(name)
+        popTo = None
+        inclusive = True
+        for i in range(len(self.tagStack)-1, 0, -1):
+            p = self.tagStack[i]
+            if (not p or p.name == name) and not isNestable:
+                #Non-nestable tags get popped to the top or to their
+                #last occurance.
+                popTo = name
+                break
+            if (nestingResetTriggers != None
+                and p.name in nestingResetTriggers) \
+                or (nestingResetTriggers == None and isResetNesting
+                    and self.RESET_NESTING_TAGS.has_key(p.name)):
+                
+                #If we encounter one of the nesting reset triggers
+                #peculiar to this tag, or we encounter another tag
+                #that causes nesting to reset, pop up to but not
+                #including that tag.
+                popTo = p.name
+                inclusive = False
+                break
+            p = p.parent
+        if popTo:
+            self._popToTag(popTo, inclusive)
+
+    def unknown_starttag(self, name, attrs, selfClosing=0):
+        #print "Start tag %s" % name
+        if self.quoteStack:
+            #This is not a real tag.
+            #print "<%s> is not real!" % name
+            attrs = ''.join(map(lambda(x, y): ' %s="%s"' % (x, y), attrs))
+            self.handle_data('<%s%s>' % (name, attrs))
+            return        
+        self.endData()
+
+        if not self.isSelfClosingTag(name) and not selfClosing:
+            self._smartPop(name)
+
+        if self.parseOnlyThese and len(self.tagStack) <= 1 \
+               and (self.parseOnlyThese.text or not self.parseOnlyThese.searchTag(name, attrs)):
+            return
+
+        tag = Tag(self, name, attrs, self.currentTag, self.previous)
+        if self.previous:
+            self.previous.next = tag
+        self.previous = tag
+        self.pushTag(tag)
+        if selfClosing or self.isSelfClosingTag(name):
+            self.popTag()                
+        if name in self.QUOTE_TAGS:
+            #print "Beginning quote (%s)" % name
+            self.quoteStack.append(name)
+            self.literal = 1
+        return tag
+
+    def unknown_endtag(self, name):
+        #print "End tag %s" % name
+        if self.quoteStack and self.quoteStack[-1] != name:
+            #This is not a real end tag.
+            #print "</%s> is not real!" % name
+            self.handle_data('</%s>' % name)
+            return
+        self.endData()
+        self._popToTag(name)
+        if self.quoteStack and self.quoteStack[-1] == name:
+            self.quoteStack.pop()
+            self.literal = (len(self.quoteStack) > 0)
+
+    def handle_data(self, data):
+        self.currentData.append(data)
+
+    def _toStringSubclass(self, text, subclass):
+        """Adds a certain piece of text to the tree as a NavigableString
+        subclass."""
+        self.endData()
+        self.handle_data(text)
+        self.endData(subclass)
+
+    def handle_pi(self, text):
+        """Handle a processing instruction as a ProcessingInstruction
+        object, possibly one with a %SOUP-ENCODING% slot into which an
+        encoding will be plugged later."""
+        if text[:3] == "xml":
+            text = "xml version='1.0' encoding='%SOUP-ENCODING%'"
+        self._toStringSubclass(text, ProcessingInstruction)
+
+    def handle_comment(self, text):
+        "Handle comments as Comment objects."
+        self._toStringSubclass(text, Comment)
+
+    def handle_charref(self, ref):
+        "Handle character references as data."
+        if self.convertEntities in [self.HTML_ENTITIES,
+                                    self.XML_ENTITIES]:
+            data = unichr(int(ref))
+        else:
+            data = '&#%s;' % ref
+        self.handle_data(data)
+
+    def handle_entityref(self, ref):
+        """Handle entity references as data, possibly converting known
+        HTML entity references to the corresponding Unicode
+        characters."""
+        data = None
+        if self.convertEntities == self.HTML_ENTITIES or \
+               (self.convertEntities == self.XML_ENTITIES and \
+                self.XML_ENTITY_LIST.get(ref)):
+            try:
+                data = unichr(name2codepoint[ref])
+            except KeyError:
+                pass
+        if not data:
+            data = '&%s;' % ref
+        self.handle_data(data)
+        
+    def handle_decl(self, data):
+        "Handle DOCTYPEs and the like as Declaration objects."
+        self._toStringSubclass(data, Declaration)
+
+    def parse_declaration(self, i):
+        """Treat a bogus SGML declaration as raw data. Treat a CDATA
+        declaration as a CData object."""
+        j = None
+        if self.rawdata[i:i+9] == '<![CDATA[':
+             k = self.rawdata.find(']]>', i)
+             if k == -1:
+                 k = len(self.rawdata)
+             data = self.rawdata[i+9:k]
+             j = k+3
+             self._toStringSubclass(data, CData)
+        else:
+            try:
+                j = SGMLParser.parse_declaration(self, i)
+            except SGMLParseError:
+                toHandle = self.rawdata[i:]
+                self.handle_data(toHandle)
+                j = i + len(toHandle)
+        return j
+
+class BeautifulSoup(BeautifulStoneSoup):
+
+    """This parser knows the following facts about HTML:
+
+    * Some tags have no closing tag and should be interpreted as being
+      closed as soon as they are encountered.
+
+    * The text inside some tags (ie. 'script') may contain tags which
+      are not really part of the document and which should be parsed
+      as text, not tags. If you want to parse the text as tags, you can
+      always fetch it and parse it explicitly.
+
+    * Tag nesting rules:
+
+      Most tags can't be nested at all. For instance, the occurance of
+      a <p> tag should implicitly close the previous <p> tag.
+
+       <p>Para1<p>Para2
+        should be transformed into:
+       <p>Para1</p><p>Para2
+
+      Some tags can be nested arbitrarily. For instance, the occurance
+      of a <blockquote> tag should _not_ implicitly close the previous
+      <blockquote> tag.
+
+       Alice said: <blockquote>Bob said: <blockquote>Blah
+        should NOT be transformed into:
+       Alice said: <blockquote>Bob said: </blockquote><blockquote>Blah
+
+      Some tags can be nested, but the nesting is reset by the
+      interposition of other tags. For instance, a <tr> tag should
+      implicitly close the previous <tr> tag within the same <table>,
+      but not close a <tr> tag in another table.
+
+       <table><tr>Blah<tr>Blah
+        should be transformed into:
+       <table><tr>Blah</tr><tr>Blah
+        but,
+       <tr>Blah<table><tr>Blah
+        should NOT be transformed into
+       <tr>Blah<table></tr><tr>Blah
+
+    Differing assumptions about tag nesting rules are a major source
+    of problems with the BeautifulSoup class. If BeautifulSoup is not
+    treating as nestable a tag your page author treats as nestable,
+    try ICantBelieveItsBeautifulSoup, MinimalSoup, or
+    BeautifulStoneSoup before writing your own subclass."""
+
+    def __init__(self, *args, **kwargs):
+        if not kwargs.has_key('smartQuotesTo'):
+            kwargs['smartQuotesTo'] = self.HTML_ENTITIES
+        BeautifulStoneSoup.__init__(self, *args, **kwargs)
+
+    SELF_CLOSING_TAGS = buildTagMap(None,
+                                    ['br' , 'hr', 'input', 'img', 'meta',
+                                    'spacer', 'link', 'frame', 'base'])
+
+    QUOTE_TAGS = {'script': None}
+    
+    #According to the HTML standard, each of these inline tags can
+    #contain another tag of the same type. Furthermore, it's common
+    #to actually use these tags this way.
+    NESTABLE_INLINE_TAGS = ['span', 'font', 'q', 'object', 'bdo', 'sub', 'sup',
+                            'center']
+
+    #According to the HTML standard, these block tags can contain
+    #another tag of the same type. Furthermore, it's common
+    #to actually use these tags this way.
+    NESTABLE_BLOCK_TAGS = ['blockquote', 'div', 'fieldset', 'ins', 'del']
+
+    #Lists can contain other lists, but there are restrictions.    
+    NESTABLE_LIST_TAGS = { 'ol' : [],
+                           'ul' : [],
+                           'li' : ['ul', 'ol'],
+                           'dl' : [],
+                           'dd' : ['dl'],
+                           'dt' : ['dl'] }
+
+    #Tables can contain other tables, but there are restrictions.    
+    NESTABLE_TABLE_TAGS = {'table' : [], 
+                           'tr' : ['table', 'tbody', 'tfoot', 'thead'],
+                           'td' : ['tr'],
+                           'th' : ['tr'],
+                           'thead' : ['table'],
+                           'tbody' : ['table'],
+                           'tfoot' : ['table'],
+                           }
+
+    NON_NESTABLE_BLOCK_TAGS = ['address', 'form', 'p', 'pre']
+
+    #If one of these tags is encountered, all tags up to the next tag of
+    #this type are popped.
+    RESET_NESTING_TAGS = buildTagMap(None, NESTABLE_BLOCK_TAGS, 'noscript',
+                                     NON_NESTABLE_BLOCK_TAGS,
+                                     NESTABLE_LIST_TAGS,
+                                     NESTABLE_TABLE_TAGS)
+
+    NESTABLE_TAGS = buildTagMap([], NESTABLE_INLINE_TAGS, NESTABLE_BLOCK_TAGS,
+                                NESTABLE_LIST_TAGS, NESTABLE_TABLE_TAGS)
+
+    # Used to detect the charset in a META tag; see start_meta
+    CHARSET_RE = re.compile("((^|;)\s*charset=)([^;]*)")
+
+    def start_meta(self, attrs):
+        """Beautiful Soup can detect a charset included in a META tag,
+        try to convert the document to that charset, and re-parse the
+        document from the beginning."""
+        httpEquiv = None
+        contentType = None
+        contentTypeIndex = None
+        tagNeedsEncodingSubstitution = False
+
+        for i in range(0, len(attrs)):
+            key, value = attrs[i]
+            key = key.lower()
+            if key == 'http-equiv':
+                httpEquiv = value
+            elif key == 'content':
+                contentType = value
+                contentTypeIndex = i
+
+        if httpEquiv and contentType: # It's an interesting meta tag.
+            match = self.CHARSET_RE.search(contentType)
+            if match:
+                if getattr(self, 'declaredHTMLEncoding') or \
+                       (self.originalEncoding == self.fromEncoding):
+                    # This is our second pass through the document, or
+                    # else an encoding was specified explicitly and it
+                    # worked. Rewrite the meta tag.
+                    newAttr = self.CHARSET_RE.sub\
+                              (lambda(match):match.group(1) +
+                               "%SOUP-ENCODING%", value)
+                    attrs[contentTypeIndex] = (attrs[contentTypeIndex][0],
+                                               newAttr)
+                    tagNeedsEncodingSubstitution = True
+                else:
+                    # This is our first pass through the document.
+                    # Go through it again with the new information.
+                    newCharset = match.group(3)
+                    if newCharset and newCharset != self.originalEncoding:
+                        self.declaredHTMLEncoding = newCharset
+                        self._feed(self.declaredHTMLEncoding)
+                        raise StopParsing
+        tag = self.unknown_starttag("meta", attrs)
+        if tagNeedsEncodingSubstitution:
+            tag.containsSubstitutions = True
+
+class StopParsing(Exception):
+    pass
+   
+class ICantBelieveItsBeautifulSoup(BeautifulSoup):
+
+    """The BeautifulSoup class is oriented towards skipping over
+    common HTML errors like unclosed tags. However, sometimes it makes
+    errors of its own. For instance, consider this fragment:
+
+     <b>Foo<b>Bar</b></b>
+
+    This is perfectly valid (if bizarre) HTML. However, the
+    BeautifulSoup class will implicitly close the first b tag when it
+    encounters the second 'b'. It will think the author wrote
+    "<b>Foo<b>Bar", and didn't close the first 'b' tag, because
+    there's no real-world reason to bold something that's already
+    bold. When it encounters '</b></b>' it will close two more 'b'
+    tags, for a grand total of three tags closed instead of two. This
+    can throw off the rest of your document structure. The same is
+    true of a number of other tags, listed below.
+
+    It's much more common for someone to forget to close a 'b' tag
+    than to actually use nested 'b' tags, and the BeautifulSoup class
+    handles the common case. This class handles the not-co-common
+    case: where you can't believe someone wrote what they did, but
+    it's valid HTML and BeautifulSoup screwed up by assuming it
+    wouldn't be."""
+
+    I_CANT_BELIEVE_THEYRE_NESTABLE_INLINE_TAGS = \
+     ['em', 'big', 'i', 'small', 'tt', 'abbr', 'acronym', 'strong',
+      'cite', 'code', 'dfn', 'kbd', 'samp', 'strong', 'var', 'b',
+      'big']
+
+    I_CANT_BELIEVE_THEYRE_NESTABLE_BLOCK_TAGS = ['noscript']
+
+    NESTABLE_TAGS = buildTagMap([], BeautifulSoup.NESTABLE_TAGS,
+                                I_CANT_BELIEVE_THEYRE_NESTABLE_BLOCK_TAGS,
+                                I_CANT_BELIEVE_THEYRE_NESTABLE_INLINE_TAGS)
+
+class MinimalSoup(BeautifulSoup):
+    """The MinimalSoup class is for parsing HTML that contains
+    pathologically bad markup. It makes no assumptions about tag
+    nesting, but it does know which tags are self-closing, that
+    <script> tags contain Javascript and should not be parsed, that
+    META tags may contain encoding information, and so on.
+
+    This also makes it better for subclassing than BeautifulStoneSoup
+    or BeautifulSoup."""
+    
+    RESET_NESTING_TAGS = buildTagMap('noscript')
+    NESTABLE_TAGS = {}
+
+class BeautifulSOAP(BeautifulStoneSoup):
+    """This class will push a tag with only a single string child into
+    the tag's parent as an attribute. The attribute's name is the tag
+    name, and the value is the string child. An example should give
+    the flavor of the change:
+
+    <foo><bar>baz</bar></foo>
+     =>
+    <foo bar="baz"><bar>baz</bar></foo>
+
+    You can then access fooTag['bar'] instead of fooTag.barTag.string.
+
+    This is, of course, useful for scraping structures that tend to
+    use subelements instead of attributes, such as SOAP messages. Note
+    that it modifies its input, so don't print the modified version
+    out.
+
+    I'm not sure how many people really want to use this class; let me
+    know if you do. Mainly I like the name."""
+
+    def popTag(self):
+        if len(self.tagStack) > 1:
+            tag = self.tagStack[-1]
+            parent = self.tagStack[-2]
+            parent._getAttrMap()
+            if (isinstance(tag, Tag) and len(tag.contents) == 1 and
+                isinstance(tag.contents[0], NavigableString) and 
+                not parent.attrMap.has_key(tag.name)):
+                parent[tag.name] = tag.contents[0]
+        BeautifulStoneSoup.popTag(self)
+
+#Enterprise class names! It has come to our attention that some people
+#think the names of the Beautiful Soup parser classes are too silly
+#and "unprofessional" for use in enterprise screen-scraping. We feel
+#your pain! For such-minded folk, the Beautiful Soup Consortium And
+#All-Night Kosher Bakery recommends renaming this file to
+#"RobustParser.py" (or, in cases of extreme enterprisitude,
+#"RobustParserBeanInterface.class") and using the following
+#enterprise-friendly class aliases:
+class RobustXMLParser(BeautifulStoneSoup):
+    pass
+class RobustHTMLParser(BeautifulSoup):
+    pass
+class RobustWackAssHTMLParser(ICantBelieveItsBeautifulSoup):
+    pass
+class RobustInsanelyWackAssHTMLParser(MinimalSoup):
+    pass
+class SimplifyingSOAPParser(BeautifulSOAP):
+    pass
+
+######################################################
+#
+# Bonus library: Unicode, Dammit
+#
+# This class forces XML data into a standard format (usually to UTF-8
+# or Unicode).  It is heavily based on code from Mark Pilgrim's
+# Universal Feed Parser. It does not rewrite the XML or HTML to
+# reflect a new encoding: that happens in BeautifulStoneSoup.handle_pi
+# (XML) and BeautifulSoup.start_meta (HTML).
+
+# Autodetects character encodings.
+# Download from http://chardet.feedparser.org/
+try:
+    import chardet
+#    import chardet.constants
+#    chardet.constants._debug = 1
+except:
+    chardet = None
+chardet = None
+
+# cjkcodecs and iconv_codec make Python know about more character encodings.
+# Both are available from http://cjkpython.i18n.org/
+# They're built in if you use Python 2.4.
+try:
+    import cjkcodecs.aliases
+except:
+    pass
+try:
+    import iconv_codec
+except:
+    pass
+
+class UnicodeDammit:
+    """A class for detecting the encoding of a *ML document and
+    converting it to a Unicode string. If the source encoding is
+    windows-1252, can replace MS smart quotes with their HTML or XML
+    equivalents."""
+
+    # This dictionary maps commonly seen values for "charset" in HTML
+    # meta tags to the corresponding Python codec names. It only covers
+    # values that aren't in Python's aliases and can't be determined
+    # by the heuristics in find_codec.
+    CHARSET_ALIASES = { "macintosh" : "mac-roman",
+                        "x-sjis" : "shift-jis" }
+    
+    def __init__(self, markup, overrideEncodings=[],
+                 smartQuotesTo='xml'):
+        self.markup, documentEncoding, sniffedEncoding = \
+                     self._detectEncoding(markup)
+        self.smartQuotesTo = smartQuotesTo
+        self.triedEncodings = []
+        if isinstance(markup, unicode):
+            return markup
+
+        u = None
+        for proposedEncoding in overrideEncodings:
+            u = self._convertFrom(proposedEncoding)
+            if u: break
+        if not u:
+            for proposedEncoding in (documentEncoding, sniffedEncoding):
+                u = self._convertFrom(proposedEncoding)
+                if u: break
+                
+        # If no luck and we have auto-detection library, try that:
+        if not u and chardet and not isinstance(self.markup, unicode):
+            u = self._convertFrom(chardet.detect(self.markup)['encoding'])
+
+        # As a last resort, try utf-8 and windows-1252:
+        if not u:
+            for proposed_encoding in ("utf-8", "windows-1252"):
+                u = self._convertFrom(proposed_encoding)
+                if u: break
+        self.unicode = u
+        if not u: self.originalEncoding = None
+
+    def _subMSChar(self, orig):
+        """Changes a MS smart quote character to an XML or HTML
+        entity."""
+        sub = self.MS_CHARS.get(orig)
+        if type(sub) == types.TupleType:
+            if self.smartQuotesTo == 'xml':
+                sub = '&#x%s;' % sub[1]
+            else:
+                sub = '&%s;' % sub[0]
+        return sub            
+
+    def _convertFrom(self, proposed):        
+        proposed = self.find_codec(proposed)
+        if not proposed or proposed in self.triedEncodings:
+            return None
+        self.triedEncodings.append(proposed)
+        markup = self.markup
+
+        # Convert smart quotes to HTML if coming from an encoding
+        # that might have them.
+        if self.smartQuotesTo and proposed in("windows-1252",
+                                              "ISO-8859-1",
+                                              "ISO-8859-2"):
+            markup = re.compile("([\x80-\x9f])").sub \
+                     (lambda(x): self._subMSChar(x.group(1)),
+                      markup)
+
+        try:
+            # print "Trying to convert document to %s" % proposed
+            u = self._toUnicode(markup, proposed)
+            self.markup = u       
+            self.originalEncoding = proposed
+        except Exception, e:
+            # print "That didn't work!"
+            # print e
+            return None        
+        #print "Correct encoding: %s" % proposed
+        return self.markup
+
+    def _toUnicode(self, data, encoding):
+        '''Given a string and its encoding, decodes the string into Unicode.
+        %encoding is a string recognized by encodings.aliases'''
+
+        # strip Byte Order Mark (if present)
+        if (len(data) >= 4) and (data[:2] == '\xfe\xff') \
+               and (data[2:4] != '\x00\x00'):
+            encoding = 'utf-16be'
+            data = data[2:]
+        elif (len(data) >= 4) and (data[:2] == '\xff\xfe') \
+                 and (data[2:4] != '\x00\x00'):
+            encoding = 'utf-16le'
+            data = data[2:]
+        elif data[:3] == '\xef\xbb\xbf':
+            encoding = 'utf-8'
+            data = data[3:]
+        elif data[:4] == '\x00\x00\xfe\xff':
+            encoding = 'utf-32be'
+            data = data[4:]
+        elif data[:4] == '\xff\xfe\x00\x00':
+            encoding = 'utf-32le'
+            data = data[4:]
+        newdata = unicode(data, encoding)
+        return newdata
+    
+    def _detectEncoding(self, xml_data):
+        """Given a document, tries to detect its XML encoding."""
+        xml_encoding = sniffed_xml_encoding = None
+        try:
+            if xml_data[:4] == '\x4c\x6f\xa7\x94':
+                # EBCDIC
+                xml_data = self._ebcdic_to_ascii(xml_data)
+            elif xml_data[:4] == '\x00\x3c\x00\x3f':
+                # UTF-16BE
+                sniffed_xml_encoding = 'utf-16be'
+                xml_data = unicode(xml_data, 'utf-16be').encode('utf-8')
+            elif (len(xml_data) >= 4) and (xml_data[:2] == '\xfe\xff') \
+                     and (xml_data[2:4] != '\x00\x00'):
+                # UTF-16BE with BOM
+                sniffed_xml_encoding = 'utf-16be'
+                xml_data = unicode(xml_data[2:], 'utf-16be').encode('utf-8')
+            elif xml_data[:4] == '\x3c\x00\x3f\x00':
+                # UTF-16LE
+                sniffed_xml_encoding = 'utf-16le'
+                xml_data = unicode(xml_data, 'utf-16le').encode('utf-8')
+            elif (len(xml_data) >= 4) and (xml_data[:2] == '\xff\xfe') and \
+                     (xml_data[2:4] != '\x00\x00'):
+                # UTF-16LE with BOM
+                sniffed_xml_encoding = 'utf-16le'
+                xml_data = unicode(xml_data[2:], 'utf-16le').encode('utf-8')
+            elif xml_data[:4] == '\x00\x00\x00\x3c':
+                # UTF-32BE
+                sniffed_xml_encoding = 'utf-32be'
+                xml_data = unicode(xml_data, 'utf-32be').encode('utf-8')
+            elif xml_data[:4] == '\x3c\x00\x00\x00':
+                # UTF-32LE
+                sniffed_xml_encoding = 'utf-32le'
+                xml_data = unicode(xml_data, 'utf-32le').encode('utf-8')
+            elif xml_data[:4] == '\x00\x00\xfe\xff':
+                # UTF-32BE with BOM
+                sniffed_xml_encoding = 'utf-32be'
+                xml_data = unicode(xml_data[4:], 'utf-32be').encode('utf-8')
+            elif xml_data[:4] == '\xff\xfe\x00\x00':
+                # UTF-32LE with BOM
+                sniffed_xml_encoding = 'utf-32le'
+                xml_data = unicode(xml_data[4:], 'utf-32le').encode('utf-8')
+            elif xml_data[:3] == '\xef\xbb\xbf':
+                # UTF-8 with BOM
+                sniffed_xml_encoding = 'utf-8'
+                xml_data = unicode(xml_data[3:], 'utf-8').encode('utf-8')
+            else:
+                sniffed_xml_encoding = 'ascii'
+                pass
+            xml_encoding_match = re.compile \
+                                 ('^<\?.*encoding=[\'"](.*?)[\'"].*\?>')\
+                                 .match(xml_data)
+        except:
+            xml_encoding_match = None
+        if xml_encoding_match:
+            xml_encoding = xml_encoding_match.groups()[0].lower()
+            if sniffed_xml_encoding and \
+               (xml_encoding in ('iso-10646-ucs-2', 'ucs-2', 'csunicode',
+                                 'iso-10646-ucs-4', 'ucs-4', 'csucs4',
+                                 'utf-16', 'utf-32', 'utf_16', 'utf_32',
+                                 'utf16', 'u16')):
+                xml_encoding = sniffed_xml_encoding
+        return xml_data, xml_encoding, sniffed_xml_encoding
+
+
+    def find_codec(self, charset):
+        return self._codec(self.CHARSET_ALIASES.get(charset, charset)) \
+               or (charset and self._codec(charset.replace("-", ""))) \
+               or (charset and self._codec(charset.replace("-", "_"))) \
+               or charset
+
+    def _codec(self, charset):
+        if not charset: return charset 
+        codec = None
+        try:
+            codecs.lookup(charset)
+            codec = charset
+        except LookupError:
+            pass
+        return codec
+
+    EBCDIC_TO_ASCII_MAP = None
+    def _ebcdic_to_ascii(self, s):
+        c = self.__class__
+        if not c.EBCDIC_TO_ASCII_MAP:
+            emap = (0,1,2,3,156,9,134,127,151,141,142,11,12,13,14,15,
+                    16,17,18,19,157,133,8,135,24,25,146,143,28,29,30,31,
+                    128,129,130,131,132,10,23,27,136,137,138,139,140,5,6,7,
+                    144,145,22,147,148,149,150,4,152,153,154,155,20,21,158,26,
+                    32,160,161,162,163,164,165,166,167,168,91,46,60,40,43,33,
+                    38,169,170,171,172,173,174,175,176,177,93,36,42,41,59,94,
+                    45,47,178,179,180,181,182,183,184,185,124,44,37,95,62,63,
+                    186,187,188,189,190,191,192,193,194,96,58,35,64,39,61,34,
+                    195,97,98,99,100,101,102,103,104,105,196,197,198,199,200,
+                    201,202,106,107,108,109,110,111,112,113,114,203,204,205,
+                    206,207,208,209,126,115,116,117,118,119,120,121,122,210,
+                    211,212,213,214,215,216,217,218,219,220,221,222,223,224,
+                    225,226,227,228,229,230,231,123,65,66,67,68,69,70,71,72,
+                    73,232,233,234,235,236,237,125,74,75,76,77,78,79,80,81,
+                    82,238,239,240,241,242,243,92,159,83,84,85,86,87,88,89,
+                    90,244,245,246,247,248,249,48,49,50,51,52,53,54,55,56,57,
+                    250,251,252,253,254,255)
+            import string
+            c.EBCDIC_TO_ASCII_MAP = string.maketrans( \
+            ''.join(map(chr, range(256))), ''.join(map(chr, emap)))
+        return s.translate(c.EBCDIC_TO_ASCII_MAP)
+
+    MS_CHARS = { '\x80' : ('euro', '20AC'),
+                 '\x81' : ' ',
+                 '\x82' : ('sbquo', '201A'),
+                 '\x83' : ('fnof', '192'),
+                 '\x84' : ('bdquo', '201E'),
+                 '\x85' : ('hellip', '2026'),
+                 '\x86' : ('dagger', '2020'),
+                 '\x87' : ('Dagger', '2021'),
+                 '\x88' : ('circ', '2C6'),
+                 '\x89' : ('permil', '2030'),
+                 '\x8A' : ('Scaron', '160'),
+                 '\x8B' : ('lsaquo', '2039'),
+                 '\x8C' : ('OElig', '152'),
+                 '\x8D' : '?',
+                 '\x8E' : ('#x17D', '17D'),
+                 '\x8F' : '?',
+                 '\x90' : '?',
+                 '\x91' : ('lsquo', '2018'),
+                 '\x92' : ('rsquo', '2019'),
+                 '\x93' : ('ldquo', '201C'),
+                 '\x94' : ('rdquo', '201D'),
+                 '\x95' : ('bull', '2022'),
+                 '\x96' : ('ndash', '2013'),
+                 '\x97' : ('mdash', '2014'),
+                 '\x98' : ('tilde', '2DC'),
+                 '\x99' : ('trade', '2122'),
+                 '\x9a' : ('scaron', '161'),
+                 '\x9b' : ('rsaquo', '203A'),
+                 '\x9c' : ('oelig', '153'),
+                 '\x9d' : '?',
+                 '\x9e' : ('#x17E', '17E'),
+                 '\x9f' : ('Yuml', ''),}
+
+#######################################################################
+
+
+#By default, act as an HTML pretty-printer.
+if __name__ == '__main__':
+    import sys
+    soup = BeautifulStoneSoup(sys.stdin.read())
+    print soup.prettify()
diff --git a/__init__.py b/__init__.py
new file mode 100644
index 00000000..e69de29b
diff --git a/adapter.py b/adapter.py
new file mode 100644
index 00000000..ff1cb8ef
--- /dev/null
+++ b/adapter.py
@@ -0,0 +1,32 @@
+class FanfictionSiteAdapter:
+	login = ''
+	password = ''
+	def __init__(self, url):
+		pass
+	
+	def requiresLogin(self, url = None):
+		pass
+	
+	def performLogin(self, url = None):
+		pass
+	
+	def extractIndividualUrls(self):
+		pass
+		
+	def getText(self, url):
+		pass
+
+	def setLogin(self, login):
+		pass
+
+	def setPassword(self, password):
+		pass
+
+	def getStoryName(self):
+		pass
+
+	def getAuthorName(self):
+		pass
+
+	def getPrintableUrl(self, url):
+		pass
\ No newline at end of file
diff --git a/constants.py b/constants.py
new file mode 100644
index 00000000..27515658
--- /dev/null
+++ b/constants.py
@@ -0,0 +1,135 @@
+CSS = '''body { margin-left: 5%; margin-right: 5%; margin-top: 5%; margin-bottom: 5%; text-align: justify; }
+pre { font-size: x-small; }
+h1 { text-align: center; }
+h2 { text-align: center; }
+h3 { text-align: center; }
+h4 { text-align: center; }
+h5 { text-align: center; }
+h6 { text-align: center; }
+.CI {
+    text-align:center;
+    margin-top:0px;
+    margin-bottom:0px;
+    padding:0px;
+    }
+.center   {text-align: center;}
+.smcap    {font-variant: small-caps;}
+.u        {text-decoration: underline;}
+.bold     {font-weight: bold;}
+'''
+
+MIMETYPE = '''application/epub+zip'''
+
+CONTAINER = '''<?xml version="1.0"?>
+<container version="1.0" xmlns="urn:oasis:names:tc:opendocument:xmlns:container">
+  <rootfiles>
+    <rootfile full-path="OEBPS/content.opf" media-type="application/oebps-package+xml"/>
+  </rootfiles>
+</container>
+'''
+
+CONTENT_START = '''<?xml version="1.0"?>
+<package version="2.0" xmlns="http://www.idpf.org/2007/opf"
+         unique-identifier="BookId-Epub-%s">
+ <metadata xmlns:dc="http://purl.org/dc/elements/1.1/"
+           xmlns:opf="http://www.idpf.org/2007/opf">
+   <dc:title>%s</dc:title> 
+   <dc:creator opf:role="aut">%s</dc:creator>
+   <dc:language>en-UK</dc:language> 
+   <dc:rights></dc:rights> 
+   <dc:publisher>sgzmd</dc:publisher> 
+   <dc:identifier id="BookId">urn:uuid:sigizmund.com062820072147132</dc:identifier>
+ </metadata>
+ <manifest>
+  <item id="ncx" href="toc.ncx" media-type="application/x-dtbncx+xml"/>
+  <item id="style" href="stylesheet.css" media-type="text/css" />
+'''
+
+CONTENT_ITEM = '<item id="%s" href="%s" media-type="application/xhtml+xml" />'
+
+CONTENT_END_MANIFEST = '''</manifest>
+<spine toc="ncx">
+'''
+
+CONTENT_ITEMREF = '''<itemref idref="%s" />'''
+
+CONTENT_END = '''</spine>
+</package>
+'''
+
+TOC_START = '''<?xml version="1.0" encoding="UTF-8"?>
+<ncx xmlns="http://www.daisy.org/z3986/2005/ncx/" version="2005-1">
+  <head>
+    <meta name="dtb:uid" content="sigizmund.com062820072147132"/>
+    <meta name="dtb:depth" content="1"/>
+    <meta name="dtb:totalPageCount" content="0"/>
+    <meta name="dtb:maxPageNumber" content="0"/>
+  </head>
+  <docTitle>
+    <text>%s</text>
+  </docTitle>
+  <navMap>
+'''
+
+TOC_ITEM = '''<navPoint id="%s" playOrder="%d">
+  <navLabel>
+    <text>%s</text>
+  </navLabel>
+  <content src="%s"/>
+</navPoint>
+'''
+
+TOC_END = '''</navMap>
+</ncx>
+'''
+
+XHTML_START = '''<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN" "http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml">
+<head>
+<title>%s</title>
+<link href="stylesheet.css" type="text/css" rel="stylesheet" />
+</head>
+<body>
+<div>
+<h3>%s</h3>
+'''
+
+XHTML_END = '''</div>
+</body>
+</html>
+'''
+
+acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
+      'blockquote', 'br', 'center', 'cite', 'code', 'col',
+      'colgroup', 'dd', 'del', 'dfn', 'dir', 'div', 'dl', 'dt', 'em',
+      'font', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'i', 
+      'ins', 'kbd', 'label', 'li', 'ol', 
+      'p', 'pre', 'q', 's', 'samp', 'small', 'span', 'strike',
+      'strong', 'sub', 'sup', 'u', 'ul']
+
+acceptable_attributes = ['href']
+
+entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', '&lsquo;' : '\'', '&quot;' : '"' }
+
+FB2_PROLOGUE = '<FictionBook>'
+FB2_DESCRIPTION = '''<description>
+<title-info>
+  <genre>fanfiction</genre>
+  <author>
+  <first-name></first-name>
+  <middle-name></middle-name>
+  <last-name>%s</last-name>
+  </author>
+  <book-title>%s</book-title>
+  <lang>eng</lang>
+</title-info>
+<document-info>
+  <author>
+  <nickname>sgzmd</nickname>
+  </author>
+<date value="%s">%s</date>
+<id>sgzmd_%s</id>
+<version>2.0</version>
+</document-info>
+</description>'''
diff --git a/downaloder.py b/downaloder.py
new file mode 100644
index 00000000..02b8ff32
--- /dev/null
+++ b/downaloder.py
@@ -0,0 +1,103 @@
+import os
+import re
+import sys
+import shutil
+import os.path
+import getpass
+import logging
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+import ffa
+import ffnet
+import ficwad
+import output
+import fictionalley
+
+class FanficLoader:
+	'''A controller class which handles the interaction between various specific downloaders and writers'''
+	booksDirectory = "books"
+	
+	def __init__(self, adapter, writerClass, quiet = False, inmemory = False, compress=True):
+		self.adapter = adapter
+		self.writerClass = writerClass
+		self.quiet = quiet
+		self.inmemory = inmemory
+		self.compress = compress
+		self.badLogin = False
+		
+	def download(self):
+		logging.debug("Trying to download the story")
+		if self.adapter.requiresLogin():
+			logging.debug("Story requires login")
+			if not self.adapter.performLogin():
+				logging.debug("Login/password problem")
+				self.badLogin = True
+				return None
+		
+		urls = self.adapter.extractIndividualUrls()
+		self.writer = self.writerClass(self.booksDirectory, self.adapter.getStoryName(), self.adapter.getAuthorName(), inmemory=self.inmemory, compress=self.compress)
+		
+		i = 0
+		for u,n in urls:
+			if not self.quiet:
+				print('Downloading chapter %d/%d' % (i, len(urls)))
+			i = i+1
+			text = self.adapter.getText(u)
+			self.writer.writeChapter(n, text)
+		
+		self.writer.finalise()
+		
+		if self.inmemory:
+			self.name = self.writer.name
+			return self.writer.output.getvalue()
+	
+
+if __name__ == '__main__':
+	logging.basicConfig(level=logging.DEBUG)
+	(url, format) = sys.argv[1:]
+	
+	if type(url) is unicode:
+		print('URL is unicode')
+		url = url.encode('latin1')
+	
+	adapter = None
+	writerClass = None
+	
+	if url.find('fanficauthors') != -1:
+		adapter = ffa.FFA(url)
+	elif url.find('fictionalley') != -1:
+		adapter = fictionalley.FictionAlley(url)
+		print >> sys.stderr, "FictionAlley adapter is broken, try to find this fic on fanfiction.net or fanficauthors"
+		sys.exit(0)
+	elif url.find('ficwad') != -1:
+		adapter = ficwad.FicWad(url)
+	elif url.find('fanfiction.net') != -1:
+		adapter = ffnet.FFNet(url)
+	else:
+		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
+		sys.exit(1)
+
+	if format == 'epub':
+		writerClass = output.EPubFanficWriter
+	elif format == 'html':
+		writerClass = output.HTMLWriter
+	
+	if adapter.requiresLogin(url):
+		print("Meow, URL %s requires you to haz been logged in! Please can I haz this datas?" % url)
+		sys.stdout.write("Can I haz ur login? ")
+		login = sys.stdin.readline().strip()
+		password = getpass.getpass(prompt='Can I haz ur password? ')
+		print("Login: `%s`, Password: `%s`" % (login, password))
+		
+		adapter.setLogin(login)
+		adapter.setPassword(password)
+		
+	
+	loader = FanficLoader(adapter, writerClass)
+	loader.download()
+	
\ No newline at end of file
diff --git a/ffa.py b/ffa.py
new file mode 100644
index 00000000..b8c307ec
--- /dev/null
+++ b/ffa.py
@@ -0,0 +1,197 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import base64
+import os.path
+import logging
+import unittest
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+from constants import *
+from adapter import *
+
+try:
+	import login_password
+except:
+	# tough luck
+	pass
+
+class FFA(FanfictionSiteAdapter):
+	def __init__(self, url):
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+	
+		logging.debug("Created FFA: url=%s" % (self.url))
+	
+	def _getLoginScript(self):
+		return self.path
+
+	def requiresLogin(self, url = None):
+		resp = self.opener.open(self.url)
+		data = resp.read()
+		if data.find('<legend>Please login to continue</legend>') != -1:
+			return True
+		else:
+			return False
+ 
+	def performLogin(self, url = None):
+		if url == None:
+			url = self.url
+		
+		data = {}
+		
+		data['username'] = self.login
+		data['password'] = self.password
+		data['submit'] = 'Submit'
+		
+		urlvals = u.urlencode(data)
+		loginUrl = 'http://' + self.host + self._getLoginScript()
+		logging.debug("Will now login to URL %s" % loginUrl)
+		
+		req = self.opener.open(loginUrl, urlvals)
+		
+		if self.requiresLogin():
+			return False
+		else:
+			return True
+	
+	def extractIndividualUrls(self):
+		data = self.opener.open(self.url).read()
+		soup = bs.BeautifulStoneSoup(data)
+
+		self.author = soup.find('a', {'href' : '/contact/'}).string
+		self.storyName = str(soup.find('h1', {'class' : 'textCenter'}).contents[0]).strip()
+		
+		logging.debug("Story `%s` by `%s`" % (self.storyName, self.author))
+		
+		selector = soup.find('select', {'class' : 'tinput'})
+		options = selector.findAll('option')
+		
+		urls = []
+		
+		for o in options:
+			title = o.string
+			url = o['value']
+			
+			urls.append((url,title))
+		
+		return urls
+
+	def getText(self, url):
+		if url.find('http://') == -1:
+			url = 'http://' + self.host + '/' + url
+		
+		logging.info('Downloading: %s' % url)
+		data = self.opener.open(url).read()
+		
+		lines = data.split('\n')
+		
+		emit = False
+		
+		post = ''
+		
+		for l in lines:
+			if l.find('</div></form>') != -1:
+				logging.debug('emit = True')
+				emit = True
+				continue
+			elif l.find('<form action="#">') != -1:
+				logging.debug('emit = False')
+				if emit:
+					break
+				else:
+					emit = False
+			
+			if emit:
+				post = post + l + '\n'
+		
+		return post
+
+	def setLogin(self, login):
+		self.login = login
+
+	def setPassword(self, password):
+		self.password = password
+	
+	def getStoryName(self):
+		return self.storyName
+		
+	def getAuthorName(self):
+		return self.author
+
+	def getPrintableUrl(self, url):
+		return url
+
+class FFA_UnitTests(unittest.TestCase):
+	def setUp(self):
+		logging.basicConfig(level=logging.DEBUG)
+		pass
+	
+	def testRequiresLoginNeg(self):
+		f = FFA('http://jeconais.fanficauthors.net/Happily_Ever_After/Introduction/')
+		self.assertFalse(f.requiresLogin())
+	
+	def testRequiresLogin(self):
+		f = FFA('http://jeconais.fanficauthors.net/Rons_Harem/Rons_Harem/')
+		self.assertTrue(f.requiresLogin())
+	
+	def testPerformLogin(self):
+		f = FFA('http://jeconais.fanficauthors.net/Rons_Harem/Rons_Harem/')
+		
+		if login_password != None:
+			f.setLogin(login_password.login)
+			f.setPassword(login_password.password)
+		
+		self.assertTrue(f.performLogin(None))
+		
+	def testExtractURLsAuthorStoryName(self):
+		f = FFA('http://draco664.fanficauthors.net/Apprentice_Potter/Prologue/')
+		f.extractIndividualUrls()
+		
+		self.assertEquals('Draco664', f.getAuthorName())
+		self.assertEquals('Apprentice Potter', f.getStoryName())
+	
+	def testExtractUrls(self):
+		f = FFA('http://draco664.fanficauthors.net/Apprentice_Potter/Prologue/')
+		urls = f.extractIndividualUrls()
+		self.assertEquals(25, len(urls))
+		
+		self.assertEquals('Grievances', urls[2][1])
+		self.assertEquals('/Apprentice_Potter/Prologue/', urls[0][0])
+	
+	def testGetText(self):
+		f = FFA('http://jeconais.fanficauthors.net/Happily_Ever_After/Introduction/')
+		data = f.getText('http://jeconais.fanficauthors.net/Happily_Ever_After/Introduction/')
+		
+		self.assertTrue(data.find('smiled slightly, and settled back in her rocking chair') != -1)
+		
+	def testGetTextLogin(self):
+		url = 'http://viridian.fanficauthors.net/Out_of_the_Darkness_A_Jinchuurikis_Tale/A_Harrowing_Escape/'
+		f = FFA(url)
+		
+		if login_password != None:
+			f.setLogin(login_password.login)
+			f.setPassword(login_password.password)
+		
+		if f.requiresLogin():
+			f.performLogin()
+		
+		data = f.getText(url)
+		seek = 'So Hokage-sama” I said, “this is how we came'
+		self.assertTrue(data.find(seek) != -1)
+		
+if __name__ == '__main__':
+	unittest.main()
\ No newline at end of file
diff --git a/ffnet.py b/ffnet.py
new file mode 100644
index 00000000..1d358e0f
--- /dev/null
+++ b/ffnet.py
@@ -0,0 +1,162 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import base64
+import os.path
+import logging
+import unittest
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+from constants import *
+from adapter import *
+
+try:
+	import login_password
+except:
+	# tough luck
+	pass
+
+try:
+	from google.appengine.api.urlfetch import fetch as googlefetch
+	appEngine = True
+except:
+	appEngine = False
+
+class FFNet(FanfictionSiteAdapter):
+	def __init__(self, url):
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		
+		self.storyName = 'FF.Net story'
+		self.storyName = 'FF.Net author'
+		
+		spl = self.path.split('/')
+		if len(spl) == 5:
+			self.path = "/".join(spl[1:-1])
+		
+		if self.path.startswith('/'):
+			self.path = self.path[1:]
+		
+		if self.path.endswith('/'):
+			self.path = self.path[:-1]
+		
+		(s, self.storyId, chapter) = self.path.split('/')
+		
+		logging.debug('self.storyId=%s, chapter=%s' % (self.storyId, chapter))
+		
+		if not appEngine:
+			self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+		else:
+			self.opener = None
+	
+		logging.debug("Created FF.Net: url=%s" % (self.url))
+	
+	def _getLoginScript(self):
+		return self.path
+
+	def requiresLogin(self, url = None):
+		return False
+
+	def performLogin(self, url = None):
+		return True
+	
+	def _fetchUrl(self, url):
+		if not appEngine:
+			return self.opener.open(url).read().decode('utf-8')
+		else:
+			return googlefetch(url).content
+	
+	def extractIndividualUrls(self):
+		data = self._fetchUrl(self.url)
+
+		urls = []
+		lines = data.split('\n')
+		for l in lines:
+			if l.find("<img src='http://c.fanfiction.net/static/ficons/script.png' width=16 height=16  border=0  align=absmiddle>") != -1:
+				s2 = bs.BeautifulStoneSoup(l)
+				self.storyName = s2.find('b').string
+			elif l.find("<a href='/u/") != -1:
+				s2 = bs.BeautifulStoneSoup(l)
+				self.authorName = s2.a.string
+			elif l.find("<SELECT title='chapter navigation'") != -1:
+				if len(urls) > 0:
+					continue
+				u = l.decode('utf-8')
+				u = re.sub('&\#[0-9]+;', ' ', u)
+				s2 = bs.BeautifulSoup(u)
+				options = s2.findAll('option')
+				for o in options:
+					url = 'http://fanfiction.net/s/' + self.storyId + '/' + o['value']
+					title = o.string
+					logging.debug('URL = `%s`, Title = `%s`' % (url, title))
+					urls.append((url,title))
+		
+		return urls
+	
+	def getText(self, url):
+		data = self._fetchUrl(url)
+		lines = data.split('\n')
+		for l in lines:
+			if l.find('<!-- start story -->') != -1:
+				s2 = bs.BeautifulStoneSoup(l)
+				return s2.div.prettify()
+		
+		
+	def setLogin(self, login):
+		self.login = login
+
+	def setPassword(self, password):
+		self.password = password
+
+	def getStoryName(self):
+		return self.storyName
+
+	def getAuthorName(self):
+		return self.authorName
+
+class FFA_UnitTests(unittest.TestCase):
+	def setUp(self):
+		logging.basicConfig(level=logging.DEBUG)
+		pass
+	
+	def testChaptersAuthStory(self):
+		f = FFNet('http://www.fanfiction.net/s/5257563/1')
+		f.extractIndividualUrls()
+		
+		self.assertEquals('Beka0502', f.getAuthorName())
+		self.assertEquals("Draco's Redemption", f.getStoryName())
+
+	def testChaptersCountNames(self):
+		f = FFNet('http://www.fanfiction.net/s/5257563/1')
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals(8, len(urls))
+	
+	def testGetText(self):
+		url = 'http://www.fanfiction.net/s/5257563/1'
+		f = FFNet(url)
+		text = f.getText(url)
+		self.assertTrue(text.find('He was just about to look at some photos when he heard a crack') != -1)
+	
+	def testBrokenWands(self):
+		url = 'http://www.fanfiction.net/s/1527263/30/Harry_Potter_and_Broken_Wands'
+		f = FFNet(url)
+		text = f.getText(url)
+		
+		urls = f.extractIndividualUrls()
+		
+	
+if __name__ == '__main__':
+	unittest.main()
\ No newline at end of file
diff --git a/fictionalley.py b/fictionalley.py
new file mode 100644
index 00000000..6ccc5ad8
--- /dev/null
+++ b/fictionalley.py
@@ -0,0 +1,75 @@
+import os
+import re
+import sys
+import shutil
+import os.path
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+class FictionAlley:
+	def __init__(self):
+		pass
+	
+	def extractIndividualUrls(self, data, host, contents):
+		soup = bs.BeautifulStoneSoup(data)
+		
+		title = soup.find('title').string
+		self.storyName = "-".join(title.split('-')[1:]).strip()
+		
+		authors = soup.findAll('a')
+		
+		print('Story "%s" by %s' % (self.storyName, self.authorName))
+		
+		links = soup.findAll('a', { 'class' : 'chapterlink' } )
+
+		result = []
+		for a in links:
+			url = a['href']
+			title = a.string
+			result.append((url,title))
+			
+		return result
+	
+	def getStoryName(self):
+		return self.storyName
+
+	def getAuthorName(self):
+		return self.authorName
+	
+
+	def getText(self, data, fetch = False):
+		soup = bs.BeautifulStoneSoup(data)
+		div = soup.find('div', {'id' : 'storytext'})
+		if None == div:
+			return '<html/>'
+		
+		return div.prettify()
+	
+	def getPrintableUrl(self, url):
+		return url
+	
+	def getPasswordLine(self):
+		return 'opaopapassword'
+
+	def getLoginScript(self):
+		return 'opaopaloginscript'
+
+	def getLoginPasswordOthers(self):
+		login = dict(login = 'name', password = 'pass')
+		other = dict(submit = 'Log In', remember='yes')
+		return (login, other)
+
+		
+if __name__ == '__main__':
+	url = 'http://www.fictionalley.org/authors/drt/DA.html'
+	data = u2.urlopen(url).read()
+	host = up.urlparse(url).netloc
+	fw = FictionAlley()
+	fw.authorName = 'DrT'
+	urls = fw.extractIndividualUrls(data, host, url)
+	pp.pprint(urls)
+	print(fw.getText(data))
\ No newline at end of file
diff --git a/ficwad.py b/ficwad.py
new file mode 100644
index 00000000..35b3b76e
--- /dev/null
+++ b/ficwad.py
@@ -0,0 +1,98 @@
+import os
+import re
+import sys
+import shutil
+import os.path
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+from adapter import *
+
+class FicWad(FanfictionSiteAdapter):
+	def __init__(self, url):
+		self.url = url
+		self.host = up.urlparse(url).netloc
+	
+	def requiresLogin(self, url):
+		return False
+	
+	def performLogin(self, url):
+		pass
+		
+	def setLogin(self, login):
+		self.login = login
+	
+	def setPassword(self, password):
+		self.password = password
+	
+	def extractIndividualUrls(self):
+		data = u2.urlopen(self.url).read()
+		soup = bs.BeautifulStoneSoup(data)
+		
+		title = soup.find('title').string
+		self.storyName = title.split('::')[0].strip()
+		
+		author = soup.find('span', {'class' : 'author'})
+		self.authorName = author.a.string
+		
+		print('Story "%s" by %s' % (self.storyName, self.authorName))
+		
+		select = soup.find('select', { 'name' : 'goto' } )
+		
+		allOptions = select.findAll('option')
+		result = []
+		for o in allOptions:
+			url = o['value']
+#			if type(url) is unicode:
+#				url = url.encode('utf-8')
+			title = o.string
+			result.append((url,title))
+			
+		return result
+	
+	def getStoryName(self):
+		return self.storyName
+
+	def getAuthorName(self):
+		return self.authorName
+	
+	def getText(self, url):
+		if url.find('http://') == -1:
+			url = 'http://' + self.host + '/' + url
+		
+		data = u2.urlopen(url).read()
+		
+		soup = bs.BeautifulStoneSoup(data)
+		div = soup.find('div', {'id' : 'storytext'})
+		if None == div:
+			return '<html/>'
+		
+		return div.prettify()
+	
+	def getPrintableUrl(self, url):
+		return url
+	
+	def getPasswordLine(self):
+		return 'opaopapassword'
+
+	def getLoginScript(self):
+		return 'opaopaloginscript'
+
+	def getLoginPasswordOthers(self):
+		login = dict(login = 'name', password = 'pass')
+		other = dict(submit = 'Log In', remember='yes')
+		return (login, other)
+
+		
+if __name__ == '__main__':
+	url = 'http://www.ficwad.com/story/14536'
+	data = u2.urlopen(url).read()
+	host = up.urlparse(url).netloc
+	fw = FicWad(url)
+	urls = fw.extractIndividualUrls()
+	pp.pprint(urls)
+	print(fw.getText(data))
\ No newline at end of file
diff --git a/html_constants.py b/html_constants.py
new file mode 100644
index 00000000..c698e8f4
--- /dev/null
+++ b/html_constants.py
@@ -0,0 +1,17 @@
+XHTML_START = '''<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN" "http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml">
+<head>
+<title>${title} by ${author}</title>
+<link href="stylesheet.css" type="text/css" rel="stylesheet" />
+</head>
+<body>
+<div>
+<h1>${title} by ${author}</h1>
+${body}
+</body></html>
+'''
+
+XHTML_CHAPTER_START = '''<h2>${chapter}</h2>'''
+
+XHTML_END = ''''''
diff --git a/output.py b/output.py
new file mode 100644
index 00000000..d03a7c53
--- /dev/null
+++ b/output.py
@@ -0,0 +1,252 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import codecs
+import shutil
+import string
+import base64
+import os.path
+import zipfile
+import StringIO
+import logging
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+import zipdir
+import html_constants
+from constants import *
+
+
+
+class FanficWriter:
+	def __init__(self):
+		pass
+		
+	def writeChapter(self, title, text):
+		pass
+	
+	def finalise(self):
+		pass
+
+class HTMLWriter(FanficWriter):
+	body = ''
+	
+	def __init__(self, base, name, author, inmemory=False, compress=False):
+		self.basePath = base
+		self.name = name.replace(" ", "_")
+		self.storyTitle = name
+		self.fileName = self.basePath + '/' + self.name + '.html'
+		self.authorName = author
+		
+		self.inmemory = inmemory
+
+		if not self.inmemory and os.path.exists(self.fileName):
+			os.remove(self.fileName)
+		
+		if self.inmemory:
+			self.output = StringIO.StringIO()
+		else:
+			self.output = open(self.fileName, 'w')
+		
+		self.xhtmlTemplate = string.Template(html_constants.XHTML_START)
+		self.chapterStartTemplate = string.Template(html_constants.XHTML_CHAPTER_START)
+		
+	def writeChapter(self, title, text):
+		title = title.decode('utf-8')
+		text = text.decode('utf-8')
+		self.body = self.body + '\n' + self.chapterStartTemplate.substitute({'chapter' : title})
+		self.body = self.body + '\n' + text
+	
+	def finalise(self):
+		html = self.xhtmlTemplate.substitute({'title' : self.storyTitle, 'author' : self.authorName, 'body' : self.body})
+		soup = bs.BeautifulSoup(html)
+		result = soup.prettify()
+		
+#		f = open(self.fileName, 'w')
+#		f.write(result)
+#		f.close()
+
+		self.output.write(result)
+		if not self.inmemory:
+			self.output.close()
+
+class EPubFanficWriter(FanficWriter):
+	chapters = []
+	
+	files = {}
+	
+	def _writeFile(self, fileName, data):
+		if fileName in self.files:
+			self.files[fileName].write(data.decode('utf-8'))
+		else:
+			if self.inmemory:
+				self.files[fileName] = StringIO.StringIO()
+			else:
+				self.files[fileName] = open(self.directory + '/' + fileName, 'w')
+
+			self._writeFile(fileName, data)
+		
+		
+	def _closeFiles(self):
+		if not self.inmemory:
+			for f in self.files:
+				self.files[f].close()
+	
+	def __init__(self, base, name, author, inmemory=False, compress=True):
+		self.basePath = base
+		self.name = name.replace(" ", "_")
+		self.storyTitle = name
+		self.directory = self.basePath + '/' + self.name
+		self.inmemory = inmemory
+		self.authorName = author
+		
+		self.files = {}
+		self.chapters = []
+		
+		if not self.inmemory:
+			self.inmemory = True
+			self.writeToFile = True
+		else:
+			self.writeToFile = False
+		
+
+		if not self.inmemory:
+			if os.path.exists(self.directory):
+				shutil.rmtree(self.directory)
+		
+			os.mkdir(self.directory)
+		
+			os.mkdir(self.directory + '/META-INF')
+			os.mkdir(self.directory + '/OEBPS')
+		
+#		print >> codecs.open(self.directory + '/mimetype', 'w', 'utf-8'), MIMETYPE
+#		print >> codecs.open(self.directory + '/META-INF/container.xml', 'w', 'utf-8'), CONTAINER
+#		print >> codecs.open(self.directory + '/OEBPS/stylesheet.css', 'w', 'utf-8'), CSS
+
+		self._writeFile('mimetype', MIMETYPE)
+		self._writeFile('META-INF/container.xml', CONTAINER)
+		self._writeFile('OEBPS/stylesheet.css', CSS)
+
+	def _removeEntities(self, text):
+		for e in entities:
+			v = entities[e]
+			text = text.replace(e, v)
+		
+		text = text.replace('&', '&amp;')
+		
+		return text
+	
+	def writeChapter(self, title, text):
+		fileName = base64.b64encode(title).replace('/', '_') + ".xhtml"
+		filePath = self.directory + "/OEBPS/" + fileName
+		
+		fn = 'OEBPS/' + fileName
+		
+#		f = open(filePath, 'w')
+		
+		text = self._removeEntities(text)
+		
+		self.soup = bs.BeautifulStoneSoup(text)
+
+		allTags = self.soup.findAll(recursive=True)
+		for t in allTags:
+			for attr in t._getAttrMap().keys():
+				if attr not in acceptable_attributes:
+					del t[attr]
+	    
+		allPs = self.soup.findAll(recursive=True)
+		for p in allPs:
+			if p.string != None and (len(p.string.strip()) == 0 or p.string.strip() == '&nbsp;' ) :
+				p.extract()
+				
+		allBrs = self.soup.findAll(recursive=True, name = ["br", "hr"])
+		for br in allBrs:
+			if (br.string != None and len(br.string.strip()) != 0) or (br.contents != None):
+				br.name = 'p'
+
+#		cleanup(self.soup )
+		
+		text = self.soup.prettify()
+		
+		tt = self._removeEntities(title)
+		
+		self._writeFile(fn, XHTML_START % (tt, tt))
+		self._writeFile(fn, text)
+		self._writeFile(fn, XHTML_END)
+#		print >> f, XHTML_START % (tt, tt)
+#		f.write(text)
+#		print >> f, XHTML_END
+		
+		self.chapters.append((title, fileName))
+	
+	def finalise(self):
+		logging.debug("Finalising...")
+		### writing table of contents -- ncx file
+		
+		tocFilePath = "OEBPS/toc.ncx"
+#		toc = open(tocFilePath, 'w')
+#		print >> toc, TOC_START % self.storyTitle
+		self._writeFile(tocFilePath, TOC_START % self.storyTitle)
+		### writing content -- opf file
+		opfFilePath = "OEBPS/content.opf"
+		
+#		opf = open(opfFilePath, 'w')
+		self._writeFile(opfFilePath, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName))
+#		print >> opf, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName)
+
+		ids = []
+		
+		i = 0
+		for t,f in self.chapters:
+			chapterId = base64.b64encode(t)
+#			print >> toc, TOC_ITEM % (chapterId, i, cgi.escape(t), f)
+			self._writeFile(tocFilePath, TOC_ITEM % (chapterId, i, cgi.escape(t), f))
+#			print >> opf, CONTENT_ITEM % (chapterId, f)
+			self._writeFile(opfFilePath, CONTENT_ITEM % (chapterId, f))
+			
+			ids.append(chapterId)
+			
+			i = i + 1
+			
+#		logging.d('Toc and refs printed, proceesing to ref-ids....')
+		
+#		print >> toc, TOC_END
+#		print >> opf, CONTENT_END_MANIFEST		
+
+		self._writeFile(tocFilePath, TOC_END)
+		self._writeFile(opfFilePath, CONTENT_END_MANIFEST)
+		
+		for chapterId in ids:
+#			print >> opf, CONTENT_ITEMREF % chapterId
+			self._writeFile(opfFilePath, CONTENT_ITEMREF % chapterId)
+		
+#		print >> opf, CONTENT_END
+		self._writeFile(opfFilePath, CONTENT_END)
+		
+#		opf.close()
+#		toc.close()
+		
+#		print('Finished')
+		
+		self._closeFiles()
+		
+		filename = self.directory + '.epub'
+		
+		zipdata = zipdir.inMemoryZip(self.files)
+		
+		if self.writeToFile:
+			f = open(filename, 'w')
+			f.write(zipdata.getvalue())
+			f.close()
+		else:
+			self.output = zipdata
+			
+#		zipdir.toZip(filename, self.directory)
diff --git a/zipdir.py b/zipdir.py
new file mode 100644
index 00000000..0da2691d
--- /dev/null
+++ b/zipdir.py
@@ -0,0 +1,69 @@
+import os
+import zipfile
+import logging
+
+import StringIO
+
+def toZip(filename, directory):
+	zippedHelp = zipfile.ZipFile(filename, "w", compression=zipfile.ZIP_DEFLATED)
+	lst = os.listdir(directory)
+	
+	for entity in lst:
+		if entity.startswith('.'):
+			continue
+
+		each = os.path.join(directory,entity)
+		print(each)
+
+		if os.path.isfile(each):
+			print(each)
+			zippedHelp.write(each, arcname=entity)
+		else:
+			addFolderToZip(zippedHelp,entity, each)
+ 	
+	zippedHelp.close()
+
+def addFolderToZip(zippedHelp,folder,fpath):
+	#print('addFolderToZip(%s)' % folder)
+	
+	if folder == '.' or folder == '..':
+		return
+	
+	folderFiles = os.listdir(fpath)
+	for f in folderFiles:
+		if os.path.isfile(fpath + '/' + f):
+			#print('basename=%s' % os.path.basename(fpath + '/' + f))
+			zippedHelp.write(fpath + '/' + f, folder + '/' + f, zipfile.ZIP_DEFLATED)
+		elif os.path.isdir(f):
+			addFolderToZip(zippedHelp,f)
+
+def inMemoryZip(files):
+	# files have a structure of {'path/to/file' => content} dictionary
+	io = StringIO.StringIO()
+	memzip = zipfile.ZipFile(io, 'a', compression=zipfile.ZIP_DEFLATED)
+	memzip.debug = 3
+	
+	for path in files:
+		if type(files[path]) != type('str'):
+			data = files[path].getvalue()
+		else:
+			data = files[path]
+		
+#		logging.debug(data)
+		memzip.writestr(path, data.encode('utf-8'))
+	
+	for zf in memzip.filelist:
+		zf.create_system = 0
+	
+	memzip.close()
+	
+	return io
+
+if __name__ == '__main__':
+#	toZip('sample.epub', "books/A_Time_To_Reflect")
+#	z = zipfile.ZipFile('sample.epub', 'r')
+	files = {'test.txt' : 'test', 'data/abc.txt' : 'abc'}
+	data = inMemoryZip(files)
+	f = open('res.zip', 'w')
+	f.write(data)
+	f.close()
\ No newline at end of file

From 5143a2187a08d3481d4e7132c33d2a66020d03b9 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Fri, 18 Dec 2009 18:55:57 +0000
Subject: [PATCH 22/94] fictionpress.com support added

---
 constants.py  |  4 ++--
 downaloder.py |  5 ++++-
 ffnet.py      | 21 ++++++++++++++++++---
 output.py     |  2 +-
 4 files changed, 25 insertions(+), 7 deletions(-)

diff --git a/constants.py b/constants.py
index 27515658..6af00eb6 100644
--- a/constants.py
+++ b/constants.py
@@ -102,7 +102,7 @@ XHTML_END = '''</div>
 
 acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
       'blockquote', 'br', 'center', 'cite', 'code', 'col',
-      'colgroup', 'dd', 'del', 'dfn', 'dir', 'div', 'dl', 'dt', 'em',
+      'colgroup', 'dd', 'del', 'dfn', 'dir', 'dl', 'dt', 'em',
       'font', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'i', 
       'ins', 'kbd', 'label', 'li', 'ol', 
       'p', 'pre', 'q', 's', 'samp', 'small', 'span', 'strike',
@@ -110,7 +110,7 @@ acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
 
 acceptable_attributes = ['href']
 
-entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', '&lsquo;' : '\'', '&quot;' : '"' }
+entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', '&lsquo;' : '\'', '&quot;' : '"', '&hellip;' : '...' }
 
 FB2_PROLOGUE = '<FictionBook>'
 FB2_DESCRIPTION = '''<description>
diff --git a/downaloder.py b/downaloder.py
index 34b369db..fa9d1466 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -17,6 +17,7 @@ import ffnet
 import ficwad
 import output
 import fictionalley
+import hpfiction
 
 class FanficLoader:
 	'''A controller class which handles the interaction between various specific downloaders and writers'''
@@ -66,8 +67,10 @@ if __name__ == '__main__':
 		sys.exit(0)
 	elif url.find('ficwad') != -1:
 		adapter = ficwad.FicWad(url)
-	elif url.find('fanfiction.net') != -1:
+	elif url.find('fanfiction.net') != -1 or url.find('fictionpress.com') != -1:
 		adapter = ffnet.FFNet(url)
+	elif url.find('harrypotterfanfiction.com') != -1:
+		adapter = hpfiction.HPFiction(url)
 	else:
 		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
 		sys.exit(1)
diff --git a/ffnet.py b/ffnet.py
index 4af36792..ddb7e53b 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -77,11 +77,17 @@ class FFNet(FanfictionSiteAdapter):
 	
 	def extractIndividualUrls(self):
 		data = self._fetchUrl(self.url)
+		d2 = re.sub('&\#[0-9]+;', ' ', data)
+		soup = bs.BeautifulStoneSoup(d2)
+		allA = soup.findAll('a')
+		for a in allA:
+			if 'href' in a._getAttrMap() and a['href'].find('/u/') != -1:
+				self.authorName = a.string
 
 		urls = []
 		lines = data.split('\n')
 		for l in lines:
-			if l.find("<img src='http://c.fanfiction.net/static/ficons/script.png' width=16 height=16  border=0  align=absmiddle>") != -1:
+			if l.find("&#187;") != -1 and l.find('<b>') != -1:
 				s2 = bs.BeautifulStoneSoup(l)
 				self.storyName = s2.find('b').string
 			elif l.find("<a href='/u/") != -1:
@@ -95,7 +101,7 @@ class FFNet(FanfictionSiteAdapter):
 				s2 = bs.BeautifulSoup(u)
 				options = s2.findAll('option')
 				for o in options:
-					url = 'http://fanfiction.net/s/' + self.storyId + '/' + o['value']
+					url = 'http://' + self.host + '/s/' + self.storyId + '/' + o['value']
 					title = o.string
 					logging.debug('URL = `%s`, Title = `%s`' % (url, title))
 					urls.append((url,title))
@@ -153,7 +159,16 @@ class FFA_UnitTests(unittest.TestCase):
 		text = f.getText(url)
 		
 		urls = f.extractIndividualUrls()
-		
 	
+	def testFictionPress(self):
+		url = 'http://www.fictionpress.com/s/2725180/1/Behind_This_Facade'
+		f = FFNet(url)
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals('Behind This Facade', f.getStoryName())
+		self.assertEquals('IntoxicatingMelody', f.getAuthorName())
+	
+		text = f.getText(url)
+		self.assertTrue(text.find('Kale Resgerald at your service" He answered, "So, can we go now? Or do you want to') != -1)
 if __name__ == '__main__':
 	unittest.main()
\ No newline at end of file
diff --git a/output.py b/output.py
index 3042441d..138c268e 100644
--- a/output.py
+++ b/output.py
@@ -164,7 +164,7 @@ class EPubFanficWriter(FanficWriter):
 			if p.string != None and (len(p.string.strip()) == 0 or p.string.strip() == '&nbsp;' ) :
 				p.extract()
 				
-		allBrs = self.soup.findAll(recursive=True, name = ["br", "hr"])
+		allBrs = self.soup.findAll(recursive=True, name = ["br", "hr", 'div'])
 		for br in allBrs:
 			if (br.string != None and len(br.string.strip()) != 0) or (br.contents != None):
 				br.name = 'p'

From ed9e2992c00afafb4f88461bbf93a9ec1c5cfec1 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Fri, 18 Dec 2009 18:57:53 +0000
Subject: [PATCH 23/94] hpfiction added - not yet working

---
 hpfiction.py | 106 +++++++++++++++++++++++++++++++++++++++++++++++++++
 1 file changed, 106 insertions(+)
 create mode 100644 hpfiction.py

diff --git a/hpfiction.py b/hpfiction.py
new file mode 100644
index 00000000..f33849a7
--- /dev/null
+++ b/hpfiction.py
@@ -0,0 +1,106 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import base64
+import os.path
+import logging
+import unittest
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+from constants import *
+from adapter import *
+
+try:
+	import login_password
+except:
+	# tough luck
+	pass
+
+class HPFiction(FanfictionSiteAdapter):
+	def __init__(self, url):
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		
+		self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+	
+		logging.debug("Created HPFiction: url=%s" % (self.url))
+	
+	def _getLoginScript(self):
+		return self.path
+
+	def requiresLogin(self, url = None):
+		return False
+
+	def performLogin(self, url = None):
+		return True
+	
+	def extractIndividualUrls(self):
+		data = self.opener.open(self.url).read()
+		soup = bs.BeautifulSoup(data)
+		
+		links = soup.findAll('a')
+		
+		for a in links:
+			if a['href'].find('psid') != -1:
+				self.storyName = a.string
+			elif a['href'].find('viewuser.php') != -1:
+				self.authorName = a.string
+		
+		select = soup.find('select', {'name' : 'chapterid'})
+		urls = []
+		for o in select.findAll('option'):
+			if 'value' in o._getAttrMap():
+				url = 'http://' + self.host + '/' + self.path + o['value']
+				title = o.string
+				urls.append((url,title))
+		return urls
+
+	def getStoryName(self):
+		return self.storyName
+
+	def getAuthorName(self):
+		return self.authorName
+	
+	def getText(self, url):
+		logging.debug('Downloading from URL: %s' % url)
+		data = self.opener.open(self.url).read()
+		soup = bs.BeautifulSoup(data)
+		divtext = soup.find('div', {'id' : 'fluidtext'})
+		return divtext.prettify()
+
+class FF_UnitTests(unittest.TestCase):
+	def setUp(self):
+		logging.basicConfig(level=logging.DEBUG)
+		pass
+
+	def testChaptersAuthStory(self):
+		f = HPFiction('http://www.harrypotterfanfiction.com/viewstory.php?chapterid=80123')
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals(49, len(urls))
+		self.assertEquals('Elisha', f.getAuthorName())
+		self.assertEquals('A Secret Thought', f.getStoryName())
+	
+	def testGetText(self):
+		url = 'http://www.harrypotterfanfiction.com/viewstory.php?chapterid=80123'
+		f = HPFiction(url)
+		#urls = f.extractIndividualUrls()
+		text = f.getText(url)
+		self.assertTrue(text.find('She pulled out of his arms and felt the subtle regret') != -1)
+
+if __name__ == '__main__':
+	unittest.main()
+
+	
\ No newline at end of file

From 1740e0da48e4e147583e6cf3a69ae25d49fa78eb Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Mon, 21 Dec 2009 13:12:47 +0000
Subject: [PATCH 24/94] Changes while moving to AJAX service

---
 adapter.py    |  7 +++++++
 downaloder.py | 13 ++++++++++---
 ffa.py        | 50 ++++++++++++++++++++++++++++++++++++++++++++------
 ffnet.py      |  4 ++--
 output.py     | 45 ++++++++++++++++++++++++---------------------
 zipdir.py     |  6 +++++-
 6 files changed, 92 insertions(+), 33 deletions(-)

diff --git a/adapter.py b/adapter.py
index ff1cb8ef..bf37a017 100644
--- a/adapter.py
+++ b/adapter.py
@@ -1,3 +1,10 @@
+class LoginRequiredException(Exception):
+	def __init__(self, url):
+		self.url = url
+	
+	def __str__(self):
+		return repr(self.url + ' requires user to be logged in')
+
 class FanfictionSiteAdapter:
 	login = ''
 	password = ''
diff --git a/downaloder.py b/downaloder.py
index e119f810..dee7a30d 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -12,13 +12,17 @@ import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
+
 import ffa
 import ffnet
 import ficwad
 import output
+import adapter
 import fictionalley
 import hpfiction
 
+import time
+
 class FanficLoader:
 	'''A controller class which handles the interaction between various specific downloaders and writers'''
 	booksDirectory = "books"
@@ -30,7 +34,10 @@ class FanficLoader:
 		self.inmemory = inmemory
 		self.compress = compress
 		self.badLogin = False
-		
+	
+	def getAdapter():
+		return self.adapter
+	
 	def download(self):
 		logging.debug("Trying to download the story")
 		if self.adapter.requiresLogin():
@@ -38,7 +45,7 @@ class FanficLoader:
 			if not self.adapter.performLogin():
 				logging.debug("Login/password problem")
 				self.badLogin = True
-				return None
+				raise adapter.LoginRequiredException(self.adapter.url)
 		
 		urls = self.adapter.extractIndividualUrls()
 		self.writer = self.writerClass(self.booksDirectory, self.adapter.getStoryName(), self.adapter.getAuthorName(), inmemory=self.inmemory, compress=self.compress)
@@ -50,7 +57,7 @@ class FanficLoader:
 			i = i+1
 			text = self.adapter.getText(u)
 			self.writer.writeChapter(n, text)
-		
+			
 		self.writer.finalise()
 		
 		if self.inmemory:
diff --git a/ffa.py b/ffa.py
index b8c307ec..ca81c6d5 100644
--- a/ffa.py
+++ b/ffa.py
@@ -39,13 +39,21 @@ class FFA(FanfictionSiteAdapter):
 	def _getLoginScript(self):
 		return self.path
 
-	def requiresLogin(self, url = None):
-		resp = self.opener.open(self.url)
-		data = resp.read()
-		if data.find('<legend>Please login to continue</legend>') != -1:
+	def reqLoginData(self, data):
+		if data.find('<legend>Please login to continue</legend>') != -1 or data.find('<h4>Username or password not found.  Please') != -1 or data.find("This story is rated Mature, you must be logged in to view it") != -1:
 			return True
 		else:
 			return False
+
+	def requiresLogin(self, url = None):
+		if url == None:
+			u = self.url
+		else:
+			u = url
+
+		resp = self.opener.open(u)
+		data = resp.read()
+		return self.reqLoginData(data)
  
 	def performLogin(self, url = None):
 		if url == None:
@@ -63,7 +71,9 @@ class FFA(FanfictionSiteAdapter):
 		
 		req = self.opener.open(loginUrl, urlvals)
 		
-		if self.requiresLogin():
+		d = req.read()
+
+		if self.reqLoginData(d) :
 			return False
 		else:
 			return True
@@ -72,7 +82,16 @@ class FFA(FanfictionSiteAdapter):
 		data = self.opener.open(self.url).read()
 		soup = bs.BeautifulStoneSoup(data)
 
-		self.author = soup.find('a', {'href' : '/contact/'}).string
+		if self.reqLoginData(data):
+			logging.debug('Data requires login, trying to login')
+			if not self.performLogin(url):
+				logging.error('Cannot login, raising exception ... ')
+				raise LoginRequiredException(url)
+			else:
+				data = self.opener.open(url).read()
+			
+
+		self.author = str(soup.find('a', {'href' : '/contact/'}).string)
 		self.storyName = str(soup.find('h1', {'class' : 'textCenter'}).contents[0]).strip()
 		
 		logging.debug("Story `%s` by `%s`" % (self.storyName, self.author))
@@ -97,6 +116,14 @@ class FFA(FanfictionSiteAdapter):
 		logging.info('Downloading: %s' % url)
 		data = self.opener.open(url).read()
 		
+		if self.reqLoginData(data):
+			logging.debug('Data requires login, trying to login')
+			if not self.performLogin(url):
+				logging.error('Cannot login, raising exception ... ')
+				raise LoginRequiredException(url)
+			else:
+				data = self.opener.open(url).read()
+		
 		lines = data.split('\n')
 		
 		emit = False
@@ -192,6 +219,17 @@ class FFA_UnitTests(unittest.TestCase):
 		data = f.getText(url)
 		seek = 'So Hokage-sama” I said, “this is how we came'
 		self.assertTrue(data.find(seek) != -1)
+	
+	def testSemiLoginRequired(self):
+		f = FFA('http://viridian.fanficauthors.net/Harry_Potter_and_the_Nightmares_of_Futures_Past/The_End_of_Days/')
+		
+		urls = f.extractIndividualUrls()
+		
+		try:
+			data = f.getText('http://viridian.fanficauthors.net/Harry_Potter_and_the_Nightmares_of_Futures_Past/Doing_the_Mungo_Shuffle/')
+			self.assertTrue(False)
+		except LoginRequiredException, e:
+			self.assertTrue(True)
 		
 if __name__ == '__main__':
 	unittest.main()
\ No newline at end of file
diff --git a/ffnet.py b/ffnet.py
index ada03a25..852c6097 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -92,10 +92,10 @@ class FFNet(FanfictionSiteAdapter):
 		for l in lines:
 			if l.find("&#187;") != -1 and l.find('<b>') != -1:
 				s2 = bs.BeautifulStoneSoup(l)
-				self.storyName = s2.find('b').string
+				self.storyName = str(s2.find('b').string)
 			elif l.find("<a href='/u/") != -1:
 				s2 = bs.BeautifulStoneSoup(l)
-				self.authorName = s2.a.string
+				self.authorName = str(s2.a.string)
 			elif l.find("<SELECT title='chapter navigation'") != -1:
 				if len(urls) > 0:
 					continue
diff --git a/output.py b/output.py
index 36961468..aeea8cda 100644
--- a/output.py
+++ b/output.py
@@ -13,6 +13,7 @@ import os.path
 import zipfile
 import StringIO
 import logging
+import hashlib
 import urllib as u
 import pprint as pp
 import urllib2 as u2
@@ -84,14 +85,20 @@ class EPubFanficWriter(FanficWriter):
 	files = {}
 	
 	def _writeFile(self, fileName, data):
+		logging.debug('_writeFile(`%s`, data)' % fileName)
 		if fileName in self.files:
-			self.files[fileName].write(data.decode('utf-8'))
+			try:
+				d = data.decode('utf-8')
+			except UnicodeEncodeError, e:
+				d = data
+			
+			self.files[fileName].write(d)
 		else:
 			if self.inmemory:
 				self.files[fileName] = StringIO.StringIO()
 			else:
 				self.files[fileName] = open(self.directory + '/' + fileName, 'w')
-
+			
 			self._writeFile(fileName, data)
 		
 		
@@ -127,10 +134,6 @@ class EPubFanficWriter(FanficWriter):
 			os.mkdir(self.directory + '/META-INF')
 			os.mkdir(self.directory + '/OEBPS')
 		
-#		print >> codecs.open(self.directory + '/mimetype', 'w', 'utf-8'), MIMETYPE
-#		print >> codecs.open(self.directory + '/META-INF/container.xml', 'w', 'utf-8'), CONTAINER
-#		print >> codecs.open(self.directory + '/OEBPS/stylesheet.css', 'w', 'utf-8'), CSS
-
 		self._writeFile('mimetype', MIMETYPE)
 		self._writeFile('META-INF/container.xml', CONTAINER)
 		self._writeFile('OEBPS/stylesheet.css', CSS)
@@ -145,7 +148,15 @@ class EPubFanficWriter(FanficWriter):
 		return text
 	
 	def writeChapter(self, title, text):
-		fileName = base64.b64encode(title).replace('/', '_') + ".xhtml"
+		logging.debug("Writing chapter: %s" % title)
+		try:
+			fileName = base64.b64encode(title).replace('/', '_') + ".xhtml"
+		except UnicodeEncodeError, e:
+			fileName = base64.b64encode(title.encode('utf-8')).replace('/', '_') + ".xhtml"
+#		title = cgi.esca#title.decode('utf-8')
+#		sha = hashlib.sha224(title)
+#		fileName = sha.hexdigest() + ".xhtml"
+		#fileName = cgi.escape(title) + '.xhtml'
 		filePath = self.directory + "/OEBPS/" + fileName
 		
 		fn = 'OEBPS/' + fileName
@@ -154,7 +165,7 @@ class EPubFanficWriter(FanficWriter):
 		
 		text = self._removeEntities(text)
 		
-		self.soup = bs.BeautifulStoneSoup(text)
+		self.soup = bs.BeautifulStoneSoup(text.decode('utf-8'))
 
 		allTags = self.soup.findAll(recursive=True)
 		for t in allTags:
@@ -206,10 +217,12 @@ class EPubFanficWriter(FanficWriter):
 		
 		i = 0
 		for t,f in self.chapters:
-			chapterId = base64.b64encode(t)
-#			print >> toc, TOC_ITEM % (chapterId, i, cgi.escape(t), f)
+			try:
+				chapterId = base64.b64encode(t)
+			except UnicodeEncodeError, e:
+				chapterId = base64.b64encode(t.encode('utf-8'))
+			
 			self._writeFile(tocFilePath, TOC_ITEM % (chapterId, i, cgi.escape(t), f))
-#			print >> opf, CONTENT_ITEM % (chapterId, f)
 			self._writeFile(opfFilePath, CONTENT_ITEM % (chapterId, f))
 			
 			ids.append(chapterId)
@@ -218,24 +231,14 @@ class EPubFanficWriter(FanficWriter):
 			
 #		logging.d('Toc and refs printed, proceesing to ref-ids....')
 		
-#		print >> toc, TOC_END
-#		print >> opf, CONTENT_END_MANIFEST		
-
 		self._writeFile(tocFilePath, TOC_END)
 		self._writeFile(opfFilePath, CONTENT_END_MANIFEST)
 		
 		for chapterId in ids:
-#			print >> opf, CONTENT_ITEMREF % chapterId
 			self._writeFile(opfFilePath, CONTENT_ITEMREF % chapterId)
 		
-#		print >> opf, CONTENT_END
 		self._writeFile(opfFilePath, CONTENT_END)
 		
-#		opf.close()
-#		toc.close()
-		
-#		print('Finished')
-		
 		self._closeFiles()
 		
 		filename = self.directory + '.epub'
diff --git a/zipdir.py b/zipdir.py
index 0da2691d..a0a568e6 100644
--- a/zipdir.py
+++ b/zipdir.py
@@ -50,7 +50,11 @@ def inMemoryZip(files):
 			data = files[path]
 		
 #		logging.debug(data)
-		memzip.writestr(path, data.encode('utf-8'))
+		logging.debug("Writing ZIP path %s" % path)
+		try:
+			memzip.writestr(path, data.encode('utf-8'))
+		except UnicodeDecodeError, e:
+			memzip.writestr(path.encode('utf-8'), data.encode('utf-8'))
 	
 	for zf in memzip.filelist:
 		zf.create_system = 0

From 48d561de1af562f092b70628b79bd7c9cfbc8079 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Mon, 21 Dec 2009 13:40:11 +0000
Subject: [PATCH 25/94] Fixed multiline ff.net

---
 ffnet.py | 18 ++++++++++++++++--
 1 file changed, 16 insertions(+), 2 deletions(-)

diff --git a/ffnet.py b/ffnet.py
index 852c6097..0816bf81 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -114,10 +114,24 @@ class FFNet(FanfictionSiteAdapter):
 	def getText(self, url):
 		data = self._fetchUrl(url)
 		lines = data.split('\n')
+		
+		textbuf = ''
+		emit = False
+		
 		for l in lines:
 			if l.find('<!-- start story -->') != -1:
-				s2 = bs.BeautifulStoneSoup(l)
-				return s2.div.prettify()
+				#s2 = bs.BeautifulStoneSoup(l)
+				#return s2.div.prettify()
+				emit = True
+			
+			if emit:
+				textbuf = textbuf + "\n" + l
+			
+			if l.find('<!-- end story -->') != -1:
+				emit = False
+		
+		s2 = bs.BeautifulStoneSoup(textbuf)
+		return s2.div.prettify()
 		
 		
 	def setLogin(self, login):

From 2b2e7d52ec2e88ab97742d17bf1e6857fa994827 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Sat, 17 Jul 2010 14:44:14 +0100
Subject: [PATCH 26/94] Starting to use source control again after a long break
 :-)

---
 BeautifulSoup.py | 747 +++++++++++++++++++++++++++++++++--------------
 constants.py     |   3 +-
 ffnet.py         |  47 ++-
 ficwad.py        |   6 +-
 html2text.py     | 450 ++++++++++++++++++++++++++++
 output.py        |  30 +-
 twilighted.py    | 134 +++++++++
 7 files changed, 1173 insertions(+), 244 deletions(-)
 create mode 100644 html2text.py
 create mode 100644 twilighted.py

diff --git a/BeautifulSoup.py b/BeautifulSoup.py
index 458f08a1..748e6fe4 100644
--- a/BeautifulSoup.py
+++ b/BeautifulSoup.py
@@ -1,7 +1,6 @@
 """Beautiful Soup
 Elixir and Tonic
 "The Screen-Scraper's Friend"
-v3.0.0
 http://www.crummy.com/software/BeautifulSoup/
 
 Beautiful Soup parses a (possibly invalid) XML or HTML document into a
@@ -25,7 +24,7 @@ if you also install these three packages:
   http://cjkpython.i18n.org/
 
 Beautiful Soup defines classes for two main parsing strategies:
-    
+
  * BeautifulStoneSoup, for parsing XML, SGML, or your domain-specific
    language that kind of looks like XML.
 
@@ -41,36 +40,83 @@ For more than you ever wanted to know about Beautiful Soup, see the
 documentation:
 http://www.crummy.com/software/BeautifulSoup/documentation.html
 
+Here, have some legalese:
+
+Copyright (c) 2004-2010, Leonard Richardson
+
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are
+met:
+
+  * Redistributions of source code must retain the above copyright
+    notice, this list of conditions and the following disclaimer.
+
+  * Redistributions in binary form must reproduce the above
+    copyright notice, this list of conditions and the following
+    disclaimer in the documentation and/or other materials provided
+    with the distribution.
+
+  * Neither the name of the the Beautiful Soup Consortium and All
+    Night Kosher Bakery nor the names of its contributors may be
+    used to endorse or promote products derived from this software
+    without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
+CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
+PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
+LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE, DAMMIT.
+
 """
 from __future__ import generators
 
 __author__ = "Leonard Richardson (leonardr@segfault.org)"
-__version__ = "3.0.0"
-__date__ = "$Date: 2004/10/18 00:14:20 $"
-__copyright__ = "Copyright (c) 2004-2005 Leonard Richardson"
-__license__ = "PSF"
+__version__ = "3.0.8.1"
+__copyright__ = "Copyright (c) 2004-2010 Leonard Richardson"
+__license__ = "New-style BSD"
 
 from sgmllib import SGMLParser, SGMLParseError
 import codecs
+import markupbase
 import types
 import re
 import sgmllib
-from htmlentitydefs import name2codepoint
+try:
+  from htmlentitydefs import name2codepoint
+except ImportError:
+  name2codepoint = {}
+try:
+    set
+except NameError:
+    from sets import Set as set
 
-#This code makes Beautiful Soup able to parse XML with namespaces
+#These hacks make Beautiful Soup able to parse XML with namespaces
 sgmllib.tagfind = re.compile('[a-zA-Z][-_.:a-zA-Z0-9]*')
+markupbase._declname_match = re.compile(r'[a-zA-Z][-_.:a-zA-Z0-9]*\s*').match
 
 DEFAULT_OUTPUT_ENCODING = "utf-8"
 
+def _match_css_class(str):
+    """Build a RE to match the given CSS class."""
+    return re.compile(r"(^|.*\s)%s($|\s)" % str)
+
 # First, the classes that represent markup elements.
 
-class PageElement:
+class PageElement(object):
     """Contains the navigational information for some part of the page
     (either a tag or a piece of text)"""
 
     def setup(self, parent=None, previous=None):
         """Sets up the initial relations between this element and
-        other elements."""        
+        other elements."""
         self.parent = parent
         self.previous = previous
         self.next = None
@@ -80,31 +126,41 @@ class PageElement:
             self.previousSibling = self.parent.contents[-1]
             self.previousSibling.nextSibling = self
 
-    def replaceWith(self, replaceWith):        
+    def replaceWith(self, replaceWith):
         oldParent = self.parent
-        myIndex = self.parent.contents.index(self)
-        if hasattr(replaceWith, 'parent') and replaceWith.parent == self.parent:
+        myIndex = self.parent.index(self)
+        if hasattr(replaceWith, "parent")\
+                  and replaceWith.parent is self.parent:
             # We're replacing this element with one of its siblings.
-            index = self.parent.contents.index(replaceWith)
+            index = replaceWith.parent.index(replaceWith)
             if index and index < myIndex:
                 # Furthermore, it comes before this element. That
                 # means that when we extract it, the index of this
                 # element will change.
                 myIndex = myIndex - 1
-        self.extract()        
+        self.extract()
         oldParent.insert(myIndex, replaceWith)
-        
+
+    def replaceWithChildren(self):
+        myParent = self.parent
+        myIndex = self.parent.index(self)
+        self.extract()
+        reversedChildren = list(self.contents)
+        reversedChildren.reverse()
+        for child in reversedChildren:
+            myParent.insert(myIndex, child)
+
     def extract(self):
-        """Destructively rips this element out of the tree."""        
+        """Destructively rips this element out of the tree."""
         if self.parent:
             try:
-                self.parent.contents.remove(self)
+                del self.parent.contents[self.parent.index(self)]
             except ValueError:
                 pass
 
         #Find the two elements that would be next to each other if
         #this element (and any children) hadn't been parsed. Connect
-        #the two.        
+        #the two.
         lastChild = self._lastRecursiveChild()
         nextElement = lastChild.next
 
@@ -115,12 +171,13 @@ class PageElement:
         self.previous = None
         lastChild.next = None
 
-        self.parent = None        
+        self.parent = None
         if self.previousSibling:
             self.previousSibling.nextSibling = self.nextSibling
         if self.nextSibling:
             self.nextSibling.previousSibling = self.previousSibling
-        self.previousSibling = self.nextSibling = None       
+        self.previousSibling = self.nextSibling = None
+        return self
 
     def _lastRecursiveChild(self):
         "Finds the last element beneath this object to be parsed."
@@ -130,25 +187,24 @@ class PageElement:
         return lastChild
 
     def insert(self, position, newChild):
-        if (isinstance(newChild, basestring)
-            or isinstance(newChild, unicode)) \
+        if isinstance(newChild, basestring) \
             and not isinstance(newChild, NavigableString):
-            newChild = NavigableString(newChild)        
+            newChild = NavigableString(newChild)
 
         position =  min(position, len(self.contents))
-        if hasattr(newChild, 'parent') and newChild.parent != None:
+        if hasattr(newChild, 'parent') and newChild.parent is not None:
             # We're 'inserting' an element that's already one
-            # of this object's children. 
-            if newChild.parent == self:
-                index = self.find(newChild)
-                if index and index < position:
+            # of this object's children.
+            if newChild.parent is self:
+                index = self.index(newChild)
+                if index > position:
                     # Furthermore we're moving it further down the
                     # list of this object's children. That means that
                     # when we extract this element, our target index
                     # will jump down one.
                     position = position - 1
             newChild.extract()
-            
+
         newChild.parent = self
         previousChild = None
         if position == 0:
@@ -160,13 +216,13 @@ class PageElement:
             newChild.previousSibling.nextSibling = newChild
             newChild.previous = previousChild._lastRecursiveChild()
         if newChild.previous:
-            newChild.previous.next = newChild        
+            newChild.previous.next = newChild
 
         newChildsLastElement = newChild._lastRecursiveChild()
 
         if position >= len(self.contents):
             newChild.nextSibling = None
-            
+
             parent = self
             parentsNextSibling = None
             while not parentsNextSibling:
@@ -179,8 +235,8 @@ class PageElement:
             else:
                 newChildsLastElement.next = None
         else:
-            nextChild = self.contents[position]            
-            newChild.nextSibling = nextChild            
+            nextChild = self.contents[position]
+            newChild.nextSibling = nextChild
             if newChild.nextSibling:
                 newChild.nextSibling.previousSibling = newChild
             newChildsLastElement.next = nextChild
@@ -189,6 +245,10 @@ class PageElement:
             newChildsLastElement.next.previous = newChildsLastElement
         self.contents.insert(position, newChild)
 
+    def append(self, tag):
+        """Appends the given tag to the contents of this tag."""
+        self.insert(len(self.contents), tag)
+
     def findNext(self, name=None, attrs={}, text=None, **kwargs):
         """Returns the first item that matches the given criteria and
         appears after this Tag in the document."""
@@ -197,8 +257,9 @@ class PageElement:
     def findAllNext(self, name=None, attrs={}, text=None, limit=None,
                     **kwargs):
         """Returns all items that match the given criteria and appear
-        before after Tag in the document."""
-        return self._findAll(name, attrs, text, limit, self.nextGenerator)
+        after this Tag in the document."""
+        return self._findAll(name, attrs, text, limit, self.nextGenerator,
+                             **kwargs)
 
     def findNextSibling(self, name=None, attrs={}, text=None, **kwargs):
         """Returns the closest sibling to this Tag that matches the
@@ -212,6 +273,7 @@ class PageElement:
         criteria and appear after this Tag in the document."""
         return self._findAll(name, attrs, text, limit,
                              self.nextSiblingGenerator, **kwargs)
+    fetchNextSiblings = findNextSiblings # Compatibility with pre-3.x
 
     def findPrevious(self, name=None, attrs={}, text=None, **kwargs):
         """Returns the first item that matches the given criteria and
@@ -224,6 +286,7 @@ class PageElement:
         before this Tag in the document."""
         return self._findAll(name, attrs, text, limit, self.previousGenerator,
                            **kwargs)
+    fetchPrevious = findAllPrevious # Compatibility with pre-3.x
 
     def findPreviousSibling(self, name=None, attrs={}, text=None, **kwargs):
         """Returns the closest sibling to this Tag that matches the
@@ -237,6 +300,7 @@ class PageElement:
         criteria and appear before this Tag in the document."""
         return self._findAll(name, attrs, text, limit,
                              self.previousSiblingGenerator, **kwargs)
+    fetchPreviousSiblings = findPreviousSiblings # Compatibility with pre-3.x
 
     def findParent(self, name=None, attrs={}, **kwargs):
         """Returns the closest parent of this Tag that matches the given
@@ -255,6 +319,7 @@ class PageElement:
 
         return self._findAll(name, attrs, None, limit, self.parentGenerator,
                              **kwargs)
+    fetchParents = findParents # Compatibility with pre-3.x
 
     #These methods do the real heavy lifting.
 
@@ -264,14 +329,27 @@ class PageElement:
         if l:
             r = l[0]
         return r
-    
+
     def _findAll(self, name, attrs, text, limit, generator, **kwargs):
         "Iterates over a generator looking for things that match."
 
         if isinstance(name, SoupStrainer):
             strainer = name
+        # (Possibly) special case some findAll*(...) searches
+        elif text is None and not limit and not attrs and not kwargs:
+            # findAll*(True)
+            if name is True:
+                return [element for element in generator()
+                        if isinstance(element, Tag)]
+            # findAll*('tag-name')
+            elif isinstance(name, basestring):
+                return [element for element in generator()
+                        if isinstance(element, Tag) and
+                        element.name == name]
+            else:
+                strainer = SoupStrainer(name, attrs, text, **kwargs)
+        # Build a SoupStrainer
         else:
-            # Build a SoupStrainer
             strainer = SoupStrainer(name, attrs, text, **kwargs)
         results = ResultSet(strainer)
         g = generator()
@@ -289,41 +367,41 @@ class PageElement:
         return results
 
     #These Generators can be used to navigate starting from both
-    #NavigableStrings and Tags.                
+    #NavigableStrings and Tags.
     def nextGenerator(self):
         i = self
-        while i:
+        while i is not None:
             i = i.next
             yield i
 
     def nextSiblingGenerator(self):
         i = self
-        while i:
+        while i is not None:
             i = i.nextSibling
             yield i
 
     def previousGenerator(self):
         i = self
-        while i:
+        while i is not None:
             i = i.previous
             yield i
 
     def previousSiblingGenerator(self):
         i = self
-        while i:
+        while i is not None:
             i = i.previousSibling
             yield i
 
     def parentGenerator(self):
         i = self
-        while i:
+        while i is not None:
             i = i.parent
             yield i
 
     # Utility methods
     def substituteEncoding(self, str, encoding=None):
         encoding = encoding or "utf-8"
-        return str.replace("%SOUP-ENCODING%", encoding)    
+        return str.replace("%SOUP-ENCODING%", encoding)
 
     def toEncoding(self, s, encoding=None):
         """Encodes an object to a string in some encoding, or to Unicode.
@@ -345,6 +423,21 @@ class PageElement:
 
 class NavigableString(unicode, PageElement):
 
+    def __new__(cls, value):
+        """Create a new NavigableString.
+
+        When unpickling a NavigableString, this method is called with
+        the string in DEFAULT_OUTPUT_ENCODING. That encoding needs to be
+        passed in to the superclass's __new__ or the superclass won't know
+        how to handle non-ASCII characters.
+        """
+        if isinstance(value, unicode):
+            return unicode.__new__(cls, value)
+        return unicode.__new__(cls, value, DEFAULT_OUTPUT_ENCODING)
+
+    def __getnewargs__(self):
+        return (NavigableString.__str__(self),)
+
     def __getattr__(self, attr):
         """text.string gives you text. This is for backwards
         compatibility for Navigable*String, but for CData* it lets you
@@ -355,14 +448,14 @@ class NavigableString(unicode, PageElement):
             raise AttributeError, "'%s' object has no attribute '%s'" % (self.__class__.__name__, attr)
 
     def __unicode__(self):
-        return __str__(self, None)
+        return str(self).decode(DEFAULT_OUTPUT_ENCODING)
 
     def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
         if encoding:
             return self.encode(encoding)
         else:
             return self
-        
+
 class CData(NavigableString):
 
     def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
@@ -377,16 +470,56 @@ class ProcessingInstruction(NavigableString):
 
 class Comment(NavigableString):
     def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
-        return "<!--%s-->" % NavigableString.__str__(self, encoding)    
+        return "<!--%s-->" % NavigableString.__str__(self, encoding)
 
 class Declaration(NavigableString):
     def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
-        return "<!%s>" % NavigableString.__str__(self, encoding)        
+        return "<!%s>" % NavigableString.__str__(self, encoding)
 
 class Tag(PageElement):
 
     """Represents a found HTML tag with its attributes and contents."""
 
+    def _invert(h):
+        "Cheap function to invert a hash."
+        i = {}
+        for k,v in h.items():
+            i[v] = k
+        return i
+
+    XML_ENTITIES_TO_SPECIAL_CHARS = { "apos" : "'",
+                                      "quot" : '"',
+                                      "amp" : "&",
+                                      "lt" : "<",
+                                      "gt" : ">" }
+
+    XML_SPECIAL_CHARS_TO_ENTITIES = _invert(XML_ENTITIES_TO_SPECIAL_CHARS)
+
+    def _convertEntities(self, match):
+        """Used in a call to re.sub to replace HTML, XML, and numeric
+        entities with the appropriate Unicode characters. If HTML
+        entities are being converted, any unrecognized entities are
+        escaped."""
+        x = match.group(1)
+        if self.convertHTMLEntities and x in name2codepoint:
+            return unichr(name2codepoint[x])
+        elif x in self.XML_ENTITIES_TO_SPECIAL_CHARS:
+            if self.convertXMLEntities:
+                return self.XML_ENTITIES_TO_SPECIAL_CHARS[x]
+            else:
+                return u'&%s;' % x
+        elif len(x) > 0 and x[0] == '#':
+            # Handle numeric entities
+            if len(x) > 1 and x[1] == 'x':
+                return unichr(int(x[2:], 16))
+            else:
+                return unichr(int(x[1:]))
+
+        elif self.escapeUnrecognizedEntities:
+            return u'&amp;%s;' % x
+        else:
+            return u'&%s;' % x
+
     def __init__(self, parser, name, attrs=None, parent=None,
                  previous=None):
         "Basic constructor."
@@ -396,19 +529,66 @@ class Tag(PageElement):
         self.parserClass = parser.__class__
         self.isSelfClosing = parser.isSelfClosingTag(name)
         self.name = name
-        if attrs == None:
+        if attrs is None:
             attrs = []
         self.attrs = attrs
         self.contents = []
         self.setup(parent, previous)
         self.hidden = False
         self.containsSubstitutions = False
+        self.convertHTMLEntities = parser.convertHTMLEntities
+        self.convertXMLEntities = parser.convertXMLEntities
+        self.escapeUnrecognizedEntities = parser.escapeUnrecognizedEntities
+
+        # Convert any HTML, XML, or numeric entities in the attribute values.
+        convert = lambda(k, val): (k,
+                                   re.sub("&(#\d+|#x[0-9a-fA-F]+|\w+);",
+                                          self._convertEntities,
+                                          val))
+        self.attrs = map(convert, self.attrs)
+
+    def getString(self):
+        if (len(self.contents) == 1
+            and isinstance(self.contents[0], NavigableString)):
+            return self.contents[0]
+
+    def setString(self, string):
+        """Replace the contents of the tag with a string"""
+        self.clear()
+        self.append(string)
+
+    string = property(getString, setString)
+
+    def getText(self, separator=u""):
+        if not len(self.contents):
+            return u""
+        stopNode = self._lastRecursiveChild().next
+        strings = []
+        current = self.contents[0]
+        while current is not stopNode:
+            if isinstance(current, NavigableString):
+                strings.append(current.strip())
+            current = current.next
+        return separator.join(strings)
+
+    text = property(getText)
 
     def get(self, key, default=None):
         """Returns the value of the 'key' attribute for the tag, or
         the value given for 'default' if it doesn't have that
         attribute."""
-        return self._getAttrMap().get(key, default)    
+        return self._getAttrMap().get(key, default)
+
+    def clear(self):
+        """Extract all children."""
+        for child in self.contents[:]:
+            child.extract()
+
+    def index(self, element):
+        for i, child in enumerate(self.contents):
+            if child is element:
+                return i
+        raise ValueError("Tag.index: element not in tag")
 
     def has_key(self, key):
         return self._getAttrMap().has_key(key)
@@ -433,7 +613,7 @@ class Tag(PageElement):
         "A tag is non-None even if it has no contents."
         return True
 
-    def __setitem__(self, key, value):        
+    def __setitem__(self, key, value):
         """Setting tag[key] sets the value of the 'key' attribute for the
         tag."""
         self._getAttrMap()
@@ -470,6 +650,7 @@ class Tag(PageElement):
             return self.find(tag[:-3])
         elif tag.find('__') != 0:
             return self.find(tag)
+        raise AttributeError, "'%s' object has no attribute '%s'" % (self.__class__, tag)
 
     def __eq__(self, other):
         """Returns true iff this tag has the same name, the same attributes,
@@ -477,6 +658,8 @@ class Tag(PageElement):
 
         NOTE: right now this will return false if two tags have the
         same attributes in a different order. Should this be fixed?"""
+        if other is self:
+            return True
         if not hasattr(other, 'name') or not hasattr(other, 'attrs') or not hasattr(other, 'contents') or self.name != other.name or self.attrs != other.attrs or len(self) != len(other):
             return False
         for i in range(0, len(self.contents)):
@@ -496,6 +679,15 @@ class Tag(PageElement):
     def __unicode__(self):
         return self.__str__(None)
 
+    BARE_AMPERSAND_OR_BRACKET = re.compile("([<>]|"
+                                           + "&(?!#\d+;|#x[0-9a-fA-F]+;|\w+;)"
+                                           + ")")
+
+    def _sub_entity(self, x):
+        """Used with a regular expression to substitute the
+        appropriate XML entity for an XML special character."""
+        return "&" + self.XML_SPECIAL_CHARS_TO_ENTITIES[x.group(0)[0]] + ";"
+
     def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING,
                 prettyPrint=False, indentLevel=0):
         """Returns a string or Unicode representation of this tag and
@@ -506,20 +698,43 @@ class Tag(PageElement):
         the original string."""
 
         encodedName = self.toEncoding(self.name, encoding)
-        
+
         attrs = []
         if self.attrs:
             for key, val in self.attrs:
                 fmt = '%s="%s"'
-                if isString(val):
+                if isinstance(val, basestring):
                     if self.containsSubstitutions and '%SOUP-ENCODING%' in val:
                         val = self.substituteEncoding(val, encoding)
+
+                    # The attribute value either:
+                    #
+                    # * Contains no embedded double quotes or single quotes.
+                    #   No problem: we enclose it in double quotes.
+                    # * Contains embedded single quotes. No problem:
+                    #   double quotes work here too.
+                    # * Contains embedded double quotes. No problem:
+                    #   we enclose it in single quotes.
+                    # * Embeds both single _and_ double quotes. This
+                    #   can't happen naturally, but it can happen if
+                    #   you modify an attribute value after parsing
+                    #   the document. Now we have a bit of a
+                    #   problem. We solve it by enclosing the
+                    #   attribute in single quotes, and escaping any
+                    #   embedded single quotes to XML entities.
                     if '"' in val:
                         fmt = "%s='%s'"
-                        # This can't happen naturally, but it can happen
-                        # if you modify an attribute value and print it out.
                         if "'" in val:
+                            # TODO: replace with apos when
+                            # appropriate.
                             val = val.replace("'", "&squot;")
+
+                    # Now we're okay w/r/t quotes. But the attribute
+                    # value might also contain angle brackets, or
+                    # ampersands that aren't part of entities. We need
+                    # to escape those to XML entities too.
+                    val = self.BARE_AMPERSAND_OR_BRACKET.sub(self._sub_entity, val)
+
                 attrs.append(fmt % (self.toEncoding(key, encoding),
                                     self.toEncoding(val, encoding)))
         close = ''
@@ -541,7 +756,7 @@ class Tag(PageElement):
             s = []
             attributeString = ''
             if attrs:
-                attributeString = ' ' + ' '.join(attrs)            
+                attributeString = ' ' + ' '.join(attrs)
             if prettyPrint:
                 s.append(space)
             s.append('<%s%s%s>' % (encodedName, attributeString, close))
@@ -558,6 +773,23 @@ class Tag(PageElement):
             s = ''.join(s)
         return s
 
+    def decompose(self):
+        """Recursively destroys the contents of this tree."""
+        self.extract()
+        if len(self.contents) == 0:
+            return
+        current = self.contents[0]
+        while current is not None:
+            next = current.next
+            if isinstance(current, Tag):
+                del current.contents[:]
+            current.parent = None
+            current.previous = None
+            current.previousSibling = None
+            current.next = None
+            current.nextSibling = None
+            current = next
+
     def prettify(self, encoding=DEFAULT_OUTPUT_ENCODING):
         return self.__str__(encoding, True)
 
@@ -573,23 +805,23 @@ class Tag(PageElement):
             elif isinstance(c, Tag):
                 s.append(c.__str__(encoding, prettyPrint, indentLevel))
             if text and prettyPrint:
-                text = text.strip()              
+                text = text.strip()
             if text:
                 if prettyPrint:
                     s.append(" " * (indentLevel-1))
                 s.append(text)
                 if prettyPrint:
                     s.append("\n")
-        return ''.join(s)    
+        return ''.join(s)
 
     #Soup methods
 
     def find(self, name=None, attrs={}, recursive=True, text=None,
-              **kwargs):
-        """Return only the first child of this
-        Tag matching the given criteria."""
+             **kwargs):
+        """Return only the first child of this Tag matching the given
+        criteria."""
         r = None
-        l = self.findAll(name, attrs, recursive, text, 1)
+        l = self.findAll(name, attrs, recursive, text, 1, **kwargs)
         if l:
             r = l[0]
         return r
@@ -610,13 +842,17 @@ class Tag(PageElement):
         if not recursive:
             generator = self.childGenerator
         return self._findAll(name, attrs, text, limit, generator, **kwargs)
-    findAllChildren = findAll
-    
-    #Utility methods
+    findChildren = findAll
 
-    def append(self, tag):
-        """Appends the given tag to the contents of this tag."""
-        self.contents.append(tag)
+    # Pre-3.x compatibility methods
+    first = find
+    fetch = findAll
+
+    def fetchText(self, text=None, recursive=True, limit=None):
+        return self.findAll(text=text, recursive=recursive, limit=limit)
+
+    def firstText(self, text=None, recursive=True):
+        return self.find(text=text, recursive=recursive)
 
     #Private methods
 
@@ -626,29 +862,23 @@ class Tag(PageElement):
         if not getattr(self, 'attrMap'):
             self.attrMap = {}
             for (key, value) in self.attrs:
-                self.attrMap[key] = value 
+                self.attrMap[key] = value
         return self.attrMap
 
     #Generator methods
     def childGenerator(self):
-        for i in range(0, len(self.contents)):
-            yield self.contents[i]
-        raise StopIteration
-    
+        # Just use the iterator from the contents
+        return iter(self.contents)
+
     def recursiveChildGenerator(self):
-        stack = [(self, 0)]
-        while stack:
-            tag, start = stack.pop()
-            if isinstance(tag, Tag):            
-                for i in range(start, len(tag.contents)):
-                    a = tag.contents[i]
-                    yield a
-                    if isinstance(a, Tag) and tag.contents:
-                        if i < len(tag.contents) - 1:
-                            stack.append((tag, i+1))
-                        stack.append((a, 0))
-                        break
-        raise StopIteration
+        if not len(self.contents):
+            raise StopIteration
+        stopNode = self._lastRecursiveChild().next
+        current = self.contents[0]
+        while current is not stopNode:
+            yield current
+            current = current.next
+
 
 # Next, a couple classes to represent queries and their results.
 class SoupStrainer:
@@ -656,9 +886,17 @@ class SoupStrainer:
     text)."""
 
     def __init__(self, name=None, attrs={}, text=None, **kwargs):
-        self.name=name
-        self.attrs=attrs.copy()
-        self.attrs.update(kwargs)
+        self.name = name
+        if isinstance(attrs, basestring):
+            kwargs['class'] = _match_css_class(attrs)
+            attrs = None
+        if kwargs:
+            if attrs:
+                attrs = attrs.copy()
+                attrs.update(kwargs)
+            else:
+                attrs = kwargs
+        self.attrs = attrs
         self.text = text
 
     def __str__(self):
@@ -666,7 +904,7 @@ class SoupStrainer:
             return self.text
         else:
             return "%s|%s" % (self.name, self.attrs)
-    
+
     def searchTag(self, markupName=None, markupAttrs={}):
         found = None
         markup = None
@@ -683,7 +921,7 @@ class SoupStrainer:
             if callFunctionWithTagData:
                 match = self.name(markupName, markupAttrs)
             else:
-                match = True            
+                match = True
                 markupAttrMap = None
                 for attr, matchAgainst in self.attrs.items():
                     if not markupAttrMap:
@@ -708,8 +946,9 @@ class SoupStrainer:
         #print 'looking for %s in %s' % (self, markup)
         found = None
         # If given a list of items, scan it for a text element that
-        # matches.        
-        if isList(markup) and not isinstance(markup, Tag):
+        # matches.
+        if hasattr(markup, "__iter__") \
+                and not isinstance(markup, Tag):
             for element in markup:
                 if isinstance(element, NavigableString) \
                        and self.search(element):
@@ -722,19 +961,19 @@ class SoupStrainer:
                 found = self.searchTag(markup)
         # If it's text, make sure the text matches.
         elif isinstance(markup, NavigableString) or \
-                 isString(markup):
+                 isinstance(markup, basestring):
             if self._matches(markup, self.text):
                 found = markup
         else:
             raise Exception, "I don't know how to match against a %s" \
                   % markup.__class__
         return found
-        
-    def _matches(self, markup, matchAgainst):    
+
+    def _matches(self, markup, matchAgainst):
         #print "Matching %s against %s" % (markup, matchAgainst)
         result = False
-        if matchAgainst == True and type(matchAgainst) == types.BooleanType:
-            result = markup != None
+        if matchAgainst is True:
+            result = markup is not None
         elif callable(matchAgainst):
             result = matchAgainst(markup)
         else:
@@ -742,17 +981,17 @@ class SoupStrainer:
             #other ways of matching match the tag name as a string.
             if isinstance(markup, Tag):
                 markup = markup.name
-            if markup and not isString(markup):
+            if markup and not isinstance(markup, basestring):
                 markup = unicode(markup)
             #Now we know that chunk is either a string, or None.
             if hasattr(matchAgainst, 'match'):
                 # It's a regexp object.
                 result = markup and matchAgainst.search(markup)
-            elif isList(matchAgainst):
+            elif hasattr(matchAgainst, '__iter__'): # list-like
                 result = markup in matchAgainst
             elif hasattr(matchAgainst, 'items'):
                 result = markup.has_key(matchAgainst)
-            elif matchAgainst and isString(markup):
+            elif matchAgainst and isinstance(markup, basestring):
                 if isinstance(markup, unicode):
                     matchAgainst = unicode(matchAgainst)
                 else:
@@ -771,20 +1010,6 @@ class ResultSet(list):
 
 # Now, some helper functions.
 
-def isList(l):
-    """Convenience method that works with all 2.x versions of Python
-    to determine whether or not something is listlike."""
-    return hasattr(l, '__iter__') \
-           or (type(l) in (types.ListType, types.TupleType))
-
-def isString(s):
-    """Convenience method that works with all 2.x versions of Python
-    to determine whether or not something is stringlike."""
-    try:
-        return isinstance(s, unicode) or isintance(s, basestring) 
-    except NameError:
-        return isinstance(s, str)
-
 def buildTagMap(default, *args):
     """Turns a list of maps, lists, or scalars into a single map.
     Used to build the SELF_CLOSING_TAGS, NESTABLE_TAGS, and
@@ -795,7 +1020,7 @@ def buildTagMap(default, *args):
             #It's a map. Merge it.
             for k,v in portion.items():
                 built[k] = v
-        elif isList(portion):
+        elif hasattr(portion, '__iter__'): # is a list
             #It's a list. Map each item to the default.
             for k in portion:
                 built[k] = default
@@ -811,7 +1036,7 @@ class BeautifulStoneSoup(Tag, SGMLParser):
     """This class contains the basic parser and search code. It defines
     a parser that knows nothing about tag behavior except for the
     following:
-   
+
       You can't close a tag without closing all the tags it encloses.
       That is, "<foo><bar></foo>" actually means
       "<foo><bar></bar></foo>".
@@ -824,14 +1049,11 @@ class BeautifulStoneSoup(Tag, SGMLParser):
     or when BeautifulSoup makes an assumption counter to what you were
     expecting."""
 
-    XML_ENTITY_LIST = {}
-    for i in ["quot", "apos", "amp", "lt", "gt"]:
-        XML_ENTITY_LIST[i] = True 
-
     SELF_CLOSING_TAGS = {}
     NESTABLE_TAGS = {}
     RESET_NESTING_TAGS = {}
     QUOTE_TAGS = {}
+    PRESERVE_WHITESPACE_TAGS = []
 
     MARKUP_MASSAGE = [(re.compile('(<[^<>]*)/>'),
                        lambda x: x.group(1) + ' />'),
@@ -843,13 +1065,22 @@ class BeautifulStoneSoup(Tag, SGMLParser):
 
     HTML_ENTITIES = "html"
     XML_ENTITIES = "xml"
+    XHTML_ENTITIES = "xhtml"
+    # TODO: This only exists for backwards-compatibility
+    ALL_ENTITIES = XHTML_ENTITIES
+
+    # Used when determining whether a text node is all whitespace and
+    # can be replaced with a single space. A text node that contains
+    # fancy Unicode spaces (usually non-breaking) should be left
+    # alone.
+    STRIP_ASCII_SPACES = { 9: None, 10: None, 12: None, 13: None, 32: None, }
 
     def __init__(self, markup="", parseOnlyThese=None, fromEncoding=None,
                  markupMassage=True, smartQuotesTo=XML_ENTITIES,
-                 convertEntities=None, selfClosingTags=None):
+                 convertEntities=None, selfClosingTags=None, isHTML=False):
         """The Soup object is initialized as the 'root tag', and the
         provided markup (which can be a string or a file-like object)
-        is fed into the underlying parser. 
+        is fed into the underlying parser.
 
         sgmllib will process most bad HTML, and the BeautifulSoup
         class has some tricks for dealing with some HTML that kills
@@ -876,25 +1107,54 @@ class BeautifulStoneSoup(Tag, SGMLParser):
         self.fromEncoding = fromEncoding
         self.smartQuotesTo = smartQuotesTo
         self.convertEntities = convertEntities
+        # Set the rules for how we'll deal with the entities we
+        # encounter
         if self.convertEntities:
             # It doesn't make sense to convert encoded characters to
             # entities even while you're converting entities to Unicode.
             # Just convert it all to Unicode.
             self.smartQuotesTo = None
+            if convertEntities == self.HTML_ENTITIES:
+                self.convertXMLEntities = False
+                self.convertHTMLEntities = True
+                self.escapeUnrecognizedEntities = True
+            elif convertEntities == self.XHTML_ENTITIES:
+                self.convertXMLEntities = True
+                self.convertHTMLEntities = True
+                self.escapeUnrecognizedEntities = False
+            elif convertEntities == self.XML_ENTITIES:
+                self.convertXMLEntities = True
+                self.convertHTMLEntities = False
+                self.escapeUnrecognizedEntities = False
+        else:
+            self.convertXMLEntities = False
+            self.convertHTMLEntities = False
+            self.escapeUnrecognizedEntities = False
+
         self.instanceSelfClosingTags = buildTagMap(None, selfClosingTags)
         SGMLParser.__init__(self)
-            
+
         if hasattr(markup, 'read'):        # It's a file-type object.
             markup = markup.read()
         self.markup = markup
         self.markupMassage = markupMassage
         try:
-            self._feed()
+            self._feed(isHTML=isHTML)
         except StopParsing:
             pass
         self.markup = None                 # The markup can now be GCed
-        
-    def _feed(self, inDocumentEncoding=None):
+
+    def convert_charref(self, name):
+        """This method fixes a bug in Python's SGMLParser."""
+        try:
+            n = int(name)
+        except ValueError:
+            return
+        if not 0 <= n <= 127 : # ASCII ends at 127, not 255
+            return
+        return self.convert_codepoint(n)
+
+    def _feed(self, inDocumentEncoding=None, isHTML=False):
         # Convert the document to Unicode.
         markup = self.markup
         if isinstance(markup, unicode):
@@ -903,15 +1163,22 @@ class BeautifulStoneSoup(Tag, SGMLParser):
         else:
             dammit = UnicodeDammit\
                      (markup, [self.fromEncoding, inDocumentEncoding],
-                      smartQuotesTo=self.smartQuotesTo)
+                      smartQuotesTo=self.smartQuotesTo, isHTML=isHTML)
             markup = dammit.unicode
             self.originalEncoding = dammit.originalEncoding
+            self.declaredHTMLEncoding = dammit.declaredHTMLEncoding
         if markup:
             if self.markupMassage:
-                if not isList(self.markupMassage):
-                    self.markupMassage = self.MARKUP_MASSAGE            
+                if not hasattr(self.markupMassage, "__iter__"):
+                    self.markupMassage = self.MARKUP_MASSAGE
                 for fix, m in self.markupMassage:
                     markup = fix.sub(m, markup)
+                # TODO: We get rid of markupMassage so that the
+                # soup object can be deepcopied later on. Some
+                # Python installations can't copy regexes. If anyone
+                # was relying on the existence of markupMassage, this
+                # might cause problems.
+                del(self.markupMassage)
         self.reset()
 
         SGMLParser.feed(self, markup)
@@ -925,10 +1192,10 @@ class BeautifulStoneSoup(Tag, SGMLParser):
         superclass or the Tag superclass, depending on the method name."""
         #print "__getattr__ called on %s.%s" % (self.__class__, methodName)
 
-        if methodName.find('start_') == 0 or methodName.find('end_') == 0 \
-               or methodName.find('do_') == 0:
+        if methodName.startswith('start_') or methodName.startswith('end_') \
+               or methodName.startswith('do_'):
             return SGMLParser.__getattr__(self, methodName)
-        elif methodName.find('__') != 0:
+        elif not methodName.startswith('__'):
             return Tag.__getattr__(self, methodName)
         else:
             raise AttributeError
@@ -938,7 +1205,7 @@ class BeautifulStoneSoup(Tag, SGMLParser):
         self-closing tag according to this parser."""
         return self.SELF_CLOSING_TAGS.has_key(name) \
                or self.instanceSelfClosingTags.has_key(name)
-            
+
     def reset(self):
         Tag.__init__(self, self, self.ROOT_TAG_NAME)
         self.hidden = 1
@@ -948,15 +1215,9 @@ class BeautifulStoneSoup(Tag, SGMLParser):
         self.tagStack = []
         self.quoteStack = []
         self.pushTag(self)
-    
+
     def popTag(self):
         tag = self.tagStack.pop()
-        # Tags with just one string-owning child get the child as a
-        # 'string' property, so that soup.tag.string is shorthand for
-        # soup.tag.contents[0]
-        if len(self.currentTag.contents) == 1 and \
-           isinstance(self.currentTag.contents[0], NavigableString):
-            self.currentTag.string = self.currentTag.contents[0]
 
         #print "Pop", tag.name
         if self.tagStack:
@@ -966,14 +1227,16 @@ class BeautifulStoneSoup(Tag, SGMLParser):
     def pushTag(self, tag):
         #print "Push", tag.name
         if self.currentTag:
-            self.currentTag.append(tag)
+            self.currentTag.contents.append(tag)
         self.tagStack.append(tag)
         self.currentTag = self.tagStack[-1]
 
     def endData(self, containerClass=NavigableString):
         if self.currentData:
-            currentData = ''.join(self.currentData)
-            if not currentData.strip():
+            currentData = u''.join(self.currentData)
+            if (currentData.translate(self.STRIP_ASCII_SPACES) == '' and
+                not set([tag.name for tag in self.tagStack]).intersection(
+                    self.PRESERVE_WHITESPACE_TAGS)):
                 if '\n' in currentData:
                     currentData = '\n'
                 else:
@@ -998,7 +1261,7 @@ class BeautifulStoneSoup(Tag, SGMLParser):
         the given tag."""
         #print "Popping to %s" % name
         if name == self.ROOT_TAG_NAME:
-            return            
+            return
 
         numPops = 0
         mostRecentTag = None
@@ -1011,7 +1274,7 @@ class BeautifulStoneSoup(Tag, SGMLParser):
 
         for i in range(0, numPops):
             mostRecentTag = self.popTag()
-        return mostRecentTag    
+        return mostRecentTag
 
     def _smartPop(self, name):
 
@@ -1022,10 +1285,9 @@ class BeautifulStoneSoup(Tag, SGMLParser):
         comes between this tag and the previous tag of this type.
 
         Examples:
-         <p>Foo<b>Bar<p> should pop to 'p', not 'b'.
-         <p>Foo<table>Bar<p> should pop to 'table', not 'p'.
-         <p>Foo<table><tr>Bar<p> should pop to 'tr', not 'p'.
-         <p>Foo<b>Bar<p> should pop to 'p', not 'b'.
+         <p>Foo<b>Bar *<p>* should pop to 'p', not 'b'.
+         <p>Foo<table>Bar *<p>* should pop to 'table', not 'p'.
+         <p>Foo<table><tr>Bar *<p>* should pop to 'tr', not 'p'.
 
          <li><ul><li> *<li>* should pop to 'ul', not the first 'li'.
          <tr><table><tr> *<tr>* should pop to 'table', not the first 'tr'
@@ -1044,11 +1306,11 @@ class BeautifulStoneSoup(Tag, SGMLParser):
                 #last occurance.
                 popTo = name
                 break
-            if (nestingResetTriggers != None
+            if (nestingResetTriggers is not None
                 and p.name in nestingResetTriggers) \
-                or (nestingResetTriggers == None and isResetNesting
+                or (nestingResetTriggers is None and isResetNesting
                     and self.RESET_NESTING_TAGS.has_key(p.name)):
-                
+
                 #If we encounter one of the nesting reset triggers
                 #peculiar to this tag, or we encounter another tag
                 #that causes nesting to reset, pop up to but not
@@ -1061,13 +1323,13 @@ class BeautifulStoneSoup(Tag, SGMLParser):
             self._popToTag(popTo, inclusive)
 
     def unknown_starttag(self, name, attrs, selfClosing=0):
-        #print "Start tag %s" % name
+        #print "Start tag %s: %s" % (name, attrs)
         if self.quoteStack:
             #This is not a real tag.
             #print "<%s> is not real!" % name
-            attrs = ''.join(map(lambda(x, y): ' %s="%s"' % (x, y), attrs))
+            attrs = ''.join([' %s="%s"' % (x, y) for x, y in attrs])
             self.handle_data('<%s%s>' % (name, attrs))
-            return        
+            return
         self.endData()
 
         if not self.isSelfClosingTag(name) and not selfClosing:
@@ -1083,7 +1345,7 @@ class BeautifulStoneSoup(Tag, SGMLParser):
         self.previous = tag
         self.pushTag(tag)
         if selfClosing or self.isSelfClosingTag(name):
-            self.popTag()                
+            self.popTag()
         if name in self.QUOTE_TAGS:
             #print "Beginning quote (%s)" % name
             self.quoteStack.append(name)
@@ -1118,7 +1380,7 @@ class BeautifulStoneSoup(Tag, SGMLParser):
         object, possibly one with a %SOUP-ENCODING% slot into which an
         encoding will be plugged later."""
         if text[:3] == "xml":
-            text = "xml version='1.0' encoding='%SOUP-ENCODING%'"
+            text = u"xml version='1.0' encoding='%SOUP-ENCODING%'"
         self._toStringSubclass(text, ProcessingInstruction)
 
     def handle_comment(self, text):
@@ -1127,8 +1389,7 @@ class BeautifulStoneSoup(Tag, SGMLParser):
 
     def handle_charref(self, ref):
         "Handle character references as data."
-        if self.convertEntities in [self.HTML_ENTITIES,
-                                    self.XML_ENTITIES]:
+        if self.convertEntities:
             data = unichr(int(ref))
         else:
             data = '&#%s;' % ref
@@ -1136,20 +1397,47 @@ class BeautifulStoneSoup(Tag, SGMLParser):
 
     def handle_entityref(self, ref):
         """Handle entity references as data, possibly converting known
-        HTML entity references to the corresponding Unicode
+        HTML and/or XML entity references to the corresponding Unicode
         characters."""
         data = None
-        if self.convertEntities == self.HTML_ENTITIES or \
-               (self.convertEntities == self.XML_ENTITIES and \
-                self.XML_ENTITY_LIST.get(ref)):
+        if self.convertHTMLEntities:
             try:
                 data = unichr(name2codepoint[ref])
             except KeyError:
                 pass
+
+        if not data and self.convertXMLEntities:
+                data = self.XML_ENTITIES_TO_SPECIAL_CHARS.get(ref)
+
+        if not data and self.convertHTMLEntities and \
+            not self.XML_ENTITIES_TO_SPECIAL_CHARS.get(ref):
+                # TODO: We've got a problem here. We're told this is
+                # an entity reference, but it's not an XML entity
+                # reference or an HTML entity reference. Nonetheless,
+                # the logical thing to do is to pass it through as an
+                # unrecognized entity reference.
+                #
+                # Except: when the input is "&carol;" this function
+                # will be called with input "carol". When the input is
+                # "AT&T", this function will be called with input
+                # "T". We have no way of knowing whether a semicolon
+                # was present originally, so we don't know whether
+                # this is an unknown entity or just a misplaced
+                # ampersand.
+                #
+                # The more common case is a misplaced ampersand, so I
+                # escape the ampersand and omit the trailing semicolon.
+                data = "&amp;%s" % ref
         if not data:
-            data = '&%s;' % ref
+            # This case is different from the one above, because we
+            # haven't already gone through a supposedly comprehensive
+            # mapping of entities to Unicode characters. We might not
+            # have gone through any mapping at all. So the chances are
+            # very high that this is a real entity, and not a
+            # misplaced ampersand.
+            data = "&%s;" % ref
         self.handle_data(data)
-        
+
     def handle_decl(self, data):
         "Handle DOCTYPEs and the like as Declaration objects."
         self._toStringSubclass(data, Declaration)
@@ -1225,26 +1513,29 @@ class BeautifulSoup(BeautifulStoneSoup):
     def __init__(self, *args, **kwargs):
         if not kwargs.has_key('smartQuotesTo'):
             kwargs['smartQuotesTo'] = self.HTML_ENTITIES
+        kwargs['isHTML'] = True
         BeautifulStoneSoup.__init__(self, *args, **kwargs)
 
     SELF_CLOSING_TAGS = buildTagMap(None,
-                                    ['br' , 'hr', 'input', 'img', 'meta',
-                                    'spacer', 'link', 'frame', 'base'])
+                                    ('br' , 'hr', 'input', 'img', 'meta',
+                                    'spacer', 'link', 'frame', 'base', 'col'))
+
+    PRESERVE_WHITESPACE_TAGS = set(['pre', 'textarea'])
+
+    QUOTE_TAGS = {'script' : None, 'textarea' : None}
 
-    QUOTE_TAGS = {'script': None}
-    
     #According to the HTML standard, each of these inline tags can
     #contain another tag of the same type. Furthermore, it's common
     #to actually use these tags this way.
-    NESTABLE_INLINE_TAGS = ['span', 'font', 'q', 'object', 'bdo', 'sub', 'sup',
-                            'center']
+    NESTABLE_INLINE_TAGS = ('span', 'font', 'q', 'object', 'bdo', 'sub', 'sup',
+                            'center')
 
     #According to the HTML standard, these block tags can contain
     #another tag of the same type. Furthermore, it's common
     #to actually use these tags this way.
-    NESTABLE_BLOCK_TAGS = ['blockquote', 'div', 'fieldset', 'ins', 'del']
+    NESTABLE_BLOCK_TAGS = ('blockquote', 'div', 'fieldset', 'ins', 'del')
 
-    #Lists can contain other lists, but there are restrictions.    
+    #Lists can contain other lists, but there are restrictions.
     NESTABLE_LIST_TAGS = { 'ol' : [],
                            'ul' : [],
                            'li' : ['ul', 'ol'],
@@ -1252,8 +1543,8 @@ class BeautifulSoup(BeautifulStoneSoup):
                            'dd' : ['dl'],
                            'dt' : ['dl'] }
 
-    #Tables can contain other tables, but there are restrictions.    
-    NESTABLE_TABLE_TAGS = {'table' : [], 
+    #Tables can contain other tables, but there are restrictions.
+    NESTABLE_TABLE_TAGS = {'table' : [],
                            'tr' : ['table', 'tbody', 'tfoot', 'thead'],
                            'td' : ['tr'],
                            'th' : ['tr'],
@@ -1262,7 +1553,7 @@ class BeautifulSoup(BeautifulStoneSoup):
                            'tfoot' : ['table'],
                            }
 
-    NON_NESTABLE_BLOCK_TAGS = ['address', 'form', 'p', 'pre']
+    NON_NESTABLE_BLOCK_TAGS = ('address', 'form', 'p', 'pre')
 
     #If one of these tags is encountered, all tags up to the next tag of
     #this type are popped.
@@ -1275,7 +1566,7 @@ class BeautifulSoup(BeautifulStoneSoup):
                                 NESTABLE_LIST_TAGS, NESTABLE_TABLE_TAGS)
 
     # Used to detect the charset in a META tag; see start_meta
-    CHARSET_RE = re.compile("((^|;)\s*charset=)([^;]*)")
+    CHARSET_RE = re.compile("((^|;)\s*charset=)([^;]*)", re.M)
 
     def start_meta(self, attrs):
         """Beautiful Soup can detect a charset included in a META tag,
@@ -1298,32 +1589,35 @@ class BeautifulSoup(BeautifulStoneSoup):
         if httpEquiv and contentType: # It's an interesting meta tag.
             match = self.CHARSET_RE.search(contentType)
             if match:
-                if getattr(self, 'declaredHTMLEncoding') or \
-                       (self.originalEncoding == self.fromEncoding):
-                    # This is our second pass through the document, or
-                    # else an encoding was specified explicitly and it
-                    # worked. Rewrite the meta tag.
-                    newAttr = self.CHARSET_RE.sub\
-                              (lambda(match):match.group(1) +
-                               "%SOUP-ENCODING%", value)
+                if (self.declaredHTMLEncoding is not None or
+                    self.originalEncoding == self.fromEncoding):
+                    # An HTML encoding was sniffed while converting
+                    # the document to Unicode, or an HTML encoding was
+                    # sniffed during a previous pass through the
+                    # document, or an encoding was specified
+                    # explicitly and it worked. Rewrite the meta tag.
+                    def rewrite(match):
+                        return match.group(1) + "%SOUP-ENCODING%"
+                    newAttr = self.CHARSET_RE.sub(rewrite, contentType)
                     attrs[contentTypeIndex] = (attrs[contentTypeIndex][0],
                                                newAttr)
                     tagNeedsEncodingSubstitution = True
                 else:
                     # This is our first pass through the document.
-                    # Go through it again with the new information.
+                    # Go through it again with the encoding information.
                     newCharset = match.group(3)
                     if newCharset and newCharset != self.originalEncoding:
                         self.declaredHTMLEncoding = newCharset
                         self._feed(self.declaredHTMLEncoding)
                         raise StopParsing
+                    pass
         tag = self.unknown_starttag("meta", attrs)
-        if tagNeedsEncodingSubstitution:
+        if tag and tagNeedsEncodingSubstitution:
             tag.containsSubstitutions = True
 
 class StopParsing(Exception):
     pass
-   
+
 class ICantBelieveItsBeautifulSoup(BeautifulSoup):
 
     """The BeautifulSoup class is oriented towards skipping over
@@ -1350,11 +1644,11 @@ class ICantBelieveItsBeautifulSoup(BeautifulSoup):
     wouldn't be."""
 
     I_CANT_BELIEVE_THEYRE_NESTABLE_INLINE_TAGS = \
-     ['em', 'big', 'i', 'small', 'tt', 'abbr', 'acronym', 'strong',
+     ('em', 'big', 'i', 'small', 'tt', 'abbr', 'acronym', 'strong',
       'cite', 'code', 'dfn', 'kbd', 'samp', 'strong', 'var', 'b',
-      'big']
+      'big')
 
-    I_CANT_BELIEVE_THEYRE_NESTABLE_BLOCK_TAGS = ['noscript']
+    I_CANT_BELIEVE_THEYRE_NESTABLE_BLOCK_TAGS = ('noscript',)
 
     NESTABLE_TAGS = buildTagMap([], BeautifulSoup.NESTABLE_TAGS,
                                 I_CANT_BELIEVE_THEYRE_NESTABLE_BLOCK_TAGS,
@@ -1369,7 +1663,7 @@ class MinimalSoup(BeautifulSoup):
 
     This also makes it better for subclassing than BeautifulStoneSoup
     or BeautifulSoup."""
-    
+
     RESET_NESTING_TAGS = buildTagMap('noscript')
     NESTABLE_TAGS = {}
 
@@ -1399,7 +1693,7 @@ class BeautifulSOAP(BeautifulStoneSoup):
             parent = self.tagStack[-2]
             parent._getAttrMap()
             if (isinstance(tag, Tag) and len(tag.contents) == 1 and
-                isinstance(tag.contents[0], NavigableString) and 
+                isinstance(tag.contents[0], NavigableString) and
                 not parent.attrMap.has_key(tag.name)):
                 parent[tag.name] = tag.contents[0]
         BeautifulStoneSoup.popTag(self)
@@ -1409,7 +1703,7 @@ class BeautifulSOAP(BeautifulStoneSoup):
 #and "unprofessional" for use in enterprise screen-scraping. We feel
 #your pain! For such-minded folk, the Beautiful Soup Consortium And
 #All-Night Kosher Bakery recommends renaming this file to
-#"RobustParser.py" (or, in cases of extreme enterprisitude,
+#"RobustParser.py" (or, in cases of extreme enterprisiness,
 #"RobustParserBeanInterface.class") and using the following
 #enterprise-friendly class aliases:
 class RobustXMLParser(BeautifulStoneSoup):
@@ -1439,20 +1733,19 @@ try:
     import chardet
 #    import chardet.constants
 #    chardet.constants._debug = 1
-except:
+except ImportError:
     chardet = None
-chardet = None
 
 # cjkcodecs and iconv_codec make Python know about more character encodings.
 # Both are available from http://cjkpython.i18n.org/
 # They're built in if you use Python 2.4.
 try:
     import cjkcodecs.aliases
-except:
+except ImportError:
     pass
 try:
     import iconv_codec
-except:
+except ImportError:
     pass
 
 class UnicodeDammit:
@@ -1467,15 +1760,18 @@ class UnicodeDammit:
     # by the heuristics in find_codec.
     CHARSET_ALIASES = { "macintosh" : "mac-roman",
                         "x-sjis" : "shift-jis" }
-    
+
     def __init__(self, markup, overrideEncodings=[],
-                 smartQuotesTo='xml'):
+                 smartQuotesTo='xml', isHTML=False):
+        self.declaredHTMLEncoding = None
         self.markup, documentEncoding, sniffedEncoding = \
-                     self._detectEncoding(markup)
+                     self._detectEncoding(markup, isHTML)
         self.smartQuotesTo = smartQuotesTo
         self.triedEncodings = []
-        if isinstance(markup, unicode):
-            return markup
+        if markup == '' or isinstance(markup, unicode):
+            self.originalEncoding = None
+            self.unicode = unicode(markup)
+            return
 
         u = None
         for proposedEncoding in overrideEncodings:
@@ -1485,7 +1781,7 @@ class UnicodeDammit:
             for proposedEncoding in (documentEncoding, sniffedEncoding):
                 u = self._convertFrom(proposedEncoding)
                 if u: break
-                
+
         # If no luck and we have auto-detection library, try that:
         if not u and chardet and not isinstance(self.markup, unicode):
             u = self._convertFrom(chardet.detect(self.markup)['encoding'])
@@ -1495,6 +1791,7 @@ class UnicodeDammit:
             for proposed_encoding in ("utf-8", "windows-1252"):
                 u = self._convertFrom(proposed_encoding)
                 if u: break
+
         self.unicode = u
         if not u: self.originalEncoding = None
 
@@ -1502,14 +1799,14 @@ class UnicodeDammit:
         """Changes a MS smart quote character to an XML or HTML
         entity."""
         sub = self.MS_CHARS.get(orig)
-        if type(sub) == types.TupleType:
+        if isinstance(sub, tuple):
             if self.smartQuotesTo == 'xml':
                 sub = '&#x%s;' % sub[1]
             else:
                 sub = '&%s;' % sub[0]
-        return sub            
+        return sub
 
-    def _convertFrom(self, proposed):        
+    def _convertFrom(self, proposed):
         proposed = self.find_codec(proposed)
         if not proposed or proposed in self.triedEncodings:
             return None
@@ -1518,9 +1815,9 @@ class UnicodeDammit:
 
         # Convert smart quotes to HTML if coming from an encoding
         # that might have them.
-        if self.smartQuotesTo and proposed in("windows-1252",
-                                              "ISO-8859-1",
-                                              "ISO-8859-2"):
+        if self.smartQuotesTo and proposed.lower() in("windows-1252",
+                                                      "iso-8859-1",
+                                                      "iso-8859-2"):
             markup = re.compile("([\x80-\x9f])").sub \
                      (lambda(x): self._subMSChar(x.group(1)),
                       markup)
@@ -1528,12 +1825,12 @@ class UnicodeDammit:
         try:
             # print "Trying to convert document to %s" % proposed
             u = self._toUnicode(markup, proposed)
-            self.markup = u       
+            self.markup = u
             self.originalEncoding = proposed
         except Exception, e:
             # print "That didn't work!"
             # print e
-            return None        
+            return None
         #print "Correct encoding: %s" % proposed
         return self.markup
 
@@ -1561,8 +1858,8 @@ class UnicodeDammit:
             data = data[4:]
         newdata = unicode(data, encoding)
         return newdata
-    
-    def _detectEncoding(self, xml_data):
+
+    def _detectEncoding(self, xml_data, isHTML=False):
         """Given a document, tries to detect its XML encoding."""
         xml_encoding = sniffed_xml_encoding = None
         try:
@@ -1610,13 +1907,17 @@ class UnicodeDammit:
             else:
                 sniffed_xml_encoding = 'ascii'
                 pass
-            xml_encoding_match = re.compile \
-                                 ('^<\?.*encoding=[\'"](.*?)[\'"].*\?>')\
-                                 .match(xml_data)
         except:
             xml_encoding_match = None
-        if xml_encoding_match:
+        xml_encoding_match = re.compile(
+            '^<\?.*encoding=[\'"](.*?)[\'"].*\?>').match(xml_data)
+        if not xml_encoding_match and isHTML:
+            regexp = re.compile('<\s*meta[^>]+charset=([^>]*?)[;\'">]', re.I)
+            xml_encoding_match = regexp.search(xml_data)
+        if xml_encoding_match is not None:
             xml_encoding = xml_encoding_match.groups()[0].lower()
+            if isHTML:
+                self.declaredHTMLEncoding = xml_encoding
             if sniffed_xml_encoding and \
                (xml_encoding in ('iso-10646-ucs-2', 'ucs-2', 'csunicode',
                                  'iso-10646-ucs-4', 'ucs-4', 'csucs4',
@@ -1633,12 +1934,12 @@ class UnicodeDammit:
                or charset
 
     def _codec(self, charset):
-        if not charset: return charset 
+        if not charset: return charset
         codec = None
         try:
             codecs.lookup(charset)
             codec = charset
-        except LookupError:
+        except (LookupError, ValueError):
             pass
         return codec
 
@@ -1707,5 +2008,5 @@ class UnicodeDammit:
 #By default, act as an HTML pretty-printer.
 if __name__ == '__main__':
     import sys
-    soup = BeautifulStoneSoup(sys.stdin.read())
+    soup = BeautifulSoup(sys.stdin)
     print soup.prettify()
diff --git a/constants.py b/constants.py
index 6af00eb6..a8691435 100644
--- a/constants.py
+++ b/constants.py
@@ -36,7 +36,8 @@ CONTENT_START = '''<?xml version="1.0"?>
    <dc:title>%s</dc:title> 
    <dc:creator opf:role="aut">%s</dc:creator>
    <dc:language>en-UK</dc:language> 
-   <dc:rights></dc:rights> 
+   <dc:rights></dc:rights>
+   <dc:subject>fanfiction</dc:subject> 
    <dc:publisher>sgzmd</dc:publisher> 
    <dc:identifier id="BookId">urn:uuid:sigizmund.com062820072147132</dc:identifier>
  </metadata>
diff --git a/ffnet.py b/ffnet.py
index 0816bf81..d576ce64 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -118,20 +118,39 @@ class FFNet(FanfictionSiteAdapter):
 		textbuf = ''
 		emit = False
 		
-		for l in lines:
-			if l.find('<!-- start story -->') != -1:
-				#s2 = bs.BeautifulStoneSoup(l)
-				#return s2.div.prettify()
-				emit = True
-			
-			if emit:
-				textbuf = textbuf + "\n" + l
-			
-			if l.find('<!-- end story -->') != -1:
-				emit = False
+		olddata = data
+		try:
+			data = data.decode('utf8')
+		except:
+			data = olddata
 		
-		s2 = bs.BeautifulStoneSoup(textbuf)
-		return s2.div.prettify()
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			logging.info("Failed to decode: <%s>" % data)
+			soup = None
+		div = soup.find('div', {'id' : 'storytext'})
+		if None == div:
+			return '<html/>'
+		
+		return div.prettify()
+		
+		# 
+		# for l in lines:
+		# 	if l.find("<div id=storytextp class=storytextp") != -1 or l.find('<!-- start story -->') != -1 or l.find('<div id="storytextp"') != -1:
+		# 		logging.debug("starting at line: %s" % l)
+		# 		#s2 = bs.BeautifulStoneSoup(l)
+		# 		#return s2.div.prettify()
+		# 		emit = True
+		# 	
+		# 	if emit:
+		# 		textbuf = textbuf + "\n" + l
+		# 	
+		# 	if l.find("</div><div style='height:10px'></div> ") != -1 or l.find('<!-- end story -->') != -1:
+		# 		emit = False
+		# 
+		# s2 = bs.BeautifulStoneSoup(textbuf)
+		# return s2.div.prettify()
 		
 		
 	def setLogin(self, login):
@@ -162,7 +181,7 @@ class FFA_UnitTests(unittest.TestCase):
 		f = FFNet('http://www.fanfiction.net/s/5257563/1')
 		urls = f.extractIndividualUrls()
 		
-		self.assertEquals(8, len(urls))
+		self.assertEquals(10, len(urls))
 	
 	def testGetText(self):
 		url = 'http://www.fanfiction.net/s/5257563/1'
diff --git a/ficwad.py b/ficwad.py
index 35b3b76e..26be350f 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -17,10 +17,10 @@ class FicWad(FanfictionSiteAdapter):
 		self.url = url
 		self.host = up.urlparse(url).netloc
 	
-	def requiresLogin(self, url):
+	def requiresLogin(self, url = None):
 		return False
 	
-	def performLogin(self, url):
+	def performLogin(self, url = None):
 		pass
 		
 	def setLogin(self, login):
@@ -37,7 +37,7 @@ class FicWad(FanfictionSiteAdapter):
 		self.storyName = title.split('::')[0].strip()
 		
 		author = soup.find('span', {'class' : 'author'})
-		self.authorName = author.a.string
+		self.authorName = str(author.a.string)
 		
 		print('Story "%s" by %s' % (self.storyName, self.authorName))
 		
diff --git a/html2text.py b/html2text.py
new file mode 100644
index 00000000..5d61b9a4
--- /dev/null
+++ b/html2text.py
@@ -0,0 +1,450 @@
+#!/usr/bin/env python
+"""html2text: Turn HTML into equivalent Markdown-structured text."""
+__version__ = "2.37"
+__author__ = "Aaron Swartz (me@aaronsw.com)"
+__copyright__ = "(C) 2004-2008 Aaron Swartz. GNU GPL 3."
+__contributors__ = ["Martin 'Joey' Schulze", "Ricardo Reyes", "Kevin Jay North"]
+
+# TODO:
+#   Support decoded entities with unifiable.
+
+if not hasattr(__builtins__, 'True'): True, False = 1, 0
+import re, sys, urllib, htmlentitydefs, codecs, StringIO, types
+import sgmllib
+import urlparse
+sgmllib.charref = re.compile('&#([xX]?[0-9a-fA-F]+)[^0-9a-fA-F]')
+
+try: from textwrap import wrap
+except: pass
+
+# Use Unicode characters instead of their ascii psuedo-replacements
+UNICODE_SNOB = 0
+
+# Put the links after each paragraph instead of at the end.
+LINKS_EACH_PARAGRAPH = 0
+
+# Wrap long lines at position. 0 for no wrapping. (Requires Python 2.3.)
+BODY_WIDTH = 78
+
+# Don't show internal links (href="#local-anchor") -- corresponding link targets
+# won't be visible in the plain text file anyway.
+SKIP_INTERNAL_LINKS = False
+
+### Entity Nonsense ###
+
+def name2cp(k):
+    if k == 'apos': return ord("'")
+    if hasattr(htmlentitydefs, "name2codepoint"): # requires Python 2.3
+        return htmlentitydefs.name2codepoint[k]
+    else:
+        k = htmlentitydefs.entitydefs[k]
+        if k.startswith("&#") and k.endswith(";"): return int(k[2:-1]) # not in latin-1
+        return ord(codecs.latin_1_decode(k)[0])
+
+unifiable = {'rsquo':"'", 'lsquo':"'", 'rdquo':'"', 'ldquo':'"', 
+'copy':'(C)', 'mdash':'--', 'nbsp':' ', 'rarr':'->', 'larr':'<-', 'middot':'*',
+'ndash':'-', 'oelig':'oe', 'aelig':'ae',
+'agrave':'a', 'aacute':'a', 'acirc':'a', 'atilde':'a', 'auml':'a', 'aring':'a', 
+'egrave':'e', 'eacute':'e', 'ecirc':'e', 'euml':'e', 
+'igrave':'i', 'iacute':'i', 'icirc':'i', 'iuml':'i',
+'ograve':'o', 'oacute':'o', 'ocirc':'o', 'otilde':'o', 'ouml':'o', 
+'ugrave':'u', 'uacute':'u', 'ucirc':'u', 'uuml':'u'}
+
+unifiable_n = {}
+
+for k in unifiable.keys():
+    unifiable_n[name2cp(k)] = unifiable[k]
+
+def charref(name):
+    if name[0] in ['x','X']:
+        c = int(name[1:], 16)
+    else:
+        c = int(name)
+    
+    if not UNICODE_SNOB and c in unifiable_n.keys():
+        return unifiable_n[c]
+    else:
+        return unichr(c)
+
+def entityref(c):
+    if not UNICODE_SNOB and c in unifiable.keys():
+        return unifiable[c]
+    else:
+        try: name2cp(c)
+        except KeyError: return "&" + c
+        else: return unichr(name2cp(c))
+
+def replaceEntities(s):
+    s = s.group(1)
+    if s[0] == "#": 
+        return charref(s[1:])
+    else: return entityref(s)
+
+r_unescape = re.compile(r"&(#?[xX]?(?:[0-9a-fA-F]+|\w{1,8}));")
+def unescape(s):
+    return r_unescape.sub(replaceEntities, s)
+    
+def fixattrs(attrs):
+    # Fix bug in sgmllib.py
+    if not attrs: return attrs
+    newattrs = []
+    for attr in attrs:
+        newattrs.append((attr[0], unescape(attr[1])))
+    return newattrs
+
+### End Entity Nonsense ###
+
+def onlywhite(line):
+    """Return true if the line does only consist of whitespace characters."""
+    for c in line:
+        if c is not ' ' and c is not '  ':
+            return c is ' '
+    return line
+
+def optwrap(text):
+    """Wrap all paragraphs in the provided text."""
+    if not BODY_WIDTH:
+        return text
+    
+    assert wrap, "Requires Python 2.3."
+    result = ''
+    newlines = 0
+    for para in text.split("\n"):
+        if len(para) > 0:
+            if para[0] is not ' ' and para[0] is not '-' and para[0] is not '*':
+                for line in wrap(para, BODY_WIDTH):
+                    result += line + "\n"
+                result += "\n"
+                newlines = 2
+            else:
+                if not onlywhite(para):
+                    result += para + "\n"
+                    newlines = 1
+        else:
+            if newlines < 2:
+                result += "\n"
+                newlines += 1
+    return result
+
+def hn(tag):
+    if tag[0] == 'h' and len(tag) == 2:
+        try:
+            n = int(tag[1])
+            if n in range(1, 10): return n
+        except ValueError: return 0
+
+class _html2text(sgmllib.SGMLParser):
+    def __init__(self, out=None, baseurl=''):
+        sgmllib.SGMLParser.__init__(self)
+        
+        if out is None: self.out = self.outtextf
+        else: self.out = out
+        self.outtext = u''
+        self.quiet = 0
+        self.p_p = 0
+        self.outcount = 0
+        self.start = 1
+        self.space = 0
+        self.a = []
+        self.astack = []
+        self.acount = 0
+        self.list = []
+        self.blockquote = 0
+        self.pre = 0
+        self.startpre = 0
+        self.lastWasNL = 0
+        self.abbr_title = None # current abbreviation definition
+        self.abbr_data = None # last inner HTML (for abbr being defined)
+        self.abbr_list = {} # stack of abbreviations to write later
+        self.baseurl = baseurl
+    
+    def outtextf(self, s): 
+        self.outtext += s
+    
+    def close(self):
+        sgmllib.SGMLParser.close(self)
+        
+        self.pbr()
+        self.o('', 0, 'end')
+        
+        return self.outtext
+        
+    def handle_charref(self, c):
+        self.o(charref(c))
+
+    def handle_entityref(self, c):
+        self.o(entityref(c))
+            
+    def unknown_starttag(self, tag, attrs):
+        self.handle_tag(tag, attrs, 1)
+    
+    def unknown_endtag(self, tag):
+        self.handle_tag(tag, None, 0)
+        
+    def previousIndex(self, attrs):
+        """ returns the index of certain set of attributes (of a link) in the
+            self.a list
+ 
+            If the set of attributes is not found, returns None
+        """
+        if not attrs.has_key('href'): return None
+        
+        i = -1
+        for a in self.a:
+            i += 1
+            match = 0
+            
+            if a.has_key('href') and a['href'] == attrs['href']:
+                if a.has_key('title') or attrs.has_key('title'):
+                        if (a.has_key('title') and attrs.has_key('title') and
+                            a['title'] == attrs['title']):
+                            match = True
+                else:
+                    match = True
+
+            if match: return i
+
+    def handle_tag(self, tag, attrs, start):
+        attrs = fixattrs(attrs)
+    
+        if hn(tag):
+            self.p()
+            if start: self.o(hn(tag)*"#" + ' ')
+
+        if tag in ['p', 'div']: self.p()
+        
+        if tag == "br" and start: self.o("  \n")
+
+        if tag == "hr" and start:
+            self.p()
+            self.o("* * *")
+            self.p()
+
+        if tag in ["head", "style", 'script']: 
+            if start: self.quiet += 1
+            else: self.quiet -= 1
+
+        if tag in ["body"]:
+            self.quiet = 0 # sites like 9rules.com never close <head>
+        
+        if tag == "blockquote":
+            if start: 
+                self.p(); self.o('> ', 0, 1); self.start = 1
+                self.blockquote += 1
+            else:
+                self.blockquote -= 1
+                self.p()
+        
+        if tag in ['em', 'i', 'u']: self.o("_")
+        if tag in ['strong', 'b']: self.o("**")
+        if tag == "code" and not self.pre: self.o('`') #TODO: `` `this` ``
+        if tag == "abbr":
+            if start:
+                attrsD = {}
+                for (x, y) in attrs: attrsD[x] = y
+                attrs = attrsD
+                
+                self.abbr_title = None
+                self.abbr_data = ''
+                if attrs.has_key('title'):
+                    self.abbr_title = attrs['title']
+            else:
+                if self.abbr_title != None:
+                    self.abbr_list[self.abbr_data] = self.abbr_title
+                    self.abbr_title = None
+                self.abbr_data = ''
+        
+        if tag == "a":
+            if start:
+                attrsD = {}
+                for (x, y) in attrs: attrsD[x] = y
+                attrs = attrsD
+                if attrs.has_key('href') and not (SKIP_INTERNAL_LINKS and attrs['href'].startswith('#')): 
+                    self.astack.append(attrs)
+                    self.o("[")
+                else:
+                    self.astack.append(None)
+            else:
+                if self.astack:
+                    a = self.astack.pop()
+                    if a:
+                        i = self.previousIndex(a)
+                        if i is not None:
+                            a = self.a[i]
+                        else:
+                            self.acount += 1
+                            a['count'] = self.acount
+                            a['outcount'] = self.outcount
+                            self.a.append(a)
+                        self.o("][" + `a['count']` + "]")
+        
+        if tag == "img" and start:
+            attrsD = {}
+            for (x, y) in attrs: attrsD[x] = y
+            attrs = attrsD
+            if attrs.has_key('src'):
+                attrs['href'] = attrs['src']
+                alt = attrs.get('alt', '')
+                i = self.previousIndex(attrs)
+                if i is not None:
+                    attrs = self.a[i]
+                else:
+                    self.acount += 1
+                    attrs['count'] = self.acount
+                    attrs['outcount'] = self.outcount
+                    self.a.append(attrs)
+                self.o("![")
+                self.o(alt)
+                self.o("]["+`attrs['count']`+"]")
+        
+        if tag == 'dl' and start: self.p()
+        if tag == 'dt' and not start: self.pbr()
+        if tag == 'dd' and start: self.o('    ')
+        if tag == 'dd' and not start: self.pbr()
+        
+        if tag in ["ol", "ul"]:
+            if start:
+                self.list.append({'name':tag, 'num':0})
+            else:
+                if self.list: self.list.pop()
+            
+            self.p()
+        
+        if tag == 'li':
+            if start:
+                self.pbr()
+                if self.list: li = self.list[-1]
+                else: li = {'name':'ul', 'num':0}
+                self.o("  "*len(self.list)) #TODO: line up <ol><li>s > 9 correctly.
+                if li['name'] == "ul": self.o("* ")
+                elif li['name'] == "ol":
+                    li['num'] += 1
+                    self.o(`li['num']`+". ")
+                self.start = 1
+            else:
+                self.pbr()
+        
+        if tag in ["table", "tr"] and start: self.p()
+        if tag == 'td': self.pbr()
+        
+        if tag == "pre":
+            if start:
+                self.startpre = 1
+                self.pre = 1
+            else:
+                self.pre = 0
+            self.p()
+            
+    def pbr(self):
+        if self.p_p == 0: self.p_p = 1
+
+    def p(self): self.p_p = 2
+    
+    def o(self, data, puredata=0, force=0):
+        if self.abbr_data is not None: self.abbr_data += data
+        
+        if not self.quiet: 
+            if puredata and not self.pre:
+                data = re.sub('\s+', ' ', data)
+                if data and data[0] == ' ':
+                    self.space = 1
+                    data = data[1:]
+            if not data and not force: return
+            
+            if self.startpre:
+                #self.out(" :") #TODO: not output when already one there
+                self.startpre = 0
+            
+            bq = (">" * self.blockquote)
+            if not (force and data and data[0] == ">") and self.blockquote: bq += " "
+            
+            if self.pre:
+                bq += "    "
+                data = data.replace("\n", "\n"+bq)
+            
+            if self.start:
+                self.space = 0
+                self.p_p = 0
+                self.start = 0
+
+            if force == 'end':
+                # It's the end.
+                self.p_p = 0
+                self.out("\n")
+                self.space = 0
+
+
+            if self.p_p:
+                self.out(('\n'+bq)*self.p_p)
+                self.space = 0
+                
+            if self.space:
+                if not self.lastWasNL: self.out(' ')
+                self.space = 0
+
+            if self.a and ((self.p_p == 2 and LINKS_EACH_PARAGRAPH) or force == "end"):
+                if force == "end": self.out("\n")
+
+                newa = []
+                for link in self.a:
+                    if self.outcount > link['outcount']:
+                        self.out("   ["+`link['count']`+"]: " + urlparse.urljoin(self.baseurl, link['href'])) 
+                        if link.has_key('title'): self.out(" ("+link['title']+")")
+                        self.out("\n")
+                    else:
+                        newa.append(link)
+
+                if self.a != newa: self.out("\n") # Don't need an extra line when nothing was done.
+
+                self.a = newa
+            
+            if self.abbr_list and force == "end":
+                for abbr, definition in self.abbr_list.items():
+                    self.out("  *[" + abbr + "]: " + definition + "\n")
+
+            self.p_p = 0
+            self.out(data)
+            self.lastWasNL = data and data[-1] == '\n'
+            self.outcount += 1
+
+    def handle_data(self, data):
+        if r'\/script>' in data: self.quiet -= 1
+        self.o(data, 1)
+    
+    def unknown_decl(self, data): pass
+
+def wrapwrite(text): sys.stdout.write(text.encode('utf8'))
+
+def html2text_file(html, out=wrapwrite, baseurl=''):
+    h = _html2text(out, baseurl)
+    h.feed(html)
+    h.feed("")
+    return h.close()
+
+def html2text(html, baseurl=''):
+    return optwrap(html2text_file(html, None, baseurl))
+
+if __name__ == "__main__":
+    baseurl = ''
+    if sys.argv[1:]:
+        arg = sys.argv[1]
+        if arg.startswith('http://'):
+            baseurl = arg
+            j = urllib.urlopen(baseurl)
+            try:
+                from feedparser import _getCharacterEncoding as enc
+            except ImportError:
+                   enc = lambda x, y: ('utf-8', 1)
+            text = j.read()
+            encoding = enc(j.headers, text)[0]
+            if encoding == 'us-ascii': encoding = 'utf-8'
+            data = text.decode(encoding)
+
+        else:
+            encoding = 'utf8'
+            if len(sys.argv) > 2:
+                encoding = sys.argv[2]
+            data = open(arg, 'r').read().decode(encoding)
+    else:
+        data = sys.stdin.read().decode('utf8')
+    wrapwrite(html2text(data, baseurl))
diff --git a/output.py b/output.py
index aeea8cda..79870c08 100644
--- a/output.py
+++ b/output.py
@@ -25,6 +25,7 @@ import zipdir
 import html_constants
 from constants import *
 
+import html2text
 
 
 class FanficWriter:
@@ -37,6 +38,22 @@ class FanficWriter:
 	def finalise(self):
 		pass
 
+class TextWriter(FanficWriter):
+	htmlWriter = None
+	
+	def __init__(self, base, name, author, inmemory=False, compress=False):
+		self.htmlWriter = HTMLWriter(base, name, author, True, False)
+	
+	def writeChapter(self, title, text):
+		self.htmlWriter.writeChapter(title, text)
+	
+	def finalise(self):
+		self.htmlWriter.finalise()
+		self.output = StringIO.StringIO()
+		self.output.write(html2text.html2text(self.htmlWriter.output.getvalue().decode('utf-8')).encode('utf-8'))
+		self.name = self.htmlWriter.name
+		
+
 class HTMLWriter(FanficWriter):
 	body = ''
 	
@@ -59,10 +76,17 @@ class HTMLWriter(FanficWriter):
 		
 		self.xhtmlTemplate = string.Template(html_constants.XHTML_START)
 		self.chapterStartTemplate = string.Template(html_constants.XHTML_CHAPTER_START)
-		
+	
+	def _printableVersion(self, text):
+		try:
+			d = text.decode('utf-8')
+			return d
+		except:
+			return text
+	
 	def writeChapter(self, title, text):
-		title = title.decode('utf-8')
-		text = text.decode('utf-8')
+		title = self._printableVersion(title) #title.decode('utf-8')
+		text = self._printableVersion(text) #text.decode('utf-8')
 		self.body = self.body + '\n' + self.chapterStartTemplate.substitute({'chapter' : title})
 		self.body = self.body + '\n' + text
 	
diff --git a/twilighted.py b/twilighted.py
new file mode 100644
index 00000000..54ff35d9
--- /dev/null
+++ b/twilighted.py
@@ -0,0 +1,134 @@
+import os
+import re
+import sys
+import shutil
+import os.path
+import urllib as u
+import logging
+import pprint as pp
+import unittest
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+from adapter import *
+import twipassword
+
+class Twilighted(FanfictionSiteAdapter):
+  def __init__(self, url):
+    self.url = url
+    parsedUrl = up.urlparse(url)
+    self.host = parsedUrl.netloc
+    self.path = parsedUrl.path
+    self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+    self.password=twipassword.password
+    self.login='sigizmund'
+    logging.debug("Created Twilighted: url=%s" % (self.url))
+
+
+  def requiresLogin(self, url = None):
+    return True
+
+  def performLogin(self, url = None):
+    data = {}
+
+    data['penname'] = self.login
+    data['password'] = self.password
+    data['cookiecheck'] = '1'
+    data['submit'] = 'Submit'
+
+    urlvals = u.urlencode(data)
+    loginUrl = 'http://' + self.host + self._getLoginScript()
+    logging.debug("Will now login to URL %s" % loginUrl)
+
+    req = self.opener.open(loginUrl, urlvals)
+
+    d = req.read().decode('utf-8')
+
+    if self.reqLoginData(d) :
+      return False
+    else:
+      return True
+
+
+  def setLogin(self, login):
+    self.login = login
+
+  def setPassword(self, password):
+    self.password = password
+
+  def extractIndividualUrls(self):
+    data = self.opener.open(self.url).read()
+    
+    if self.reqLoginData(data):
+      self.performLogin()
+      data = self.opener.open(self.url).read()
+      if self.reqLoginData(data):
+        return None
+    
+    soup = bs.BeautifulStoneSoup(data)
+
+    title = soup.find('title').string
+    self.storyName = title.split(' by ')[0].strip()
+    self.authorName = title.split(' by ')[1].strip()
+
+    select = soup.find('select', { 'name' : 'chapter' } )
+
+    allOptions = select.findAll('option')
+    result = []
+    for o in allOptions:
+      url = self.url + "&chapter=%s" % o['value']
+      title = o.string
+      result.append((url,title))
+
+    return result
+
+  def getStoryName(self):
+    return self.storyName
+
+  def getAuthorName(self):
+    return self.authorName
+
+  def getText(self, url):
+    if url.find('http://') == -1:
+      url = 'http://' + self.host + '/' + url
+
+    logging.debug('Getting data from: %s' % url)
+
+    data = self.opener.open(url).read()
+    
+    soup = bs.BeautifulStoneSoup(data, convertEntities=bs.BeautifulStoneSoup.HTML_ENTITIES)
+
+    div = soup.find('div', {'id' : 'story'})
+
+    if None == div:
+      return '<html/>'
+
+    return div.prettify()
+
+  def _getLoginScript(self):
+    return '/user.php?action=login'
+
+  def reqLoginData(self, data):
+    if data.find('Registered Users Only. Please click OK to login or register.') != -1 or data.find('There is no such account on our website') != -1:
+      return True
+    else:
+      return False
+
+
+class Twilighted_UnitTests(unittest.TestCase):
+  def setUp(self):
+    logging.basicConfig(level=logging.DEBUG)
+    pass
+  
+  def testLoginWorks(self):
+    url = 'http://www.twilighted.net/viewstory.php?sid=10004'
+    self.assertTrue(Twilighted(url).performLogin())
+  
+  def testGetUrlsWorks(self):
+    url = 'http://www.twilighted.net/viewstory.php?sid=10004'
+    self.assertEquals(32, len(Twilighted(url).extractIndividualUrls()))
+
+if __name__ == '__main__':
+  unittest.main()
\ No newline at end of file

From b22d961e738602ff217371fc56fb5bf70d22dd74 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Fri, 24 Sep 2010 23:36:05 -0500
Subject: [PATCH 27/94] Allow one-shot fics for ffnet. Write epub files as mode
 'b' binary so it works on Windows. Allow hr tags in epub output. Don't
 compress file mimetype in epub file--required by standard.

---
 books/place holder.txt |  0
 ffnet.py               |  6 ++++--
 output.py              | 12 +++++++-----
 zipdir.py              | 15 ++++++++++++---
 4 files changed, 23 insertions(+), 10 deletions(-)
 create mode 100644 books/place holder.txt

diff --git a/books/place holder.txt b/books/place holder.txt
new file mode 100644
index 00000000..e69de29b
diff --git a/ffnet.py b/ffnet.py
index d576ce64..fb1ff29e 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -40,7 +40,7 @@ class FFNet(FanfictionSiteAdapter):
 		self.path = parsedUrl.path
 		
 		self.storyName = 'FF.Net story'
-		self.storyName = 'FF.Net author'
+		self.authorName = 'FF.Net author'
 		
 		spl = self.path.split('/')
 		if len(spl) == 5:
@@ -108,7 +108,9 @@ class FFNet(FanfictionSiteAdapter):
 					title = o.string
 					logging.debug('URL = `%s`, Title = `%s`' % (url, title))
 					urls.append((url,title))
-		
+		if len(urls) == 0:
+			# no chapters found, try url by itself.
+			urls.append((self.url,self.storyName))
 		return urls
 	
 	def getText(self, url):
diff --git a/output.py b/output.py
index 79870c08..012b071a 100644
--- a/output.py
+++ b/output.py
@@ -109,7 +109,7 @@ class EPubFanficWriter(FanficWriter):
 	files = {}
 	
 	def _writeFile(self, fileName, data):
-		logging.debug('_writeFile(`%s`, data)' % fileName)
+		#logging.debug('_writeFile(`%s`, data)' % fileName)
 		if fileName in self.files:
 			try:
 				d = data.decode('utf-8')
@@ -189,20 +189,22 @@ class EPubFanficWriter(FanficWriter):
 		
 		text = self._removeEntities(text)
 		
-		self.soup = bs.BeautifulStoneSoup(text.decode('utf-8'))
+		# BeautifulStoneSoup doesn't have any selfClosingTags by default.  
+		# hr needs to be if it's going to work.
+		self.soup = bs.BeautifulStoneSoup(text.decode('utf-8'), selfClosingTags=('hr'))
 
 		allTags = self.soup.findAll(recursive=True)
 		for t in allTags:
 			for attr in t._getAttrMap().keys():
 				if attr not in acceptable_attributes:
 					del t[attr]
-	    
+
 		allPs = self.soup.findAll(recursive=True)
 		for p in allPs:
 			if p.string != None and (len(p.string.strip()) == 0 or p.string.strip() == '&nbsp;' ) :
 				p.extract()
 				
-		allBrs = self.soup.findAll(recursive=True, name = ["br", "hr", 'div'])
+		allBrs = self.soup.findAll(recursive=True, name = ["br", 'div'])
 		for br in allBrs:
 			if (br.string != None and len(br.string.strip()) != 0) or (br.contents != None):
 				br.name = 'p'
@@ -270,7 +272,7 @@ class EPubFanficWriter(FanficWriter):
 		zipdata = zipdir.inMemoryZip(self.files)
 		
 		if self.writeToFile:
-			f = open(filename, 'w')
+			f = open(filename, 'wb')
 			f.write(zipdata.getvalue())
 			f.close()
 		else:
diff --git a/zipdir.py b/zipdir.py
index a0a568e6..ddaeb2f7 100644
--- a/zipdir.py
+++ b/zipdir.py
@@ -17,7 +17,11 @@ def toZip(filename, directory):
 
 		if os.path.isfile(each):
 			print(each)
-			zippedHelp.write(each, arcname=entity)
+			# epub standard requires mimetype to be uncompressed and first file.
+			if entity == 'mimetype':
+				zippedHelp.write(each, arcname=entity, compress_type=zipfile.ZIP_STORED)
+			else:
+				zippedHelp.write(each, arcname=entity)
 		else:
 			addFolderToZip(zippedHelp,entity, each)
  	
@@ -51,10 +55,15 @@ def inMemoryZip(files):
 		
 #		logging.debug(data)
 		logging.debug("Writing ZIP path %s" % path)
+		# epub standard requires mimetype to be uncompressed and first file.
+		if path == 'mimetype':
+			compress=zipfile.ZIP_STORED
+		else:
+			compress=zipfile.ZIP_DEFLATED
 		try:
-			memzip.writestr(path, data.encode('utf-8'))
+			memzip.writestr(path, data.encode('utf-8'), compress_type=compress)
 		except UnicodeDecodeError, e:
-			memzip.writestr(path.encode('utf-8'), data.encode('utf-8'))
+			memzip.writestr(path.encode('utf-8'), data.encode('utf-8'), compress_type=compress)
 	
 	for zf in memzip.filelist:
 		zf.create_system = 0

From 950807747c02269d739c404bb3bee868197e1251 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Sat, 25 Sep 2010 00:44:56 -0500
Subject: [PATCH 28/94] Replace ':' in filename with '_' for Windoze.  appspot
 version appears to already do this.

---
 output.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/output.py b/output.py
index 012b071a..9c004c73 100644
--- a/output.py
+++ b/output.py
@@ -133,7 +133,7 @@ class EPubFanficWriter(FanficWriter):
 	
 	def __init__(self, base, name, author, inmemory=False, compress=True):
 		self.basePath = base
-		self.name = name.replace(" ", "_")
+		self.name = name.replace(" ", "_").replace(":","_")
 		self.storyTitle = name
 		self.directory = self.basePath + '/' + self.name
 		self.inmemory = inmemory

From 31c68ff796936761de13ba684a559caa15b6c766 Mon Sep 17 00:00:00 2001
From: Jimm <retiefjimm@gmail.com>
Date: Sat, 25 Sep 2010 11:55:31 -0500
Subject: [PATCH 29/94] Exit on ff.net error downloading chapter.  Replace ':'
 with '_' in file name for html output, too.

---
 ffnet.py  | 2 ++
 output.py | 2 +-
 2 files changed, 3 insertions(+), 1 deletion(-)

diff --git a/ffnet.py b/ffnet.py
index fb1ff29e..373c6ea0 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -133,6 +133,8 @@ class FFNet(FanfictionSiteAdapter):
 			soup = None
 		div = soup.find('div', {'id' : 'storytext'})
 		if None == div:
+			logging.error("Error downloading Chapter: %s" % url)
+			exit(1)
 			return '<html/>'
 		
 		return div.prettify()
diff --git a/output.py b/output.py
index 9c004c73..a0784c25 100644
--- a/output.py
+++ b/output.py
@@ -59,7 +59,7 @@ class HTMLWriter(FanficWriter):
 	
 	def __init__(self, base, name, author, inmemory=False, compress=False):
 		self.basePath = base
-		self.name = name.replace(" ", "_")
+		self.name = name.replace(" ", "_").replace(":","_")
 		self.storyTitle = name
 		self.fileName = self.basePath + '/' + self.name + '.html'
 		self.authorName = author

From ccb3fb36c5c9fb1664f95e04ca8602173da2c500 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Sun, 26 Sep 2010 19:08:49 -0500
Subject: [PATCH 30/94] Allow '&amp;' and '&pound;'.  Allow single
 chapter/one-shot stories from FicWad.  Correct story names from FicWad.  Stop
 creating empty 'Story Index' chapter in stories from FicWad.  Exit on chapter
 d/l error from FicWad.

---
 constants.py |  5 ++++-
 ficwad.py    | 37 +++++++++++++++++++++++++------------
 output.py    |  6 +++++-
 3 files changed, 34 insertions(+), 14 deletions(-)

diff --git a/constants.py b/constants.py
index a8691435..8d389e32 100644
--- a/constants.py
+++ b/constants.py
@@ -1,3 +1,5 @@
+﻿# -*- coding: utf-8 -*-
+
 CSS = '''body { margin-left: 5%; margin-right: 5%; margin-top: 5%; margin-bottom: 5%; text-align: justify; }
 pre { font-size: x-small; }
 h1 { text-align: center; }
@@ -111,7 +113,8 @@ acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
 
 acceptable_attributes = ['href']
 
-entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', '&lsquo;' : '\'', '&quot;' : '"', '&hellip;' : '...' }
+entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', 
+		'&lsquo;' : '\'', '&quot;' : '"', '&hellip;' : '...', '&amp;' : '&', '&pound;' : '£' }
 
 FB2_PROLOGUE = '<FictionBook>'
 FB2_DESCRIPTION = '''<description>
diff --git a/ficwad.py b/ficwad.py
index 26be350f..1e769a00 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -33,25 +33,37 @@ class FicWad(FanfictionSiteAdapter):
 		data = u2.urlopen(self.url).read()
 		soup = bs.BeautifulStoneSoup(data)
 		
-		title = soup.find('title').string
-		self.storyName = title.split('::')[0].strip()
+		story = soup.find('div', {'id' : 'story'})
+		crumbtrail = story.find('h3') # the only h3 ficwad uses.
+		allAhrefs = crumbtrail.findAll('a')
+		# last of crumbtrail
+		self.storyName = allAhrefs[-1].string.strip()
+		# save chapter name from header in case of one-shot.
+		chaptername = story.find('h4').find('a').string.strip()
 		
 		author = soup.find('span', {'class' : 'author'})
 		self.authorName = str(author.a.string)
 		
-		print('Story "%s" by %s' % (self.storyName, self.authorName))
-		
 		select = soup.find('select', { 'name' : 'goto' } )
 		
-		allOptions = select.findAll('option')
 		result = []
-		for o in allOptions:
-			url = o['value']
-#			if type(url) is unicode:
-#				url = url.encode('utf-8')
-			title = o.string
-			result.append((url,title))
+		if select is None:
+			# Single chapter storys don't have title in crumbtrail, just 'chapter' title in h4.
+			self.storyName = chaptername
+			# no chapters found, try url by itself.
+			result.append((self.url,self.storyName))
+		else:
+			allOptions = select.findAll('option')
+			for o in allOptions:
+				url = o['value']
+				title = o.string
+				# ficwad includes 'Story Index' in the dropdown of chapters, 
+				# but it's not a real chapter.
+				if title != "Story Index":
+					result.append((url,title))
 			
+		print('Story "%s" by %s' % (self.storyName, self.authorName))
+		
 		return result
 	
 	def getStoryName(self):
@@ -69,8 +81,9 @@ class FicWad(FanfictionSiteAdapter):
 		soup = bs.BeautifulStoneSoup(data)
 		div = soup.find('div', {'id' : 'storytext'})
 		if None == div:
+			logging.error("Error downloading Chapter: %s" % url)
+			exit(1)
 			return '<html/>'
-		
 		return div.prettify()
 	
 	def getPrintableUrl(self, url):
diff --git a/output.py b/output.py
index a0784c25..bd17b02a 100644
--- a/output.py
+++ b/output.py
@@ -165,7 +165,11 @@ class EPubFanficWriter(FanficWriter):
 	def _removeEntities(self, text):
 		for e in entities:
 			v = entities[e]
-			text = text.replace(e, v)
+			try:
+				text = text.replace(e, v)
+			except UnicodeDecodeError, ex:
+				# for the pound symbol in constants.py
+				text = text.replace(e, v.decode('utf-8'))
 		
 		text = text.replace('&', '&amp;')
 		

From fe67201f953323fb68d838361560282a5799405e Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Tue, 28 Sep 2010 13:26:49 -0500
Subject: [PATCH 31/94] Fix up code for harrypotterfanfiction.com so it works
 and add one-shot support.  Add &nbsp; &lt; and &gt; to entities list.

---
 constants.py |  3 ++-
 hpfiction.py | 22 +++++++++++++++-------
 2 files changed, 17 insertions(+), 8 deletions(-)

diff --git a/constants.py b/constants.py
index 8d389e32..f9f4a366 100644
--- a/constants.py
+++ b/constants.py
@@ -114,7 +114,8 @@ acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
 acceptable_attributes = ['href']
 
 entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', 
-		'&lsquo;' : '\'', '&quot;' : '"', '&hellip;' : '...', '&amp;' : '&', '&pound;' : '£' }
+		'&lsquo;' : '\'', '&quot;' : '"', '&hellip;' : '...', '&amp;' : '&', '&pound;' : '£', '&nbsp;' : ' ',
+		'&lt;' : '<', '&gt;' : '>' }
 
 FB2_PROLOGUE = '<FictionBook>'
 FB2_DESCRIPTION = '''<description>
diff --git a/hpfiction.py b/hpfiction.py
index f33849a7..36e8fff1 100644
--- a/hpfiction.py
+++ b/hpfiction.py
@@ -58,13 +58,18 @@ class HPFiction(FanfictionSiteAdapter):
 			elif a['href'].find('viewuser.php') != -1:
 				self.authorName = a.string
 		
-		select = soup.find('select', {'name' : 'chapterid'})
 		urls = []
-		for o in select.findAll('option'):
-			if 'value' in o._getAttrMap():
-				url = 'http://' + self.host + '/' + self.path + o['value']
-				title = o.string
-				urls.append((url,title))
+		select = soup.find('select', {'name' : 'chapterid'})
+		if select is None:
+			# no chapters found, try url by itself.
+			urls.append((self.url,self.storyName))
+		else:
+			for o in select.findAll('option'):
+				if 'value' in o._getAttrMap():
+					url = 'http://' + self.host + '/' + self.path + o['value']
+					title = o.string
+					if title != "Story Index":
+						urls.append((url,title))
 		return urls
 
 	def getStoryName(self):
@@ -75,9 +80,12 @@ class HPFiction(FanfictionSiteAdapter):
 	
 	def getText(self, url):
 		logging.debug('Downloading from URL: %s' % url)
-		data = self.opener.open(self.url).read()
+		data = self.opener.open(url).read()
 		soup = bs.BeautifulSoup(data)
 		divtext = soup.find('div', {'id' : 'fluidtext'})
+		if None == divtext:
+			logging.error("Error downloading Chapter: %s" % url)
+			exit(1)
 		return divtext.prettify()
 
 class FF_UnitTests(unittest.TestCase):

From 84fea5b8969a545cc6f593e91920428e687a6008 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Tue, 28 Sep 2010 19:26:06 -0500
Subject: [PATCH 32/94] Fictionalley.com working, also add twilighted.com to
 downaloder.py.

---
 downaloder.py   |  6 ++--
 fictionalley.py | 90 ++++++++++++++++++++++++++++++++++++++-----------
 2 files changed, 74 insertions(+), 22 deletions(-)

diff --git a/downaloder.py b/downaloder.py
index dee7a30d..de93c790 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -80,14 +80,16 @@ if __name__ == '__main__':
 		adapter = ffa.FFA(url)
 	elif url.find('fictionalley') != -1:
 		adapter = fictionalley.FictionAlley(url)
-		print >> sys.stderr, "FictionAlley adapter is broken, try to find this fic on fanfiction.net or fanficauthors"
-		sys.exit(0)
+		#print >> sys.stderr, "FictionAlley adapter is broken, try to find this fic on fanfiction.net or fanficauthors"
+		#sys.exit(0)
 	elif url.find('ficwad') != -1:
 		adapter = ficwad.FicWad(url)
 	elif url.find('fanfiction.net') != -1 or url.find('fictionpress.com') != -1:
 		adapter = ffnet.FFNet(url)
 	elif url.find('harrypotterfanfiction.com') != -1:
 		adapter = hpfiction.HPFiction(url)
+	elif url.find('twilighted.com') != -1:
+		adapter = twilighted.Twilighted(url)
 	else:
 		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
 		sys.exit(1)
diff --git a/fictionalley.py b/fictionalley.py
index 6ccc5ad8..59a0b7d6 100644
--- a/fictionalley.py
+++ b/fictionalley.py
@@ -2,36 +2,78 @@ import os
 import re
 import sys
 import shutil
+import logging
 import os.path
 import urllib as u
 import pprint as pp
 import urllib2 as u2
+import cookielib as cl
 import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
+import time as time
+from adapter import *
 
-class FictionAlley:
-	def __init__(self):
-		pass
+
+class FictionAlley(FanfictionSiteAdapter):
+	def __init__(self, url):
+		self.url = url
+		self.host = up.urlparse(url).netloc
+		cookieproc = u2.HTTPCookieProcessor()
+
+		# FictionAlley wants a cookie to prove you're old enough to read R+ rated stuff.
+		cookie = cl.Cookie(version=0, name='fauser', value='wizard',
+                 port=None, port_specified=False,
+                  domain='www.fictionalley.org', domain_specified=False, domain_initial_dot=False,
+                 path='/authors', path_specified=True,
+                 secure=False,
+                 expires=time.time()+100,
+                 discard=False,
+                 comment=None,
+                 comment_url=None,
+                 rest={'HttpOnly': None},
+					  rfc2109=False)
+		cookieproc.cookiejar.set_cookie(cookie)
+		self.opener = u2.build_opener(cookieproc)
+		
+	def requiresLogin(self, url = None):
+		return False
 	
-	def extractIndividualUrls(self, data, host, contents):
+	def performLogin(self, url = None):
+		pass
+		
+	def setLogin(self, login):
+		self.login = login
+	
+	def setPassword(self, password):
+		self.password = password
+	
+	def extractIndividualUrls(self):
+		data = self.opener.open(self.url).read()		
 		soup = bs.BeautifulStoneSoup(data)
-		
+				
+		# Get title from <title>, remove before '-'.
 		title = soup.find('title').string
-		self.storyName = "-".join(title.split('-')[1:]).strip()
-		
-		authors = soup.findAll('a')
-		
-		print('Story "%s" by %s' % (self.storyName, self.authorName))
+		self.storyName = "-".join(title.split('-')[1:]).strip().replace(" (Story Text)","")
 		
 		links = soup.findAll('a', { 'class' : 'chapterlink' } )
 
 		result = []
-		for a in links:
-			url = a['href']
-			title = a.string
-			result.append((url,title))
+		if len(links) == 0:
+			breadcrumbs = soup.find('div', {'class': 'breadcrumbs'})
+			self.authorName = breadcrumbs.a.string.replace("'s Fics","")
+			result.append((self.url,self.storyName))
+		else:
+			author = soup.find('h1', {'class' : 'title'})
+			self.authorName = author.a.string
 			
+			for a in links:
+				url = a['href']
+				title = a.string
+				result.append((url,title))
+					
+		print('Story "%s" by %s' % (self.storyName, self.authorName))
+		
 		return result
 	
 	def getStoryName(self):
@@ -40,11 +82,20 @@ class FictionAlley:
 	def getAuthorName(self):
 		return self.authorName
 	
-
-	def getText(self, data, fetch = False):
+	def getText(self, url):
+		# fictionalley uses full URLs in chapter list.
+		data = self.opener.open(url).read()
+		
+		# find <!-- headerend --> & <!-- footerstart -->
+		# and replaced with matching div pair for easier parsing.
+		# Yes, it's an evil kludge, but what can ya do?
+		data = data.replace('<!-- headerend -->','<div id="storytext">').replace('<!-- footerstart -->','</div>')
 		soup = bs.BeautifulStoneSoup(data)
+		
 		div = soup.find('div', {'id' : 'storytext'})
 		if None == div:
+			logging.error("Error downloading Chapter: %s" % url)
+			exit(1)
 			return '<html/>'
 		
 		return div.prettify()
@@ -62,14 +113,13 @@ class FictionAlley:
 		login = dict(login = 'name', password = 'pass')
 		other = dict(submit = 'Log In', remember='yes')
 		return (login, other)
-
+	
 		
 if __name__ == '__main__':
 	url = 'http://www.fictionalley.org/authors/drt/DA.html'
-	data = u2.urlopen(url).read()
+	data = self.opener.open(url).read()
 	host = up.urlparse(url).netloc
-	fw = FictionAlley()
-	fw.authorName = 'DrT'
+	fw = FictionAlley(url)
 	urls = fw.extractIndividualUrls(data, host, url)
 	pp.pprint(urls)
 	print(fw.getText(data))
\ No newline at end of file

From 3be9b3331e902a080904868d9f76804331d490af Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Tue, 28 Sep 2010 19:26:19 -0500
Subject: [PATCH 33/94] Replace &#XXX; entities in file names, allow BR
 tags--some stories use multiple BRs are section breaks.

---
 output.py | 13 ++++++++-----
 1 file changed, 8 insertions(+), 5 deletions(-)

diff --git a/output.py b/output.py
index bd17b02a..9aca5eab 100644
--- a/output.py
+++ b/output.py
@@ -25,6 +25,7 @@ import zipdir
 import html_constants
 from constants import *
 
+
 import html2text
 
 
@@ -59,7 +60,7 @@ class HTMLWriter(FanficWriter):
 	
 	def __init__(self, base, name, author, inmemory=False, compress=False):
 		self.basePath = base
-		self.name = name.replace(" ", "_").replace(":","_")
+		self.name = re.sub('&\#[0-9]+;', '_', name.replace(" ", "_").replace(":","_"))
 		self.storyTitle = name
 		self.fileName = self.basePath + '/' + self.name + '.html'
 		self.authorName = author
@@ -133,7 +134,7 @@ class EPubFanficWriter(FanficWriter):
 	
 	def __init__(self, base, name, author, inmemory=False, compress=True):
 		self.basePath = base
-		self.name = name.replace(" ", "_").replace(":","_")
+		self.name = re.sub('&\#[0-9]+;', '_', name.replace(" ", "_").replace(":","_"))
 		self.storyTitle = name
 		self.directory = self.basePath + '/' + self.name
 		self.inmemory = inmemory
@@ -149,6 +150,7 @@ class EPubFanficWriter(FanficWriter):
 			self.writeToFile = False
 		
 
+
 		if not self.inmemory:
 			if os.path.exists(self.directory):
 				shutil.rmtree(self.directory)
@@ -194,8 +196,9 @@ class EPubFanficWriter(FanficWriter):
 		text = self._removeEntities(text)
 		
 		# BeautifulStoneSoup doesn't have any selfClosingTags by default.  
-		# hr needs to be if it's going to work.
-		self.soup = bs.BeautifulStoneSoup(text.decode('utf-8'), selfClosingTags=('hr'))
+		# hr & br needs to be if they're going to work.
+		# Some stories do use multiple br tags as their section breaks...
+		self.soup = bs.BeautifulStoneSoup(text.decode('utf-8'), selfClosingTags=('br','hr'))
 
 		allTags = self.soup.findAll(recursive=True)
 		for t in allTags:
@@ -208,7 +211,7 @@ class EPubFanficWriter(FanficWriter):
 			if p.string != None and (len(p.string.strip()) == 0 or p.string.strip() == '&nbsp;' ) :
 				p.extract()
 				
-		allBrs = self.soup.findAll(recursive=True, name = ["br", 'div'])
+		allBrs = self.soup.findAll(recursive=True, name = ['div'])
 		for br in allBrs:
 			if (br.string != None and len(br.string.strip()) != 0) or (br.contents != None):
 				br.name = 'p'

From 9434431c7b847020c4c2bd875be9424c3d911e2e Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Tue, 28 Sep 2010 19:52:30 -0500
Subject: [PATCH 34/94] Add twilighted.net(not com) to downaloder.py so it
 actually *works*.  Add one-shot support for twilighted.net.

---
 downaloder.py |  3 ++-
 twilighted.py | 16 ++++++++++------
 2 files changed, 12 insertions(+), 7 deletions(-)

diff --git a/downaloder.py b/downaloder.py
index de93c790..e16dab4d 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -20,6 +20,7 @@ import output
 import adapter
 import fictionalley
 import hpfiction
+import twilighted
 
 import time
 
@@ -88,7 +89,7 @@ if __name__ == '__main__':
 		adapter = ffnet.FFNet(url)
 	elif url.find('harrypotterfanfiction.com') != -1:
 		adapter = hpfiction.HPFiction(url)
-	elif url.find('twilighted.com') != -1:
+	elif url.find('twilighted.net') != -1:
 		adapter = twilighted.Twilighted(url)
 	else:
 		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
diff --git a/twilighted.py b/twilighted.py
index 54ff35d9..03bb08cf 100644
--- a/twilighted.py
+++ b/twilighted.py
@@ -74,13 +74,17 @@ class Twilighted(FanfictionSiteAdapter):
     self.authorName = title.split(' by ')[1].strip()
 
     select = soup.find('select', { 'name' : 'chapter' } )
-
-    allOptions = select.findAll('option')
+	 
     result = []
-    for o in allOptions:
-      url = self.url + "&chapter=%s" % o['value']
-      title = o.string
-      result.append((url,title))
+    if select is None:
+	   # no chapters found, try url by itself.
+	   result.append((self.url,self.storyName))
+    else:
+	   allOptions = select.findAll('option')
+	   for o in allOptions:
+	     url = self.url + "&chapter=%s" % o['value']
+	     title = o.string
+	     result.append((url,title))
 
     return result
 

From 773ff3c03c55ebf3ce9d52321554be83c724dcf2 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Wed, 29 Sep 2010 21:32:04 -0500
Subject: [PATCH 35/94] Improved metadata for epubcheck, fixed a problem I
 introduced with &gt;/&lt;.

---
 constants.py |  7 +++----
 output.py    | 37 ++++++++++++++++++++++---------------
 2 files changed, 25 insertions(+), 19 deletions(-)

diff --git a/constants.py b/constants.py
index f9f4a366..6bb75c1c 100644
--- a/constants.py
+++ b/constants.py
@@ -32,7 +32,7 @@ CONTAINER = '''<?xml version="1.0"?>
 
 CONTENT_START = '''<?xml version="1.0"?>
 <package version="2.0" xmlns="http://www.idpf.org/2007/opf"
-         unique-identifier="BookId-Epub-%s">
+         unique-identifier="BookID">
  <metadata xmlns:dc="http://purl.org/dc/elements/1.1/"
            xmlns:opf="http://www.idpf.org/2007/opf">
    <dc:title>%s</dc:title> 
@@ -41,7 +41,7 @@ CONTENT_START = '''<?xml version="1.0"?>
    <dc:rights></dc:rights>
    <dc:subject>fanfiction</dc:subject> 
    <dc:publisher>sgzmd</dc:publisher> 
-   <dc:identifier id="BookId">urn:uuid:sigizmund.com062820072147132</dc:identifier>
+   <dc:identifier id="BookID">%s</dc:identifier>
  </metadata>
  <manifest>
   <item id="ncx" href="toc.ncx" media-type="application/x-dtbncx+xml"/>
@@ -114,8 +114,7 @@ acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
 acceptable_attributes = ['href']
 
 entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', 
-		'&lsquo;' : '\'', '&quot;' : '"', '&hellip;' : '...', '&amp;' : '&', '&pound;' : '£', '&nbsp;' : ' ',
-		'&lt;' : '<', '&gt;' : '>' }
+		'&lsquo;' : '\'', '&quot;' : '"', '&hellip;' : '...', '&amp;' : '&', '&pound;' : '£', '&nbsp;' : ' ' }
 
 FB2_PROLOGUE = '<FictionBook>'
 FB2_DESCRIPTION = '''<description>
diff --git a/output.py b/output.py
index 9aca5eab..37165eea 100644
--- a/output.py
+++ b/output.py
@@ -173,20 +173,22 @@ class EPubFanficWriter(FanficWriter):
 				# for the pound symbol in constants.py
 				text = text.replace(e, v.decode('utf-8'))
 		
-		text = text.replace('&', '&amp;')
+		# &lt; &lt; and &amp; are the only html entities allowed in xhtml.
+		text = text.replace('&', '&amp;').replace('&amp;lt;', '&lt;').replace('&amp;gt;', '&gt;')
 		
 		return text
 	
 	def writeChapter(self, title, text):
 		logging.debug("Writing chapter: %s" % title)
 		try:
-			fileName = base64.b64encode(title).replace('/', '_') + ".xhtml"
+			fileName = base64.b64encode(title) + ".xhtml"
 		except UnicodeEncodeError, e:
-			fileName = base64.b64encode(title.encode('utf-8')).replace('/', '_') + ".xhtml"
-#		title = cgi.esca#title.decode('utf-8')
-#		sha = hashlib.sha224(title)
-#		fileName = sha.hexdigest() + ".xhtml"
-		#fileName = cgi.escape(title) + '.xhtml'
+			fileName = base64.b64encode(title.encode('utf-8')) + ".xhtml"
+		# Base64 can include +, / and =, which XML technically doesn't like
+		# in it's id attributes.  _ and - are okay and not otherwise used in Base64.
+		# The = for padding is superfluous
+		fileName = fileName.replace('/', '_').replace('+', '-').replace('=','')
+
 		filePath = self.directory + "/OEBPS/" + fileName
 		
 		fn = 'OEBPS/' + fileName
@@ -208,13 +210,14 @@ class EPubFanficWriter(FanficWriter):
 
 		allPs = self.soup.findAll(recursive=True)
 		for p in allPs:
-			if p.string != None and (len(p.string.strip()) == 0 or p.string.strip() == '&nbsp;' ) :
+			if p.string != None and len(p.string.strip()) == 0 :
 				p.extract()
-				
-		allBrs = self.soup.findAll(recursive=True, name = ['div'])
-		for br in allBrs:
-			if (br.string != None and len(br.string.strip()) != 0) or (br.contents != None):
-				br.name = 'p'
+
+		# xhtml doesn't like <p> nesting in <p>, so leave divs.
+		# allBrs = self.soup.findAll(recursive=True, name = ['div'])
+		# for br in allBrs:
+			# if (br.string != None and len(br.string.strip()) != 0) or (br.contents != None):
+				# br.name = 'p'
 
 #		cleanup(self.soup )
 		
@@ -243,17 +246,21 @@ class EPubFanficWriter(FanficWriter):
 		opfFilePath = "OEBPS/content.opf"
 		
 #		opf = open(opfFilePath, 'w')
-		self._writeFile(opfFilePath, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName))
+		self._writeFile(opfFilePath, CONTENT_START % (self.storyTitle, self.authorName, uuid.uuid4().urn))
 #		print >> opf, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName)
 
 		ids = []
 		
-		i = 0
+		i = 1
 		for t,f in self.chapters:
 			try:
 				chapterId = base64.b64encode(t)
 			except UnicodeEncodeError, e:
 				chapterId = base64.b64encode(t.encode('utf-8'))
+			# Base64 can include +, / and =, which XML technically doesn't like
+			# in it's id attributes.  _ and - are okay and not otherwise used in Base64.
+			# The = for padding is superfluous
+			chapterId = chapterId.replace('/', '_').replace('+', '-').replace('=','')
 			
 			self._writeFile(tocFilePath, TOC_ITEM % (chapterId, i, cgi.escape(t), f))
 			self._writeFile(opfFilePath, CONTENT_ITEM % (chapterId, f))

From f75910ce7d8f80c404ba014adf36d0e32f1ae758 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Thu, 30 Sep 2010 21:33:58 -0500
Subject: [PATCH 36/94] Stop doing prettify on the HTML, it sometimes
 introduces extraneous white space.  Change the chapter file names and ids
 inside the metadata to sequential chapter0001 rather than base64 of the
 chapter title.  Replace invalid center & u tags with div styled centered and
 span styled underlined.  Remove dead ffa.py file.  Change downloda.py to not
 call ffa.py, but do call fictionalley.

---
 constants.py    |   6 +-
 downaloder.py   |  12 ++-
 ffa.py          | 235 ------------------------------------------------
 ffnet.py        |  23 +----
 fictionalley.py |   2 +-
 ficwad.py       |   2 +-
 hpfiction.py    |   3 +-
 output.py       |  49 ++++------
 twilighted.py   |   2 +-
 9 files changed, 32 insertions(+), 302 deletions(-)
 delete mode 100644 ffa.py

diff --git a/constants.py b/constants.py
index 6bb75c1c..437fe5a1 100644
--- a/constants.py
+++ b/constants.py
@@ -48,13 +48,15 @@ CONTENT_START = '''<?xml version="1.0"?>
   <item id="style" href="stylesheet.css" media-type="text/css" />
 '''
 
-CONTENT_ITEM = '<item id="%s" href="%s" media-type="application/xhtml+xml" />'
+CONTENT_ITEM = '''<item id="%s" href="%s" media-type="application/xhtml+xml" />
+'''
 
 CONTENT_END_MANIFEST = '''</manifest>
 <spine toc="ncx">
 '''
 
-CONTENT_ITEMREF = '''<itemref idref="%s" />'''
+CONTENT_ITEMREF = '''<itemref idref="%s" />
+'''
 
 CONTENT_END = '''</spine>
 </package>
diff --git a/downaloder.py b/downaloder.py
index e16dab4d..b90408f5 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -13,7 +13,6 @@ import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
 
-import ffa
 import ffnet
 import ficwad
 import output
@@ -51,13 +50,13 @@ class FanficLoader:
 		urls = self.adapter.extractIndividualUrls()
 		self.writer = self.writerClass(self.booksDirectory, self.adapter.getStoryName(), self.adapter.getAuthorName(), inmemory=self.inmemory, compress=self.compress)
 		
-		i = 0
+		i = 1
 		for u,n in urls:
 			if not self.quiet:
 				print('Downloading chapter %d/%d' % (i, len(urls)))
-			i = i+1
 			text = self.adapter.getText(u)
-			self.writer.writeChapter(n, text)
+			self.writer.writeChapter(i, n, text)
+			i = i+1
 			
 		self.writer.finalise()
 		
@@ -78,11 +77,10 @@ if __name__ == '__main__':
 	writerClass = None
 	
 	if url.find('fanficauthors') != -1:
-		adapter = ffa.FFA(url)
+		print >> sys.stderr, "fanficauthors.net already provides ebooks"
+		sys.exit(0)
 	elif url.find('fictionalley') != -1:
 		adapter = fictionalley.FictionAlley(url)
-		#print >> sys.stderr, "FictionAlley adapter is broken, try to find this fic on fanfiction.net or fanficauthors"
-		#sys.exit(0)
 	elif url.find('ficwad') != -1:
 		adapter = ficwad.FicWad(url)
 	elif url.find('fanfiction.net') != -1 or url.find('fictionpress.com') != -1:
diff --git a/ffa.py b/ffa.py
deleted file mode 100644
index ca81c6d5..00000000
--- a/ffa.py
+++ /dev/null
@@ -1,235 +0,0 @@
-# -*- coding: utf-8 -*-
-
-import os
-import re
-import sys
-import cgi
-import uuid
-import shutil
-import base64
-import os.path
-import logging
-import unittest
-import urllib as u
-import pprint as pp
-import urllib2 as u2
-import urlparse as up
-import BeautifulSoup as bs
-import htmlentitydefs as hdefs
-
-from constants import *
-from adapter import *
-
-try:
-	import login_password
-except:
-	# tough luck
-	pass
-
-class FFA(FanfictionSiteAdapter):
-	def __init__(self, url):
-		self.url = url
-		parsedUrl = up.urlparse(url)
-		self.host = parsedUrl.netloc
-		self.path = parsedUrl.path
-		self.opener = u2.build_opener(u2.HTTPCookieProcessor())
-	
-		logging.debug("Created FFA: url=%s" % (self.url))
-	
-	def _getLoginScript(self):
-		return self.path
-
-	def reqLoginData(self, data):
-		if data.find('<legend>Please login to continue</legend>') != -1 or data.find('<h4>Username or password not found.  Please') != -1 or data.find("This story is rated Mature, you must be logged in to view it") != -1:
-			return True
-		else:
-			return False
-
-	def requiresLogin(self, url = None):
-		if url == None:
-			u = self.url
-		else:
-			u = url
-
-		resp = self.opener.open(u)
-		data = resp.read()
-		return self.reqLoginData(data)
- 
-	def performLogin(self, url = None):
-		if url == None:
-			url = self.url
-		
-		data = {}
-		
-		data['username'] = self.login
-		data['password'] = self.password
-		data['submit'] = 'Submit'
-		
-		urlvals = u.urlencode(data)
-		loginUrl = 'http://' + self.host + self._getLoginScript()
-		logging.debug("Will now login to URL %s" % loginUrl)
-		
-		req = self.opener.open(loginUrl, urlvals)
-		
-		d = req.read()
-
-		if self.reqLoginData(d) :
-			return False
-		else:
-			return True
-	
-	def extractIndividualUrls(self):
-		data = self.opener.open(self.url).read()
-		soup = bs.BeautifulStoneSoup(data)
-
-		if self.reqLoginData(data):
-			logging.debug('Data requires login, trying to login')
-			if not self.performLogin(url):
-				logging.error('Cannot login, raising exception ... ')
-				raise LoginRequiredException(url)
-			else:
-				data = self.opener.open(url).read()
-			
-
-		self.author = str(soup.find('a', {'href' : '/contact/'}).string)
-		self.storyName = str(soup.find('h1', {'class' : 'textCenter'}).contents[0]).strip()
-		
-		logging.debug("Story `%s` by `%s`" % (self.storyName, self.author))
-		
-		selector = soup.find('select', {'class' : 'tinput'})
-		options = selector.findAll('option')
-		
-		urls = []
-		
-		for o in options:
-			title = o.string
-			url = o['value']
-			
-			urls.append((url,title))
-		
-		return urls
-
-	def getText(self, url):
-		if url.find('http://') == -1:
-			url = 'http://' + self.host + '/' + url
-		
-		logging.info('Downloading: %s' % url)
-		data = self.opener.open(url).read()
-		
-		if self.reqLoginData(data):
-			logging.debug('Data requires login, trying to login')
-			if not self.performLogin(url):
-				logging.error('Cannot login, raising exception ... ')
-				raise LoginRequiredException(url)
-			else:
-				data = self.opener.open(url).read()
-		
-		lines = data.split('\n')
-		
-		emit = False
-		
-		post = ''
-		
-		for l in lines:
-			if l.find('</div></form>') != -1:
-				logging.debug('emit = True')
-				emit = True
-				continue
-			elif l.find('<form action="#">') != -1:
-				logging.debug('emit = False')
-				if emit:
-					break
-				else:
-					emit = False
-			
-			if emit:
-				post = post + l + '\n'
-		
-		return post
-
-	def setLogin(self, login):
-		self.login = login
-
-	def setPassword(self, password):
-		self.password = password
-	
-	def getStoryName(self):
-		return self.storyName
-		
-	def getAuthorName(self):
-		return self.author
-
-	def getPrintableUrl(self, url):
-		return url
-
-class FFA_UnitTests(unittest.TestCase):
-	def setUp(self):
-		logging.basicConfig(level=logging.DEBUG)
-		pass
-	
-	def testRequiresLoginNeg(self):
-		f = FFA('http://jeconais.fanficauthors.net/Happily_Ever_After/Introduction/')
-		self.assertFalse(f.requiresLogin())
-	
-	def testRequiresLogin(self):
-		f = FFA('http://jeconais.fanficauthors.net/Rons_Harem/Rons_Harem/')
-		self.assertTrue(f.requiresLogin())
-	
-	def testPerformLogin(self):
-		f = FFA('http://jeconais.fanficauthors.net/Rons_Harem/Rons_Harem/')
-		
-		if login_password != None:
-			f.setLogin(login_password.login)
-			f.setPassword(login_password.password)
-		
-		self.assertTrue(f.performLogin(None))
-		
-	def testExtractURLsAuthorStoryName(self):
-		f = FFA('http://draco664.fanficauthors.net/Apprentice_Potter/Prologue/')
-		f.extractIndividualUrls()
-		
-		self.assertEquals('Draco664', f.getAuthorName())
-		self.assertEquals('Apprentice Potter', f.getStoryName())
-	
-	def testExtractUrls(self):
-		f = FFA('http://draco664.fanficauthors.net/Apprentice_Potter/Prologue/')
-		urls = f.extractIndividualUrls()
-		self.assertEquals(25, len(urls))
-		
-		self.assertEquals('Grievances', urls[2][1])
-		self.assertEquals('/Apprentice_Potter/Prologue/', urls[0][0])
-	
-	def testGetText(self):
-		f = FFA('http://jeconais.fanficauthors.net/Happily_Ever_After/Introduction/')
-		data = f.getText('http://jeconais.fanficauthors.net/Happily_Ever_After/Introduction/')
-		
-		self.assertTrue(data.find('smiled slightly, and settled back in her rocking chair') != -1)
-		
-	def testGetTextLogin(self):
-		url = 'http://viridian.fanficauthors.net/Out_of_the_Darkness_A_Jinchuurikis_Tale/A_Harrowing_Escape/'
-		f = FFA(url)
-		
-		if login_password != None:
-			f.setLogin(login_password.login)
-			f.setPassword(login_password.password)
-		
-		if f.requiresLogin():
-			f.performLogin()
-		
-		data = f.getText(url)
-		seek = 'So Hokage-sama” I said, “this is how we came'
-		self.assertTrue(data.find(seek) != -1)
-	
-	def testSemiLoginRequired(self):
-		f = FFA('http://viridian.fanficauthors.net/Harry_Potter_and_the_Nightmares_of_Futures_Past/The_End_of_Days/')
-		
-		urls = f.extractIndividualUrls()
-		
-		try:
-			data = f.getText('http://viridian.fanficauthors.net/Harry_Potter_and_the_Nightmares_of_Futures_Past/Doing_the_Mungo_Shuffle/')
-			self.assertTrue(False)
-		except LoginRequiredException, e:
-			self.assertTrue(True)
-		
-if __name__ == '__main__':
-	unittest.main()
\ No newline at end of file
diff --git a/ffnet.py b/ffnet.py
index 373c6ea0..00e0fb55 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -6,7 +6,6 @@ import sys
 import cgi
 import uuid
 import shutil
-import base64
 import os.path
 import logging
 import unittest
@@ -136,26 +135,8 @@ class FFNet(FanfictionSiteAdapter):
 			logging.error("Error downloading Chapter: %s" % url)
 			exit(1)
 			return '<html/>'
-		
-		return div.prettify()
-		
-		# 
-		# for l in lines:
-		# 	if l.find("<div id=storytextp class=storytextp") != -1 or l.find('<!-- start story -->') != -1 or l.find('<div id="storytextp"') != -1:
-		# 		logging.debug("starting at line: %s" % l)
-		# 		#s2 = bs.BeautifulStoneSoup(l)
-		# 		#return s2.div.prettify()
-		# 		emit = True
-		# 	
-		# 	if emit:
-		# 		textbuf = textbuf + "\n" + l
-		# 	
-		# 	if l.find("</div><div style='height:10px'></div> ") != -1 or l.find('<!-- end story -->') != -1:
-		# 		emit = False
-		# 
-		# s2 = bs.BeautifulStoneSoup(textbuf)
-		# return s2.div.prettify()
-		
+			
+		return div.__str__('utf8')
 		
 	def setLogin(self, login):
 		self.login = login
diff --git a/fictionalley.py b/fictionalley.py
index 59a0b7d6..2ab11167 100644
--- a/fictionalley.py
+++ b/fictionalley.py
@@ -98,7 +98,7 @@ class FictionAlley(FanfictionSiteAdapter):
 			exit(1)
 			return '<html/>'
 		
-		return div.prettify()
+		return div.__str__('utf8')
 	
 	def getPrintableUrl(self, url):
 		return url
diff --git a/ficwad.py b/ficwad.py
index 1e769a00..de2137b2 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -84,7 +84,7 @@ class FicWad(FanfictionSiteAdapter):
 			logging.error("Error downloading Chapter: %s" % url)
 			exit(1)
 			return '<html/>'
-		return div.prettify()
+		return div.__str__('utf8')
 	
 	def getPrintableUrl(self, url):
 		return url
diff --git a/hpfiction.py b/hpfiction.py
index 36e8fff1..1108cf22 100644
--- a/hpfiction.py
+++ b/hpfiction.py
@@ -6,7 +6,6 @@ import sys
 import cgi
 import uuid
 import shutil
-import base64
 import os.path
 import logging
 import unittest
@@ -86,7 +85,7 @@ class HPFiction(FanfictionSiteAdapter):
 		if None == divtext:
 			logging.error("Error downloading Chapter: %s" % url)
 			exit(1)
-		return divtext.prettify()
+		return divtext.__str__('utf8')
 
 class FF_UnitTests(unittest.TestCase):
 	def setUp(self):
diff --git a/output.py b/output.py
index 37165eea..866005b2 100644
--- a/output.py
+++ b/output.py
@@ -8,7 +8,6 @@ import uuid
 import codecs
 import shutil
 import string
-import base64
 import os.path
 import zipfile
 import StringIO
@@ -33,7 +32,7 @@ class FanficWriter:
 	def __init__(self):
 		pass
 		
-	def writeChapter(self, title, text):
+	def writeChapter(self, index, title, text):
 		pass
 	
 	def finalise(self):
@@ -45,8 +44,8 @@ class TextWriter(FanficWriter):
 	def __init__(self, base, name, author, inmemory=False, compress=False):
 		self.htmlWriter = HTMLWriter(base, name, author, True, False)
 	
-	def writeChapter(self, title, text):
-		self.htmlWriter.writeChapter(title, text)
+	def writeChapter(self, index, title, text):
+		self.htmlWriter.writeChapter(index, title, text)
 	
 	def finalise(self):
 		self.htmlWriter.finalise()
@@ -85,7 +84,7 @@ class HTMLWriter(FanficWriter):
 		except:
 			return text
 	
-	def writeChapter(self, title, text):
+	def writeChapter(self, index, title, text):
 		title = self._printableVersion(title) #title.decode('utf-8')
 		text = self._printableVersion(text) #text.decode('utf-8')
 		self.body = self.body + '\n' + self.chapterStartTemplate.substitute({'chapter' : title})
@@ -94,7 +93,7 @@ class HTMLWriter(FanficWriter):
 	def finalise(self):
 		html = self.xhtmlTemplate.substitute({'title' : self.storyTitle, 'author' : self.authorName, 'body' : self.body})
 		soup = bs.BeautifulSoup(html)
-		result = soup.prettify()
+		result = soup.__str__('utf8')
 		
 #		f = open(self.fileName, 'w')
 #		f.write(result)
@@ -178,16 +177,9 @@ class EPubFanficWriter(FanficWriter):
 		
 		return text
 	
-	def writeChapter(self, title, text):
+	def writeChapter(self, index, title, text):
 		logging.debug("Writing chapter: %s" % title)
-		try:
-			fileName = base64.b64encode(title) + ".xhtml"
-		except UnicodeEncodeError, e:
-			fileName = base64.b64encode(title.encode('utf-8')) + ".xhtml"
-		# Base64 can include +, / and =, which XML technically doesn't like
-		# in it's id attributes.  _ and - are okay and not otherwise used in Base64.
-		# The = for padding is superfluous
-		fileName = fileName.replace('/', '_').replace('+', '-').replace('=','')
+		fileName="chapter%04d.xhtml" % index
 
 		filePath = self.directory + "/OEBPS/" + fileName
 		
@@ -207,21 +199,21 @@ class EPubFanficWriter(FanficWriter):
 			for attr in t._getAttrMap().keys():
 				if attr not in acceptable_attributes:
 					del t[attr]
+			# these are not acceptable strict XHTML.  But we do already have 
+			# CSS classes of the same names defined in constants.py
+			if t.name in ('u'):
+				t['class']=t.name
+				t.name='span'
+			if t.name in ('center'):
+				t['class']=t.name
+				t.name='div'
 
 		allPs = self.soup.findAll(recursive=True)
 		for p in allPs:
 			if p.string != None and len(p.string.strip()) == 0 :
 				p.extract()
 
-		# xhtml doesn't like <p> nesting in <p>, so leave divs.
-		# allBrs = self.soup.findAll(recursive=True, name = ['div'])
-		# for br in allBrs:
-			# if (br.string != None and len(br.string.strip()) != 0) or (br.contents != None):
-				# br.name = 'p'
-
-#		cleanup(self.soup )
-		
-		text = self.soup.prettify()
+		text = self.soup.__str__('utf8')
 		
 		tt = self._removeEntities(title)
 		
@@ -253,14 +245,7 @@ class EPubFanficWriter(FanficWriter):
 		
 		i = 1
 		for t,f in self.chapters:
-			try:
-				chapterId = base64.b64encode(t)
-			except UnicodeEncodeError, e:
-				chapterId = base64.b64encode(t.encode('utf-8'))
-			# Base64 can include +, / and =, which XML technically doesn't like
-			# in it's id attributes.  _ and - are okay and not otherwise used in Base64.
-			# The = for padding is superfluous
-			chapterId = chapterId.replace('/', '_').replace('+', '-').replace('=','')
+			chapterId = "chapter%04d" % i
 			
 			self._writeFile(tocFilePath, TOC_ITEM % (chapterId, i, cgi.escape(t), f))
 			self._writeFile(opfFilePath, CONTENT_ITEM % (chapterId, f))
diff --git a/twilighted.py b/twilighted.py
index 03bb08cf..e351c0e8 100644
--- a/twilighted.py
+++ b/twilighted.py
@@ -109,7 +109,7 @@ class Twilighted(FanfictionSiteAdapter):
     if None == div:
       return '<html/>'
 
-    return div.prettify()
+    return div.__str__('utf8')
 
   def _getLoginScript(self):
     return '/user.php?action=login'

From ca4b09d69dd3b1e226c824987ba4a7daa36945a1 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Sun, 3 Oct 2010 19:23:39 -0500
Subject: [PATCH 37/94] Fixes for some obscure encoding errors.  UTF8 versions
 of apostrophe and dash in story titles & chapter titles could cause problems
 in a few places.

---
 ffnet.py  | 5 ++++-
 ficwad.py | 5 +++--
 output.py | 5 +++--
 3 files changed, 10 insertions(+), 5 deletions(-)

diff --git a/ffnet.py b/ffnet.py
index 00e0fb55..94fd9954 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -98,7 +98,10 @@ class FFNet(FanfictionSiteAdapter):
 			elif l.find("<SELECT title='chapter navigation'") != -1:
 				if len(urls) > 0:
 					continue
-				u = l.decode('utf-8')
+				try:
+					u = l.decode('utf-8')
+				except UnicodeEncodeError, e:
+					u = l
 				u = re.sub('&\#[0-9]+;', ' ', u)
 				s2 = bs.BeautifulSoup(u)
 				options = s2.findAll('option')
diff --git a/ficwad.py b/ficwad.py
index de2137b2..dab4fe0d 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -1,3 +1,5 @@
+# -*- coding: utf-8 -*-
+
 import os
 import re
 import sys
@@ -9,6 +11,7 @@ import urllib2 as u2
 import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
+import logging
 
 from adapter import *
 
@@ -62,8 +65,6 @@ class FicWad(FanfictionSiteAdapter):
 				if title != "Story Index":
 					result.append((url,title))
 			
-		print('Story "%s" by %s' % (self.storyName, self.authorName))
-		
 		return result
 	
 	def getStoryName(self):
diff --git a/output.py b/output.py
index 866005b2..95656e4a 100644
--- a/output.py
+++ b/output.py
@@ -61,7 +61,7 @@ class HTMLWriter(FanficWriter):
 		self.basePath = base
 		self.name = re.sub('&\#[0-9]+;', '_', name.replace(" ", "_").replace(":","_"))
 		self.storyTitle = name
-		self.fileName = self.basePath + '/' + self.name + '.html'
+		self.fileName = self.basePath + '/' + re.sub('[^a-zA-Z0-9_\'-]+','',self.name) + '.html'
 		self.authorName = author
 		
 		self.inmemory = inmemory
@@ -135,7 +135,8 @@ class EPubFanficWriter(FanficWriter):
 		self.basePath = base
 		self.name = re.sub('&\#[0-9]+;', '_', name.replace(" ", "_").replace(":","_"))
 		self.storyTitle = name
-		self.directory = self.basePath + '/' + self.name
+		self.directory = self.basePath + '/' + re.sub('[^a-zA-Z0-9_\'-]+','',self.name)
+
 		self.inmemory = inmemory
 		self.authorName = author
 		

From 466d5f4ee3e04433bb5504337c55f3bf4bc8c0a3 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Wed, 6 Oct 2010 14:31:21 -0500
Subject: [PATCH 38/94] Remove Entities, fix bar ampersands in story & author
 names.

---
 output.py | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/output.py b/output.py
index 95656e4a..70a4cf01 100644
--- a/output.py
+++ b/output.py
@@ -134,11 +134,11 @@ class EPubFanficWriter(FanficWriter):
 	def __init__(self, base, name, author, inmemory=False, compress=True):
 		self.basePath = base
 		self.name = re.sub('&\#[0-9]+;', '_', name.replace(" ", "_").replace(":","_"))
-		self.storyTitle = name
+		self.storyTitle = self._removeEntities(name)
 		self.directory = self.basePath + '/' + re.sub('[^a-zA-Z0-9_\'-]+','',self.name)
 
 		self.inmemory = inmemory
-		self.authorName = author
+		self.authorName = self._removeEntities(author)
 		
 		self.files = {}
 		self.chapters = []

From f8701a9e8d8dac505d6c021eb34ebdcfe9afcf0b Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Fri, 8 Oct 2010 18:46:03 -0500
Subject: [PATCH 39/94] Fix to force mimetype file to be uncompressed and first
 in epub.  Tested on Python 2.5.2.

---
 zipdir.py | 40 +++++++++++++++++++++++++++++++---------
 1 file changed, 31 insertions(+), 9 deletions(-)

diff --git a/zipdir.py b/zipdir.py
index ddaeb2f7..49810ed5 100644
--- a/zipdir.py
+++ b/zipdir.py
@@ -44,6 +44,32 @@ def addFolderToZip(zippedHelp,folder,fpath):
 def inMemoryZip(files):
 	# files have a structure of {'path/to/file' => content} dictionary
 	io = StringIO.StringIO()
+
+	# This fixes the uncompressed mimetype-first issue by opening
+	# the in memory file as STORE, putting in the mimetype, then
+	# closing and re-opening with DEFLATED.  while it is often
+	# true that mimetype is the first file, we can't assume it,
+	# because the dict object is defined as unordered.
+	path='mimetype'
+	memzip = zipfile.ZipFile(io, 'a', compression=zipfile.ZIP_STORED)
+	memzip.debug = 3
+	if type(files[path]) != type('str'):
+		data = files[path].getvalue()
+	else:
+		data = files[path]
+		
+	logging.debug("Writing ZIP path %s" % path)
+	try:
+		memzip.writestr(path, data.encode('utf-8'))
+	except UnicodeDecodeError, e:
+		memzip.writestr(path.encode('utf-8'), data.encode('utf-8'))
+		
+	memzip.close()
+
+	# remove it from the files dict.
+	del(files['mimetype'])
+	
+	# open in 'a' append mode.
 	memzip = zipfile.ZipFile(io, 'a', compression=zipfile.ZIP_DEFLATED)
 	memzip.debug = 3
 	
@@ -55,16 +81,12 @@ def inMemoryZip(files):
 		
 #		logging.debug(data)
 		logging.debug("Writing ZIP path %s" % path)
-		# epub standard requires mimetype to be uncompressed and first file.
-		if path == 'mimetype':
-			compress=zipfile.ZIP_STORED
-		else:
-			compress=zipfile.ZIP_DEFLATED
 		try:
-			memzip.writestr(path, data.encode('utf-8'), compress_type=compress)
+			memzip.writestr(path, data.encode('utf-8'))
 		except UnicodeDecodeError, e:
-			memzip.writestr(path.encode('utf-8'), data.encode('utf-8'), compress_type=compress)
-	
+			memzip.writestr(path.encode('utf-8'), data.encode('utf-8'))
+
+	# declares all the files created by Windows.  
 	for zf in memzip.filelist:
 		zf.create_system = 0
 	
@@ -79,4 +101,4 @@ if __name__ == '__main__':
 	data = inMemoryZip(files)
 	f = open('res.zip', 'w')
 	f.write(data)
-	f.close()
\ No newline at end of file
+	f.close()

From 275a1dd6ad84dc6ddf603f2df5f09c77d36fe642 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Fri, 8 Oct 2010 21:54:35 -0500
Subject: [PATCH 40/94] Add &#039;->'\'' to entity translation list.

---
 constants.py | 6 +++---
 1 file changed, 3 insertions(+), 3 deletions(-)

diff --git a/constants.py b/constants.py
index 437fe5a1..5da65e78 100644
--- a/constants.py
+++ b/constants.py
@@ -1,4 +1,4 @@
-﻿# -*- coding: utf-8 -*-
+# -*- coding: utf-8 -*-
 
 CSS = '''body { margin-left: 5%; margin-right: 5%; margin-top: 5%; margin-bottom: 5%; text-align: justify; }
 pre { font-size: x-small; }
@@ -115,8 +115,8 @@ acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
 
 acceptable_attributes = ['href']
 
-entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', 
-		'&lsquo;' : '\'', '&quot;' : '"', '&hellip;' : '...', '&amp;' : '&', '&pound;' : '£', '&nbsp;' : ' ' }
+entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', '&#039;' : '\'',
+             '&lsquo;' : '\'', '&quot;' : '"', '&hellip;' : '...', '&amp;' : '&', '&pound;' : '£', '&nbsp;' : ' ' }
 
 FB2_PROLOGUE = '<FictionBook>'
 FB2_DESCRIPTION = '''<description>

From dafa33c64ee984aa4a257653b19dc6cfe34254f7 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Sun, 10 Oct 2010 12:54:41 -0500
Subject: [PATCH 41/94] Generalize handling of &#<number>; entities. 
 Generalize method to create a valid filename. Remove print from
 fictionalley.py that was causing the output-before-302-header issue. Some
 changes to chapter URL formation due to apparent differences in handling '//'
 in URLs in appengine vs downalod.py in 2.5.2.

---
 constants.py    |  2 +-
 fictionalley.py |  4 +--
 ficwad.py       |  7 ++---
 hpfiction.py    |  4 +--
 output.py       | 78 +++++++++++++++++++++++++++++++------------------
 5 files changed, 57 insertions(+), 38 deletions(-)

diff --git a/constants.py b/constants.py
index 5da65e78..2bcc1a67 100644
--- a/constants.py
+++ b/constants.py
@@ -115,7 +115,7 @@ acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
 
 acceptable_attributes = ['href']
 
-entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', '&#039;' : '\'',
+entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', 
              '&lsquo;' : '\'', '&quot;' : '"', '&hellip;' : '...', '&amp;' : '&', '&pound;' : '£', '&nbsp;' : ' ' }
 
 FB2_PROLOGUE = '<FictionBook>'
diff --git a/fictionalley.py b/fictionalley.py
index 2ab11167..35ae71e2 100644
--- a/fictionalley.py
+++ b/fictionalley.py
@@ -72,7 +72,7 @@ class FictionAlley(FanfictionSiteAdapter):
 				title = a.string
 				result.append((url,title))
 					
-		print('Story "%s" by %s' % (self.storyName, self.authorName))
+		#print('Story "%s" by %s' % (self.storyName, self.authorName))
 		
 		return result
 	
@@ -122,4 +122,4 @@ if __name__ == '__main__':
 	fw = FictionAlley(url)
 	urls = fw.extractIndividualUrls(data, host, url)
 	pp.pprint(urls)
-	print(fw.getText(data))
\ No newline at end of file
+	print(fw.getText(data))
diff --git a/ficwad.py b/ficwad.py
index dab4fe0d..28b71584 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -58,7 +58,7 @@ class FicWad(FanfictionSiteAdapter):
 		else:
 			allOptions = select.findAll('option')
 			for o in allOptions:
-				url = o['value']
+				url = 'http://' + self.host + o['value']
 				title = o.string
 				# ficwad includes 'Story Index' in the dropdown of chapters, 
 				# but it's not a real chapter.
@@ -74,9 +74,6 @@ class FicWad(FanfictionSiteAdapter):
 		return self.authorName
 	
 	def getText(self, url):
-		if url.find('http://') == -1:
-			url = 'http://' + self.host + '/' + url
-		
 		data = u2.urlopen(url).read()
 		
 		soup = bs.BeautifulStoneSoup(data)
@@ -109,4 +106,4 @@ if __name__ == '__main__':
 	fw = FicWad(url)
 	urls = fw.extractIndividualUrls()
 	pp.pprint(urls)
-	print(fw.getText(data))
\ No newline at end of file
+	print(fw.getText(data))
diff --git a/hpfiction.py b/hpfiction.py
index 1108cf22..75cb4597 100644
--- a/hpfiction.py
+++ b/hpfiction.py
@@ -65,7 +65,7 @@ class HPFiction(FanfictionSiteAdapter):
 		else:
 			for o in select.findAll('option'):
 				if 'value' in o._getAttrMap():
-					url = 'http://' + self.host + '/' + self.path + o['value']
+					url = 'http://' + self.host + self.path + o['value']
 					title = o.string
 					if title != "Story Index":
 						urls.append((url,title))
@@ -110,4 +110,4 @@ class FF_UnitTests(unittest.TestCase):
 if __name__ == '__main__':
 	unittest.main()
 
-	
\ No newline at end of file
+	
diff --git a/output.py b/output.py
index 70a4cf01..4a5387c6 100644
--- a/output.py
+++ b/output.py
@@ -59,10 +59,10 @@ class HTMLWriter(FanficWriter):
 	
 	def __init__(self, base, name, author, inmemory=False, compress=False):
 		self.basePath = base
-		self.name = re.sub('&\#[0-9]+;', '_', name.replace(" ", "_").replace(":","_"))
-		self.storyTitle = name
-		self.fileName = self.basePath + '/' + re.sub('[^a-zA-Z0-9_\'-]+','',self.name) + '.html'
-		self.authorName = author
+		self.storyTitle = removeEntities(name)
+		self.name = makeAcceptableFilename(name)
+		self.fileName =  self.basePath + '/' + self.name + '.html'
+		self.authorName = removeEntities(author)
 		
 		self.inmemory = inmemory
 
@@ -133,12 +133,12 @@ class EPubFanficWriter(FanficWriter):
 	
 	def __init__(self, base, name, author, inmemory=False, compress=True):
 		self.basePath = base
-		self.name = re.sub('&\#[0-9]+;', '_', name.replace(" ", "_").replace(":","_"))
-		self.storyTitle = self._removeEntities(name)
-		self.directory = self.basePath + '/' + re.sub('[^a-zA-Z0-9_\'-]+','',self.name)
+		self.storyTitle = removeEntities(name)
+		self.name = makeAcceptableFilename(name)
+		self.directory = self.basePath + '/' + self.name
+		self.authorName = removeEntities(author)
 
 		self.inmemory = inmemory
-		self.authorName = self._removeEntities(author)
 		
 		self.files = {}
 		self.chapters = []
@@ -164,21 +164,8 @@ class EPubFanficWriter(FanficWriter):
 		self._writeFile('META-INF/container.xml', CONTAINER)
 		self._writeFile('OEBPS/stylesheet.css', CSS)
 
-	def _removeEntities(self, text):
-		for e in entities:
-			v = entities[e]
-			try:
-				text = text.replace(e, v)
-			except UnicodeDecodeError, ex:
-				# for the pound symbol in constants.py
-				text = text.replace(e, v.decode('utf-8'))
-		
-		# &lt; &lt; and &amp; are the only html entities allowed in xhtml.
-		text = text.replace('&', '&amp;').replace('&amp;lt;', '&lt;').replace('&amp;gt;', '&gt;')
-		
-		return text
-	
 	def writeChapter(self, index, title, text):
+		title = removeEntities(title)
 		logging.debug("Writing chapter: %s" % title)
 		fileName="chapter%04d.xhtml" % index
 
@@ -188,7 +175,7 @@ class EPubFanficWriter(FanficWriter):
 		
 #		f = open(filePath, 'w')
 		
-		text = self._removeEntities(text)
+		text = removeEntities(text)
 		
 		# BeautifulStoneSoup doesn't have any selfClosingTags by default.  
 		# hr & br needs to be if they're going to work.
@@ -216,12 +203,10 @@ class EPubFanficWriter(FanficWriter):
 
 		text = self.soup.__str__('utf8')
 		
-		tt = self._removeEntities(title)
-		
-		self._writeFile(fn, XHTML_START % (tt, tt))
+		self._writeFile(fn, XHTML_START % (title, title))
 		self._writeFile(fn, text)
 		self._writeFile(fn, XHTML_END)
-#		print >> f, XHTML_START % (tt, tt)
+#		print >> f, XHTML_START % (title, title)
 #		f.write(text)
 #		print >> f, XHTML_END
 		
@@ -248,7 +233,7 @@ class EPubFanficWriter(FanficWriter):
 		for t,f in self.chapters:
 			chapterId = "chapter%04d" % i
 			
-			self._writeFile(tocFilePath, TOC_ITEM % (chapterId, i, cgi.escape(t), f))
+			self._writeFile(tocFilePath, TOC_ITEM % (chapterId, i, t, f))
 			self._writeFile(opfFilePath, CONTENT_ITEM % (chapterId, f))
 			
 			ids.append(chapterId)
@@ -279,3 +264,40 @@ class EPubFanficWriter(FanficWriter):
 			self.output = zipdata
 			
 #		zipdir.toZip(filename, self.directory)
+
+def unirepl(match):
+	"Return the unicode string for a decimal number"
+	s = match.group()
+	value = int(s[2:-1])
+	return unichr(value)
+
+def replaceNumberEntities(data):
+	p = re.compile(r'&#(\d+);')
+	return p.sub(unirepl, data)
+
+def removeEntities(text):
+	# replace numeric versions of [&<>] with named versions.
+	text = re.sub(r'&#0*38;','&amp;',text)
+	text = re.sub(r'&#0*60;','&lt;',text)
+	text = re.sub(r'&#0*62;','&gt;',text)
+	
+	# replace remaining &#000; entities with unicode value, such as &#039; -> '
+	text = replaceNumberEntities(text)
+
+	# replace several named entities with character, such as &mdash; -> -
+	# see constants.py for the list.
+	for e in entities:
+		v = entities[e]
+		try:
+			text = text.replace(e, v)
+		except UnicodeDecodeError, ex:
+			# for the pound symbol in constants.py
+			text = text.replace(e, v.decode('utf-8'))
+	
+	# &lt; &lt; and &amp; are the only html entities allowed in xhtml, put those back.
+	text = text.replace('&', '&amp;').replace('&amp;lt;', '&lt;').replace('&amp;gt;', '&gt;')
+		
+	return text
+	
+def makeAcceptableFilename(text):
+	return re.sub('[^a-zA-Z0-9_\'-]+','',removeEntities(text).replace(" ", "_").replace(":","_"))	

From 7f8d7a7dbb8b3f47f3578fd2883baa4a3b89da78 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Mon, 11 Oct 2010 14:05:57 -0500
Subject: [PATCH 42/94] Add '\n' after each </p> and <br /> tag.  Extremely
 long(200k+) single line chapters (like ffnet gives) causes problems for nook.
 Also removed a little dead code from ffnet.py.

---
 ffnet.py  |  9 ++-------
 output.py | 19 +++++++++++++------
 2 files changed, 15 insertions(+), 13 deletions(-)

diff --git a/ffnet.py b/ffnet.py
index 94fd9954..f3e101fc 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -117,17 +117,12 @@ class FFNet(FanfictionSiteAdapter):
 	
 	def getText(self, url):
 		data = self._fetchUrl(url)
-		lines = data.split('\n')
-		
-		textbuf = ''
-		emit = False
-		
 		olddata = data
 		try:
 			data = data.decode('utf8')
 		except:
 			data = olddata
-		
+
 		try:
 			soup = bs.BeautifulStoneSoup(data)
 		except:
@@ -195,4 +190,4 @@ class FFA_UnitTests(unittest.TestCase):
 		text = f.getText(url)
 		self.assertTrue(text.find('Kale Resgerald at your service" He answered, "So, can we go now? Or do you want to') != -1)
 if __name__ == '__main__':
-	unittest.main()
\ No newline at end of file
+	unittest.main()
diff --git a/output.py b/output.py
index 4a5387c6..8b412a97 100644
--- a/output.py
+++ b/output.py
@@ -136,7 +136,7 @@ class EPubFanficWriter(FanficWriter):
 		self.storyTitle = removeEntities(name)
 		self.name = makeAcceptableFilename(name)
 		self.directory = self.basePath + '/' + self.name
-		self.authorName = removeEntities(author)
+		self.authorName = removeEntities(author+" aa")
 
 		self.inmemory = inmemory
 		
@@ -195,14 +195,21 @@ class EPubFanficWriter(FanficWriter):
 			if t.name in ('center'):
 				t['class']=t.name
 				t.name='div'
-
-		allPs = self.soup.findAll(recursive=True)
-		for p in allPs:
-			if p.string != None and len(p.string.strip()) == 0 :
-				p.extract()
+			# removes paired, but empty tags.
+			if t.string != None and len(t.string.strip()) == 0 :
+				t.extract()
 
 		text = self.soup.__str__('utf8')
 		
+		# ffnet(& maybe others) gives the whole chapter text
+		# as one line.  This causes problems for nook(at
+		# least) when the chapter size starts getting big
+		# (200k+) Using Soup's prettify() messes up italics
+		# and such.  Done after soup extract so <p> and <br>
+		# tags are normalized.  Doing it here seems less evil
+		# than hacking BeautifulSoup, but it's debatable.
+		text = text.replace('</p>','</p>\n').replace('<br />','<br />\n')
+		
 		self._writeFile(fn, XHTML_START % (title, title))
 		self._writeFile(fn, text)
 		self._writeFile(fn, XHTML_END)

From b9a72d372d7081e4d549203d8d40f41922cad469 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Mon, 11 Oct 2010 20:44:19 -0500
Subject: [PATCH 43/94] Add &#x0000; entity support, fix "<authorname> aa" from
 testing, add potionsandsnitches.net.

---
 downaloder.py |  7 +++++--
 output.py     | 10 +++++++---
 2 files changed, 12 insertions(+), 5 deletions(-)

diff --git a/downaloder.py b/downaloder.py
index b90408f5..b8af3abe 100644
--- a/downaloder.py
+++ b/downaloder.py
@@ -57,6 +57,7 @@ class FanficLoader:
 			text = self.adapter.getText(u)
 			self.writer.writeChapter(i, n, text)
 			i = i+1
+			# time.sleep(2)
 			
 		self.writer.finalise()
 		
@@ -68,6 +69,8 @@ class FanficLoader:
 if __name__ == '__main__':
 	logging.basicConfig(level=logging.DEBUG)
 	(url, format) = sys.argv[1:]
+	# (url) = sys.argv[1]
+	# format = 'epub'
 	
 	if type(url) is unicode:
 		print('URL is unicode')
@@ -87,7 +90,7 @@ if __name__ == '__main__':
 		adapter = ffnet.FFNet(url)
 	elif url.find('harrypotterfanfiction.com') != -1:
 		adapter = hpfiction.HPFiction(url)
-	elif url.find('twilighted.net') != -1:
+	elif url.find('twilighted.net') != -1 or url.find('potionsandsnitches.net') != -1:
 		adapter = twilighted.Twilighted(url)
 	else:
 		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
@@ -111,4 +114,4 @@ if __name__ == '__main__':
 	
 	loader = FanficLoader(adapter, writerClass)
 	loader.download()
-	
\ No newline at end of file
+	
diff --git a/output.py b/output.py
index 8b412a97..1700bfe7 100644
--- a/output.py
+++ b/output.py
@@ -136,7 +136,7 @@ class EPubFanficWriter(FanficWriter):
 		self.storyTitle = removeEntities(name)
 		self.name = makeAcceptableFilename(name)
 		self.directory = self.basePath + '/' + self.name
-		self.authorName = removeEntities(author+" aa")
+		self.authorName = removeEntities(author)
 
 		self.inmemory = inmemory
 		
@@ -275,11 +275,15 @@ class EPubFanficWriter(FanficWriter):
 def unirepl(match):
 	"Return the unicode string for a decimal number"
 	s = match.group()
-	value = int(s[2:-1])
+	if s[2].lower()=='x':
+		radix=16
+	else:
+		radix=10
+	value = int(s[3:-1], radix )
 	return unichr(value)
 
 def replaceNumberEntities(data):
-	p = re.compile(r'&#(\d+);')
+	p = re.compile(r'&#(x?)(\d+);')
 	return p.sub(unirepl, data)
 
 def removeEntities(text):

From 4e53481d7d71efffe77ed20c81913126ff4289b1 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Wed, 13 Oct 2010 00:01:24 -0500
Subject: [PATCH 44/94] Somewhat kludgey fix for the kludgey way we extract the
 story text from fictionalley for stories with poor html.

---
 fictionalley.py | 15 ++++++++-------
 1 file changed, 8 insertions(+), 7 deletions(-)

diff --git a/fictionalley.py b/fictionalley.py
index 35ae71e2..884720fd 100644
--- a/fictionalley.py
+++ b/fictionalley.py
@@ -86,19 +86,20 @@ class FictionAlley(FanfictionSiteAdapter):
 		# fictionalley uses full URLs in chapter list.
 		data = self.opener.open(url).read()
 		
-		# find <!-- headerend --> & <!-- footerstart -->
-		# and replaced with matching div pair for easier parsing.
-		# Yes, it's an evil kludge, but what can ya do?
-		data = data.replace('<!-- headerend -->','<div id="storytext">').replace('<!-- footerstart -->','</div>')
+		# find <!-- headerend --> & <!-- footerstart --> and
+		# replaced with matching div pair for easier parsing.
+		# Yes, it's an evil kludge, but what can ya do?  Using
+		# something other than div prevents soup from pairing
+		# our div with poor html inside the story text.
+		data = data.replace('<!-- headerend -->','<crazytagstringnobodywouldstumbleonaccidently id="storytext">').replace('<!-- footerstart -->','</crazytagstringnobodywouldstumbleonaccidently>')
 		soup = bs.BeautifulStoneSoup(data)
 		
-		div = soup.find('div', {'id' : 'storytext'})
+		div = soup.find('crazytagstringnobodywouldstumbleonaccidently', {'id' : 'storytext'})
 		if None == div:
 			logging.error("Error downloading Chapter: %s" % url)
 			exit(1)
 			return '<html/>'
-		
-		return div.__str__('utf8')
+		return div.__str__('utf8').replace('crazytagstringnobodywouldstumbleonaccidently','div')
 	
 	def getPrintableUrl(self, url):
 		return url

From 25cbab225ce4e3126e0e03463aa7f3464a4a01ed Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Thu, 14 Oct 2010 12:42:29 -0500
Subject: [PATCH 45/94] potionsandsnitches.net doesn't require login.  Indeed,
 it doesn't even have the same login URL.

---
 twilighted.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/twilighted.py b/twilighted.py
index e351c0e8..a7e77a53 100644
--- a/twilighted.py
+++ b/twilighted.py
@@ -28,7 +28,11 @@ class Twilighted(FanfictionSiteAdapter):
 
 
   def requiresLogin(self, url = None):
-    return True
+    # potionsandsnitches.net doesn't require login.
+    if self.host == 'potionsandsnitches.net':
+      return False
+    else:
+      return True
 
   def performLogin(self, url = None):
     data = {}
@@ -135,4 +139,4 @@ class Twilighted_UnitTests(unittest.TestCase):
     self.assertEquals(32, len(Twilighted(url).extractIndividualUrls()))
 
 if __name__ == '__main__':
-  unittest.main()
\ No newline at end of file
+  unittest.main()

From c056ed0740c8b481cf4b65dfa1144f1367450e84 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Sat, 16 Oct 2010 11:30:09 -0500
Subject: [PATCH 46/94] Fix zip routine so it checks for file mimetype doesn't
 just assume it exists.

---
 zipdir.py | 41 +++++++++++++++++++++--------------------
 1 file changed, 21 insertions(+), 20 deletions(-)

diff --git a/zipdir.py b/zipdir.py
index 49810ed5..f9a79acf 100644
--- a/zipdir.py
+++ b/zipdir.py
@@ -45,29 +45,30 @@ def inMemoryZip(files):
 	# files have a structure of {'path/to/file' => content} dictionary
 	io = StringIO.StringIO()
 
-	# This fixes the uncompressed mimetype-first issue by opening
-	# the in memory file as STORE, putting in the mimetype, then
-	# closing and re-opening with DEFLATED.  while it is often
-	# true that mimetype is the first file, we can't assume it,
-	# because the dict object is defined as unordered.
-	path='mimetype'
-	memzip = zipfile.ZipFile(io, 'a', compression=zipfile.ZIP_STORED)
-	memzip.debug = 3
-	if type(files[path]) != type('str'):
-		data = files[path].getvalue()
-	else:
-		data = files[path]
+	if 'mimetype' in files:
+		# This fixes the uncompressed mimetype-first issue by opening
+		# the in memory file as STORE, putting in the mimetype, then
+		# closing and re-opening with DEFLATED.  while it is often
+		# true that mimetype is the first file, we can't assume it,
+		# because the dict object is defined as unordered.
+		path='mimetype'
+		memzip = zipfile.ZipFile(io, 'a', compression=zipfile.ZIP_STORED)
+		memzip.debug = 3
+		if type(files[path]) != type('str'):
+			data = files[path].getvalue()
+		else:
+			data = files[path]
 		
-	logging.debug("Writing ZIP path %s" % path)
-	try:
-		memzip.writestr(path, data.encode('utf-8'))
-	except UnicodeDecodeError, e:
-		memzip.writestr(path.encode('utf-8'), data.encode('utf-8'))
+		logging.debug("Writing ZIP path %s" % path)
+		try:
+			memzip.writestr(path, data.encode('utf-8'))
+		except UnicodeDecodeError, e:
+			memzip.writestr(path.encode('utf-8'), data.encode('utf-8'))
 		
-	memzip.close()
+		memzip.close()
 
-	# remove it from the files dict.
-	del(files['mimetype'])
+		# remove it from the files dict.
+		del(files['mimetype'])
 	
 	# open in 'a' append mode.
 	memzip = zipfile.ZipFile(io, 'a', compression=zipfile.ZIP_DEFLATED)

From 5bca3106dfef0d6a91aec40a65d45c765ad8d755 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Wed, 20 Oct 2010 14:58:48 -0500
Subject: [PATCH 47/94] Adding a twipassword.py and a quick readme.txt.

---
 readme.txt     | 10 ++++++++++
 twipassword.py |  2 ++
 2 files changed, 12 insertions(+)
 create mode 100644 readme.txt
 create mode 100644 twipassword.py

diff --git a/readme.txt b/readme.txt
new file mode 100644
index 00000000..996efe64
--- /dev/null
+++ b/readme.txt
@@ -0,0 +1,10 @@
+To use, do:
+
+python downaloder.py <url> (epub|html)
+
+Eg:
+
+python downaloder.py http://www.fanfiction.net/s/5192986/1/A_Fox_in_Tokyo epub
+
+This tool uses Python 2.5.2, but should work with newer versions.
+
diff --git a/twipassword.py b/twipassword.py
new file mode 100644
index 00000000..466686ff
--- /dev/null
+++ b/twipassword.py
@@ -0,0 +1,2 @@
+# This is really for the web version.  downalod.py will ask.
+password='somepass'

From 33c3f0b4fd0611df7a9a128c74c4ddda05c40b9a Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Wed, 20 Oct 2010 15:02:11 -0500
Subject: [PATCH 48/94] Added tag fanficdownloader-0.2 for changeset
 3eff15bceebe


From 778deaea00bdf06bf0d616b4c37f0cc235c92f1e Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Thu, 28 Oct 2010 17:29:00 -0500
Subject: [PATCH 49/94] Replace the haphazardly collected set of html entities
 with a list of known (browser) supported entities.  Will now preserve
 right/left quotes.

---
 constants.py | 367 ++++++++++++++++++++++++++++++++++++++++++++++++++-
 1 file changed, 365 insertions(+), 2 deletions(-)

diff --git a/constants.py b/constants.py
index 2bcc1a67..e01342d9 100644
--- a/constants.py
+++ b/constants.py
@@ -115,8 +115,371 @@ acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
 
 acceptable_attributes = ['href']
 
-entities = { '&ndash;' : ' - ', '&mdash;' : ' - ', '&rdquo;' : '"', '&ldquo;' : '"', '&rsquo;' : '\'', 
-             '&lsquo;' : '\'', '&quot;' : '"', '&hellip;' : '...', '&amp;' : '&', '&pound;' : '£', '&nbsp;' : ' ' }
+# entity list from http://code.google.com/p/doctype/wiki/CharacterEntitiesConsistent
+# when version without ; is allowed, make sure to put the version with first.
+entities = { '&aacute;' : 'á',
+             '&Aacute;' : 'Á',
+             '&Aacute' : 'Á',
+             '&aacute' : 'á',
+             '&acirc;' : 'â',
+             '&Acirc;' : 'Â',
+             '&Acirc' : 'Â',
+             '&acirc' : 'â',
+             '&acute;' : '´',
+             '&acute' : '´',
+             '&AElig;' : 'Æ',
+             '&aelig;' : 'æ',
+             '&AElig' : 'Æ',
+             '&aelig' : 'æ',
+             '&agrave;' : 'à',
+             '&Agrave;' : 'À',
+             '&Agrave' : 'À',
+             '&agrave' : 'à',
+             '&alefsym;' : 'ℵ',
+             '&alpha;' : 'α',
+             '&Alpha;' : 'Α',
+             '&amp;' : '&',
+             '&AMP;' : '&',
+             '&AMP' : '&',
+             '&amp' : '&',
+             '&and;' : '∧',
+             '&ang;' : '∠',
+             '&aring;' : 'å',
+             '&Aring;' : 'Å',
+             '&Aring' : 'Å',
+             '&aring' : 'å',
+             '&asymp;' : '≈',
+             '&atilde;' : 'ã',
+             '&Atilde;' : 'Ã',
+             '&Atilde' : 'Ã',
+             '&atilde' : 'ã',
+             '&auml;' : 'ä',
+             '&Auml;' : 'Ä',
+             '&Auml' : 'Ä',
+             '&auml' : 'ä',
+             '&bdquo;' : '„',
+             '&beta;' : 'β',
+             '&Beta;' : 'Β',
+             '&brvbar;' : '¦',
+             '&brvbar' : '¦',
+             '&bull;' : '•',
+             '&cap;' : '∩',
+             '&ccedil;' : 'ç',
+             '&Ccedil;' : 'Ç',
+             '&Ccedil' : 'Ç',
+             '&ccedil' : 'ç',
+             '&cedil;' : '¸',
+             '&cedil' : '¸',
+             '&cent;' : '¢',
+             '&cent' : '¢',
+             '&chi;' : 'χ',
+             '&Chi;' : 'Χ',
+             '&circ;' : 'ˆ',
+             '&clubs;' : '♣',
+             '&cong;' : '≅',
+             '&copy;' : '©',
+             '&COPY;' : '©',
+             '&COPY' : '©',
+             '&copy' : '©',
+             '&crarr;' : '↵',
+             '&cup;' : '∪',
+             '&curren;' : '¤',
+             '&curren' : '¤',
+             '&dagger;' : '†',
+             '&Dagger;' : '‡',
+             '&darr;' : '↓',
+             '&dArr;' : '⇓',
+             '&deg;' : '°',
+             '&deg' : '°',
+             '&delta;' : 'δ',
+             '&Delta;' : 'Δ',
+             '&diams;' : '♦',
+             '&divide;' : '÷',
+             '&divide' : '÷',
+             '&eacute;' : 'é',
+             '&Eacute;' : 'É',
+             '&Eacute' : 'É',
+             '&eacute' : 'é',
+             '&ecirc;' : 'ê',
+             '&Ecirc;' : 'Ê',
+             '&Ecirc' : 'Ê',
+             '&ecirc' : 'ê',
+             '&egrave;' : 'è',
+             '&Egrave;' : 'È',
+             '&Egrave' : 'È',
+             '&egrave' : 'è',
+             '&empty;' : '∅',
+             '&emsp;' : ' ',
+             '&ensp;' : ' ',
+             '&epsilon;' : 'ε',
+             '&Epsilon;' : 'Ε',
+             '&equiv;' : '≡',
+             '&eta;' : 'η',
+             '&Eta;' : 'Η',
+             '&eth;' : 'ð',
+             '&ETH;' : 'Ð',
+             '&ETH' : 'Ð',
+             '&eth' : 'ð',
+             '&euml;' : 'ë',
+             '&Euml;' : 'Ë',
+             '&Euml' : 'Ë',
+             '&euml' : 'ë',
+             '&euro;' : '€',
+             '&exist;' : '∃',
+             '&fnof;' : 'ƒ',
+             '&forall;' : '∀',
+             '&frac12;' : '½',
+             '&frac12' : '½',
+             '&frac14;' : '¼',
+             '&frac14' : '¼',
+             '&frac34;' : '¾',
+             '&frac34' : '¾',
+             '&frasl;' : '⁄',
+             '&gamma;' : 'γ',
+             '&Gamma;' : 'Γ',
+             '&ge;' : '≥',
+             '&gt;' : '>',
+             '&GT;' : '>',
+             '&GT' : '>',
+             '&gt' : '>',
+             '&harr;' : '↔',
+             '&hArr;' : '⇔',
+             '&hearts;' : '♥',
+             '&hellip;' : '…',
+             '&iacute;' : 'í',
+             '&Iacute;' : 'Í',
+             '&Iacute' : 'Í',
+             '&iacute' : 'í',
+             '&icirc;' : 'î',
+             '&Icirc;' : 'Î',
+             '&Icirc' : 'Î',
+             '&icirc' : 'î',
+             '&iexcl;' : '¡',
+             '&iexcl' : '¡',
+             '&igrave;' : 'ì',
+             '&Igrave;' : 'Ì',
+             '&Igrave' : 'Ì',
+             '&igrave' : 'ì',
+             '&image;' : 'ℑ',
+             '&infin;' : '∞',
+             '&int;' : '∫',
+             '&iota;' : 'ι',
+             '&Iota;' : 'Ι',
+             '&iquest;' : '¿',
+             '&iquest' : '¿',
+             '&isin;' : '∈',
+             '&iuml;' : 'ï',
+             '&Iuml;' : 'Ï',
+             '&Iuml' : 'Ï',
+             '&iuml' : 'ï',
+             '&kappa;' : 'κ',
+             '&Kappa;' : 'Κ',
+             '&lambda;' : 'λ',
+             '&Lambda;' : 'Λ',
+             '&laquo;' : '«',
+             '&laquo' : '«',
+             '&larr;' : '←',
+             '&lArr;' : '⇐',
+             '&lceil;' : '⌈',
+             '&ldquo;' : '“',
+             '&le;' : '≤',
+             '&lfloor;' : '⌊',
+             '&lowast;' : '∗',
+             '&loz;' : '◊',
+             '&lrm;' : '‎',
+             '&lsaquo;' : '‹',
+             '&lsquo;' : '‘',
+             '&lt;' : '<',
+             '&LT;' : '<',
+             '&LT' : '<',
+             '&lt' : '<',
+             '&macr;' : '¯',
+             '&macr' : '¯',
+             '&mdash;' : '—',
+             '&micro;' : 'µ',
+             '&micro' : 'µ',
+             '&middot;' : '·',
+             '&middot' : '·',
+             '&minus;' : '−',
+             '&mu;' : 'μ',
+             '&Mu;' : 'Μ',
+             '&nabla;' : '∇',
+             '&nbsp;' : ' ',
+             '&nbsp' : ' ',
+             '&ndash;' : '–',
+             '&ne;' : '≠',
+             '&ni;' : '∋',
+             '&not;' : '¬',
+             '&not' : '¬',
+             '&notin;' : '∉',
+             '&nsub;' : '⊄',
+             '&ntilde;' : 'ñ',
+             '&Ntilde;' : 'Ñ',
+             '&Ntilde' : 'Ñ',
+             '&ntilde' : 'ñ',
+             '&nu;' : 'ν',
+             '&Nu;' : 'Ν',
+             '&oacute;' : 'ó',
+             '&Oacute;' : 'Ó',
+             '&Oacute' : 'Ó',
+             '&oacute' : 'ó',
+             '&ocirc;' : 'ô',
+             '&Ocirc;' : 'Ô',
+             '&Ocirc' : 'Ô',
+             '&ocirc' : 'ô',
+             '&OElig;' : 'Œ',
+             '&oelig;' : 'œ',
+             '&ograve;' : 'ò',
+             '&Ograve;' : 'Ò',
+             '&Ograve' : 'Ò',
+             '&ograve' : 'ò',
+             '&oline;' : '‾',
+             '&omega;' : 'ω',
+             '&Omega;' : 'Ω',
+             '&omicron;' : 'ο',
+             '&Omicron;' : 'Ο',
+             '&oplus;' : '⊕',
+             '&or;' : '∨',
+             '&ordf;' : 'ª',
+             '&ordf' : 'ª',
+             '&ordm;' : 'º',
+             '&ordm' : 'º',
+             '&oslash;' : 'ø',
+             '&Oslash;' : 'Ø',
+             '&Oslash' : 'Ø',
+             '&oslash' : 'ø',
+             '&otilde;' : 'õ',
+             '&Otilde;' : 'Õ',
+             '&Otilde' : 'Õ',
+             '&otilde' : 'õ',
+             '&otimes;' : '⊗',
+             '&ouml;' : 'ö',
+             '&Ouml;' : 'Ö',
+             '&Ouml' : 'Ö',
+             '&ouml' : 'ö',
+             '&para;' : '¶',
+             '&para' : '¶',
+             '&part;' : '∂',
+             '&permil;' : '‰',
+             '&perp;' : '⊥',
+             '&phi;' : 'φ',
+             '&Phi;' : 'Φ',
+             '&pi;' : 'π',
+             '&Pi;' : 'Π',
+             '&piv;' : 'ϖ',
+             '&plusmn;' : '±',
+             '&plusmn' : '±',
+             '&pound;' : '£',
+             '&pound' : '£',
+             '&prime;' : '′',
+             '&Prime;' : '″',
+             '&prod;' : '∏',
+             '&prop;' : '∝',
+             '&psi;' : 'ψ',
+             '&Psi;' : 'Ψ',
+             '&quot;' : '"',
+             '&QUOT;' : '"',
+             '&QUOT' : '"',
+             '&quot' : '"',
+             '&radic;' : '√',
+             '&raquo;' : '»',
+             '&raquo' : '»',
+             '&rarr;' : '→',
+             '&rArr;' : '⇒',
+             '&rceil;' : '⌉',
+             '&rdquo;' : '”',
+             '&real;' : 'ℜ',
+             '&reg;' : '®',
+             '&REG;' : '®',
+             '&REG' : '®',
+             '&reg' : '®',
+             '&rfloor;' : '⌋',
+             '&rho;' : 'ρ',
+             '&Rho;' : 'Ρ',
+             '&rlm;' : '‏',
+             '&rsaquo;' : '›',
+             '&rsquo;' : '’',
+             '&sbquo;' : '‚',
+             '&scaron;' : 'š',
+             '&Scaron;' : 'Š',
+             '&sdot;' : '⋅',
+             '&sect;' : '§',
+             '&sect' : '§',
+             '&shy;' : '­', # strange optional hyphenation control character, not just a dash
+             '&shy' : '­',
+             '&sigma;' : 'σ',
+             '&Sigma;' : 'Σ',
+             '&sigmaf;' : 'ς',
+             '&sim;' : '∼',
+             '&spades;' : '♠',
+             '&sub;' : '⊂',
+             '&sube;' : '⊆',
+             '&sum;' : '∑',
+             '&sup1;' : '¹',
+             '&sup1' : '¹',
+             '&sup2;' : '²',
+             '&sup2' : '²',
+             '&sup3;' : '³',
+             '&sup3' : '³',
+             '&sup;' : '⊃',
+             '&supe;' : '⊇',
+             '&szlig;' : 'ß',
+             '&szlig' : 'ß',
+             '&tau;' : 'τ',
+             '&Tau;' : 'Τ',
+             '&there4;' : '∴',
+             '&theta;' : 'θ',
+             '&Theta;' : 'Θ',
+             '&thetasym;' : 'ϑ',
+             '&thinsp;' : ' ',
+             '&thorn;' : 'þ',
+             '&THORN;' : 'Þ',
+             '&THORN' : 'Þ',
+             '&thorn' : 'þ',
+             '&tilde;' : '˜',
+             '&times;' : '×',
+             '&times' : '×',
+             '&trade;' : '™',
+             '&uacute;' : 'ú',
+             '&Uacute;' : 'Ú',
+             '&Uacute' : 'Ú',
+             '&uacute' : 'ú',
+             '&uarr;' : '↑',
+             '&uArr;' : '⇑',
+             '&ucirc;' : 'û',
+             '&Ucirc;' : 'Û',
+             '&Ucirc' : 'Û',
+             '&ucirc' : 'û',
+             '&ugrave;' : 'ù',
+             '&Ugrave;' : 'Ù',
+             '&Ugrave' : 'Ù',
+             '&ugrave' : 'ù',
+             '&uml;' : '¨',
+             '&uml' : '¨',
+             '&upsih;' : 'ϒ',
+             '&upsilon;' : 'υ',
+             '&Upsilon;' : 'Υ',
+             '&uuml;' : 'ü',
+             '&Uuml;' : 'Ü',
+             '&Uuml' : 'Ü',
+             '&uuml' : 'ü',
+             '&weierp;' : '℘',
+             '&xi;' : 'ξ',
+             '&Xi;' : 'Ξ',
+             '&yacute;' : 'ý',
+             '&Yacute;' : 'Ý',
+             '&Yacute' : 'Ý',
+             '&yacute' : 'ý',
+             '&yen;' : '¥',
+             '&yen' : '¥',
+             '&yuml;' : 'ÿ',
+             '&Yuml;' : 'Ÿ',
+             '&yuml' : 'ÿ',
+             '&zeta;' : 'ζ',
+             '&Zeta;' : 'Ζ',
+             '&zwj;' : '‍',  # strange spacing control character, not just a space
+             '&zwnj;' : '‌',  # strange spacing control character, not just a space
+             }
 
 FB2_PROLOGUE = '<FictionBook>'
 FB2_DESCRIPTION = '''<description>

From 379efc34f17acbd75b05c6ebc8516d295a6e941e Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Tue, 9 Nov 2010 16:35:46 -0600
Subject: [PATCH 50/94] Add a title page to the resulting EPUB file.  This
 required scraping more information from the web pages in order to populate
 the new fields.  This change includes a change to the way that the output.py
 uses the adapters.  It now gets passed in the adapter and then calls
 functions from the adapter in order to retrieve the scraped information. 
 This will make it easier down the road when adding more information, or even
 pictures.

---
 adapter.py                     |  73 +++++-
 constants.py                   |  82 ++++--
 downaloder.py => downloader.py |   9 +-
 ffnet.py                       | 293 +++++++++++++++++++++-
 fictionalley.py                | 269 +++++++++++++++++++-
 ficwad.py                      | 288 +++++++++++++++++++--
 hpfiction.py                   | 226 ++++++++++++++++-
 output.py                      |  67 +++--
 twilighted.py                  | 439 +++++++++++++++++++++++++--------
 9 files changed, 1577 insertions(+), 169 deletions(-)
 rename downaloder.py => downloader.py (91%)

diff --git a/adapter.py b/adapter.py
index bf37a017..246f4177 100644
--- a/adapter.py
+++ b/adapter.py
@@ -29,11 +29,80 @@ class FanfictionSiteAdapter:
 	def setPassword(self, password):
 		pass
 
-	def getStoryName(self):
+	def getStoryURL(self):
+		pass
+
+	def getUUID(self):
+		pass
+
+	def getOutputName(self):
+		pass
+
+	def getAuthorURL(self):
+		pass
+
+	def getAuthorId(self):
 		pass
 
 	def getAuthorName(self):
 		pass
 
+	def getStoryId(self):
+		pass
+
+	def getStoryName(self):
+		pass
+
+	def getStoryDescription(self):
+		pass
+
+	def getStoryCreated(self):
+		pass
+
+	def getStoryPublished(self):
+		pass
+
+	def getStoryUpdated(self):
+		pass
+
+	def getStorySeries(self):
+		pass
+
+	def getLanguage(self):
+		pass
+
+	def getLanguageId(self):
+		pass
+
+	def getSubjects(self):
+		pass
+
+	def getCharacters(self):
+		pass
+
+	def getPublisher(self):
+		pass
+
+	def getNumChapters(self):
+		pass
+
+	def getNumWords(self):
+		pass
+
+	def getCategory(self):
+		pass
+
+	def getGenre(self):
+		pass
+
+	def getStoryStatus(self):
+		pass
+
+	def getStoryRating(self):
+		pass
+
+	def getStoryUserRating(self):
+		pass
+
 	def getPrintableUrl(self, url):
-		pass
\ No newline at end of file
+		pass
diff --git a/constants.py b/constants.py
index e01342d9..6ea1f086 100644
--- a/constants.py
+++ b/constants.py
@@ -15,6 +15,9 @@ h6 { text-align: center; }
     padding:0px;
     }
 .center   {text-align: center;}
+.cover    {text-align: center;}
+.full     {width: 100%; }
+.quarter  {width: 25%; }
 .smcap    {font-variant: small-caps;}
 .u        {text-decoration: underline;}
 .bold     {font-weight: bold;}
@@ -22,6 +25,37 @@ h6 { text-align: center; }
 
 MIMETYPE = '''application/epub+zip'''
 
+TITLE_PAGE = '''<html xmlns="http://www.w3.org/1999/xhtml" xmlns:xlink="http://www.w3.org/1999/xlink"><head><meta http-equiv="Content-Type" content="text/html; charset=utf-8"/>
+<title>%s - %s</title><link href="stylesheet.css" type="text/css" charset="UTF-8" rel="stylesheet"/></head>
+<body><div class="cover">
+<h1 id="cfs_0"><a id="StoryLink" href="%s">%s</a></h1>
+<h2 id="cfs_1">by <a id="AuthorLink" href="%s">%s</a></h2>
+</div><div style="text-align:center">
+<table class="full">
+<colgroup span="2"></colgroup>
+<tr><td> </td>
+<td> </td>
+</tr><tr><td> </td>
+<td> </td>
+</tr><tr><td><b>Category:</b></td><td>%s</td>
+</tr><tr><td><b>Genre:</b></td><td>%s</td>
+</tr><tr><td><b>Status:</b></td><td>%s</td>
+</tr><tr><td><b>Published:</b></td><td>%s</td>
+</tr><tr><td><b>Updated:</b></td><td>%s</td>
+</tr><tr><td><b>Packaged:</b></td><td>%s</td>
+</tr><tr><td><b>Rating Age/User:</b></td><td>%s / %s</td>
+</tr><tr><td><b>Chapters/Words:</b></td><td>%s / %s</td>
+</tr><tr><td><b>URL:</b></td><td><h3 id="url0"><a id="StoryURL" href="%s">%s</a></h3></td>
+</tr><tr><td><b>Summary:</b></td>
+</tr><tr><td colspan="2">%s</td>
+</tr><tr><td> </td>
+<td> </td>
+</tr><tr><td> </td>
+<td> </td>
+</tr></table></div>
+<div class="full" id="pb_0"/></body></html>
+'''
+
 CONTAINER = '''<?xml version="1.0"?>
 <container version="1.0" xmlns="urn:oasis:names:tc:opendocument:xmlns:container">
   <rootfiles>
@@ -30,42 +64,60 @@ CONTAINER = '''<?xml version="1.0"?>
 </container>
 '''
 
-CONTENT_START = '''<?xml version="1.0"?>
+CONTENT_START = '''<?xml version="1.0" encoding="utf-8"?>
 <package version="2.0" xmlns="http://www.idpf.org/2007/opf"
-         unique-identifier="BookID">
- <metadata xmlns:dc="http://purl.org/dc/elements/1.1/"
-           xmlns:opf="http://www.idpf.org/2007/opf">
+         unique-identifier="fanficdownloader-uuid">
+ <metadata xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+           xmlns:dc="http://purl.org/dc/elements/1.1/"
+           xmlns:dcterms="http://purl.org/dc/terms/"
+           xmlns:opf="http://www.idpf.org/2007/opf"
+           xmlns:calibre="http://calibre.kovidgoyal.net/2009/metadata">
+   <dc:identifier id="fanficdownloader-uuid">BookID-Epub-%s</dc:identifier>
    <dc:title>%s</dc:title> 
    <dc:creator opf:role="aut">%s</dc:creator>
-   <dc:language>en-UK</dc:language> 
+   <dc:contributor opf:role="bkp">fanficdownloader [http://fanficdownloader.googlecode.com]</dc:contributor>
+   <dc:language>%s</dc:language> 
    <dc:rights></dc:rights>
-   <dc:subject>fanfiction</dc:subject> 
-   <dc:publisher>sgzmd</dc:publisher> 
-   <dc:identifier id="BookID">%s</dc:identifier>
+   <dc:date opf:event="publication">%s</dc:date>
+   <dc:date opf:event="creation">%s</dc:date>
+   <dc:date opf:event="modification">%s</dc:date>
+   <meta name="calibre:timestamp" content="%s"/>
+   <dc:description>%s</dc:description>
+'''
+
+CONTENT_END_METADATA = '''   <dc:publisher>%s</dc:publisher> 
+   <dc:identifier id="BookId">%s</dc:identifier>
+   <dc:identifier opf:scheme="URL">%s</dc:identifier>
+   <dc:source>%s</dc:source>
+   <dc:type>FanFiction</dc:type>
+   <meta name="calibre:rating" content="%s"/>
  </metadata>
  <manifest>
   <item id="ncx" href="toc.ncx" media-type="application/x-dtbncx+xml"/>
   <item id="style" href="stylesheet.css" media-type="text/css" />
 '''
 
-CONTENT_ITEM = '''<item id="%s" href="%s" media-type="application/xhtml+xml" />
+CONTENT_SUBJECT = '''   <dc:subject>%s</dc:subject> 
 '''
 
-CONTENT_END_MANIFEST = '''</manifest>
-<spine toc="ncx">
+CONTENT_ITEM = '''  <item id="%s" href="%s" media-type="application/xhtml+xml" />
 '''
 
-CONTENT_ITEMREF = '''<itemref idref="%s" />
+CONTENT_END_MANIFEST = ''' </manifest>
+ <spine toc="ncx">
 '''
 
-CONTENT_END = '''</spine>
+CONTENT_ITEMREF = '''  <itemref idref="%s" />
+'''
+
+CONTENT_END = ''' </spine>
 </package>
 '''
 
 TOC_START = '''<?xml version="1.0" encoding="UTF-8"?>
 <ncx xmlns="http://www.daisy.org/z3986/2005/ncx/" version="2005-1">
   <head>
-    <meta name="dtb:uid" content="sigizmund.com062820072147132"/>
+    <meta name="dtb:uid" content="%s"/>
     <meta name="dtb:depth" content="1"/>
     <meta name="dtb:totalPageCount" content="0"/>
     <meta name="dtb:maxPageNumber" content="0"/>
@@ -502,3 +554,5 @@ FB2_DESCRIPTION = '''<description>
 <version>2.0</version>
 </document-info>
 </description>'''
+
+HTML_ESC_Definitions = 'HTML_Escape.def'
diff --git a/downaloder.py b/downloader.py
similarity index 91%
rename from downaloder.py
rename to downloader.py
index b8af3abe..f8ca80c6 100644
--- a/downaloder.py
+++ b/downloader.py
@@ -34,6 +34,7 @@ class FanficLoader:
 		self.inmemory = inmemory
 		self.compress = compress
 		self.badLogin = False
+		self.overWrite = True
 	
 	def getAdapter():
 		return self.adapter
@@ -48,7 +49,13 @@ class FanficLoader:
 				raise adapter.LoginRequiredException(self.adapter.url)
 		
 		urls = self.adapter.extractIndividualUrls()
-		self.writer = self.writerClass(self.booksDirectory, self.adapter.getStoryName(), self.adapter.getAuthorName(), inmemory=self.inmemory, compress=self.compress)
+
+		s = self.booksDirectory + "/" + self.adapter.getOutputName() + "." + format
+		if not self.overWrite and os.path.isfile(s):
+			print >> sys.stderr, "File " + s + " already exists!  Skipping!"
+			exit(10)
+
+		self.writer = self.writerClass(self.booksDirectory, self.adapter, inmemory=self.inmemory, compress=self.compress)
 		
 		i = 1
 		for u,n in urls:
diff --git a/ffnet.py b/ffnet.py
index f3e101fc..7320ec5a 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -15,6 +15,8 @@ import urllib2 as u2
 import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
+import time
+import datetime
 
 from constants import *
 from adapter import *
@@ -40,10 +42,37 @@ class FFNet(FanfictionSiteAdapter):
 		
 		self.storyName = 'FF.Net story'
 		self.authorName = 'FF.Net author'
+		self.outputName = 'FF.Net_story'
+		self.storyDescription = 'Fanfiction Story'
+		self.storyCharacters = []
+		self.storySeries = ''
+		self.authorId = '0'
+		self.authorURL = self.path
+		self.storyId = '0'
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		self.subjects.append ('FanFiction')
+		logging.debug('self.subjects=%s' % self.subjects)
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = 'FanFiction'
+		self.category = 'FF.Net Category'
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'K'
+		self.storyUserRating = '0'
 		
+		logging.debug('self.path=%s' % self.path)
+
 		spl = self.path.split('/')
+		logging.debug('spl=%s' % spl)
 		if len(spl) == 5:
 			self.path = "/".join(spl[1:-1])
+			self.outputName = spl[4] + '-ffnet_' + spl[2]
 		
 		if self.path.startswith('/'):
 			self.path = self.path[1:]
@@ -51,10 +80,14 @@ class FFNet(FanfictionSiteAdapter):
 		if self.path.endswith('/'):
 			self.path = self.path[:-1]
 		
+		logging.debug('self.path=%s' % self.path)
+
 		(s, self.storyId, chapter) = self.path.split('/')
 		
-		logging.debug('self.storyId=%s, chapter=%s' % (self.storyId, chapter))
-		
+		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+		logging.debug('self.uuid=%s' % self.uuid)
+
+		logging.debug('self.storyId=%s, chapter=%s, self.outputName=%s' % (self.storyId, chapter, self.outputName))
 		if not appEngine:
 			self.opener = u2.build_opener(u2.HTTPCookieProcessor())
 		else:
@@ -70,7 +103,70 @@ class FFNet(FanfictionSiteAdapter):
 
 	def performLogin(self, url = None):
 		return True
+
+	def _getVarValue(self, varstr):
+		#logging.debug('_getVarValue varstr=%s' % varstr)
+		vals = varstr.split('=')
+		#logging.debug('vals=%s' % vals)
+		retstr="".join(vals[+1:])
+		#logging.debug('retstr=%s' % retstr)
+		if retstr.startswith(' '):
+			retstr = retstr[1:]
+		if retstr.endswith(';'):
+			retstr = retstr[:-1]
+		return retstr
 	
+	def _splitCrossover(self, subject):
+		if "Crossover" in subject:
+			self._addSubject ("Crossover")
+			logging.debug('Crossover=%s' % subject)
+			if subject.find(' and ') != -1:
+				words = subject.split(' ')
+				logging.debug('words=%s' % words)
+				subj = ''
+				for s in words:
+					if s in "and Crossover":
+						if len(subj) > 0:
+							self._addSubject(subj)
+						subj = ''
+					else:
+						if len(subj) > 0:
+							subj = subj + ' '
+						subj = subj + s
+				if len(subj) > 0:
+					self._addSubject(subj)
+			else:
+				self._addSubject(subject)
+		else:
+			self._addSubject(subject)
+		return True
+
+	def _splitGenre(self, subject):
+		if len(subject) > 0:
+			words = subject.split('/')
+			logging.debug('words=%s' % words)
+			for subj in words:
+			    if len(subj) > 0:
+				self._addSubject(subj)
+		return True
+
+	def _addSubject(self, subject):
+		subj = subject.upper()
+		for s in self.subjects:
+			if s.upper() == subj:
+				return False
+
+		self.subjects.append(subject)
+		return True
+
+	def _addCharacter(self, character):
+		chara = character.upper()
+		for c in self.storyCharacters:
+			if c.upper() == chara:
+				return False
+		self.storyCharacters.append(character)
+		return True
+
 	def _fetchUrl(self, url):
 		if not appEngine:
 			return self.opener.open(url).read().decode('utf-8')
@@ -85,6 +181,8 @@ class FFNet(FanfictionSiteAdapter):
 		for a in allA:
 			if 'href' in a._getAttrMap() and a['href'].find('/u/') != -1:
 				self.authorName = a.string
+				(u1, u2, self.authorId, u3) = a['href'].split('/')
+				logging.debug('self.authorId=%s self.authorName=%s' % (self.authorId, self.authorName))
 
 		urls = []
 		lines = data.split('\n')
@@ -92,9 +190,38 @@ class FFNet(FanfictionSiteAdapter):
 			if l.find("&#187;") != -1 and l.find('<b>') != -1:
 				s2 = bs.BeautifulStoneSoup(l)
 				self.storyName = str(s2.find('b').string)
+				logging.debug('self.storyId=%s self.storyName=%s' % (self.storyId, self.storyName))
 			elif l.find("<a href='/u/") != -1:
 				s2 = bs.BeautifulStoneSoup(l)
 				self.authorName = str(s2.a.string)
+				(u1, u2, self.authorId, u3) = s2.a['href'].split('/')
+				logging.debug('self.authorId=%s self.authorName=%s' % (self.authorId, self.authorName))
+			elif l.find("Rated: <a href=") != -1:
+				s2 = bs.BeautifulStoneSoup(l)
+				self.storyRating = str(s2.a.string).strip()
+				logging.debug('self.storyRating=%s' % self.storyRating)
+				logging.debug('s2.a=%s' % s2.a)
+				s3 = l.split('-')
+				logging.debug('s3=%s' % s3)
+				if len(s3) > 0:
+					if s3[1].find("Reviews: <a href=") != -1:
+						continue
+					self.language = s3[1].strip()
+					logging.debug('self.language=%s' % self.language)
+					if len(s3) > 1:
+						if s3[2].find("Reviews: <a href=") != -1:
+							continue
+						self.genre = s3[2].strip()
+						if "&" in self.genre:
+							self.genre = ''
+							continue
+						logging.debug('self.genre=%s' % self.genre)
+						self._splitGenre(self.genre)
+						logging.debug('self.subjects=%s' % self.subjects)
+				if "Complete" in l:
+					self.storyStatus = 'Completed'
+				else:
+					self.storyStatus = 'In-Progress'
 			elif l.find("<SELECT title='chapter navigation'") != -1:
 				if len(urls) > 0:
 					continue
@@ -102,6 +229,8 @@ class FFNet(FanfictionSiteAdapter):
 					u = l.decode('utf-8')
 				except UnicodeEncodeError, e:
 					u = l
+				except:
+					u = l.encode('ascii', 'xmlcharrefreplace')
 				u = re.sub('&\#[0-9]+;', ' ', u)
 				s2 = bs.BeautifulSoup(u)
 				options = s2.findAll('option')
@@ -110,19 +239,69 @@ class FFNet(FanfictionSiteAdapter):
 					title = o.string
 					logging.debug('URL = `%s`, Title = `%s`' % (url, title))
 					urls.append((url,title))
-		if len(urls) == 0:
+			elif l.find("var chapters") != -1:
+				self.numChapters = self._getVarValue (l)
+				logging.debug('self.numChapters=%s' % self.numChapters)
+			elif l.find("var words") != -1:
+				self.numWords = self._getVarValue (l)
+				logging.debug('self.numWords=%s' % self.numWords)
+			elif l.find("var categoryid") != -1:
+				categoryid = self._getVarValue (l)
+				logging.debug('categoryid=%s' % categoryid)
+			elif l.find("var cat_title") != -1:
+				self.category = self._getVarValue (l).strip("'")
+				logging.debug('self.category=%s' % self.category)
+				self._splitCrossover(self.category)
+				logging.debug('self.subjects=%s' % self.subjects)
+			elif l.find("var summary") != -1:
+				self.storyDescription = self._getVarValue (l).strip("'")
+				if '&' in self.storyDescription:
+					s = self.storyDescription.split('&')
+					logging.debug('s=%s' % s)
+					self.storyDescription = ''
+					for ss in s:
+						if len(self.storyDescription) > 0:
+							if len(ss) > 4 and 'amp;' in ss[1:4]:
+								self.storyDescription = self.storyDescription + '&' + ss
+							else:
+								self.storyDescription = self.storyDescription + '&amp;' + ss
+						else:
+							self.storyDescription = ss
+				logging.debug('self.storyDescription=%s' % self.storyDescription)
+			elif l.find("var datep") != -1:
+				dateps = self._getVarValue (l)
+				self.storyPublished = datetime.datetime(*time.strptime ( dateps, "'%m-%d-%y'" )[0:5])
+				logging.debug('self.storyPublished=%s' % self.storyPublished.strftime("%Y-%m-%dT%I:%M:%S"))
+			elif l.find("var dateu") != -1:
+				dateus = self._getVarValue (l)
+				self.storyUpdated = datetime.datetime(*time.strptime ( dateus, "'%m-%d-%y'" )[0:5])
+				logging.debug('self.storyUpdated=%s' % self.storyUpdated.strftime("%Y-%m-%dT%I:%M:%S"))
+		
+		if len(urls) <= 0:
 			# no chapters found, try url by itself.
 			urls.append((self.url,self.storyName))
+
+		self.uuid = 'urn:uuid:' + self.host + '-a.' + self.authorId + '-s.' + self.storyId
+		self.authorURL = 'http://' + self.host + '/u/' + self.authorId
+		logging.debug('self.uuid=%s' % self.uuid)
+
+		#logging.debug('urls=%s' % urls)
 		return urls
 	
 	def getText(self, url):
+		time.sleep( 2.0 )
 		data = self._fetchUrl(url)
+		lines = data.split('\n')
+		
+		textbuf = ''
+		emit = False
+		
 		olddata = data
 		try:
 			data = data.decode('utf8')
 		except:
 			data = olddata
-
+		
 		try:
 			soup = bs.BeautifulStoneSoup(data)
 		except:
@@ -131,23 +310,121 @@ class FFNet(FanfictionSiteAdapter):
 		div = soup.find('div', {'id' : 'storytext'})
 		if None == div:
 			logging.error("Error downloading Chapter: %s" % url)
-			exit(1)
+			exit (20)
 			return '<html/>'
 			
 		return div.__str__('utf8')
-		
+					
 	def setLogin(self, login):
 		self.login = login
 
 	def setPassword(self, password):
 		self.password = password
 
-	def getStoryName(self):
-		return self.storyName
+	def getStoryURL(self):
+		logging.debug('self.url=%s' % self.url)
+		return self.url
+
+	def getUUID(self):
+		logging.debug('self.uuid=%s' % self.uuid)
+		return self.uuid
+
+	def getOutputName(self):
+		logging.debug('self.storyId=%s, self.storyName=%s self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
+		return self.outputName
 
 	def getAuthorName(self):
+		logging.debug('self.authorName=%s' % self.authorName)
 		return self.authorName
 
+	def getAuthorId(self):
+		logging.debug('self.authorId=%s' % self.authorId)
+		return self.authorId
+
+	def getAuthorURL(self):
+		logging.debug('self.authorURL=%s' % self.authorURL)
+		return self.authorURL
+
+	def getStoryId(self):
+		logging.debug('self.storyId=%s' % self.storyId)
+		return self.storyId
+
+	def getStoryName(self):
+		logging.debug('self.storyName=%s' % self.storyName)
+		return self.storyName
+
+	def getStoryDescription(self):
+		logging.debug('self.storyDescription=%s' % self.storyDescription)
+		return self.storyDescription
+
+	def getStoryPublished(self):
+		logging.debug('self.storyPublished=%s' % self.storyPublished)
+		return self.storyPublished
+
+	def getStoryCreated(self):
+		self.storyCreated = datetime.datetime.now()
+		logging.debug('self.storyCreated=%s' % self.storyCreated)
+		return self.storyCreated
+
+	def getStoryUpdated(self):
+		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+		return self.storyUpdated
+
+	def getLanguage(self):
+		logging.debug('self.language=%s' % self.language)
+		return self.language
+
+	def getLanguageId(self):
+		logging.debug('self.languageId=%s' % self.languageId)
+		return self.languageId
+
+	def getSubjects(self):
+		logging.debug('self.subjects=%s' % self.authorName)
+		return self.subjects
+
+	def getPublisher(self):
+		logging.debug('self.publisher=%s' % self.publisher)
+		return self.publisher
+
+	def getNumChapters(self):
+		logging.debug('self.numChapters=%s' % self.numChapters)
+		return self.numChapters
+
+	def getNumWords(self):
+		logging.debug('self.numWords=%s' % self.numWords)
+		return self.numWords
+
+	def getCategory(self):
+		logging.debug('self.category=%s' % self.category)
+		return self.category
+
+	def getGenre(self):
+		logging.debug('self.genre=%s' % self.genre)
+		return self.genre
+
+	def getStoryStatus(self):
+		logging.debug('self.storyStatus=%s' % self.storyStatus)
+		return self.storyStatus
+
+	def getStoryRating(self):
+		logging.debug('self.storyRating=%s' % self.storyRating)
+		return self.storyRating
+
+	def getStoryUserRating(self):
+		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
+		return self.storyUserRating
+
+	def getPrintableUrl(self, url):
+		pass
+
+	def getStoryCharacters(self):
+		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+		return self.storyCharacters
+	
+	def getStorySeries(self):
+		logging.debug('self.storySeries=%s' % self.storySeries)
+		return self.storySeries
+		
 class FFA_UnitTests(unittest.TestCase):
 	def setUp(self):
 		logging.basicConfig(level=logging.DEBUG)
diff --git a/fictionalley.py b/fictionalley.py
index 884720fd..20763bf9 100644
--- a/fictionalley.py
+++ b/fictionalley.py
@@ -12,13 +12,20 @@ import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 import time as time
+import datetime
 from adapter import *
 
 
 class FictionAlley(FanfictionSiteAdapter):
 	def __init__(self, url):
 		self.url = url
-		self.host = up.urlparse(url).netloc
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		
+		logging.debug('self.host=%s' % self.host)
+		logging.debug('self.path=%s' % self.path)
+
 		cookieproc = u2.HTTPCookieProcessor()
 
 		# FictionAlley wants a cookie to prove you're old enough to read R+ rated stuff.
@@ -35,6 +42,36 @@ class FictionAlley(FanfictionSiteAdapter):
 					  rfc2109=False)
 		cookieproc.cookiejar.set_cookie(cookie)
 		self.opener = u2.build_opener(cookieproc)
+
+		ss = self.path.split('/')
+		
+		self.storyDescription = 'Fanfiction Story'
+		self.authorId = ''
+		self.authorURL = ''
+		self.storyId = ''
+		if len(ss) > 2 and ss[1] == 'authors':
+			self.authorId = ss[2]
+			self.authorURL = 'http://' + self.host + '/authors/' + self.authorId
+			if len(ss) > 3:
+				self.storyId = ss[3].replace ('.html','')
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		self.subjects.append ('fanfiction')
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = 'FanFiction'
+		self.category = 'Category'
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'K'
+		self.storyUserRating = '0'
+		self.storyCharacters = []
+		self.storySeries = ''
+	
 		
 	def requiresLogin(self, url = None):
 		return False
@@ -48,31 +85,147 @@ class FictionAlley(FanfictionSiteAdapter):
 	def setPassword(self, password):
 		self.password = password
 	
+	def _addSubject(self, subject):
+		subj = subject.upper()
+		for s in self.subjects:
+			if s.upper() == subj:
+				return False
+		self.subjects.append(subject)
+		return True
+
+	def _addCharacter(self, character):
+		chara = character.upper()
+		for c in self.storyCharacters:
+			if c.upper() == chara:
+				return False
+		self.storyCharacters.append(character)
+		return True
+
+	def _processChapterHeaders(self, div):
+		brs = div.findAll ('br')
+		for br in brs:
+			keystr=''
+			valstr=''
+			if len(br.contents) > 2:
+				keystr = br.contents[1]
+				if keystr is not None:
+					strs = re.split ("<[^>]+>", str(keystr))
+					keystr=''
+					for s in strs:
+						keystr = keystr + s					
+				valstr = br.contents[2].strip(' ')
+			if keystr is not None:
+				if keystr == 'Rating:':
+					self.storyRating = valstr
+					logging.debug('self.storyRating=%s' % self.storyRating)
+				elif keystr == 'Genre:':
+					self.genre = valstr
+					logging.debug('self.genre=%s' % self.genre)
+					s2 = valstr.split(', ')
+					for ss2 in s2:
+						self._addSubject(ss2)
+					logging.debug('self.subjects=%s' % self.subjects)
+				elif keystr == 'Main Character(s):':
+					s2 = valstr.split(', ')
+					for ss2 in s2:
+						self._addCharacter(ss2)
+					logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+				elif keystr == 'Summary:':
+					self.storyDescription = valstr
+					logging.debug('self.storyDescription=%s' % self.storyDescription)
+	
+		
 	def extractIndividualUrls(self):
 		data = self.opener.open(self.url).read()		
+		
+		# There is some usefull information in the headers of the first chapter page..
+		data = data.replace('<!-- headerstart -->','<crazytagstringnobodywouldstumbleonaccidently id="storyheaders">').replace('<!-- headerend -->','</crazytagstringnobodywouldstumbleonaccidently>')
 		soup = bs.BeautifulStoneSoup(data)
 				
 		# Get title from <title>, remove before '-'.
 		title = soup.find('title').string
 		self.storyName = "-".join(title.split('-')[1:]).strip().replace(" (Story Text)","")
+		self.outputName = self.storyName.replace(" ", "_") + '-fa_' + self.storyId
 		
-		links = soup.findAll('a', { 'class' : 'chapterlink' } )
+		links = soup.findAll('li')
 
+		# If it is decided that we really do care about number of words..  It's only available on the author's page..
+		#d0 = self.opener.open(self.authorURL).read()
+		#soupA = bs.BeautifulStoneSoup(d0)
+		#dls = soupA.findAll('dl')
+		#logging.debug('dls=%s' % dls)
+		
+		self.numChapters = 0;
 		result = []
 		if len(links) == 0:
+			# Be aware that this means that the user has entered the {STORY}01.html 
+			# We will not have valid Publised and Updated dates.  User should enter 
+			# the {STORY}.html instead.  We should force that instead of this.
 			breadcrumbs = soup.find('div', {'class': 'breadcrumbs'})
 			self.authorName = breadcrumbs.a.string.replace("'s Fics","")
 			result.append((self.url,self.storyName))
+			#logging.debug('chapter[%s]=%s, %s' % (self.numChapters+1,self.url,self.storyName))
+			self.numChapters = self.numChapters + 1;
+			div = soup.find('crazytagstringnobodywouldstumbleonaccidently', {'id' : 'storyheaders'})
+			if div is not None:
+				self._processChapterHeaders(div)
 		else:
 			author = soup.find('h1', {'class' : 'title'})
 			self.authorName = author.a.string
 			
-			for a in links:
-				url = a['href']
-				title = a.string
-				result.append((url,title))
+			summary = soup.find('div', {'class' : 'summary'})
+			ss = summary.contents
+			if len(ss) > 1:
+				ss1 = ss[0].split(': ')
+				if len(ss1) > 1 and ss1[0] == 'Rating':
+					self.storyRating = ss1[1]
+					logging.debug('self.storyRating=%s' % self.storyRating)
+				self.storyDescription = str(ss[1]).replace("<br>","").replace("</br>","").replace('\n','')
+				logging.debug('self.storyDescription=%s' % self.storyDescription)
+			
+			for li in links:
+				a = li.find('a', {'class' : 'chapterlink'})
+				s = li.contents
+				if a is not None:
+					url = a['href']
+					title = a.string
+					result.append((url,title))
+					#logging.debug('chapter[%s]=%s, %s' % (self.numChapters+1,url,title))
+					if self.numChapters == 0:
+						# fictionalley uses full URLs in chapter list.
+						d1 = self.opener.open(url).read()
+						
+						# find <!-- headerstart --> & <!-- headerend --> and
+						# replaced with matching div pair for easier parsing.
+						# Yes, it's an evil kludge, but what can ya do?  Using
+						# something other than div prevents soup from pairing
+						# our div with poor html inside the story text.
+						d1 = d1.replace('<!-- headerstart -->','<crazytagstringnobodywouldstumbleonaccidently id="storyheaders">').replace('<!-- headerend -->','</crazytagstringnobodywouldstumbleonaccidently>')
+						sop = bs.BeautifulStoneSoup(d1)
+						
+						div = sop.find('crazytagstringnobodywouldstumbleonaccidently', {'id' : 'storyheaders'})
+						if div is not None:
+							self._processChapterHeaders(div)
+							
+					self.numChapters = self.numChapters + 1
+					if len(s) > 1:
+						datestr=''
+						ss2 = s[1].replace('\n','').replace('(','').split(' ')
+						if len(ss2) > 2 and ss2[0] == 'Posted:':
+							datestr = ss2[1] + ' ' + ss2[2]
+							tmpdate = datetime.datetime.fromtimestamp(time.mktime(time.strptime(datestr.strip(' '), "%Y-%m-%d %H:%M:%S")))
+							if self.numChapters == 1:
+								self.storyPublished = tmpdate
+							self.storyUpdated = tmpdate
+						logging.debug('self.storyPublished=%s, self.storyUpdated=%s' % (self.storyPublished, self.storyUpdated))
+				else:
+					logging.debug('li chapterlink not found!  li=%s' % li)
 					
-		#print('Story "%s" by %s' % (self.storyName, self.authorName))
+
+		print('Story "%s" by %s' % (self.storyName, self.authorName))
+		
+		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+		logging.debug('self.uuid=%s' % self.uuid)
 		
 		return result
 	
@@ -82,6 +235,9 @@ class FictionAlley(FanfictionSiteAdapter):
 	def getAuthorName(self):
 		return self.authorName
 	
+	def getOutputName(self):
+		return self.outputName
+
 	def getText(self, url):
 		# fictionalley uses full URLs in chapter list.
 		data = self.opener.open(url).read()
@@ -97,10 +253,96 @@ class FictionAlley(FanfictionSiteAdapter):
 		div = soup.find('crazytagstringnobodywouldstumbleonaccidently', {'id' : 'storytext'})
 		if None == div:
 			logging.error("Error downloading Chapter: %s" % url)
-			exit(1)
+			exit(20)
 			return '<html/>'
-		return div.__str__('utf8').replace('crazytagstringnobodywouldstumbleonaccidently','div')
+
+		html = soup.findAll('html')
+		if len(html) > 1:
+			return html[1].__str__('utf8')
+		else:
+			return div.__str__('utf8').replace('crazytagstringnobodywouldstumbleonaccidently','div')
 	
+	def getStoryURL(self):
+		logging.debug('self.url=%s' % self.url)
+		return self.url
+
+	def getAuthorURL(self):
+		logging.debug('self.authorURL=%s' % self.authorURL)
+		return self.authorURL
+
+	def getUUID(self):
+		logging.debug('self.uuid=%s' % self.uuid)
+		return self.uuid
+
+	def getAuthorId(self):
+		logging.debug('self.authorId=%s' % self.authorId)
+		return self.authorId
+
+	def getStoryId(self):
+		logging.debug('self.storyId=%s' % self.storyId)
+		return self.storyId
+
+	def getStoryDescription(self):
+		logging.debug('self.storyDescription=%s' % self.storyDescription)
+		return self.storyDescription
+
+	def getStoryPublished(self):
+		logging.debug('self.storyPublished=%s' % self.storyPublished)
+		return self.storyPublished
+
+	def getStoryCreated(self):
+		self.storyCreated = datetime.datetime.now()
+		logging.debug('self.storyCreated=%s' % self.storyCreated)
+		return self.storyCreated
+
+	def getStoryUpdated(self):
+		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+		return self.storyUpdated
+
+	def getLanguage(self):
+		logging.debug('self.language=%s' % self.language)
+		return self.language
+
+	def getLanguageId(self):
+		logging.debug('self.languageId=%s' % self.languageId)
+		return self.languageId
+
+	def getSubjects(self):
+		logging.debug('self.subjects=%s' % self.authorName)
+		return self.subjects
+
+	def getPublisher(self):
+		logging.debug('self.publisher=%s' % self.publisher)
+		return self.publisher
+
+	def getNumChapters(self):
+		logging.debug('self.numChapters=%s' % self.numChapters)
+		return self.numChapters
+
+	def getNumWords(self):
+		logging.debug('self.numWords=%s' % self.numWords)
+		return self.numWords
+
+	def getCategory(self):
+		logging.debug('self.category=%s' % self.category)
+		return self.category
+
+	def getGenre(self):
+		logging.debug('self.genre=%s' % self.genre)
+		return self.genre
+
+	def getStoryStatus(self):
+		logging.debug('self.storyStatus=%s' % self.storyStatus)
+		return self.storyStatus
+
+	def getStoryRating(self):
+		logging.debug('self.storyRating=%s' % self.storyRating)
+		return self.storyRating
+
+	def getStoryUserRating(self):
+		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
+		return self.storyUserRating
+
 	def getPrintableUrl(self, url):
 		return url
 	
@@ -114,6 +356,15 @@ class FictionAlley(FanfictionSiteAdapter):
 		login = dict(login = 'name', password = 'pass')
 		other = dict(submit = 'Log In', remember='yes')
 		return (login, other)
+
+	def getStoryCharacters(self):
+		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+		return self.storyCharacters
+	
+	def getStorySeries(self):
+		logging.debug('self.storySeries=%s' % self.storySeries)
+		return self.storySeries
+		
 	
 		
 if __name__ == '__main__':
diff --git a/ficwad.py b/ficwad.py
index 28b71584..133d424a 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -12,6 +12,8 @@ import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 import logging
+import time
+import datetime
 
 from adapter import *
 
@@ -32,7 +34,44 @@ class FicWad(FanfictionSiteAdapter):
 	def setPassword(self, password):
 		self.password = password
 	
+	def _addSubject(self, subject):
+		subj = subject.upper()
+		for s in self.subjects:
+			if s.upper() == subj:
+				return False
+		self.subjects.append(subject)
+		return True
+
+	def _addCharacter(self, character):
+		chara = character.upper()
+		for c in self.storyCharacters:
+			if c.upper() == chara:
+				return False
+		self.storyCharacters.append(character)
+		return True
+
 	def extractIndividualUrls(self):
+		self.storyDescription = 'Fanfiction Story'
+		self.authorId = '0'
+		self.storyId = '0'
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		self.subjects.append ('fanfiction')
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = 'FanFiction'
+		self.category = 'Category'
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'PG'
+		self.storyUserRating = '0'
+		self.storyCharacters = []
+		self.storySeries = ''
+		
 		data = u2.urlopen(self.url).read()
 		soup = bs.BeautifulStoneSoup(data)
 		
@@ -40,50 +79,254 @@ class FicWad(FanfictionSiteAdapter):
 		crumbtrail = story.find('h3') # the only h3 ficwad uses.
 		allAhrefs = crumbtrail.findAll('a')
 		# last of crumbtrail
-		self.storyName = allAhrefs[-1].string.strip()
+		storyinfo = allAhrefs[-1]
+		(u0, u1, storyid) = storyinfo['href'].split('/')
+		if u1 == "story":
+			# This page does not have the correct information on it..  Need to get the Story Title Page
+			logging.debug('URL %s is a chapter URL.  Getting Title Page http://%s/%s/%s.' % (self.url, self.host, u1, storyid))
+			self.url = 'http://' + self.host + '/' + u1 + '/' + storyid
+			data = u2.urlopen(self.url).read()
+			soup = bs.BeautifulStoneSoup(data)
+			
+			story = soup.find('div', {'id' : 'story'})
+			crumbtrail = story.find('h3') # the only h3 ficwad uses.
+			allAhrefs = crumbtrail.findAll('a')
+		
 		# save chapter name from header in case of one-shot.
-		chaptername = story.find('h4').find('a').string.strip()
+		storyinfo = story.find('h4').find('a')
+		(u0, u1, self.storyId) = storyinfo['href'].split('/')
+		self.storyName = storyinfo.string.strip()
+		self.outputName = self.storyName.replace(" ", "_") + '-fw_' + self.storyId
+
+		logging.debug('self.storyName=%s, self.storyId=%s, self.outputName=%s' % (self.storyName, self.storyId, self.outputName))
 		
 		author = soup.find('span', {'class' : 'author'})
 		self.authorName = str(author.a.string)
+		(u0, u1,self.authorId) = author.a['href'].split('/')
+		self.authorURL = 'http://' + self.host + author.a['href']
+		logging.debug('self.authorName=%s self.authorId=%s' % (self.authorName, self.authorId))
 		
-		select = soup.find('select', { 'name' : 'goto' } )
+		description = soup.find('blockquote', {'class' : 'summary'})
+		if description is not None:
+			self.storyDescription = str(description.p.string)
+		logging.debug('self.storyDescription=%s' % self.storyDescription)
+		
+		meta = soup.find('p', {'class' : 'meta'})
+		if meta is not None:
+			s = str(meta).replace('\n',' ').replace('\t','').split(' - ')
+			logging.debug('meta.s=%s' % s)
+			for ss in s:
+				s1 = ss.replace('&nbsp;','').split(':')
+				#logging.debug('meta.s.s1=%s' % s1)
+				if len(s1) > 1:
+					s2 = re.split ('<[^>]+>', s1[0])
+					#logging.debug('meta.s.s1.s2=%s' % s2)
+					if len(s2) > 1:
+						s1[0] = s2[1]
+					skey = s1[0].strip()
+					#logging.debug('Checking = %s' % skey)
+					if skey == 'Category':
+						soup1 = bs.BeautifulStoneSoup(s1[1])
+						allAs = soup1.findAll('a')
+						for a in allAs:
+							if self.category == 'Category':
+								self.category = str(a.string)
+								logging.debug('self.category=%s' % self.category)
+							self._addSubject(self.category)
+						logging.debug('self.subjects=%s' % self.subjects)
+					elif skey == 'Rating':
+						self.storyRating = s1[1]
+						logging.debug('self.storyRating=%s' % self.storyRating)
+					elif skey == 'Genres':
+						self.genre = s1[1]
+						logging.debug('self.genre=%s' % self.genre)
+						s2 = s1[1].split(', ')
+						for ss2 in s2:
+							self._addSubject(ss2)
+						logging.debug('self.subjects=%s' % self.subjects)
+					elif skey == 'Characters':
+						s2 = s1[1].split(', ')
+						for ss2 in s2:
+							self._addCharacter(ss2)
+						logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+					elif skey == 'Chapters':
+						self.numChapters = s1[1]
+						logging.debug('self.numChapters=%s' % self.numChapters)
+					elif skey == 'Warnings':
+						logging.debug('Warnings=%s' % s1[1])
+					elif skey == 'Published':
+						self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s1[1].strip(' '), "%Y/%m/%d")))
+						logging.debug('self.storyPublished=%s' % self.storyPublished)
+					elif skey == 'Updated':
+						self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s1[1].strip(' '), "%Y/%m/%d")))
+						logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+				else:
+					s3 = re.split ('<[^>]+>', s1[0])
+					#logging.debug('meta.s.s1.s3=%s' % s3)
+					if len(s3) > 1:
+						s1[0] = s3[0]
+					s4 = s1[0].split('w')
+					#logging.debug('meta.s.s1.s4=%s' % s4)
+					if len(s4) > 1 and s4[1] == 'ords':
+						self.numWords = s4[0]
+						logging.debug('self.numWords=%s' % self.numWords)
+					
+		
+		print('Story "%s" by %s' % (self.storyName, self.authorName))
 		
 		result = []
-		if select is None:
-			# Single chapter storys don't have title in crumbtrail, just 'chapter' title in h4.
-			self.storyName = chaptername
-			# no chapters found, try url by itself.
-			result.append((self.url,self.storyName))
-		else:
-			allOptions = select.findAll('option')
-			for o in allOptions:
-				url = 'http://' + self.host + o['value']
-				title = o.string
-				# ficwad includes 'Story Index' in the dropdown of chapters, 
-				# but it's not a real chapter.
-				if title != "Story Index":
-					result.append((url,title))
+		ii = 1
+
+		storylist = soup.find('ul', {'id' : 'storylist'})
+		if storylist is not None:
+			allH4s = storylist.findAll('h4')
+			#logging.debug('allH4s=%s' % allH4s)
+	
+			if allH4s is not None:
+				for h4 in allH4s:
+					chapterinfo = h4.find('a')
+					#logging.debug('Chapter1=%s' % chapterinfo)
+					url = 'http://' + self.host + chapterinfo['href']
+					title = chapterinfo.string.strip()
+					#logging.debug('Chapter=%s, %s' % (url, title))
+					# ficwad includes 'Story Index' in the dropdown of chapters, 
+					# but it's not a real chapter.
+					if title != "Story Index":
+						logging.debug('Chapter[%s]=%s, %s' % (ii, url, title))
+						result.append((url,title))
+						ii = ii+1
+					else:
+						logging.debug('Skipping Story Index.  URL %s' % url)
+				
+		if ii == 1:
+			select = soup.find('select', { 'name' : 'goto' } )
+
+			if select is None:
+				result.append((self.url,self.storyName))
+				logging.debug('Chapter[%s]=%s %s' % (ii, self.url, self.storyName))
+			else:
+				allOptions = select.findAll('option')
+				for o in allOptions:
+					url = 'http://' + self.host + o['value']
+					title = o.string
+					# ficwad includes 'Story Index' in the dropdown of chapters, 
+					# but it's not a real chapter.
+					if title != "Story Index":
+						logging.debug('Chapter[%s]=%s, %s' % (ii, url, title))
+						result.append((url,title))
+						ii = ii+1
+					else:
+						logging.debug('Skipping Story Index.  URL %s' % url)
 			
+		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+		logging.debug('self.uuid=%s' % self.uuid)
+		
 		return result
 	
 	def getStoryName(self):
 		return self.storyName
 
+	def getOutputName(self):
+		return self.outputName
+		
 	def getAuthorName(self):
 		return self.authorName
 	
 	def getText(self, url):
+		if url.find('http://') == -1:
+			url = 'http://' + self.host + '/' + url
+		
 		data = u2.urlopen(url).read()
 		
 		soup = bs.BeautifulStoneSoup(data)
 		div = soup.find('div', {'id' : 'storytext'})
 		if None == div:
 			logging.error("Error downloading Chapter: %s" % url)
-			exit(1)
+			exit(20)
 			return '<html/>'
 		return div.__str__('utf8')
 	
+	def getStoryURL(self):
+		logging.debug('self.url=%s' % self.url)
+		return self.url
+
+	def getAuthorURL(self):
+		logging.debug('self.authorURL=%s' % self.authorURL)
+		return self.authorURL
+
+	def getUUID(self):
+		logging.debug('self.uuid=%s' % self.uuid)
+		return self.uuid
+
+	def getAuthorId(self):
+		logging.debug('self.authorId=%s' % self.authorId)
+		return self.authorId
+
+	def getStoryId(self):
+		logging.debug('self.storyId=%s' % self.storyId)
+		return self.storyId
+
+	def getStoryDescription(self):
+		logging.debug('self.storyDescription=%s' % self.storyDescription)
+		return self.storyDescription
+
+	def getStoryPublished(self):
+		logging.debug('self.storyPublished=%s' % self.storyPublished)
+		return self.storyPublished
+
+	def getStoryCreated(self):
+		self.storyCreated = datetime.datetime.now()
+		logging.debug('self.storyCreated=%s' % self.storyCreated)
+		return self.storyCreated
+
+	def getStoryUpdated(self):
+		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+		return self.storyUpdated
+
+	def getLanguage(self):
+		logging.debug('self.language=%s' % self.language)
+		return self.language
+
+	def getLanguageId(self):
+		logging.debug('self.languageId=%s' % self.languageId)
+		return self.languageId
+
+	def getSubjects(self):
+		logging.debug('self.subjects=%s' % self.authorName)
+		return self.subjects
+
+	def getPublisher(self):
+		logging.debug('self.publisher=%s' % self.publisher)
+		return self.publisher
+
+	def getNumChapters(self):
+		logging.debug('self.numChapters=%s' % self.numChapters)
+		return self.numChapters
+
+	def getNumWords(self):
+		logging.debug('self.numWords=%s' % self.numWords)
+		return self.numWords
+
+	def getCategory(self):
+		logging.debug('self.category=%s' % self.category)
+		return self.category
+
+	def getGenre(self):
+		logging.debug('self.genre=%s' % self.genre)
+		return self.genre
+
+	def getStoryStatus(self):
+		logging.debug('self.storyStatus=%s' % self.storyStatus)
+		return self.storyStatus
+
+	def getStoryRating(self):
+		logging.debug('self.storyRating=%s' % self.storyRating)
+		return self.storyRating
+
+	def getStoryUserRating(self):
+		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
+		return self.storyUserRating
+
 	def getPrintableUrl(self, url):
 		return url
 	
@@ -98,6 +341,15 @@ class FicWad(FanfictionSiteAdapter):
 		other = dict(submit = 'Log In', remember='yes')
 		return (login, other)
 
+	def getStoryCharacters(self):
+		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+		return self.storyCharacters
+	
+	def getStorySeries(self):
+		logging.debug('self.storySeries=%s' % self.storySeries)
+		return self.storySeries
+		
+
 		
 if __name__ == '__main__':
 	url = 'http://www.ficwad.com/story/14536'
diff --git a/hpfiction.py b/hpfiction.py
index 75cb4597..9f6cd467 100644
--- a/hpfiction.py
+++ b/hpfiction.py
@@ -15,6 +15,8 @@ import urllib2 as u2
 import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
+import time
+import datetime
 
 from constants import *
 from adapter import *
@@ -32,8 +34,37 @@ class HPFiction(FanfictionSiteAdapter):
 		self.host = parsedUrl.netloc
 		self.path = parsedUrl.path
 		
+		logging.debug('self.url=%s' % self.url)
+		logging.debug('self.host=%s' % self.host)
+		logging.debug('self.path=%s' % self.path)
+	
 		self.opener = u2.build_opener(u2.HTTPCookieProcessor())
 	
+		self.storyDescription = 'Fanfiction Story'
+		self.authorId = '0'
+		self.authorURL = ''
+		(u1, self.storyId) = self.url.split('=')
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		self.subjects.append ('fanfiction')
+		self.subjects.append ('Harry Potter')
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = 'FanFiction'
+		self.category = 'Category'
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'K'
+		self.storyUserRating = '0'
+		self.storyCharacters = []
+		self.storySeries = ''
+		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+		logging.debug('self.uuid=%s' % self.uuid)
+		
 		logging.debug("Created HPFiction: url=%s" % (self.url))
 	
 	def _getLoginScript(self):
@@ -45,23 +76,116 @@ class HPFiction(FanfictionSiteAdapter):
 	def performLogin(self, url = None):
 		return True
 	
+	def _addSubject(self, subject):
+		subj = subject.upper()
+		for s in self.subjects:
+			if s.upper() == subj:
+				return False
+		self.subjects.append(subject)
+		return True
+
+	def _addCharacter(self, character):
+		chara = character.upper()
+		for c in self.storyCharacters:
+			if c.upper() == chara:
+				return False
+		self.storyCharacters.append(character)
+		return True
+
 	def extractIndividualUrls(self):
 		data = self.opener.open(self.url).read()
 		soup = bs.BeautifulSoup(data)
 		
 		links = soup.findAll('a')
+		def_chapurl = ''
+		def_chaptitle = ''
 		
 		for a in links:
 			if a['href'].find('psid') != -1:
 				self.storyName = a.string
+				logging.debug('self.storyName=%s' % self.storyName)
 			elif a['href'].find('viewuser.php') != -1:
 				self.authorName = a.string
+				self.authorURL = 'http://' + self.host + '/' + a['href']
+				(u1, self.authorId) = a['href'].split('=')
+				logging.debug('self.authorName=%s, self.authorId=%s' % (self.authorName, self.authorId))
+			elif a['href'].find('chapterid=') != -1 and len(def_chapurl) == 0:
+				def_chapurl = 'http://' + self.host + '/viewstory.php' + str(a['href'])
+				def_chaptitle = a.string
+				logging.debug('def_chapurl=%s, def_chaptitle=%s' % (def_chapurl, def_chaptitle))
+		
+		centers = soup.findAll('center')
+		for center in centers:
+			tds = center.findAll ('td')
+			if tds is not None and len(tds) > 0:
+				for td in tds:
+					s = re.split ("<[^>]+>", str(td).replace('\n','').replace('&nbsp;',' '))
+					logging.debug('s=%s' % s)
+					ii = 0
+					ll = len(s)
+					sss = ''
+					while ii < ll - 1:
+						if s[ii] is not None and len(s[ii]) > 0:
+							if s[ii] == 'Rating:':
+								self.storyRating = s[ii+1]
+								logging.debug('self.storyRating=%s' % self.storyRating)
+								ii = ii + 2
+							elif s[ii] == 'Chapters:':
+								self.numChapters = s[ii+1]
+								logging.debug('self.numChapters=%s' % self.numChapters)
+								ii = ii + 2
+							elif s[ii] == 'Characters:':
+								s2 = s[ii+1].split(', ')
+								for ss2 in s2:
+									self._addCharacter(ss2)
+								logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+								ii = ii + 2
+							elif s[ii] == 'Genre(s):':
+								self.genre = s[ii+1]
+								logging.debug('self.genre=%s' % self.genre)
+								s2 = s[ii+1].split(', ')
+								for ss2 in s2:
+									self._addSubject(ss2)
+								logging.debug('self.subjects=%s' % self.subjects)
+								ii = ii + 2
+							elif s[ii] == 'Status:':
+								if s[ii+1].strip(' ') == "Work In Progress":
+									self.storyStatus = 'In-Progress'
+								else:
+									self.storyStatus = 'Completed'
+								ii = ii + 2
+							elif s[ii] == 'First Published:':
+								self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s[ii+1].strip(' '), "%Y.%m.%d")))
+								logging.debug('self.storyPublished=%s' % self.storyPublished)
+								ii = ii + 2
+							elif s[ii] == 'Last Updated:':
+								self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s[ii+1].strip(' '), "%Y.%m.%d")))
+								logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+								ii = ii + 2
+							elif s[ii] == 'Last Published Chapter:':
+								ii = ii + 2
+							elif s[ii] == 'Pairings:':
+								ii = ii + 2
+							elif s[ii] == 'Warnings:':
+								ii = ii + 2
+							else:
+								sss = sss + ' ' + s[ii]
+								ii = ii + 1
+						else:
+							ii = ii + 1
+					self.storyDescription = sss
+					logging.debug('self.storyDescription=%s' % self.storyDescription)
 		
 		urls = []
+		self.outputName = self.storyName.replace(" ", "_") + '-hp_' + self.storyId
+
 		select = soup.find('select', {'name' : 'chapterid'})
 		if select is None:
 			# no chapters found, try url by itself.
-			urls.append((self.url,self.storyName))
+			if len(def_chapurl) > 0:
+				urls.append((def_chapurl, def_chaptitle))
+			else:
+				urls.append((self.url,self.storyName))
 		else:
 			for o in select.findAll('option'):
 				if 'value' in o._getAttrMap():
@@ -69,11 +193,18 @@ class HPFiction(FanfictionSiteAdapter):
 					title = o.string
 					if title != "Story Index":
 						urls.append((url,title))
+
+		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+		logging.debug('self.uuid=%s' % self.uuid)
+		
 		return urls
 
 	def getStoryName(self):
 		return self.storyName
 
+	def getOutputName(self):
+		return self.outputName
+		
 	def getAuthorName(self):
 		return self.authorName
 	
@@ -84,9 +215,100 @@ class HPFiction(FanfictionSiteAdapter):
 		divtext = soup.find('div', {'id' : 'fluidtext'})
 		if None == divtext:
 			logging.error("Error downloading Chapter: %s" % url)
-			exit(1)
+			exit(20)
 		return divtext.__str__('utf8')
 
+	def getAuthorId(self):
+		logging.debug('self.authorId=%s' % self.authorId)
+		return self.authorId
+
+	def getStoryId(self):
+		logging.debug('self.storyId=%s' % self.storyId)
+		return self.storyId
+
+	def getStoryDescription(self):
+		logging.debug('self.storyDescription=%s' % self.storyDescription)
+		return self.storyDescription
+
+	def getStoryPublished(self):
+		logging.debug('self.storyPublished=%s' % self.storyPublished)
+		return self.storyPublished
+
+	def getStoryCreated(self):
+		self.storyCreated = datetime.datetime.now()
+		logging.debug('self.storyCreated=%s' % self.storyCreated)
+		return self.storyCreated
+
+	def getStoryUpdated(self):
+		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+		return self.storyUpdated
+
+	def getLanguage(self):
+		logging.debug('self.language=%s' % self.language)
+		return self.language
+
+	def getLanguageId(self):
+		logging.debug('self.languageId=%s' % self.languageId)
+		return self.languageId
+
+	def getSubjects(self):
+		logging.debug('self.subjects=%s' % self.authorName)
+		return self.subjects
+
+	def getPublisher(self):
+		logging.debug('self.publisher=%s' % self.publisher)
+		return self.publisher
+
+	def getNumChapters(self):
+		logging.debug('self.numChapters=%s' % self.numChapters)
+		return self.numChapters
+
+	def getNumWords(self):
+		logging.debug('self.numWords=%s' % self.numWords)
+		return self.numWords
+
+	def getStoryURL(self):
+		logging.debug('self.url=%s' % self.url)
+		return self.url
+
+	def getAuthorURL(self):
+		logging.debug('self.authorURL=%s' % self.authorURL)
+		return self.authorURL
+
+	def getUUID(self):
+		logging.debug('self.uuid=%s' % self.uuid)
+		return self.uuid
+
+	def getCategory(self):
+		logging.debug('self.category=%s' % self.category)
+		return self.category
+
+	def getGenre(self):
+		logging.debug('self.genre=%s' % self.genre)
+		return self.genre
+
+	def getStoryStatus(self):
+		logging.debug('self.storyStatus=%s' % self.storyStatus)
+		return self.storyStatus
+
+	def getStoryRating(self):
+		logging.debug('self.storyRating=%s' % self.storyRating)
+		return self.storyRating
+
+	def getStoryUserRating(self):
+		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
+		return self.storyUserRating
+
+	def getStoryCharacters(self):
+		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+		return self.storyCharacters
+	
+	def getStorySeries(self):
+		logging.debug('self.storySeries=%s' % self.storySeries)
+		return self.storySeries
+		
+
+
 class FF_UnitTests(unittest.TestCase):
 	def setUp(self):
 		logging.basicConfig(level=logging.DEBUG)
diff --git a/output.py b/output.py
index 1700bfe7..9ffb1503 100644
--- a/output.py
+++ b/output.py
@@ -26,6 +26,7 @@ from constants import *
 
 
 import html2text
+import datetime
 
 
 class FanficWriter:
@@ -41,8 +42,8 @@ class FanficWriter:
 class TextWriter(FanficWriter):
 	htmlWriter = None
 	
-	def __init__(self, base, name, author, inmemory=False, compress=False):
-		self.htmlWriter = HTMLWriter(base, name, author, True, False)
+	def __init__(self, base, adapter, inmemory=False, compress=False):
+		self.htmlWriter = HTMLWriter(base, adapter, True, False)
 	
 	def writeChapter(self, index, title, text):
 		self.htmlWriter.writeChapter(index, title, text)
@@ -57,12 +58,13 @@ class TextWriter(FanficWriter):
 class HTMLWriter(FanficWriter):
 	body = ''
 	
-	def __init__(self, base, name, author, inmemory=False, compress=False):
+	def __init__(self, base, adapter, inmemory=False, compress=False):
 		self.basePath = base
-		self.storyTitle = removeEntities(name)
-		self.name = makeAcceptableFilename(name)
-		self.fileName =  self.basePath + '/' + self.name + '.html'
-		self.authorName = removeEntities(author)
+		self.storyTitle = removeEntities(adapter.getStoryName())
+		self.name = makeAcceptableFilename(adapter.getOutputName())
+		self.fileName = self.basePath + '/' + self.name + '.html'
+		self.authorName = removeEntities(adapter.getAuthorName())
+		self.adapter = adapter
 		
 		self.inmemory = inmemory
 
@@ -131,14 +133,14 @@ class EPubFanficWriter(FanficWriter):
 			for f in self.files:
 				self.files[f].close()
 	
-	def __init__(self, base, name, author, inmemory=False, compress=True):
+	def __init__(self, base, adapter, inmemory=False, compress=True):
 		self.basePath = base
-		self.storyTitle = removeEntities(name)
-		self.name = makeAcceptableFilename(name)
+		self.storyTitle = removeEntities(adapter.getStoryName())
+		self.name = makeAcceptableFilename(adapter.getOutputName())
 		self.directory = self.basePath + '/' + self.name
-		self.authorName = removeEntities(author)
-
+		self.authorName = removeEntities(adapter.getAuthorName())
 		self.inmemory = inmemory
+		self.adapter = adapter
 		
 		self.files = {}
 		self.chapters = []
@@ -226,17 +228,50 @@ class EPubFanficWriter(FanficWriter):
 		tocFilePath = "OEBPS/toc.ncx"
 #		toc = open(tocFilePath, 'w')
 #		print >> toc, TOC_START % self.storyTitle
-		self._writeFile(tocFilePath, TOC_START % self.storyTitle)
+		self._writeFile(tocFilePath, TOC_START % (self.adapter.getUUID(), self.storyTitle))
+
+		published = self.adapter.getStoryPublished().strftime("%Y-%m-%d")
+		createda = self.adapter.getStoryCreated().strftime("%Y-%m-%d %H:%M:%S")
+		created = self.adapter.getStoryCreated().strftime("%Y-%m-%d")
+		updated = self.adapter.getStoryUpdated().strftime("%Y-%m-%d")
+		calibre = self.adapter.getStoryUpdated().strftime("%Y-%m-%dT%H:%M:%S")
+		
+		### writing content -- title page
+		titleFilePath = "OEBPS/title_page.xhtml"
+		self._writeFile(titleFilePath, TITLE_PAGE % (self.authorName, self.storyTitle, self.adapter.getStoryURL(), self.storyTitle, self.adapter.getAuthorURL(), self.authorName, self.adapter.getCategory(), self.adapter.getGenre(), self.adapter.getStoryStatus(), published, updated, createda, self.adapter.getStoryRating(), self.adapter.getStoryUserRating(), self.adapter.getNumChapters(), self.adapter.getNumWords(), self.adapter.getStoryURL(), self.adapter.getStoryURL(), self.adapter.getStoryDescription()))
+
 		### writing content -- opf file
 		opfFilePath = "OEBPS/content.opf"
-		
+
 #		opf = open(opfFilePath, 'w')
-		self._writeFile(opfFilePath, CONTENT_START % (self.storyTitle, self.authorName, uuid.uuid4().urn))
+		self._writeFile(opfFilePath, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName, self.adapter.getLanguageId(), published, created, updated, calibre, self.adapter.getStoryDescription()))
+
+		i = 0
+		subjs = []
+		subjs = self.adapter.getSubjects()
+		for subj in subjs:
+			self._writeFile(opfFilePath, CONTENT_SUBJECT % subj)
+			i = i + 1
+		if (i <= 0):
+			self._writeFile(opfFilePath, CONTENT_SUBJECT % "FanFiction")
+
+		self._writeFile(opfFilePath, CONTENT_END_METADATA % (self.adapter.getPublisher(), self.adapter.getUUID(), self.adapter.getStoryURL(), self.adapter.getStoryURL(), self.adapter.getStoryUserRating()))
 #		print >> opf, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName)
 
 		ids = []
 		
-		i = 1
+		i = 0
+
+		t = "Title Page"
+		f = "title_page.xhtml"
+		chapterId = "Title Page"		
+		self._writeFile(tocFilePath, TOC_ITEM % (chapterId, i, t, f))
+		self._writeFile(opfFilePath, CONTENT_ITEM % (chapterId, f))
+		
+		ids.append(chapterId)
+		
+		i = i + 1
+		
 		for t,f in self.chapters:
 			chapterId = "chapter%04d" % i
 			
diff --git a/twilighted.py b/twilighted.py
index a7e77a53..f7654041 100644
--- a/twilighted.py
+++ b/twilighted.py
@@ -11,119 +11,360 @@ import urllib2 as u2
 import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
+import time
+import datetime
 
 from adapter import *
 import twipassword
 
 class Twilighted(FanfictionSiteAdapter):
-  def __init__(self, url):
-    self.url = url
-    parsedUrl = up.urlparse(url)
-    self.host = parsedUrl.netloc
-    self.path = parsedUrl.path
-    self.opener = u2.build_opener(u2.HTTPCookieProcessor())
-    self.password=twipassword.password
-    self.login='sigizmund'
-    logging.debug("Created Twilighted: url=%s" % (self.url))
-
-
-  def requiresLogin(self, url = None):
-    # potionsandsnitches.net doesn't require login.
-    if self.host == 'potionsandsnitches.net':
-      return False
-    else:
-      return True
-
-  def performLogin(self, url = None):
-    data = {}
-
-    data['penname'] = self.login
-    data['password'] = self.password
-    data['cookiecheck'] = '1'
-    data['submit'] = 'Submit'
-
-    urlvals = u.urlencode(data)
-    loginUrl = 'http://' + self.host + self._getLoginScript()
-    logging.debug("Will now login to URL %s" % loginUrl)
-
-    req = self.opener.open(loginUrl, urlvals)
-
-    d = req.read().decode('utf-8')
-
-    if self.reqLoginData(d) :
-      return False
-    else:
-      return True
-
-
-  def setLogin(self, login):
-    self.login = login
-
-  def setPassword(self, password):
-    self.password = password
-
-  def extractIndividualUrls(self):
-    data = self.opener.open(self.url).read()
+    def __init__(self, url):
+        self.url = url
+        parsedUrl = up.urlparse(url)
+        self.host = parsedUrl.netloc
+        self.path = parsedUrl.path
+        self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+        self.password=twipassword.password
+        self.login='sigizmund'
+        self.storyDescription = 'Fanfiction Story'
+        self.authorId = '0'
+        self.authorURL = ''
+        self.storyId = '0'
+        self.storyPublished = datetime.date(1970, 01, 31)
+        self.storyCreated = datetime.datetime.now()
+        self.storyUpdated = datetime.date(1970, 01, 31)
+        self.languageId = 'en-UK'
+        self.language = 'English'
+        self.subjects = []
+        self.subjects.append ('fanfiction')
+        self.subjects.append ('Twilight')
+        self.publisher = self.host
+        self.numChapters = 0
+        self.numWords = 0
+        self.genre = 'FanFiction'
+        self.category = 'Category'
+        self.storyStatus = 'In-Progress'
+        self.storyRating = 'PG'
+        self.storyUserRating = '0'
+        self.storyCharacters = []
+        self.storySeries = ''
+        self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+        logging.debug('self.uuid=%s' % self.uuid)
     
-    if self.reqLoginData(data):
-      self.performLogin()
-      data = self.opener.open(self.url).read()
-      if self.reqLoginData(data):
-        return None
+        logging.debug("Created Twilighted: url=%s" % (self.url))
+
+
+    def requiresLogin(self, url = None):
+        # potionsandsnitches.net doesn't require login.
+        if self.host == 'potionsandsnitches.net':
+          return False
+        else:
+          return True
+
+    def performLogin(self, url = None):
+        data = {}
     
-    soup = bs.BeautifulStoneSoup(data)
-
-    title = soup.find('title').string
-    self.storyName = title.split(' by ')[0].strip()
-    self.authorName = title.split(' by ')[1].strip()
-
-    select = soup.find('select', { 'name' : 'chapter' } )
-	 
-    result = []
-    if select is None:
-	   # no chapters found, try url by itself.
-	   result.append((self.url,self.storyName))
-    else:
-	   allOptions = select.findAll('option')
-	   for o in allOptions:
-	     url = self.url + "&chapter=%s" % o['value']
-	     title = o.string
-	     result.append((url,title))
-
-    return result
-
-  def getStoryName(self):
-    return self.storyName
-
-  def getAuthorName(self):
-    return self.authorName
-
-  def getText(self, url):
-    if url.find('http://') == -1:
-      url = 'http://' + self.host + '/' + url
-
-    logging.debug('Getting data from: %s' % url)
-
-    data = self.opener.open(url).read()
+        data['penname'] = self.login
+        data['password'] = self.password
+        data['cookiecheck'] = '1'
+        data['submit'] = 'Submit'
     
-    soup = bs.BeautifulStoneSoup(data, convertEntities=bs.BeautifulStoneSoup.HTML_ENTITIES)
+        urlvals = u.urlencode(data)
+        loginUrl = 'http://' + self.host + self._getLoginScript()
+        logging.debug("Will now login to URL %s" % loginUrl)
+    
+        req = self.opener.open(loginUrl, urlvals)
+    
+        d = req.read().decode('utf-8')
+    
+        if self.reqLoginData(d) :
+          return False
+        else:
+          return True
 
-    div = soup.find('div', {'id' : 'story'})
 
-    if None == div:
-      return '<html/>'
+    def setLogin(self, login):
+        self.login = login
 
-    return div.__str__('utf8')
+    def setPassword(self, password):
+        self.password = password
 
-  def _getLoginScript(self):
-    return '/user.php?action=login'
+    def _addSubject(self, subject):
+        subj = subject.upper()
+        for s in self.subjects:
+            if s.upper() == subj:
+                return False
+        self.subjects.append(subject)
+        return True
 
-  def reqLoginData(self, data):
-    if data.find('Registered Users Only. Please click OK to login or register.') != -1 or data.find('There is no such account on our website') != -1:
-      return True
-    else:
-      return False
+    def _addCharacter(self, character):
+        chara = character.upper()
+        for c in self.storyCharacters:
+            if c.upper() == chara:
+                return False
+        self.storyCharacters.append(character)
+        return True
 
+    def extractIndividualUrls(self):
+        data = self.opener.open(self.url).read()
+        
+        if self.reqLoginData(data):
+          self.performLogin()
+          data = self.opener.open(self.url).read()
+          if self.reqLoginData(data):
+            return None
+        
+        soup = bs.BeautifulStoneSoup(data)
+    
+        title = soup.find('title').string
+        self.storyName = title.split(' by ')[0].strip()
+        self.authorName = title.split(' by ')[1].strip()
+        self.outputName = self.storyName.replace(" ", "_")
+    
+        select = soup.find('select', { 'name' : 'chapter' } )
+    	 
+        result = []
+        if select is None:
+    	   # no chapters found, try url by itself.
+    	   result.append((self.url,self.storyName))
+        else:
+    	   allOptions = select.findAll('option')
+    	   for o in allOptions:
+    	     url = self.url + "&chapter=%s" % o['value']
+    	     title = o.string
+    	     result.append((url,title))
+    
+        url = self.url + "&index=1"
+        data = self.opener.open(url).read()
+        lines = data.split('\n')
+        soup = bs.BeautifulStoneSoup(data)
+        metas = soup.findAll('meta')
+        for meta in metas:
+            if 'name' in meta._getAttrMap() and meta['name'].find('description') != -1:
+                #logging.debug('Meta: %s' % meta)
+                if 'content' in meta._getAttrMap():
+                    s1 = bs.BeautifulStoneSoup(meta['content'])
+                    ps = s1.findAll('p')
+                    if len(ps) > 0:
+                        self.storyDescription = ps[0]
+                        logging.debug('self.storyDescription=%s' % (self.storyDescription))
+                    else:
+                        divs = meta.findAll('div')
+                        #logging.debug('Divs: %s' % divs)
+                        
+                        for div in divs:
+                            #logging.debug('Div: %s' % div)
+                            if 'id' in div._getAttrMap() and div['id'].find('pagetitle') != -1:
+                                #logging.debug('Div PAGETITLE: %s' % div)
+                                allA = div.findAll('a')
+                                for a in allA:
+                                    if 'href' in a._getAttrMap(): 
+                                        if a['href'].find('viewstory.php?sid=') != -1:
+                                            str1 = a.string
+                                            (vs, self.storyId) = a['href'].split('=')
+                                            logging.debug('self.storyId=%s self.storyName=%s' % (self.storyId, self.storyName))
+                                            self.outputName = self.outputName + "-tw_" + self.storyId
+                                            logging.debug('self.outputName=%s' % self.outputName)
+                                        if a['href'].find('viewuser.php?uid=') != -1:
+                                            str1 = a.string
+                                            (vs, self.authorId) = a['href'].split('=')
+                                            logging.debug('self.authorId=%s self.authorName=%s' % (self.authorId, self.authorName))
+                                            self.authorURL = 'http://'+self.host+'/viewuser.php?uid='+self.authorId
+                                            logging.debug('self.authorURL=%s' % self.authorURL)
+                            if 'class' in div._getAttrMap() and div['class'].find('content') !=   -1:
+                                #logging.debug('Div CONTENT: %s' % div)        
+                                brs = div.findAll('br')
+                                for br in brs:
+                                    buf = unicode(br).encode('utf-8')  
+                                    strs = re.split ('<[^>]+>', buf)
+                                    #logging.debug('BUF: %s' % strs)
+                                    ii = 2
+                                    stlen = len(strs)
+                                    while stlen > ii+1:
+                                        if len(strs[ii]) == 0:
+                                            ii = ii+1
+                                            continue
+                                        if strs[ii] == 'Categories:':
+                                            ii = ii+1
+                                            while stlen > ii and len(strs[ii]) != 0 and strs[ii].find(':') == -1:
+                                                if strs[ii] != ' ' and strs[ii] != ', ':
+                                                    if self.category == 'Category':
+                                                        self.category = strs[ii].strip(' ')
+                                                    self._addSubject(strs[ii].strip(' '))
+                                                ii = ii+1
+                                            logging.debug('self.subjects=%s' % self.subjects)
+                                        if strs[ii] == 'Characters: ':
+                                            ii = ii+1
+                                            while stlen > ii and len(strs[ii]) != 0 and strs[ii].find(':') == -1:
+                                                if strs[ii] != ' ' and strs[ii] != ', ':
+                                                    self._addCharacter(strs[ii].strip(' '))
+                                                ii = ii+1
+                                            logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+                                        elif strs[ii] == 'Completed:':
+                                            if strs[ii+1].strip(' ') == "No":
+                                                self.storyStatus = 'In-Progress'
+                                            else:
+                                                self.storyStatus = 'Completed'
+                                            ii = ii+2
+                                            logging.debug('self.storyStatus=%s' % self.storyStatus)
+                                        elif strs[ii] == 'Rated:':
+                                            self.storyRating = strs[ii+1].strip(' ')
+                                            ii = ii+2
+                                            logging.debug('self.storyRating=%s' % self.storyRating)
+                                        elif strs[ii] == 'Series:':
+                                            self.storySeries = strs[ii+1].strip(' ')
+                                            if self.storySeries == 'None':
+                                                self.storySeries = ''
+                                            ii = ii+2
+                                            logging.debug('self.storySeries=%s' % self.storySeries)
+                                        elif strs[ii] == 'Chapters: ':
+                                            self.numChapters = strs[ii+1].strip(' ')
+                                            ii = ii+2
+                                            logging.debug('self.numChapters=%s' % self.numChapters)
+                                        elif strs[ii] == 'Word count:':
+                                            self.numWords = strs[ii+1].strip(' ')
+                                            ii = ii+2
+                                            logging.debug('self.numWords=%s' % self.numWords)
+                                        elif strs[ii] == ' Published: ':
+                                            self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(strs[ii+1].strip(' '), "%B %d, %Y")))
+                                            ii = ii+2
+                                            logging.debug('self.storyPublished=%s' % self.storyPublished)
+                                        elif strs[ii] == 'Updated:':
+                                            self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(strs[ii+1].strip(' '), "%B %d, %Y")))
+                                            ii = ii+2
+                                            logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+                                        else:
+                                            logging.debug('Skipped Label \"%s\" Value \"%s\"' % (strs[ii], strs[ii+1]))
+                                            ii = ii+2
+                                
+        self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+        logging.debug('self.uuid=%s' % self.uuid)
+
+        return result
+
+    def getStoryName(self):
+        return self.storyName
+
+    def getOutputName(self):
+        return self.outputName
+		
+    def getAuthorName(self):
+        return self.authorName
+    
+    def getText(self, url):
+        if url.find('http://') == -1:
+          url = 'http://' + self.host + '/' + url
+    
+        logging.debug('Getting data from: %s' % url)
+    
+        data = self.opener.open(url).read()
+        
+        soup = bs.BeautifulStoneSoup(data, convertEntities=bs.BeautifulStoneSoup.HTML_ENTITIES)
+    
+        div = soup.find('div', {'id' : 'story'})
+    
+        if None == div:
+          return '<html/>'
+    
+        return div.__str__('utf8')
+
+    def _getLoginScript(self):
+        return '/user.php?action=login'
+
+    def reqLoginData(self, data):
+        if data.find('Registered Users Only. Please click OK to login or register.') != -1 or data.find('There is no such account on our website') != -1:
+          return True
+        else:
+          return False
+
+    def getStoryURL(self):
+        logging.debug('self.url=%s' % self.url)
+        return self.url
+
+    def getAuthorURL(self):
+        logging.debug('self.authorURL=%s' % self.authorURL)
+        return self.authorURL
+
+    def getUUID(self):
+        logging.debug('self.uuid=%s' % self.uuid)
+        return self.uuid
+    
+    def getStoryDescription(self):
+        logging.debug('self.storyDescription=%s' % self.storyDescription)
+        return self.storyDescription
+    
+    def getStoryPublished(self):
+        logging.debug('self.storyPublished=%s' % self.storyPublished)
+        return self.storyPublished
+    
+    def getStoryCreated(self):
+        self.storyCreated = datetime.datetime.now()
+        logging.debug('self.storyCreated=%s' % self.storyCreated)
+        return self.storyCreated
+    
+    def getStoryUpdated(self):
+        logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+        return self.storyUpdated
+    
+    def getLanguage(self):
+        logging.debug('self.language=%s' % self.language)
+        return self.language
+    
+    def getLanguageId(self):
+        logging.debug('self.languageId=%s' % self.languageId)
+        return self.languageId
+    
+    def getSubjects(self):
+        logging.debug('self.subjects=%s' % self.authorName)
+        return self.subjects
+    
+    def getPublisher(self):
+        logging.debug('self.publisher=%s' % self.publisher)
+        return self.publisher
+    
+    def getNumChapters(self):
+        logging.debug('self.numChapters=%s' % self.numChapters)
+        return self.numChapters
+    
+    def getNumWords(self):
+        logging.debug('self.numWords=%s' % self.numWords)
+        return self.numWords
+    
+    def getAuthorId(self):
+        logging.debug('self.authorId=%s' % self.authorId)
+        return self.authorId
+    
+    def getStoryId(self):
+        logging.debug('self.storyId=%s' % self.storyId)
+        return self.storyId
+    
+    def getCategory(self):
+        logging.debug('self.category=%s' % self.category)
+        return self.category
+    
+    def getGenre(self):
+        logging.debug('self.genre=%s' % self.genre)
+        return self.genre
+    
+    def getStoryStatus(self):
+        logging.debug('self.storyStatus=%s' % self.storyStatus)
+        return self.storyStatus
+    
+    def getStoryRating(self):
+        logging.debug('self.storyRating=%s' % self.storyRating)
+        return self.storyRating
+    
+    def getStoryUserRating(self):
+        logging.debug('self.storyUserRating=%s' % self.storyUserRating)
+        return self.storyUserRating
+    
+    def getStoryCharacters(self):
+        logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+        return self.storyCharacters
+
+    def getStorySeries(self):
+        logging.debug('self.storySeries=%s' % self.storySeries)
+        return self.storySeries
 
 class Twilighted_UnitTests(unittest.TestCase):
   def setUp(self):

From 363c211401f783643b0d869f020d77f43de9ce24 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Tue, 9 Nov 2010 18:18:42 -0600
Subject: [PATCH 51/94] Had left in a debugging statements that should have
 been removed..

---
 hpfiction.py | 1 -
 1 file changed, 1 deletion(-)

diff --git a/hpfiction.py b/hpfiction.py
index 9f6cd467..27d8c28f 100644
--- a/hpfiction.py
+++ b/hpfiction.py
@@ -120,7 +120,6 @@ class HPFiction(FanfictionSiteAdapter):
 			if tds is not None and len(tds) > 0:
 				for td in tds:
 					s = re.split ("<[^>]+>", str(td).replace('\n','').replace('&nbsp;',' '))
-					logging.debug('s=%s' % s)
 					ii = 0
 					ll = len(s)
 					sss = ''

From d67668de230bcb3e17c388abc4acef4dcd29b112 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Tue, 9 Nov 2010 18:20:37 -0600
Subject: [PATCH 52/94] Changes to the format of the title page.  Tried to fix
 the description field on the title page and the contents.opf page.

---
 constants.py | 43 ++++++++++++++++---------------------------
 output.py    | 11 +++++++++--
 2 files changed, 25 insertions(+), 29 deletions(-)

diff --git a/constants.py b/constants.py
index 6ea1f086..9f14afb0 100644
--- a/constants.py
+++ b/constants.py
@@ -2,12 +2,14 @@
 
 CSS = '''body { margin-left: 5%; margin-right: 5%; margin-top: 5%; margin-bottom: 5%; text-align: justify; }
 pre { font-size: x-small; }
+sml { font-size: small; }
 h1 { text-align: center; }
 h2 { text-align: center; }
 h3 { text-align: center; }
 h4 { text-align: center; }
 h5 { text-align: center; }
 h6 { text-align: center; }
+h7 { text-align: left; font-size: large; font-weight: bold; }
 .CI {
     text-align:center;
     margin-top:0px;
@@ -26,34 +28,21 @@ h6 { text-align: center; }
 MIMETYPE = '''application/epub+zip'''
 
 TITLE_PAGE = '''<html xmlns="http://www.w3.org/1999/xhtml" xmlns:xlink="http://www.w3.org/1999/xlink"><head><meta http-equiv="Content-Type" content="text/html; charset=utf-8"/>
-<title>%s - %s</title><link href="stylesheet.css" type="text/css" charset="UTF-8" rel="stylesheet"/></head>
-<body><div class="cover">
-<h1 id="cfs_0"><a id="StoryLink" href="%s">%s</a></h1>
-<h2 id="cfs_1">by <a id="AuthorLink" href="%s">%s</a></h2>
-</div><div style="text-align:center">
+<title>%s - %s</title><link href="stylesheet.css" type="text/css" charset="UTF-8" rel="stylesheet"/></head><body>
+<p><h7 id="lnks"><b><a id="StoryLink" href="%s">%s</a></b> by <b><a id="AuthorLink" href="%s">%s</a></b></h7></p>
 <table class="full">
-<colgroup span="2"></colgroup>
-<tr><td> </td>
-<td> </td>
-</tr><tr><td> </td>
-<td> </td>
-</tr><tr><td><b>Category:</b></td><td>%s</td>
-</tr><tr><td><b>Genre:</b></td><td>%s</td>
-</tr><tr><td><b>Status:</b></td><td>%s</td>
-</tr><tr><td><b>Published:</b></td><td>%s</td>
-</tr><tr><td><b>Updated:</b></td><td>%s</td>
-</tr><tr><td><b>Packaged:</b></td><td>%s</td>
-</tr><tr><td><b>Rating Age/User:</b></td><td>%s / %s</td>
-</tr><tr><td><b>Chapters/Words:</b></td><td>%s / %s</td>
-</tr><tr><td><b>URL:</b></td><td><h3 id="url0"><a id="StoryURL" href="%s">%s</a></h3></td>
-</tr><tr><td><b>Summary:</b></td>
-</tr><tr><td colspan="2">%s</td>
-</tr><tr><td> </td>
-<td> </td>
-</tr><tr><td> </td>
-<td> </td>
-</tr></table></div>
-<div class="full" id="pb_0"/></body></html>
+<tr><td><b>Category:</b></td><td>%s</td></tr>
+<tr><td><b>Genre:</b></td><td>%s</td></tr>
+<tr><td><b>Status:</b></td><td>%s</td></tr>
+<tr><td><b>Published:</b></td><td>%s</td></tr>
+<tr><td><b>Updated:</b></td><td>%s</td></tr>
+<tr><td><b>Packaged:</b></td><td>%s</td></tr>
+<tr><td><b>Rating Age/User:</b></td><td>%s / %s</td></tr>
+<tr><td><b>Chapters/Words:</b></td><td>%s / %s</td></tr>
+</table>
+<p><b>URL:</b><pre id="url0"><br /><a id="StoryURL" href="%s">%s</a></pre></p>
+<p><b>Summary:</b><br />%s</p>
+</body></html>
 '''
 
 CONTAINER = '''<?xml version="1.0"?>
diff --git a/output.py b/output.py
index 9ffb1503..e756ca5c 100644
--- a/output.py
+++ b/output.py
@@ -236,15 +236,22 @@ class EPubFanficWriter(FanficWriter):
 		updated = self.adapter.getStoryUpdated().strftime("%Y-%m-%d")
 		calibre = self.adapter.getStoryUpdated().strftime("%Y-%m-%dT%H:%M:%S")
 		
+		description = self.adapter.getStoryDescription()
+		if hasattr(description, "text"):
+			description = str(description.text)
+		else:
+			description = str(description)
+		if description is not None and len(description) > 0:
+			description =  removeEntities(description.replace('&nbsp;',' ').replace('&rsquo;',''))
 		### writing content -- title page
 		titleFilePath = "OEBPS/title_page.xhtml"
-		self._writeFile(titleFilePath, TITLE_PAGE % (self.authorName, self.storyTitle, self.adapter.getStoryURL(), self.storyTitle, self.adapter.getAuthorURL(), self.authorName, self.adapter.getCategory(), self.adapter.getGenre(), self.adapter.getStoryStatus(), published, updated, createda, self.adapter.getStoryRating(), self.adapter.getStoryUserRating(), self.adapter.getNumChapters(), self.adapter.getNumWords(), self.adapter.getStoryURL(), self.adapter.getStoryURL(), self.adapter.getStoryDescription()))
+		self._writeFile(titleFilePath, TITLE_PAGE % (self.authorName, self.storyTitle, self.adapter.getStoryURL(), self.storyTitle, self.adapter.getAuthorURL(), self.authorName, self.adapter.getCategory(), self.adapter.getGenre(), self.adapter.getStoryStatus(), published, updated, createda, self.adapter.getStoryRating(), self.adapter.getStoryUserRating(), self.adapter.getNumChapters(), self.adapter.getNumWords(), self.adapter.getStoryURL(), self.adapter.getStoryURL(), description))
 
 		### writing content -- opf file
 		opfFilePath = "OEBPS/content.opf"
 
 #		opf = open(opfFilePath, 'w')
-		self._writeFile(opfFilePath, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName, self.adapter.getLanguageId(), published, created, updated, calibre, self.adapter.getStoryDescription()))
+		self._writeFile(opfFilePath, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName, self.adapter.getLanguageId(), published, created, updated, calibre, description))
 
 		i = 0
 		subjs = []

From c326aa47b09745b60b25d07de3028f76a119c811 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Tue, 9 Nov 2010 23:02:33 -0600
Subject: [PATCH 53/94] Need to reverse sort entities list to get entities with
 ';' ahead of versions without.  Like '&quot;' and '&quot'.  Otherwise
 '&quot;' becomes '";'.

---
 constants.py | 1 -
 output.py    | 3 ++-
 2 files changed, 2 insertions(+), 2 deletions(-)

diff --git a/constants.py b/constants.py
index 9f14afb0..89b0ef0e 100644
--- a/constants.py
+++ b/constants.py
@@ -157,7 +157,6 @@ acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
 acceptable_attributes = ['href']
 
 # entity list from http://code.google.com/p/doctype/wiki/CharacterEntitiesConsistent
-# when version without ; is allowed, make sure to put the version with first.
 entities = { '&aacute;' : 'á',
              '&Aacute;' : 'Á',
              '&Aacute' : 'Á',
diff --git a/output.py b/output.py
index e756ca5c..5244ceb7 100644
--- a/output.py
+++ b/output.py
@@ -339,7 +339,8 @@ def removeEntities(text):
 
 	# replace several named entities with character, such as &mdash; -> -
 	# see constants.py for the list.
-	for e in entities:
+	# reverse sort will put entities with ; before the same one without, when valid.
+	for e in reversed(sorted(entities.keys())):
 		v = entities[e]
 		try:
 			text = text.replace(e, v)

From 33d1fabd11915ecc1e64e74e42764bdadee32feb Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Wed, 10 Nov 2010 10:18:46 -0600
Subject: [PATCH 54/94] Changeset	Tag	Branch	User	Date
 Summary 53:c93e07566456			wsuetholz	2010-11-10
 10:11	Ficwad wants you to login in order to view some stories..  They old
 ficwad.py got around that by starting with the first chapter instead of the
 story index page.  Since I needed the story index page I had changed it to
 switch to that page, and then scrape the chapter information from there,
 which doesn't work if the chapters are blocked.  While it still won't work if
 you pass in the URL for the story index page, I now switch back to the page
 that you passed in originally when looking for the chapters to download.. 
 The one problem I have with this, is I change the self.url to the story index
 page, which should probably remain so that we have a consistent self.url even
 if the user starts with chapter 9 this time instead of chapter 1.

---
 ficwad.py | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/ficwad.py b/ficwad.py
index 133d424a..4fa0b87d 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -71,6 +71,7 @@ class FicWad(FanfictionSiteAdapter):
 		self.storyUserRating = '0'
 		self.storyCharacters = []
 		self.storySeries = ''
+		oldurl = ''
 		
 		data = u2.urlopen(self.url).read()
 		soup = bs.BeautifulStoneSoup(data)
@@ -84,6 +85,7 @@ class FicWad(FanfictionSiteAdapter):
 		if u1 == "story":
 			# This page does not have the correct information on it..  Need to get the Story Title Page
 			logging.debug('URL %s is a chapter URL.  Getting Title Page http://%s/%s/%s.' % (self.url, self.host, u1, storyid))
+			oldurl = self.url
 			self.url = 'http://' + self.host + '/' + u1 + '/' + storyid
 			data = u2.urlopen(self.url).read()
 			soup = bs.BeautifulStoneSoup(data)
@@ -177,6 +179,10 @@ class FicWad(FanfictionSiteAdapter):
 		result = []
 		ii = 1
 
+		if oldurl is not None and len(oldurl) > 0:
+			data = u2.urlopen(oldurl).read()
+			soup = bs.BeautifulStoneSoup(data)
+			
 		storylist = soup.find('ul', {'id' : 'storylist'})
 		if storylist is not None:
 			allH4s = storylist.findAll('h4')

From b2ea9c3e738063aa0b312c07db0bfbf1644884f7 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Wed, 10 Nov 2010 11:18:48 -0600
Subject: [PATCH 55/94] Changed the title page generation to allow for easily
 adding and removing entries from the table of information shown.

Modified ffnet.py to use the mangled story title if given instead of the name portion of the URL.  As part of this, the Name and chapter number are now optional in the URL passed in.
---
 adapter.py      |  3 +++
 constants.py    | 18 +++++++-----------
 ffnet.py        | 34 ++++++++++++++++++++++++----------
 fictionalley.py |  4 ++++
 ficwad.py       |  4 ++++
 hpfiction.py    |  4 ++++
 output.py       | 21 ++++++++++++++++++++-
 twilighted.py   |  4 ++++
 8 files changed, 70 insertions(+), 22 deletions(-)

diff --git a/adapter.py b/adapter.py
index 246f4177..b7708f48 100644
--- a/adapter.py
+++ b/adapter.py
@@ -29,6 +29,9 @@ class FanfictionSiteAdapter:
 	def setPassword(self, password):
 		pass
 
+	def getHost(self):
+		pass
+	
 	def getStoryURL(self):
 		pass
 
diff --git a/constants.py b/constants.py
index 89b0ef0e..294ae4bb 100644
--- a/constants.py
+++ b/constants.py
@@ -27,20 +27,16 @@ h7 { text-align: left; font-size: large; font-weight: bold; }
 
 MIMETYPE = '''application/epub+zip'''
 
-TITLE_PAGE = '''<html xmlns="http://www.w3.org/1999/xhtml" xmlns:xlink="http://www.w3.org/1999/xlink"><head><meta http-equiv="Content-Type" content="text/html; charset=utf-8"/>
+TITLE_HEADER = '''<html xmlns="http://www.w3.org/1999/xhtml" xmlns:xlink="http://www.w3.org/1999/xlink"><head><meta http-equiv="Content-Type" content="text/html; charset=utf-8"/>
 <title>%s - %s</title><link href="stylesheet.css" type="text/css" charset="UTF-8" rel="stylesheet"/></head><body>
 <p><h7 id="lnks"><b><a id="StoryLink" href="%s">%s</a></b> by <b><a id="AuthorLink" href="%s">%s</a></b></h7></p>
 <table class="full">
-<tr><td><b>Category:</b></td><td>%s</td></tr>
-<tr><td><b>Genre:</b></td><td>%s</td></tr>
-<tr><td><b>Status:</b></td><td>%s</td></tr>
-<tr><td><b>Published:</b></td><td>%s</td></tr>
-<tr><td><b>Updated:</b></td><td>%s</td></tr>
-<tr><td><b>Packaged:</b></td><td>%s</td></tr>
-<tr><td><b>Rating Age/User:</b></td><td>%s / %s</td></tr>
-<tr><td><b>Chapters/Words:</b></td><td>%s / %s</td></tr>
-</table>
-<p><b>URL:</b><pre id="url0"><br /><a id="StoryURL" href="%s">%s</a></pre></p>
+'''
+
+TITLE_ENTRY = '''<tr><td><b>%s</b></td><td>%s</td></tr>
+'''
+
+TITLE_FOOTER = '''</table>
 <p><b>Summary:</b><br />%s</p>
 </body></html>
 '''
diff --git a/ffnet.py b/ffnet.py
index 7320ec5a..3f9f41e5 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -68,21 +68,29 @@ class FFNet(FanfictionSiteAdapter):
 		
 		logging.debug('self.path=%s' % self.path)
 
-		spl = self.path.split('/')
-		logging.debug('spl=%s' % spl)
-		if len(spl) == 5:
-			self.path = "/".join(spl[1:-1])
-			self.outputName = spl[4] + '-ffnet_' + spl[2]
-		
 		if self.path.startswith('/'):
 			self.path = self.path[1:]
 		
+		spl = self.path.split('/')
+		logging.debug('spl=%s' % spl)
+		if spl is not None:
+			if len(spl) > 0 and spl[0] != 's':
+				logging.error("Error URL \"%s\" is not a story." % self.url)
+				exit (20)				
+			if len(spl) > 1:
+				self.storyId = spl[1]
+			if len(spl) > 2:
+				chapter = spl[1]
+			else:
+				chapter = '1'
+			if len(spl) == 5:
+				self.path = "/".join(spl[1:-1])
+				self.outputName = spl[4] + '-ffnet_' + spl[2]
+		
 		if self.path.endswith('/'):
 			self.path = self.path[:-1]
 		
 		logging.debug('self.path=%s' % self.path)
-
-		(s, self.storyId, chapter) = self.path.split('/')
 		
 		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
 		logging.debug('self.uuid=%s' % self.uuid)
@@ -190,12 +198,14 @@ class FFNet(FanfictionSiteAdapter):
 			if l.find("&#187;") != -1 and l.find('<b>') != -1:
 				s2 = bs.BeautifulStoneSoup(l)
 				self.storyName = str(s2.find('b').string)
-				logging.debug('self.storyId=%s self.storyName=%s' % (self.storyId, self.storyName))
+				# mangling storyName replaces url for outputName 
+				self.outputName = self.storyName.replace(" ", "_") + '-ffnet_' + self.storyId
+				logging.debug('self.storyId=%s, self.storyName=%s, self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
 			elif l.find("<a href='/u/") != -1:
 				s2 = bs.BeautifulStoneSoup(l)
 				self.authorName = str(s2.a.string)
 				(u1, u2, self.authorId, u3) = s2.a['href'].split('/')
-				logging.debug('self.authorId=%s self.authorName=%s' % (self.authorId, self.authorName))
+				logging.debug('self.authorId=%s, self.authorName=%s' % (self.authorId, self.authorName))
 			elif l.find("Rated: <a href=") != -1:
 				s2 = bs.BeautifulStoneSoup(l)
 				self.storyRating = str(s2.a.string).strip()
@@ -321,6 +331,10 @@ class FFNet(FanfictionSiteAdapter):
 	def setPassword(self, password):
 		self.password = password
 
+	def getHost(self):
+		logging.debug('self.host=%s' % self.host)
+		return self.host
+
 	def getStoryURL(self):
 		logging.debug('self.url=%s' % self.url)
 		return self.url
diff --git a/fictionalley.py b/fictionalley.py
index 20763bf9..56d14f0e 100644
--- a/fictionalley.py
+++ b/fictionalley.py
@@ -229,6 +229,10 @@ class FictionAlley(FanfictionSiteAdapter):
 		
 		return result
 	
+	def getHost(self):
+		logging.debug('self.host=%s' % self.host)
+		return self.host
+
 	def getStoryName(self):
 		return self.storyName
 
diff --git a/ficwad.py b/ficwad.py
index 4fa0b87d..8ea76b60 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -229,6 +229,10 @@ class FicWad(FanfictionSiteAdapter):
 		
 		return result
 	
+	def getHost(self):
+		logging.debug('self.host=%s' % self.host)
+		return self.host
+
 	def getStoryName(self):
 		return self.storyName
 
diff --git a/hpfiction.py b/hpfiction.py
index 27d8c28f..f83f713e 100644
--- a/hpfiction.py
+++ b/hpfiction.py
@@ -198,6 +198,10 @@ class HPFiction(FanfictionSiteAdapter):
 		
 		return urls
 
+	def getHost(self):
+		logging.debug('self.host=%s' % self.host)
+		return self.host
+
 	def getStoryName(self):
 		return self.storyName
 
diff --git a/output.py b/output.py
index 5244ceb7..1d208256 100644
--- a/output.py
+++ b/output.py
@@ -242,10 +242,29 @@ class EPubFanficWriter(FanficWriter):
 		else:
 			description = str(description)
 		if description is not None and len(description) > 0:
+			description = description.replace ('\\\'', '').replace('\\\"', '')
 			description =  removeEntities(description.replace('&nbsp;',' ').replace('&rsquo;',''))
+		else:
+			description = ' '
+
 		### writing content -- title page
 		titleFilePath = "OEBPS/title_page.xhtml"
-		self._writeFile(titleFilePath, TITLE_PAGE % (self.authorName, self.storyTitle, self.adapter.getStoryURL(), self.storyTitle, self.adapter.getAuthorURL(), self.authorName, self.adapter.getCategory(), self.adapter.getGenre(), self.adapter.getStoryStatus(), published, updated, createda, self.adapter.getStoryRating(), self.adapter.getStoryUserRating(), self.adapter.getNumChapters(), self.adapter.getNumWords(), self.adapter.getStoryURL(), self.adapter.getStoryURL(), description))
+		self._writeFile(titleFilePath, TITLE_HEADER % (self.authorName, self.storyTitle, self.adapter.getStoryURL(), self.storyTitle, self.adapter.getAuthorURL(), self.authorName))
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Category:', self.adapter.getCategory()))		 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Genre:', self.adapter.getGenre())) 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Status:', self.adapter.getStoryStatus()))		 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Published:', published))		 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Updated:', updated))		 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Packaged:', createda))
+		tmpstr = self.adapter.getStoryRating() + " / " + self.adapter.getStoryUserRating()		 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Rating Age/User:', tmpstr))
+		tmpstr = self.adapter.getNumChapters() + " / " + self.adapter.getNumWords()
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Chapters/Words:', tmpstr))
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Publisher:', self.adapter.getHost()))
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Story ID:', self.adapter.getStoryId()))
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Author ID:', self.adapter.getAuthorId()))
+
+		self._writeFile(titleFilePath, TITLE_FOOTER % description )
 
 		### writing content -- opf file
 		opfFilePath = "OEBPS/content.opf"
diff --git a/twilighted.py b/twilighted.py
index f7654041..5551f0e1 100644
--- a/twilighted.py
+++ b/twilighted.py
@@ -277,6 +277,10 @@ class Twilighted(FanfictionSiteAdapter):
         else:
           return False
 
+    def getHost(self):
+        logging.debug('self.host=%s' % self.host)
+        return self.host
+
     def getStoryURL(self):
         logging.debug('self.url=%s' % self.url)
         return self.url

From d4c18fe1a862832f6a7ec04edecf331aef273bf2 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Wed, 10 Nov 2010 11:29:17 -0600
Subject: [PATCH 56/94] Changed all references to downaloder.py to
 downloader.py.

---
 readme.txt | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/readme.txt b/readme.txt
index 996efe64..108eff20 100644
--- a/readme.txt
+++ b/readme.txt
@@ -1,10 +1,10 @@
 To use, do:
 
-python downaloder.py <url> (epub|html)
+python downloader.py <url> (epub|html)
 
 Eg:
 
-python downaloder.py http://www.fanfiction.net/s/5192986/1/A_Fox_in_Tokyo epub
+python downloader.py http://www.fanfiction.net/s/5192986/1/A_Fox_in_Tokyo epub
 
 This tool uses Python 2.5.2, but should work with newer versions.
 

From 7c252e83a1eeaecb36cc9f40710077f90cf7460f Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Wed, 10 Nov 2010 12:34:25 -0600
Subject: [PATCH 57/94] It seems that self.numWords and self.numChapters can on
 occasion be numeric instead of string, so use the str() function when
 building the string for the title page.

---
 output.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/output.py b/output.py
index 1d208256..c2f87c26 100644
--- a/output.py
+++ b/output.py
@@ -258,7 +258,7 @@ class EPubFanficWriter(FanficWriter):
 		self._writeFile(titleFilePath, TITLE_ENTRY % ('Packaged:', createda))
 		tmpstr = self.adapter.getStoryRating() + " / " + self.adapter.getStoryUserRating()		 
 		self._writeFile(titleFilePath, TITLE_ENTRY % ('Rating Age/User:', tmpstr))
-		tmpstr = self.adapter.getNumChapters() + " / " + self.adapter.getNumWords()
+		tmpstr = str(self.adapter.getNumChapters()) + " / " + str(self.adapter.getNumWords())
 		self._writeFile(titleFilePath, TITLE_ENTRY % ('Chapters/Words:', tmpstr))
 		self._writeFile(titleFilePath, TITLE_ENTRY % ('Publisher:', self.adapter.getHost()))
 		self._writeFile(titleFilePath, TITLE_ENTRY % ('Story ID:', self.adapter.getStoryId()))

From 3f40df82dda7bff1ced46a5ccfc17d9095ecd344 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Wed, 10 Nov 2010 12:36:21 -0600
Subject: [PATCH 58/94] Change to allow a chapter url to be passed in, yet
 still get the information it needs from the story index page.  This will get
 the chapter links from the passed in url.

---
 hpfiction.py | 56 +++++++++++++++++++++++++++++++++++++++++++++++-----
 1 file changed, 51 insertions(+), 5 deletions(-)

diff --git a/hpfiction.py b/hpfiction.py
index f83f713e..1bf46f55 100644
--- a/hpfiction.py
+++ b/hpfiction.py
@@ -39,11 +39,24 @@ class HPFiction(FanfictionSiteAdapter):
 		logging.debug('self.path=%s' % self.path)
 	
 		self.opener = u2.build_opener(u2.HTTPCookieProcessor())
-	
+
+		self.chapurl = False
+		self.storyId = '0'
+		
+		sss = self.url.split('?')
+		logging.debug('sss=%s' % sss)
+		if sss is not None and len(sss) > 1:
+			sc = sss[1].split('=')
+			logging.debug('sc=%s' % sc)
+			if sc is not None and len(sc) > 1:
+				if sc[0] == 'chapterid':
+					self.chapurl = True
+				elif sc[0] == 'psid' or sc[0] == 'sid':
+					self.storyId = sc[1]
+
 		self.storyDescription = 'Fanfiction Story'
 		self.authorId = '0'
 		self.authorURL = ''
-		(u1, self.storyId) = self.url.split('=')
 		self.storyPublished = datetime.date(1970, 01, 31)
 		self.storyCreated = datetime.datetime.now()
 		self.storyUpdated = datetime.date(1970, 01, 31)
@@ -93,6 +106,7 @@ class HPFiction(FanfictionSiteAdapter):
 		return True
 
 	def extractIndividualUrls(self):
+		
 		data = self.opener.open(self.url).read()
 		soup = bs.BeautifulSoup(data)
 		
@@ -100,10 +114,42 @@ class HPFiction(FanfictionSiteAdapter):
 		def_chapurl = ''
 		def_chaptitle = ''
 		
+		if self.chapurl:
+			foundid = False
+			for a in links:
+				if a['href'].find('psid') != -1:
+					sp = a['href'].split('?')
+					if sp is not None and len(sp) > 1:
+						for sp1 in sp:
+							if sp1.find('psid') != -1:
+								ps = sp1.split('=')
+								if ps is not None and len(ps) > 1:
+									self.storyId = ps[1].replace('\'','')
+									foundid = True
+					self.storyName = a.string
+					logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+					break
+			if foundid:
+				self.url = "http://" + self.host + "/viewstory.php?psid=" + self.storyId
+				logging.debug('Title Page URL=%s' % self.url)
+				data1 = self.opener.open(self.url).read()
+				hdrsoup = bs.BeautifulSoup(data1)
+			else:
+				hdrsoup = soup
+		else:
+			hdrsoup = soup
+			
 		for a in links:
-			if a['href'].find('psid') != -1:
+			if not self.chapurl and a['href'].find('psid') != -1:
+				sp = a['href'].split('?')
+				if sp is not None and len(sp) > 1:
+					for sp1 in sp:
+						if sp1.find('psid') != -1:
+							ps = sp1.split('=')
+							if ps is not None and len(ps) > 1:
+								self.storyId = ps[1].replace('\'','')
 				self.storyName = a.string
-				logging.debug('self.storyName=%s' % self.storyName)
+				logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
 			elif a['href'].find('viewuser.php') != -1:
 				self.authorName = a.string
 				self.authorURL = 'http://' + self.host + '/' + a['href']
@@ -114,7 +160,7 @@ class HPFiction(FanfictionSiteAdapter):
 				def_chaptitle = a.string
 				logging.debug('def_chapurl=%s, def_chaptitle=%s' % (def_chapurl, def_chaptitle))
 		
-		centers = soup.findAll('center')
+		centers = hdrsoup.findAll('center')
 		for center in centers:
 			tds = center.findAll ('td')
 			if tds is not None and len(tds) > 0:

From ed4ff4b6ab67c57b156fa51b6da5ed41ce467cf4 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Wed, 10 Nov 2010 13:47:13 -0600
Subject: [PATCH 59/94] Trying to fix outputting some utf-8 text.  Added the
 utf-8 header to all the source code. Ended up modifying the removeEntities
 function to do a weird decode/encode step on the text passed in.  This seems
 to at least stop things from crashing..

---
 BeautifulSoup.py  |  2 ++
 __init__.py       |  1 +
 adapter.py        |  2 ++
 constants.py      |  4 ++--
 downloader.py     |  2 ++
 fictionalley.py   |  2 ++
 html2text.py      |  2 ++
 html_constants.py |  2 ++
 output.py         | 14 ++++++++++++--
 twilighted.py     |  2 ++
 twipassword.py    |  2 ++
 zipdir.py         |  2 ++
 12 files changed, 33 insertions(+), 4 deletions(-)

diff --git a/BeautifulSoup.py b/BeautifulSoup.py
index 748e6fe4..31ff0e5f 100644
--- a/BeautifulSoup.py
+++ b/BeautifulSoup.py
@@ -1,3 +1,5 @@
+# -*- coding: utf-8 -*-
+
 """Beautiful Soup
 Elixir and Tonic
 "The Screen-Scraper's Friend"
diff --git a/__init__.py b/__init__.py
index e69de29b..40a96afc 100644
--- a/__init__.py
+++ b/__init__.py
@@ -0,0 +1 @@
+# -*- coding: utf-8 -*-
diff --git a/adapter.py b/adapter.py
index b7708f48..03c3b59d 100644
--- a/adapter.py
+++ b/adapter.py
@@ -1,3 +1,5 @@
+# -*- coding: utf-8 -*-
+
 class LoginRequiredException(Exception):
 	def __init__(self, url):
 		self.url = url
diff --git a/constants.py b/constants.py
index 294ae4bb..dc185eb6 100644
--- a/constants.py
+++ b/constants.py
@@ -27,7 +27,7 @@ h7 { text-align: left; font-size: large; font-weight: bold; }
 
 MIMETYPE = '''application/epub+zip'''
 
-TITLE_HEADER = '''<html xmlns="http://www.w3.org/1999/xhtml" xmlns:xlink="http://www.w3.org/1999/xlink"><head><meta http-equiv="Content-Type" content="text/html; charset=utf-8"/>
+TITLE_HEADER = '''<?xml version="1.0" encoding="utf-8"?><html xmlns="http://www.w3.org/1999/xhtml" xmlns:xlink="http://www.w3.org/1999/xlink"><head><meta http-equiv="Content-Type" content="text/html; charset=utf-8"/>
 <title>%s - %s</title><link href="stylesheet.css" type="text/css" charset="UTF-8" rel="stylesheet"/></head><body>
 <p><h7 id="lnks"><b><a id="StoryLink" href="%s">%s</a></b> by <b><a id="AuthorLink" href="%s">%s</a></b></h7></p>
 <table class="full">
@@ -41,7 +41,7 @@ TITLE_FOOTER = '''</table>
 </body></html>
 '''
 
-CONTAINER = '''<?xml version="1.0"?>
+CONTAINER = '''<?xml version="1.0" encoding="utf-8"?>
 <container version="1.0" xmlns="urn:oasis:names:tc:opendocument:xmlns:container">
   <rootfiles>
     <rootfile full-path="OEBPS/content.opf" media-type="application/oebps-package+xml"/>
diff --git a/downloader.py b/downloader.py
index f8ca80c6..bee778c0 100644
--- a/downloader.py
+++ b/downloader.py
@@ -1,3 +1,5 @@
+# -*- coding: utf-8 -*-
+
 import os
 import re
 import sys
diff --git a/fictionalley.py b/fictionalley.py
index 56d14f0e..da81a4ce 100644
--- a/fictionalley.py
+++ b/fictionalley.py
@@ -1,3 +1,5 @@
+# -*- coding: utf-8 -*-
+
 import os
 import re
 import sys
diff --git a/html2text.py b/html2text.py
index 5d61b9a4..ce6e1d3d 100644
--- a/html2text.py
+++ b/html2text.py
@@ -1,4 +1,6 @@
 #!/usr/bin/env python
+# -*- coding: utf-8 -*-
+
 """html2text: Turn HTML into equivalent Markdown-structured text."""
 __version__ = "2.37"
 __author__ = "Aaron Swartz (me@aaronsw.com)"
diff --git a/html_constants.py b/html_constants.py
index c698e8f4..f160a8a1 100644
--- a/html_constants.py
+++ b/html_constants.py
@@ -1,3 +1,5 @@
+# -*- coding: utf-8 -*-
+
 XHTML_START = '''<?xml version="1.0" encoding="UTF-8"?>
 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN" "http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd">
 <html xmlns="http://www.w3.org/1999/xhtml">
diff --git a/output.py b/output.py
index c2f87c26..e028237e 100644
--- a/output.py
+++ b/output.py
@@ -5,6 +5,7 @@ import re
 import sys
 import cgi
 import uuid
+import unicodedata
 import codecs
 import shutil
 import string
@@ -123,7 +124,7 @@ class EPubFanficWriter(FanficWriter):
 			if self.inmemory:
 				self.files[fileName] = StringIO.StringIO()
 			else:
-				self.files[fileName] = open(self.directory + '/' + fileName, 'w')
+				self.files[fileName] = open(self.directory + '/' + fileName, encoding='utf-8', mode='w')
 			
 			self._writeFile(fileName, data)
 		
@@ -182,7 +183,7 @@ class EPubFanficWriter(FanficWriter):
 		# BeautifulStoneSoup doesn't have any selfClosingTags by default.  
 		# hr & br needs to be if they're going to work.
 		# Some stories do use multiple br tags as their section breaks...
-		self.soup = bs.BeautifulStoneSoup(text.decode('utf-8'), selfClosingTags=('br','hr'))
+		self.soup = bs.BeautifulStoneSoup(text, selfClosingTags=('br','hr'))
 
 		allTags = self.soup.findAll(recursive=True)
 		for t in allTags:
@@ -349,6 +350,15 @@ def replaceNumberEntities(data):
 
 def removeEntities(text):
 	# replace numeric versions of [&<>] with named versions.
+	
+	try:
+		t = text.decode('utf-8')
+	except UnicodeEncodeError, e:
+		try:
+			t = text.encode ('ascii', 'xmlcharrefreplace') 
+		except UnicodeEncodeError, e:
+			t = text
+	text = t 
 	text = re.sub(r'&#0*38;','&amp;',text)
 	text = re.sub(r'&#0*60;','&lt;',text)
 	text = re.sub(r'&#0*62;','&gt;',text)
diff --git a/twilighted.py b/twilighted.py
index 5551f0e1..764502e9 100644
--- a/twilighted.py
+++ b/twilighted.py
@@ -1,3 +1,5 @@
+# -*- coding: utf-8 -*-
+
 import os
 import re
 import sys
diff --git a/twipassword.py b/twipassword.py
index 466686ff..105c09c3 100644
--- a/twipassword.py
+++ b/twipassword.py
@@ -1,2 +1,4 @@
+# -*- coding: utf-8 -*-
+
 # This is really for the web version.  downalod.py will ask.
 password='somepass'
diff --git a/zipdir.py b/zipdir.py
index f9a79acf..597b4f8c 100644
--- a/zipdir.py
+++ b/zipdir.py
@@ -1,3 +1,5 @@
+# -*- coding: utf-8 -*-
+
 import os
 import zipfile
 import logging

From 30b914788c3759473c9908aebcb39a707abeb2c1 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Wed, 10 Nov 2010 23:11:08 -0600
Subject: [PATCH 60/94] Add a new adapter for the potionsandsnitches web site. 
 Once we started looking for the additional information for the title page,
 things were sufficiently different from the twilighted adapter that it
 couldn't be used anymore.

---
 downloader.py       |   5 +-
 potionsNsnitches.py | 498 ++++++++++++++++++++++++++++++++++++++++++++
 twilighted.py       |  37 +++-
 3 files changed, 534 insertions(+), 6 deletions(-)
 create mode 100644 potionsNsnitches.py

diff --git a/downloader.py b/downloader.py
index bee778c0..cbcc7aeb 100644
--- a/downloader.py
+++ b/downloader.py
@@ -22,6 +22,7 @@ import adapter
 import fictionalley
 import hpfiction
 import twilighted
+import potionsNsnitches
 
 import time
 
@@ -99,8 +100,10 @@ if __name__ == '__main__':
 		adapter = ffnet.FFNet(url)
 	elif url.find('harrypotterfanfiction.com') != -1:
 		adapter = hpfiction.HPFiction(url)
-	elif url.find('twilighted.net') != -1 or url.find('potionsandsnitches.net') != -1:
+	elif url.find('twilighted.net') != -1:
 		adapter = twilighted.Twilighted(url)
+	elif url.find('potionsandsnitches.net') != -1:
+		adapter = potionsNsnitches.PotionsNSnitches(url)
 	else:
 		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
 		sys.exit(1)
diff --git a/potionsNsnitches.py b/potionsNsnitches.py
new file mode 100644
index 00000000..95ac435c
--- /dev/null
+++ b/potionsNsnitches.py
@@ -0,0 +1,498 @@
+# -*- coding: utf-8 -*-
+
+# Copied from the twilighted.py because site is almost the same..
+# of course, now that we're trying to scrape more detail about the
+# story, there were differences in how headers are displayed
+
+import os
+import re
+import sys
+import shutil
+import os.path
+import urllib as u
+import logging
+import pprint as pp
+import unittest
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time
+import datetime
+
+from adapter import *
+
+class PotionsNSnitches(FanfictionSiteAdapter):
+    def __init__(self, url):
+        self.url = url
+        parsedUrl = up.urlparse(url)
+        self.host = parsedUrl.netloc
+        self.path = parsedUrl.path
+        self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+        self.password = ''
+        self.login='sigizmund'
+        self.storyDescription = 'Fanfiction Story'
+        self.authorId = '0'
+        self.authorURL = ''
+        self.storyId = '0'
+        self.storyPublished = datetime.date(1970, 01, 31)
+        self.storyCreated = datetime.datetime.now()
+        self.storyUpdated = datetime.date(1970, 01, 31)
+        self.languageId = 'en-UK'
+        self.language = 'English'
+        self.subjects = []
+        self.subjects.append ('fanfiction')
+        self.subjects.append ('Harry Potter')
+        self.publisher = self.host
+        self.numChapters = 0
+        self.numWords = 0
+        self.genre = 'FanFiction'
+        self.category = 'Category'
+        self.storyStatus = 'In-Progress'
+        self.storyRating = 'PG'
+        self.storyUserRating = '0'
+        self.storyCharacters = []
+        self.storySeries = ''
+        
+        self.chapurl = False
+        ss=self.url.split('?')
+        logging.debug('ss=%s' % ss)
+        if ss is not None and len(ss) > 1:
+            sss = ss[1].replace('&amp;','&').split('&')
+            logging.debug('sss=%s' % sss)
+            if sss is not None and len(sss) > 0:
+                ssss = sss[0].split('=')
+                logging.debug('ssss=%s' % ssss)
+                if ssss is not None and len(ssss) > 1 and ssss[0] == 'sid':
+                    self.storyId = ssss[1]
+                if len(sss) > 1:
+                    ssss = sss[1].split('=')
+                    logging.debug('ssss=%s' % ssss)
+                    if ssss is not None and len(ssss) > 1 and ssss[0] == 'chapter':
+                        self.chapurl = True
+
+        self.url = 'http://' + self.host + '/' + self.path + '?sid=' + self.storyId
+        logging.debug('self.url=%s' % self.url)
+        
+        self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+        logging.debug('self.uuid=%s' % self.uuid)
+    
+        logging.debug("Created PotionsNSnitches: url=%s" % (self.url))
+
+
+    def requiresLogin(self, url = None):
+        # potionsandsnitches.net doesn't require login.
+        if self.host == 'potionsandsnitches.net':
+          return False
+        else:
+          return True
+
+    def performLogin(self, url = None):
+        data = {}
+    
+        data['penname'] = self.login
+        data['password'] = self.password
+        data['cookiecheck'] = '1'
+        data['submit'] = 'Submit'
+    
+        urlvals = u.urlencode(data)
+        loginUrl = 'http://' + self.host + self._getLoginScript()
+        logging.debug("Will now login to URL %s" % loginUrl)
+    
+        req = self.opener.open(loginUrl, urlvals)
+    
+        d = req.read().decode('utf-8')
+    
+        if self.reqLoginData(d) :
+          return False
+        else:
+          return True
+
+
+    def setLogin(self, login):
+        self.login = login
+
+    def setPassword(self, password):
+        self.password = password
+
+    def _addSubject(self, subject):
+        subj = subject.upper()
+        for s in self.subjects:
+            if s.upper() == subj:
+                return False
+        self.subjects.append(subject)
+        return True
+
+    def _addCharacter(self, character):
+        chara = character.upper()
+        for c in self.storyCharacters:
+            if c.upper() == chara:
+                return False
+        self.storyCharacters.append(character)
+        return True 
+    
+    def _fillCharacters(self, strlist, idx, maxlen):
+        ii = idx
+        while ii < maxlen:
+            chara = strlist[ii].strip()
+            if len(chara) > 0:
+                if chara.find(':') != -1:
+                    return (ii-1)
+                elif chara.find(',') == -1:
+                    self._addCharacter (chara)
+            ii = ii + 1
+        return (ii) 
+
+    def _buildGenre(self, strlist, idx, maxlen):
+        self.genre = ''
+        ii = idx
+        while ii < maxlen:
+            genre = strlist[ii].strip()
+            if len(genre) > 0:
+                if genre.find(':') != -1:
+                    return (ii-1)
+                elif genre.find(',') != -1:
+                    genre = ', '
+                else:
+                    self._addSubject (genre)
+                self.genre = self.genre + genre
+            ii = ii + 1
+        return (ii) 
+
+    def _buildCategory(self, strlist, idx, maxlen):
+        self.category = ''
+        ii = idx
+        while ii < maxlen:
+            cat = strlist[ii].strip()
+            if len(cat) > 0:
+                if cat.find(':') != -1:
+                    return (ii-1)
+                elif cat.find(',') != -1:
+                    cat = ', '
+                else:
+                    self._addSubject (cat)
+                self.category = self.category + cat
+            ii = ii + 1
+        return (ii) 
+
+    def extractIndividualUrls(self):
+        url = self.url + '&chapter=1'
+        data = self.opener.open(url).read()
+        
+        if self.reqLoginData(data):
+          self.performLogin()
+          data = self.opener.open(url).read()
+          if self.reqLoginData(data):
+            return None
+        
+        soup = bs.BeautifulStoneSoup(data)
+
+        self.storyName = ''
+        self.authorName = ''
+        self.storyId = '0'
+        title = soup.find('title').string
+        if title is not None and len(title) > 0:
+            logging.debug('Title: %s' % title)
+            ss = title.split(' by ')
+            if ss is not None and len(ss) > 1:
+                self.storyName = ss[0].strip()
+                self.authorName = ss[1].strip()
+                self.outputName = self.storyName.replace(" ", "_") + '-pNs_' + self.storyId
+
+        logging.debug('self.storyId=%s, self.storyName=%s, self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
+        logging.debug('self.authorId=%s, self.authorName=%s' % (self.authorId, self.authorName))
+                
+        select = soup.find('select', { 'name' : 'chapter' } )
+    	 
+        result = []
+        if select is None:
+    	   # no chapters found, try url by itself.
+           chaptitle = soup.find('div', { 'id' : 'chaptertitle' } )
+           if chaptitle is not None and chaptitle.string is not None and len(chaptitle.string) > 0:
+               result.append((url,chaptitle.string))
+           else:
+    	       result.append((url,self.storyName))
+        else:
+    	   allOptions = select.findAll('option')
+    	   for o in allOptions:
+    	     url = self.url + "&chapter=%s" % o['value']
+    	     title = o.string
+    	     result.append((url,title))
+    
+        url = self.url + "&index=1"
+        data = self.opener.open(url).read()
+        lines = data.split('\n')
+        soup = bs.BeautifulStoneSoup(data)
+        pgt = soup.find('div', {'id' : 'pagetitle'})
+        #logging.debug('pagetitle: %s' % pgt)
+        pgtAs = pgt.findAll('a')
+        #logging.debug('pgtAs: %s' % pgtAs)
+        for a in pgtAs:
+            if a['href'].find('viewstory.php') != -1:
+                (u1, self.storyId) = a['href'].split('=')
+                self.storyName = a.string
+                logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+            elif a['href'].find('viewuser.php') != -1:
+                self.authorName = a.string
+                self.authorURL = 'http://' + self.host + '/' + a['href']
+                (u1, self.authorId) = a['href'].split('=')
+                logging.debug('self.authorName=%s, self.authorId=%s' % (self.authorName, self.authorId))
+
+        output = soup.find('div', {'id' : 'output'})
+        #logging.debug('output: %s' % str(output))
+        if output is not None and len(str(output)) > 1:
+            s2 = re.split ('<[^>]+>', str(output))
+            #logging.debug('s2=%s' % s2)
+            ii = 0
+            ll = len(s2)
+            while ii < ll:
+                if s2[ii] == 'Summary:' and ii+1 < ll:
+                    self.storyDescription = s2[ii+1].strip()
+                    logging.debug('self.storyDescription: %s' % self.storyDescription)
+                    break;
+                ii = ii+1
+            
+        cnt = soup.find('div', {'class' : 'content'})
+        #logging.debug('content: %s' % cnt)
+        cnttd = cnt.findAll('td')
+        #logging.debug('cnttd: %s' % cnttd)
+        for td in cnttd:
+            #logging.debug('td: %s' % str(td))
+            ss = str(td).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
+            if len(ss) > 1:
+                s2 = re.split ('<[^>]+>', ss)
+                #logging.debug('s2=%s' % s2)
+                ii = 0
+                ll = len(s2)
+                while ii < ll-1:
+                    if s2[ii] is not None and len(s2[ii]) > 0 and s2[ii].find(':') != -1:
+                        skey = s2[ii].strip()
+                        ii = ii+1
+                        if skey == 'Rated:':
+                            self.storyRating = s2[ii].strip()
+                            logging.debug('self.storyRating=%s' % self.storyRating)
+                            ii = ii + 1
+                        elif skey == 'Chapters:':
+                            self.numChapters = s2[ii].strip()
+                            logging.debug('self.numChapters=%s' % self.numChapters)
+                            ii = ii + 1
+                        elif skey == 'Characters:':
+                            ii = self._fillCharacters(s2, ii, ll)
+                            logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+                            ii = ii + 1
+                        elif skey == 'Genres:':
+                            ii = self._buildGenre(s2, ii, ll)
+                            logging.debug('self.genre=%s' % self.genre)
+                            logging.debug('self.subjects=%s' % self.subjects)
+                        elif skey == 'Categories:':
+                            ii = self._buildCategory(s2, ii, ll)
+                            logging.debug('self.category=%s' % self.category)
+                            logging.debug('self.subjects=%s' % self.subjects)
+                        elif skey == 'Completed:':
+                            if s2[ii].strip(' ') == "No":
+                                self.storyStatus = 'In-Progress'
+                            else:
+                                self.storyStatus = 'Completed'
+                            ii = ii + 1
+                        elif skey == 'Word count:':
+                            self.numWords = s2[ii].strip()
+                            if self.numWords is None or len(self.numWords) == 0:
+                                self.numWords = '0'
+                            logging.debug('self.numWords=%s' % self.numWords)
+                            ii = ii + 1
+                        elif skey == 'Takes Place:':
+                            ii = ii + 1
+                        elif skey == 'Awards:':
+                            ii = ii + 1
+                        elif skey == 'Series:':
+                            ii = ii + 1
+                        elif skey == 'Read:':
+                            ii = ii + 1
+                        elif skey == 'Warnings:':
+                            ii = ii + 1
+                    else:
+                        ii = ii + 1
+                                        
+        tls = soup.findAll('div', {'style' : 'text-align: center;'})
+        for tl in tls:
+            #logging.debug('tl: %s' % tl)
+            ss = str(tl).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
+            if ss.find('Published:') != -1:
+                s2 = re.split ('<[^>]+>', ss)
+                #logging.debug('s2: %s' % s2)
+                ii = 0
+                ll = len(s2)
+                while ii < ll-1:
+                    if s2[ii] is not None and len(s2[ii]) > 0 and s2[ii].find(':') != -1:
+                        skey = s2[ii].strip()
+                        #logging.debug('skey: %s' % skey)
+                        ii = ii+1
+                        if skey == 'Published:':
+                            self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s2[ii].strip(' '), "%b %d %Y")))
+                            logging.debug('self.storyPublished=%s' % self.storyPublished)
+                            ii = ii + 1
+                        elif skey == 'Updated:':
+                            self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s2[ii].strip(' '), "%b %d %Y")))
+                            logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+                            ii = ii + 1
+                    else:
+                        ii = ii + 1
+            
+        if (self.storyName is None or len(self.storyName) == 0) and self.storyId == '0': 
+            logging.error('self.storyName is empty!!  Exitting!')
+            exit(1)
+            
+        self.outputName = self.storyName.replace(" ", "_") + '-pNs_' + self.storyId
+        logging.debug('self.outputName=%s' % self.outputName)
+        
+        self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+        logging.debug('self.uuid=%s' % self.uuid)
+
+        return result
+
+    def getStoryName(self):
+        return self.storyName
+
+    def getOutputName(self):
+        return self.outputName
+		
+    def getAuthorName(self):
+        return self.authorName
+    
+    def getText(self, url):
+        if url.find('http://') == -1:
+          url = 'http://' + self.host + '/' + url
+    
+        logging.debug('Getting data from: %s' % url)
+    
+        data = self.opener.open(url).read()
+        
+        # need to do this, because for some reason the <br /> tag in the story causes problems
+        data = data.replace('<br />', ' SOMETHING_BR ')
+        soup = bs.BeautifulStoneSoup(data, convertEntities=bs.BeautifulStoneSoup.HTML_ENTITIES)
+    
+        div = soup.find('div', {'id' : 'story'})
+    
+        if None == div:
+          return '<html/>'
+
+        # put the <br /> tags back in..
+        text = div.__str__('utf8').replace(' SOMETHING_BR ','<br />')    
+        return text
+
+    def _getLoginScript(self):
+        return '/user.php?action=login'
+
+    def reqLoginData(self, data):
+        if data.find('Registered Users Only. Please click OK to login or register.') != -1 or data.find('There is no such account on our website') != -1:
+          return True
+        else:
+          return False
+
+    def getHost(self):
+        logging.debug('self.host=%s' % self.host)
+        return self.host
+
+    def getStoryURL(self):
+        logging.debug('self.url=%s' % self.url)
+        return self.url
+
+    def getAuthorURL(self):
+        logging.debug('self.authorURL=%s' % self.authorURL)
+        return self.authorURL
+
+    def getUUID(self):
+        logging.debug('self.uuid=%s' % self.uuid)
+        return self.uuid
+    
+    def getStoryDescription(self):
+        logging.debug('self.storyDescription=%s' % self.storyDescription)
+        return self.storyDescription
+    
+    def getStoryPublished(self):
+        logging.debug('self.storyPublished=%s' % self.storyPublished)
+        return self.storyPublished
+    
+    def getStoryCreated(self):
+        self.storyCreated = datetime.datetime.now()
+        logging.debug('self.storyCreated=%s' % self.storyCreated)
+        return self.storyCreated
+    
+    def getStoryUpdated(self):
+        logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+        return self.storyUpdated
+    
+    def getLanguage(self):
+        logging.debug('self.language=%s' % self.language)
+        return self.language
+    
+    def getLanguageId(self):
+        logging.debug('self.languageId=%s' % self.languageId)
+        return self.languageId
+    
+    def getSubjects(self):
+        logging.debug('self.subjects=%s' % self.authorName)
+        return self.subjects
+    
+    def getPublisher(self):
+        logging.debug('self.publisher=%s' % self.publisher)
+        return self.publisher
+    
+    def getNumChapters(self):
+        logging.debug('self.numChapters=%s' % self.numChapters)
+        return self.numChapters
+    
+    def getNumWords(self):
+        logging.debug('self.numWords=%s' % self.numWords)
+        return self.numWords
+    
+    def getAuthorId(self):
+        logging.debug('self.authorId=%s' % self.authorId)
+        return self.authorId
+    
+    def getStoryId(self):
+        logging.debug('self.storyId=%s' % self.storyId)
+        return self.storyId
+    
+    def getCategory(self):
+        logging.debug('self.category=%s' % self.category)
+        return self.category
+    
+    def getGenre(self):
+        logging.debug('self.genre=%s' % self.genre)
+        return self.genre
+    
+    def getStoryStatus(self):
+        logging.debug('self.storyStatus=%s' % self.storyStatus)
+        return self.storyStatus
+    
+    def getStoryRating(self):
+        logging.debug('self.storyRating=%s' % self.storyRating)
+        return self.storyRating
+    
+    def getStoryUserRating(self):
+        logging.debug('self.storyUserRating=%s' % self.storyUserRating)
+        return self.storyUserRating
+    
+    def getStoryCharacters(self):
+        logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+        return self.storyCharacters
+
+    def getStorySeries(self):
+        logging.debug('self.storySeries=%s' % self.storySeries)
+        return self.storySeries
+
+class PotionsNSnitches_UnitTests(unittest.TestCase):
+    def setUp(self):
+        logging.basicConfig(level=logging.DEBUG)
+        pass
+  
+    def testLoginWorks(self):
+        pass
+  
+    def testGetUrlsWorks(self):
+        url = 'http://potionsandsnitches.net/fanfiction/viewstory.php?sid=2230'
+        self.assertEquals(32, len(Twilighted(url).extractIndividualUrls()))
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/twilighted.py b/twilighted.py
index 764502e9..d45e4688 100644
--- a/twilighted.py
+++ b/twilighted.py
@@ -50,6 +50,27 @@ class Twilighted(FanfictionSiteAdapter):
         self.storyUserRating = '0'
         self.storyCharacters = []
         self.storySeries = ''
+        
+        self.chapurl = False
+        ss=self.url.split('?')
+        logging.debug('ss=%s' % ss)
+        if ss is not None and len(ss) > 1:
+            sss = ss[1].replace('&amp;','&').split('&')
+            logging.debug('sss=%s' % sss)
+            if sss is not None and len(sss) > 0:
+                ssss = sss[0].split('=')
+                logging.debug('ssss=%s' % ssss)
+                if ssss is not None and len(ssss) > 1 and ssss[0] == 'sid':
+                    self.storyId = ssss[1]
+                if len(sss) > 1:
+                    ssss = sss[1].split('=')
+                    logging.debug('ssss=%s' % ssss)
+                    if ssss is not None and len(ssss) > 1 and ssss[0] == 'chapter':
+                        self.chapurl = True
+
+        self.url = 'http://' + self.host + '/' + self.path + '?sid=' + self.storyId
+        logging.debug('self.url=%s' % self.url)
+        
         self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
         logging.debug('self.uuid=%s' % self.uuid)
     
@@ -108,21 +129,26 @@ class Twilighted(FanfictionSiteAdapter):
         return True
 
     def extractIndividualUrls(self):
-        data = self.opener.open(self.url).read()
+        url = self.url + '&chapter=1'
+        data = self.opener.open(url).read()
         
         if self.reqLoginData(data):
           self.performLogin()
-          data = self.opener.open(self.url).read()
+          data = self.opener.open(url).read()
           if self.reqLoginData(data):
             return None
         
         soup = bs.BeautifulStoneSoup(data)
-    
+
         title = soup.find('title').string
+        logging.debug('Title: %s' % title)
         self.storyName = title.split(' by ')[0].strip()
         self.authorName = title.split(' by ')[1].strip()
-        self.outputName = self.storyName.replace(" ", "_")
-    
+        self.outputName = self.storyName.replace(" ", "_") + '-tw_' + self.storyId
+
+        logging.debug('self.storyId=%s, self.storyName=%s, self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
+        logging.debug('self.authorId=%s, self.authorName=%s' % (self.authorId, self.authorName))
+                
         select = soup.find('select', { 'name' : 'chapter' } )
     	 
         result = []
@@ -141,6 +167,7 @@ class Twilighted(FanfictionSiteAdapter):
         lines = data.split('\n')
         soup = bs.BeautifulStoneSoup(data)
         metas = soup.findAll('meta')
+        
         for meta in metas:
             if 'name' in meta._getAttrMap() and meta['name'].find('description') != -1:
                 #logging.debug('Meta: %s' % meta)

From 696223a456646cb11072591dbc760cfb720c2640 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Thu, 11 Nov 2010 09:55:37 -0600
Subject: [PATCH 61/94] Added in an adapter for FictionPress.com.  This started
 out as a copy of ffnet.py, but the extractIndividualUrls rapidly became
 completly different.  I have not found a field that says total number of
 words for the story.

---
 downloader.py |   5 +-
 fpcom.py      | 507 ++++++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 511 insertions(+), 1 deletion(-)
 create mode 100644 fpcom.py

diff --git a/downloader.py b/downloader.py
index cbcc7aeb..431bbad4 100644
--- a/downloader.py
+++ b/downloader.py
@@ -16,6 +16,7 @@ import htmlentitydefs as hdefs
 
 
 import ffnet
+import fpcom
 import ficwad
 import output
 import adapter
@@ -96,8 +97,10 @@ if __name__ == '__main__':
 		adapter = fictionalley.FictionAlley(url)
 	elif url.find('ficwad') != -1:
 		adapter = ficwad.FicWad(url)
-	elif url.find('fanfiction.net') != -1 or url.find('fictionpress.com') != -1:
+	elif url.find('fanfiction.net') != -1:
 		adapter = ffnet.FFNet(url)
+	elif url.find('fictionpress.com') != -1:
+		adapter = fpcom.FPCom(url)
 	elif url.find('harrypotterfanfiction.com') != -1:
 		adapter = hpfiction.HPFiction(url)
 	elif url.find('twilighted.net') != -1:
diff --git a/fpcom.py b/fpcom.py
new file mode 100644
index 00000000..0389e9a9
--- /dev/null
+++ b/fpcom.py
@@ -0,0 +1,507 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import os.path
+import logging
+import unittest
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time
+import datetime
+
+from constants import *
+from adapter import *
+
+try:
+	import login_password
+except:
+	# tough luck
+	pass
+
+try:
+	from google.appengine.api.urlfetch import fetch as googlefetch
+	appEngine = True
+except:
+	appEngine = False
+
+class FPCom(FanfictionSiteAdapter):
+	def __init__(self, url):
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		
+		self.storyName = 'Story'
+		self.authorName = 'Author'
+		self.outputName = 'Story'
+		self.storyDescription = 'A Story'
+		self.storyCharacters = []
+		self.storySeries = ''
+		self.authorId = '0'
+		self.authorURL = self.path
+		self.storyId = '0'
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		logging.debug('self.subjects=%s' % self.subjects)
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = 'Fiction'
+		self.category = 'Category'
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'K'
+		self.storyUserRating = '0'
+		
+		logging.debug('self.path=%s' % self.path)
+
+		if self.path.startswith('/'):
+			self.path = self.path[1:]
+		
+		spl = self.path.split('/')
+		logging.debug('spl=%s' % spl)
+		if spl is not None:
+			if len(spl) > 0 and spl[0] != 's':
+				logging.error("Error URL \"%s\" is not a story." % self.url)
+				exit (20)				
+			if len(spl) > 1:
+				self.storyId = spl[1]
+			if len(spl) > 2:
+				chapter = spl[1]
+			else:
+				chapter = '1'
+			if len(spl) == 5:
+				self.path = "/".join(spl[1:-1])
+				self.outputName = spl[4] + '-ffnet_' + spl[2]
+		
+		if self.path.endswith('/'):
+			self.path = self.path[:-1]
+		
+		logging.debug('self.path=%s' % self.path)
+		
+		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+		logging.debug('self.uuid=%s' % self.uuid)
+
+		logging.debug('self.storyId=%s, chapter=%s, self.outputName=%s' % (self.storyId, chapter, self.outputName))
+		if not appEngine:
+			self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+		else:
+			self.opener = None
+	
+		logging.debug("Created FF.Net: url=%s" % (self.url))
+	
+	def _getLoginScript(self):
+		return self.path
+
+	def requiresLogin(self, url = None):
+		return False
+
+	def performLogin(self, url = None):
+		return True
+
+	def _getVarValue(self, varstr):
+		#logging.debug('_getVarValue varstr=%s' % varstr)
+		vals = varstr.split('=')
+		#logging.debug('vals=%s' % vals)
+		retstr="".join(vals[+1:])
+		#logging.debug('retstr=%s' % retstr)
+		if retstr.startswith(' '):
+			retstr = retstr[1:]
+		if retstr.endswith(';'):
+			retstr = retstr[:-1]
+		return retstr
+	
+	def _splitCrossover(self, subject):
+		if "Crossover" in subject:
+			self._addSubject ("Crossover")
+			logging.debug('Crossover=%s' % subject)
+			if subject.find(' and ') != -1:
+				words = subject.split(' ')
+				logging.debug('words=%s' % words)
+				subj = ''
+				for s in words:
+					if s in "and Crossover":
+						if len(subj) > 0:
+							self._addSubject(subj)
+						subj = ''
+					else:
+						if len(subj) > 0:
+							subj = subj + ' '
+						subj = subj + s
+				if len(subj) > 0:
+					self._addSubject(subj)
+			else:
+				self._addSubject(subject)
+		else:
+			self._addSubject(subject)
+		return True
+
+	def _splitGenre(self, subject):
+		if len(subject) > 0:
+			words = subject.split('/')
+			logging.debug('words=%s' % words)
+			for subj in words:
+			    if len(subj) > 0:
+				self._addSubject(subj)
+		return True
+
+	def _addSubject(self, subject):
+		subj = subject.upper()
+		for s in self.subjects:
+			if s.upper() == subj:
+				return False
+
+		self.subjects.append(subject)
+		return True
+
+	def _addCharacter(self, character):
+		chara = character.upper()
+		for c in self.storyCharacters:
+			if c.upper() == chara:
+				return False
+		self.storyCharacters.append(character)
+		return True
+
+	def _fetchUrl(self, url):
+		if not appEngine:
+			return self.opener.open(url).read().decode('utf-8')
+		else:
+			return googlefetch(url).content
+	
+	def extractIndividualUrls(self):
+		data = self._fetchUrl(self.url)
+		d2 = re.sub('&\#[0-9]+;', ' ', data)
+		soup = bs.BeautifulStoneSoup(d2)
+		allA = soup.findAll('a')
+		for a in allA:
+			if 'href' in a._getAttrMap() and a['href'].find('/u/') != -1:
+				self.authorName = a.string
+				(u1, u2, self.authorId, u3) = a['href'].split('/')
+				logging.debug('self.authorId=%s self.authorName=%s' % (self.authorId, self.authorName))
+
+		urls = []
+		
+		metas = soup.findAll ('meta', {'name' : 'description'})
+		if metas is not None:
+			for meta in metas:
+				if 'content' in meta._getAttrMap():
+					self.storyDescription = str(meta['content'])
+					logging.debug('self.storyDescription=%s' % self.storyDescription)
+					
+					title=meta.find('title')
+					logging.debug('title=%s' % title.string)
+					tt = title.string.split(',')
+					if tt is not None:
+						if len(tt) > 0:
+							self.storyName = tt[0]
+							self.outputName = self.storyName.replace(" ", "_") + '-fpcom_' + self.storyId
+							logging.debug('self.storyId=%s, self.storyName=%s, self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
+						if len(tt) > 1:
+							tt1 = tt[1].split(' - ')
+							if tt1 is not None and len(tt1) > 0:
+								self.category = tt1[0].strip()
+								logging.debug('self.category=%s' % self.category)
+								cc = self.category.split(' ')
+								for cc1 in cc:
+									if cc1 is not None and cc1 != 'a':
+										if cc1 == 'fanfic':
+											self._addSubject('FanFiction')
+										else:
+											self._addSubject(cc1)
+								logging.debug('self.subjects=%s' % self.subjects)
+								
+
+		fidochap = soup.find('form', {'name':'fidochap'})
+		sl = fidochap.find('select', {'title':'chapter navigation'})
+		logging.debug('sl=%s' % sl )
+		urlstory = ''
+		if 'onchange' in sl._getAttrMap():
+			ocs = sl['onchange'].split('\'')
+			logging.debug('ocs=%s' % ocs)
+			if ocs is not None and len(ocs) > 3:
+				urlstory = ocs[3]
+				logging.debug('urlstory=%s' % urlstory)
+			
+		numchapters = 0
+		opts = sl.findAll('option')
+		for o in opts:
+			if 'value' in o._getAttrMap():
+				url = 'http://' + self.host + '/s/' + self.storyId  + '/' + o['value'] + urlstory
+				logging.debug('URL=%s, Title=%s' % (url, o.string))
+				urls.append((url, o.string))
+				numchapters = numchapters + 1
+		
+		if numchapters == 0:
+			numchapters = 1
+			url = 'http://' + self.host + '/s/' + self.storyId  + '/1' +  urlstory
+			logging.debug('URL=%s, Title=%s' % (url, self.storyName))
+			urls.append((url, self.storyName))
+			
+		self.numChapters = str(numchapters)
+		logging.debug('self.numChapters=%s' % self.numChapters)
+		logging.debug('urls=%s' % urls)
+		
+		self.genre = ''
+		tds = fidochap.findAll('td')
+		for td in tds:
+			tdb = td.find('b')
+			if tdb is not None and tdb.string == self.storyName:
+				tdas = td.findAll('a')
+				for tda in tdas:
+					ss = tda.string
+					if ss is not None:
+						if len(self.genre) > 0:
+							self.genre = self.genre + ', '
+						self.genre = self.genre + ss
+						self._addSubject(ss)
+				logging.debug('self.genre=%s' % self.genre)
+				logging.debug('self.subjects=%s' % self.subjects)
+			tda = td.find ('a')
+			if tda is not None and tda.string.find('Rated:') != -1:
+				tdas = re.split ("<[^>]+>", str(td).replace('\n','').replace('&nbsp;',' '))
+				if tdas is not None:
+					ll = len(tdas)
+					if ll > 2:
+						ss = tdas[2].split(': ')
+						if ss is not None and len(ss) > 1:
+							self.storyRating = ss[1]
+							logging.debug('self.storyRating=%s' % self.storyRating)
+					if ll > 3:
+						ss = tdas[3].split(' - ')
+						if ss is not None:
+							lls = len(ss)
+							if lls > 1:
+								language = ss[1]
+								logging.debug('language=%s' % language)
+							if lls > 2:
+								self.category = ss[2]
+								logging.debug('self.category=%s' % self.category)
+								sgs = self.category.split('/')
+								for sg in sgs:
+									self._addSubject(sg)
+								logging.debug('self.subjects=%s' % self.subjects)
+							if lls > 3 and ss[3].strip() == 'Reviews:' and ll > 4:
+								reviews = tdas[4] 
+								logging.debug('reviews=%s' % reviews)
+					if ll > 5:
+						ss = tdas[5].split(' - ')
+						if ss is not None:
+							lls = len(ss)
+							if lls > 1:
+								sds = ss[1].split(': ')
+								logging.debug('sds=%s' % sds)
+								if sds is not None and len(sds) > 1 and sds[0] == 'Published':
+									self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sds[1].strip(' '), "%m-%d-%y")))
+									logging.debug('self.storyPublished=%s' % self.storyPublished)
+							lls = len(ss)
+							if lls > 2:
+								sds = ss[2].split(': ')
+								logging.debug('sds=%s' % sds)
+								if sds is not None and len(sds) > 1 and sds[0] == 'Updated':
+									self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sds[1].strip(' '), "%m-%d-%y")))
+									logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+									
+
+
+		self.uuid = 'urn:uuid:' + self.host + '-a.' + self.authorId + '-s.' + self.storyId
+		self.authorURL = 'http://' + self.host + '/u/' + self.authorId
+		logging.debug('self.uuid=%s' % self.uuid)
+
+		return urls
+	
+	def getText(self, url):
+		time.sleep( 2.0 )
+		data = self._fetchUrl(url)
+		lines = data.split('\n')
+		
+		textbuf = ''
+		emit = False
+		
+		olddata = data
+		try:
+			data = data.decode('utf8')
+		except:
+			data = olddata
+		
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			logging.info("Failed to decode: <%s>" % data)
+			soup = None
+		div = soup.find('div', {'id' : 'storytext'})
+		if None == div:
+			logging.error("Error downloading Chapter: %s" % url)
+			exit (20)
+			return '<html/>'
+			
+		return div.__str__('utf8')
+					
+	def setLogin(self, login):
+		self.login = login
+
+	def setPassword(self, password):
+		self.password = password
+
+	def getHost(self):
+		logging.debug('self.host=%s' % self.host)
+		return self.host
+
+	def getStoryURL(self):
+		logging.debug('self.url=%s' % self.url)
+		return self.url
+
+	def getUUID(self):
+		logging.debug('self.uuid=%s' % self.uuid)
+		return self.uuid
+
+	def getOutputName(self):
+		logging.debug('self.storyId=%s, self.storyName=%s self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
+		return self.outputName
+
+	def getAuthorName(self):
+		logging.debug('self.authorName=%s' % self.authorName)
+		return self.authorName
+
+	def getAuthorId(self):
+		logging.debug('self.authorId=%s' % self.authorId)
+		return self.authorId
+
+	def getAuthorURL(self):
+		logging.debug('self.authorURL=%s' % self.authorURL)
+		return self.authorURL
+
+	def getStoryId(self):
+		logging.debug('self.storyId=%s' % self.storyId)
+		return self.storyId
+
+	def getStoryName(self):
+		logging.debug('self.storyName=%s' % self.storyName)
+		return self.storyName
+
+	def getStoryDescription(self):
+		logging.debug('self.storyDescription=%s' % self.storyDescription)
+		return self.storyDescription
+
+	def getStoryPublished(self):
+		logging.debug('self.storyPublished=%s' % self.storyPublished)
+		return self.storyPublished
+
+	def getStoryCreated(self):
+		self.storyCreated = datetime.datetime.now()
+		logging.debug('self.storyCreated=%s' % self.storyCreated)
+		return self.storyCreated
+
+	def getStoryUpdated(self):
+		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+		return self.storyUpdated
+
+	def getLanguage(self):
+		logging.debug('self.language=%s' % self.language)
+		return self.language
+
+	def getLanguageId(self):
+		logging.debug('self.languageId=%s' % self.languageId)
+		return self.languageId
+
+	def getSubjects(self):
+		logging.debug('self.subjects=%s' % self.authorName)
+		return self.subjects
+
+	def getPublisher(self):
+		logging.debug('self.publisher=%s' % self.publisher)
+		return self.publisher
+
+	def getNumChapters(self):
+		logging.debug('self.numChapters=%s' % self.numChapters)
+		return self.numChapters
+
+	def getNumWords(self):
+		logging.debug('self.numWords=%s' % self.numWords)
+		return self.numWords
+
+	def getCategory(self):
+		logging.debug('self.category=%s' % self.category)
+		return self.category
+
+	def getGenre(self):
+		logging.debug('self.genre=%s' % self.genre)
+		return self.genre
+
+	def getStoryStatus(self):
+		logging.debug('self.storyStatus=%s' % self.storyStatus)
+		return self.storyStatus
+
+	def getStoryRating(self):
+		logging.debug('self.storyRating=%s' % self.storyRating)
+		return self.storyRating
+
+	def getStoryUserRating(self):
+		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
+		return self.storyUserRating
+
+	def getPrintableUrl(self, url):
+		pass
+
+	def getStoryCharacters(self):
+		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+		return self.storyCharacters
+	
+	def getStorySeries(self):
+		logging.debug('self.storySeries=%s' % self.storySeries)
+		return self.storySeries
+		
+class FFA_UnitTests(unittest.TestCase):
+	def setUp(self):
+		logging.basicConfig(level=logging.DEBUG)
+		pass
+	
+	def testChaptersAuthStory(self):
+		f = FFNet('http://www.fanfiction.net/s/5257563/1')
+		f.extractIndividualUrls()
+		
+		self.assertEquals('Beka0502', f.getAuthorName())
+		self.assertEquals("Draco's Redemption", f.getStoryName())
+
+	def testChaptersCountNames(self):
+		f = FFNet('http://www.fanfiction.net/s/5257563/1')
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals(10, len(urls))
+	
+	def testGetText(self):
+		url = 'http://www.fanfiction.net/s/5257563/1'
+		f = FFNet(url)
+		text = f.getText(url)
+		self.assertTrue(text.find('He was just about to look at some photos when he heard a crack') != -1)
+	
+	def testBrokenWands(self):
+		url = 'http://www.fanfiction.net/s/1527263/30/Harry_Potter_and_Broken_Wands'
+		f = FFNet(url)
+		text = f.getText(url)
+		
+		urls = f.extractIndividualUrls()
+	
+	def testFictionPress(self):
+		url = 'http://www.fictionpress.com/s/2725180/1/Behind_This_Facade'
+		f = FFNet(url)
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals('Behind This Facade', f.getStoryName())
+		self.assertEquals('IntoxicatingMelody', f.getAuthorName())
+	
+		text = f.getText(url)
+		self.assertTrue(text.find('Kale Resgerald at your service" He answered, "So, can we go now? Or do you want to') != -1)
+if __name__ == '__main__':
+	unittest.main()

From 35065593afdf9cc5767f29f1536f92103fd7f940 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Thu, 11 Nov 2010 13:14:15 -0600
Subject: [PATCH 62/94] Refactored source code to remove redundant code.. 
 Moved most of the adapter get and set functions for variables into the
 adapter.py.  Define all the adapter variables in adapter.py.  Remove the
 unneeded functions from the various adapter sources.

Fix a couple of problems with fpcom.py.  Rearrange the Genre and Category for some of the adapters.
---
 adapter.py          | 161 +++++++++++++++++++++------
 ffnet.py            | 173 ++--------------------------
 fictionalley.py     | 167 +++------------------------
 ficwad.py           | 178 ++++-------------------------
 fpcom.py            | 266 ++++++++------------------------------------
 hpfiction.py        | 137 +----------------------
 potionsNsnitches.py | 190 +++----------------------------
 twilighted.py       | 173 ++++------------------------
 8 files changed, 257 insertions(+), 1188 deletions(-)

diff --git a/adapter.py b/adapter.py
index 03c3b59d..d4f80cc5 100644
--- a/adapter.py
+++ b/adapter.py
@@ -1,5 +1,9 @@
 # -*- coding: utf-8 -*-
 
+import logging
+import datetime
+
+
 class LoginRequiredException(Exception):
 	def __init__(self, url):
 		self.url = url
@@ -8,16 +12,56 @@ class LoginRequiredException(Exception):
 		return repr(self.url + ' requires user to be logged in')
 
 class FanfictionSiteAdapter:
+	try:
+		from google.appengine.api.urlfetch import fetch as googlefetch
+		appEngine = True
+	except:
+		appEngine = False
 	login = ''
 	password = ''
+	url = ''
+	host = ''
+	path = ''
+	uuid = ''
+	storyName = ''
+	storyId = ''
+	authorName = ''
+	authorId = ''
+	authorURL = ''
+	outputStorySep = '-Ukn_'
+	outputName = ''
+	storyDescription = ''
+	storyCharacters = []
+	storySeries = ''
+	storyPublished = datetime.date(1970, 01, 31)
+	storyCreated = datetime.datetime.now()
+	storyUpdated = datetime.date(1970, 01, 31)
+	languageId = 'en-UK'
+	language = 'English'
+	subjects = []
+	publisher = ''
+	numChapters = '0'
+	numWords = '0'
+	genre = ''
+	category = ''
+	storyStatus = 'In-Progress'
+	storyRating = ''
+	storyUserRating = '0'
 	def __init__(self, url):
-		pass
+		# basic plain url parsing...
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+			
+	def hasAppEngine(self):
+		return self.appEngine
 	
 	def requiresLogin(self, url = None):
-		pass
+		return False
 	
 	def performLogin(self, url = None):
-		pass
+		return True
 	
 	def extractIndividualUrls(self):
 		pass
@@ -26,88 +70,133 @@ class FanfictionSiteAdapter:
 		pass
 
 	def setLogin(self, login):
-		pass
+		self.login = login
 
 	def setPassword(self, password):
-		pass
+		self.password = password
 
 	def getHost(self):
-		pass
+		logging.debug('self.host=%s' % self.host)
+		return self.host
 	
-	def getStoryURL(self):
-		pass
-
 	def getUUID(self):
-		pass
+		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+		logging.debug('self.uuid=%s' % self.uuid)
+		return self.uuid
 
 	def getOutputName(self):
-		pass
+		self.outputName = self.storyName.replace(" ", "_") + self.outputStorySep + self.storyId
+		logging.debug('self.storyId=%s, self.storyName=%s self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
+		return self.outputName
 
 	def getAuthorURL(self):
-		pass
+		logging.debug('self.authorURL=%s' % self.authorURL)
+		return self.authorURL
 
 	def getAuthorId(self):
-		pass
+		logging.debug('self.authorId=%s' % self.authorId)
+		return self.authorId
 
 	def getAuthorName(self):
-		pass
+		logging.debug('self.authorName=%s' % self.authorName)
+		return self.authorName
+
+	def getStoryURL(self):
+		logging.debug('self.url=%s' % self.url)
+		return self.url
 
 	def getStoryId(self):
-		pass
+		logging.debug('self.storyId=%s' % self.storyId)
+		return self.storyId
 
 	def getStoryName(self):
-		pass
+		logging.debug('self.storyName=%s' % self.storyName)
+		return self.storyName
 
 	def getStoryDescription(self):
-		pass
+		logging.debug('self.storyDescription=%s' % self.storyDescription)
+		return self.storyDescription
 
 	def getStoryCreated(self):
-		pass
+		self.storyCreated = datetime.datetime.now()
+		logging.debug('self.storyCreated=%s' % self.storyCreated)
+		return self.storyCreated
 
+	def addCharacter(self, character):
+		chara = character.upper()
+		for c in self.storyCharacters:
+			if c.upper() == chara:
+				return False
+		self.storyCharacters.append(character)
+		return True
+
+	def getStoryCharacters(self):
+		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+		return self.storyCharacters
+	
 	def getStoryPublished(self):
-		pass
+		logging.debug('self.storyPublished=%s' % self.storyPublished)
+		return self.storyPublished
 
 	def getStoryUpdated(self):
-		pass
+		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+		return self.storyUpdated
 
 	def getStorySeries(self):
-		pass
+		logging.debug('self.storySeries=%s' % self.storySeries)
+		return self.storySeries
 
 	def getLanguage(self):
-		pass
+		logging.debug('self.language=%s' % self.language)
+		return self.language
 
 	def getLanguageId(self):
-		pass
+		logging.debug('self.languageId=%s' % self.languageId)
+		return self.languageId
+
+	def addSubject(self, subject):
+		subj = subject.upper()
+		for s in self.subjects:
+			if s.upper() == subj:
+				return False
+		self.subjects.append(subject)
+		return True
 
 	def getSubjects(self):
-		pass
-
-	def getCharacters(self):
-		pass
+		logging.debug('self.subjects=%s' % self.authorName)
+		return self.subjects
 
 	def getPublisher(self):
-		pass
+		logging.debug('self.publisher=%s' % self.publisher)
+		return self.publisher
 
 	def getNumChapters(self):
-		pass
+		logging.debug('self.numChapters=%s' % self.numChapters)
+		return self.numChapters
 
 	def getNumWords(self):
-		pass
+		logging.debug('self.numWords=%s' % self.numWords)
+		return self.numWords
 
 	def getCategory(self):
-		pass
+		logging.debug('self.category=%s' % self.category)
+		return self.category
 
 	def getGenre(self):
-		pass
+		logging.debug('self.genre=%s' % self.genre)
+		return self.genre
 
 	def getStoryStatus(self):
-		pass
+		logging.debug('self.storyStatus=%s' % self.storyStatus)
+		return self.storyStatus
 
 	def getStoryRating(self):
-		pass
+		logging.debug('self.storyRating=%s' % self.storyRating)
+		return self.storyRating
 
 	def getStoryUserRating(self):
-		pass
+		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
+		return self.storyUserRating
 
 	def getPrintableUrl(self, url):
-		pass
+		return url
diff --git a/ffnet.py b/ffnet.py
index 3f9f41e5..a036988e 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -27,12 +27,6 @@ except:
 	# tough luck
 	pass
 
-try:
-	from google.appengine.api.urlfetch import fetch as googlefetch
-	appEngine = True
-except:
-	appEngine = False
-
 class FFNet(FanfictionSiteAdapter):
 	def __init__(self, url):
 		self.url = url
@@ -42,7 +36,6 @@ class FFNet(FanfictionSiteAdapter):
 		
 		self.storyName = 'FF.Net story'
 		self.authorName = 'FF.Net author'
-		self.outputName = 'FF.Net_story'
 		self.storyDescription = 'Fanfiction Story'
 		self.storyCharacters = []
 		self.storySeries = ''
@@ -65,6 +58,8 @@ class FFNet(FanfictionSiteAdapter):
 		self.storyStatus = 'In-Progress'
 		self.storyRating = 'K'
 		self.storyUserRating = '0'
+		self.outputName = ''
+		self.outputStorySep = '-ffnet_'
 		
 		logging.debug('self.path=%s' % self.path)
 
@@ -85,18 +80,14 @@ class FFNet(FanfictionSiteAdapter):
 				chapter = '1'
 			if len(spl) == 5:
 				self.path = "/".join(spl[1:-1])
-				self.outputName = spl[4] + '-ffnet_' + spl[2]
 		
 		if self.path.endswith('/'):
 			self.path = self.path[:-1]
 		
 		logging.debug('self.path=%s' % self.path)
 		
-		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
-		logging.debug('self.uuid=%s' % self.uuid)
-
-		logging.debug('self.storyId=%s, chapter=%s, self.outputName=%s' % (self.storyId, chapter, self.outputName))
-		if not appEngine:
+		logging.debug('self.storyId=%s, chapter=%s' % (self.storyId, chapter))
+		if not self.appEngine:
 			self.opener = u2.build_opener(u2.HTTPCookieProcessor())
 		else:
 			self.opener = None
@@ -106,12 +97,6 @@ class FFNet(FanfictionSiteAdapter):
 	def _getLoginScript(self):
 		return self.path
 
-	def requiresLogin(self, url = None):
-		return False
-
-	def performLogin(self, url = None):
-		return True
-
 	def _getVarValue(self, varstr):
 		#logging.debug('_getVarValue varstr=%s' % varstr)
 		vals = varstr.split('=')
@@ -126,7 +111,7 @@ class FFNet(FanfictionSiteAdapter):
 	
 	def _splitCrossover(self, subject):
 		if "Crossover" in subject:
-			self._addSubject ("Crossover")
+			self.addSubject ("Crossover")
 			logging.debug('Crossover=%s' % subject)
 			if subject.find(' and ') != -1:
 				words = subject.split(' ')
@@ -135,18 +120,18 @@ class FFNet(FanfictionSiteAdapter):
 				for s in words:
 					if s in "and Crossover":
 						if len(subj) > 0:
-							self._addSubject(subj)
+							self.addSubject(subj)
 						subj = ''
 					else:
 						if len(subj) > 0:
 							subj = subj + ' '
 						subj = subj + s
 				if len(subj) > 0:
-					self._addSubject(subj)
+					self.addSubject(subj)
 			else:
-				self._addSubject(subject)
+				self.addSubject(subject)
 		else:
-			self._addSubject(subject)
+			self.addSubject(subject)
 		return True
 
 	def _splitGenre(self, subject):
@@ -155,28 +140,11 @@ class FFNet(FanfictionSiteAdapter):
 			logging.debug('words=%s' % words)
 			for subj in words:
 			    if len(subj) > 0:
-				self._addSubject(subj)
-		return True
-
-	def _addSubject(self, subject):
-		subj = subject.upper()
-		for s in self.subjects:
-			if s.upper() == subj:
-				return False
-
-		self.subjects.append(subject)
-		return True
-
-	def _addCharacter(self, character):
-		chara = character.upper()
-		for c in self.storyCharacters:
-			if c.upper() == chara:
-				return False
-		self.storyCharacters.append(character)
+				self.addSubject(subj)
 		return True
 
 	def _fetchUrl(self, url):
-		if not appEngine:
+		if not self.appEngine:
 			return self.opener.open(url).read().decode('utf-8')
 		else:
 			return googlefetch(url).content
@@ -198,9 +166,7 @@ class FFNet(FanfictionSiteAdapter):
 			if l.find("&#187;") != -1 and l.find('<b>') != -1:
 				s2 = bs.BeautifulStoneSoup(l)
 				self.storyName = str(s2.find('b').string)
-				# mangling storyName replaces url for outputName 
-				self.outputName = self.storyName.replace(" ", "_") + '-ffnet_' + self.storyId
-				logging.debug('self.storyId=%s, self.storyName=%s, self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
+				logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
 			elif l.find("<a href='/u/") != -1:
 				s2 = bs.BeautifulStoneSoup(l)
 				self.authorName = str(s2.a.string)
@@ -291,9 +257,7 @@ class FFNet(FanfictionSiteAdapter):
 			# no chapters found, try url by itself.
 			urls.append((self.url,self.storyName))
 
-		self.uuid = 'urn:uuid:' + self.host + '-a.' + self.authorId + '-s.' + self.storyId
 		self.authorURL = 'http://' + self.host + '/u/' + self.authorId
-		logging.debug('self.uuid=%s' % self.uuid)
 
 		#logging.debug('urls=%s' % urls)
 		return urls
@@ -325,119 +289,6 @@ class FFNet(FanfictionSiteAdapter):
 			
 		return div.__str__('utf8')
 					
-	def setLogin(self, login):
-		self.login = login
-
-	def setPassword(self, password):
-		self.password = password
-
-	def getHost(self):
-		logging.debug('self.host=%s' % self.host)
-		return self.host
-
-	def getStoryURL(self):
-		logging.debug('self.url=%s' % self.url)
-		return self.url
-
-	def getUUID(self):
-		logging.debug('self.uuid=%s' % self.uuid)
-		return self.uuid
-
-	def getOutputName(self):
-		logging.debug('self.storyId=%s, self.storyName=%s self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
-		return self.outputName
-
-	def getAuthorName(self):
-		logging.debug('self.authorName=%s' % self.authorName)
-		return self.authorName
-
-	def getAuthorId(self):
-		logging.debug('self.authorId=%s' % self.authorId)
-		return self.authorId
-
-	def getAuthorURL(self):
-		logging.debug('self.authorURL=%s' % self.authorURL)
-		return self.authorURL
-
-	def getStoryId(self):
-		logging.debug('self.storyId=%s' % self.storyId)
-		return self.storyId
-
-	def getStoryName(self):
-		logging.debug('self.storyName=%s' % self.storyName)
-		return self.storyName
-
-	def getStoryDescription(self):
-		logging.debug('self.storyDescription=%s' % self.storyDescription)
-		return self.storyDescription
-
-	def getStoryPublished(self):
-		logging.debug('self.storyPublished=%s' % self.storyPublished)
-		return self.storyPublished
-
-	def getStoryCreated(self):
-		self.storyCreated = datetime.datetime.now()
-		logging.debug('self.storyCreated=%s' % self.storyCreated)
-		return self.storyCreated
-
-	def getStoryUpdated(self):
-		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
-		return self.storyUpdated
-
-	def getLanguage(self):
-		logging.debug('self.language=%s' % self.language)
-		return self.language
-
-	def getLanguageId(self):
-		logging.debug('self.languageId=%s' % self.languageId)
-		return self.languageId
-
-	def getSubjects(self):
-		logging.debug('self.subjects=%s' % self.authorName)
-		return self.subjects
-
-	def getPublisher(self):
-		logging.debug('self.publisher=%s' % self.publisher)
-		return self.publisher
-
-	def getNumChapters(self):
-		logging.debug('self.numChapters=%s' % self.numChapters)
-		return self.numChapters
-
-	def getNumWords(self):
-		logging.debug('self.numWords=%s' % self.numWords)
-		return self.numWords
-
-	def getCategory(self):
-		logging.debug('self.category=%s' % self.category)
-		return self.category
-
-	def getGenre(self):
-		logging.debug('self.genre=%s' % self.genre)
-		return self.genre
-
-	def getStoryStatus(self):
-		logging.debug('self.storyStatus=%s' % self.storyStatus)
-		return self.storyStatus
-
-	def getStoryRating(self):
-		logging.debug('self.storyRating=%s' % self.storyRating)
-		return self.storyRating
-
-	def getStoryUserRating(self):
-		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
-		return self.storyUserRating
-
-	def getPrintableUrl(self, url):
-		pass
-
-	def getStoryCharacters(self):
-		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
-		return self.storyCharacters
-	
-	def getStorySeries(self):
-		logging.debug('self.storySeries=%s' % self.storySeries)
-		return self.storySeries
 		
 class FFA_UnitTests(unittest.TestCase):
 	def setUp(self):
diff --git a/fictionalley.py b/fictionalley.py
index da81a4ce..00d34815 100644
--- a/fictionalley.py
+++ b/fictionalley.py
@@ -63,45 +63,30 @@ class FictionAlley(FanfictionSiteAdapter):
 		self.language = 'English'
 		self.subjects = []
 		self.subjects.append ('fanfiction')
+		self.subjects.append ('Harry Potter')
 		self.publisher = self.host
 		self.numChapters = 0
 		self.numWords = 0
-		self.genre = 'FanFiction'
-		self.category = 'Category'
+		self.genre = ''
+		self.category = 'Harry Potter'
 		self.storyStatus = 'In-Progress'
 		self.storyRating = 'K'
 		self.storyUserRating = '0'
 		self.storyCharacters = []
 		self.storySeries = ''
-	
+		self.outputName = ''
+		self.outputStorySep = '-fa_'	
 		
-	def requiresLogin(self, url = None):
-		return False
-	
-	def performLogin(self, url = None):
-		pass
-		
-	def setLogin(self, login):
-		self.login = login
-	
-	def setPassword(self, password):
-		self.password = password
-	
-	def _addSubject(self, subject):
-		subj = subject.upper()
-		for s in self.subjects:
-			if s.upper() == subj:
-				return False
-		self.subjects.append(subject)
-		return True
+	def getPasswordLine(self):
+		return 'opaopapassword'
 
-	def _addCharacter(self, character):
-		chara = character.upper()
-		for c in self.storyCharacters:
-			if c.upper() == chara:
-				return False
-		self.storyCharacters.append(character)
-		return True
+	def getLoginScript(self):
+		return 'opaopaloginscript'
+
+	def getLoginPasswordOthers(self):
+		login = dict(login = 'name', password = 'pass')
+		other = dict(submit = 'Log In', remember='yes')
+		return (login, other)
 
 	def _processChapterHeaders(self, div):
 		brs = div.findAll ('br')
@@ -125,12 +110,12 @@ class FictionAlley(FanfictionSiteAdapter):
 					logging.debug('self.genre=%s' % self.genre)
 					s2 = valstr.split(', ')
 					for ss2 in s2:
-						self._addSubject(ss2)
+						self.addSubject(ss2)
 					logging.debug('self.subjects=%s' % self.subjects)
 				elif keystr == 'Main Character(s):':
 					s2 = valstr.split(', ')
 					for ss2 in s2:
-						self._addCharacter(ss2)
+						self.addCharacter(ss2)
 					logging.debug('self.storyCharacters=%s' % self.storyCharacters)
 				elif keystr == 'Summary:':
 					self.storyDescription = valstr
@@ -147,7 +132,6 @@ class FictionAlley(FanfictionSiteAdapter):
 		# Get title from <title>, remove before '-'.
 		title = soup.find('title').string
 		self.storyName = "-".join(title.split('-')[1:]).strip().replace(" (Story Text)","")
-		self.outputName = self.storyName.replace(" ", "_") + '-fa_' + self.storyId
 		
 		links = soup.findAll('li')
 
@@ -226,24 +210,8 @@ class FictionAlley(FanfictionSiteAdapter):
 
 		print('Story "%s" by %s' % (self.storyName, self.authorName))
 		
-		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
-		logging.debug('self.uuid=%s' % self.uuid)
-		
 		return result
 	
-	def getHost(self):
-		logging.debug('self.host=%s' % self.host)
-		return self.host
-
-	def getStoryName(self):
-		return self.storyName
-
-	def getAuthorName(self):
-		return self.authorName
-	
-	def getOutputName(self):
-		return self.outputName
-
 	def getText(self, url):
 		# fictionalley uses full URLs in chapter list.
 		data = self.opener.open(url).read()
@@ -268,109 +236,6 @@ class FictionAlley(FanfictionSiteAdapter):
 		else:
 			return div.__str__('utf8').replace('crazytagstringnobodywouldstumbleonaccidently','div')
 	
-	def getStoryURL(self):
-		logging.debug('self.url=%s' % self.url)
-		return self.url
-
-	def getAuthorURL(self):
-		logging.debug('self.authorURL=%s' % self.authorURL)
-		return self.authorURL
-
-	def getUUID(self):
-		logging.debug('self.uuid=%s' % self.uuid)
-		return self.uuid
-
-	def getAuthorId(self):
-		logging.debug('self.authorId=%s' % self.authorId)
-		return self.authorId
-
-	def getStoryId(self):
-		logging.debug('self.storyId=%s' % self.storyId)
-		return self.storyId
-
-	def getStoryDescription(self):
-		logging.debug('self.storyDescription=%s' % self.storyDescription)
-		return self.storyDescription
-
-	def getStoryPublished(self):
-		logging.debug('self.storyPublished=%s' % self.storyPublished)
-		return self.storyPublished
-
-	def getStoryCreated(self):
-		self.storyCreated = datetime.datetime.now()
-		logging.debug('self.storyCreated=%s' % self.storyCreated)
-		return self.storyCreated
-
-	def getStoryUpdated(self):
-		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
-		return self.storyUpdated
-
-	def getLanguage(self):
-		logging.debug('self.language=%s' % self.language)
-		return self.language
-
-	def getLanguageId(self):
-		logging.debug('self.languageId=%s' % self.languageId)
-		return self.languageId
-
-	def getSubjects(self):
-		logging.debug('self.subjects=%s' % self.authorName)
-		return self.subjects
-
-	def getPublisher(self):
-		logging.debug('self.publisher=%s' % self.publisher)
-		return self.publisher
-
-	def getNumChapters(self):
-		logging.debug('self.numChapters=%s' % self.numChapters)
-		return self.numChapters
-
-	def getNumWords(self):
-		logging.debug('self.numWords=%s' % self.numWords)
-		return self.numWords
-
-	def getCategory(self):
-		logging.debug('self.category=%s' % self.category)
-		return self.category
-
-	def getGenre(self):
-		logging.debug('self.genre=%s' % self.genre)
-		return self.genre
-
-	def getStoryStatus(self):
-		logging.debug('self.storyStatus=%s' % self.storyStatus)
-		return self.storyStatus
-
-	def getStoryRating(self):
-		logging.debug('self.storyRating=%s' % self.storyRating)
-		return self.storyRating
-
-	def getStoryUserRating(self):
-		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
-		return self.storyUserRating
-
-	def getPrintableUrl(self, url):
-		return url
-	
-	def getPasswordLine(self):
-		return 'opaopapassword'
-
-	def getLoginScript(self):
-		return 'opaopaloginscript'
-
-	def getLoginPasswordOthers(self):
-		login = dict(login = 'name', password = 'pass')
-		other = dict(submit = 'Log In', remember='yes')
-		return (login, other)
-
-	def getStoryCharacters(self):
-		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
-		return self.storyCharacters
-	
-	def getStorySeries(self):
-		logging.debug('self.storySeries=%s' % self.storySeries)
-		return self.storySeries
-		
 	
 		
 if __name__ == '__main__':
diff --git a/ficwad.py b/ficwad.py
index 8ea76b60..ddac91a8 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -21,36 +21,6 @@ class FicWad(FanfictionSiteAdapter):
 	def __init__(self, url):
 		self.url = url
 		self.host = up.urlparse(url).netloc
-	
-	def requiresLogin(self, url = None):
-		return False
-	
-	def performLogin(self, url = None):
-		pass
-		
-	def setLogin(self, login):
-		self.login = login
-	
-	def setPassword(self, password):
-		self.password = password
-	
-	def _addSubject(self, subject):
-		subj = subject.upper()
-		for s in self.subjects:
-			if s.upper() == subj:
-				return False
-		self.subjects.append(subject)
-		return True
-
-	def _addCharacter(self, character):
-		chara = character.upper()
-		for c in self.storyCharacters:
-			if c.upper() == chara:
-				return False
-		self.storyCharacters.append(character)
-		return True
-
-	def extractIndividualUrls(self):
 		self.storyDescription = 'Fanfiction Story'
 		self.authorId = '0'
 		self.storyId = '0'
@@ -71,6 +41,21 @@ class FicWad(FanfictionSiteAdapter):
 		self.storyUserRating = '0'
 		self.storyCharacters = []
 		self.storySeries = ''
+		self.outputName = ''
+		self.outputStorySep = '-fw_'
+
+	def getPasswordLine(self):
+		return 'opaopapassword'
+
+	def getLoginScript(self):
+		return 'opaopaloginscript'
+
+	def getLoginPasswordOthers(self):
+		login = dict(login = 'name', password = 'pass')
+		other = dict(submit = 'Log In', remember='yes')
+		return (login, other)
+
+	def extractIndividualUrls(self):
 		oldurl = ''
 		
 		data = u2.urlopen(self.url).read()
@@ -98,9 +83,8 @@ class FicWad(FanfictionSiteAdapter):
 		storyinfo = story.find('h4').find('a')
 		(u0, u1, self.storyId) = storyinfo['href'].split('/')
 		self.storyName = storyinfo.string.strip()
-		self.outputName = self.storyName.replace(" ", "_") + '-fw_' + self.storyId
 
-		logging.debug('self.storyName=%s, self.storyId=%s, self.outputName=%s' % (self.storyName, self.storyId, self.outputName))
+		logging.debug('self.storyName=%s, self.storyId=%s' % (self.storyName, self.storyId))
 		
 		author = soup.find('span', {'class' : 'author'})
 		self.authorName = str(author.a.string)
@@ -134,7 +118,7 @@ class FicWad(FanfictionSiteAdapter):
 							if self.category == 'Category':
 								self.category = str(a.string)
 								logging.debug('self.category=%s' % self.category)
-							self._addSubject(self.category)
+							self.addSubject(self.category)
 						logging.debug('self.subjects=%s' % self.subjects)
 					elif skey == 'Rating':
 						self.storyRating = s1[1]
@@ -144,12 +128,12 @@ class FicWad(FanfictionSiteAdapter):
 						logging.debug('self.genre=%s' % self.genre)
 						s2 = s1[1].split(', ')
 						for ss2 in s2:
-							self._addSubject(ss2)
+							self.addSubject(ss2)
 						logging.debug('self.subjects=%s' % self.subjects)
 					elif skey == 'Characters':
 						s2 = s1[1].split(', ')
 						for ss2 in s2:
-							self._addCharacter(ss2)
+							self.addCharacter(ss2)
 						logging.debug('self.storyCharacters=%s' % self.storyCharacters)
 					elif skey == 'Chapters':
 						self.numChapters = s1[1]
@@ -208,6 +192,7 @@ class FicWad(FanfictionSiteAdapter):
 			select = soup.find('select', { 'name' : 'goto' } )
 
 			if select is None:
+				self.numChapters = '1'
 				result.append((self.url,self.storyName))
 				logging.debug('Chapter[%s]=%s %s' % (ii, self.url, self.storyName))
 			else:
@@ -223,25 +208,12 @@ class FicWad(FanfictionSiteAdapter):
 						ii = ii+1
 					else:
 						logging.debug('Skipping Story Index.  URL %s' % url)
-			
-		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
-		logging.debug('self.uuid=%s' % self.uuid)
+		
+		self.numChapters = str(ii)
+		logging.debug('self.numChapters=%s' % self.numChapters)
 		
 		return result
 	
-	def getHost(self):
-		logging.debug('self.host=%s' % self.host)
-		return self.host
-
-	def getStoryName(self):
-		return self.storyName
-
-	def getOutputName(self):
-		return self.outputName
-		
-	def getAuthorName(self):
-		return self.authorName
-	
 	def getText(self, url):
 		if url.find('http://') == -1:
 			url = 'http://' + self.host + '/' + url
@@ -256,110 +228,6 @@ class FicWad(FanfictionSiteAdapter):
 			return '<html/>'
 		return div.__str__('utf8')
 	
-	def getStoryURL(self):
-		logging.debug('self.url=%s' % self.url)
-		return self.url
-
-	def getAuthorURL(self):
-		logging.debug('self.authorURL=%s' % self.authorURL)
-		return self.authorURL
-
-	def getUUID(self):
-		logging.debug('self.uuid=%s' % self.uuid)
-		return self.uuid
-
-	def getAuthorId(self):
-		logging.debug('self.authorId=%s' % self.authorId)
-		return self.authorId
-
-	def getStoryId(self):
-		logging.debug('self.storyId=%s' % self.storyId)
-		return self.storyId
-
-	def getStoryDescription(self):
-		logging.debug('self.storyDescription=%s' % self.storyDescription)
-		return self.storyDescription
-
-	def getStoryPublished(self):
-		logging.debug('self.storyPublished=%s' % self.storyPublished)
-		return self.storyPublished
-
-	def getStoryCreated(self):
-		self.storyCreated = datetime.datetime.now()
-		logging.debug('self.storyCreated=%s' % self.storyCreated)
-		return self.storyCreated
-
-	def getStoryUpdated(self):
-		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
-		return self.storyUpdated
-
-	def getLanguage(self):
-		logging.debug('self.language=%s' % self.language)
-		return self.language
-
-	def getLanguageId(self):
-		logging.debug('self.languageId=%s' % self.languageId)
-		return self.languageId
-
-	def getSubjects(self):
-		logging.debug('self.subjects=%s' % self.authorName)
-		return self.subjects
-
-	def getPublisher(self):
-		logging.debug('self.publisher=%s' % self.publisher)
-		return self.publisher
-
-	def getNumChapters(self):
-		logging.debug('self.numChapters=%s' % self.numChapters)
-		return self.numChapters
-
-	def getNumWords(self):
-		logging.debug('self.numWords=%s' % self.numWords)
-		return self.numWords
-
-	def getCategory(self):
-		logging.debug('self.category=%s' % self.category)
-		return self.category
-
-	def getGenre(self):
-		logging.debug('self.genre=%s' % self.genre)
-		return self.genre
-
-	def getStoryStatus(self):
-		logging.debug('self.storyStatus=%s' % self.storyStatus)
-		return self.storyStatus
-
-	def getStoryRating(self):
-		logging.debug('self.storyRating=%s' % self.storyRating)
-		return self.storyRating
-
-	def getStoryUserRating(self):
-		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
-		return self.storyUserRating
-
-	def getPrintableUrl(self, url):
-		return url
-	
-	def getPasswordLine(self):
-		return 'opaopapassword'
-
-	def getLoginScript(self):
-		return 'opaopaloginscript'
-
-	def getLoginPasswordOthers(self):
-		login = dict(login = 'name', password = 'pass')
-		other = dict(submit = 'Log In', remember='yes')
-		return (login, other)
-
-	def getStoryCharacters(self):
-		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
-		return self.storyCharacters
-	
-	def getStorySeries(self):
-		logging.debug('self.storySeries=%s' % self.storySeries)
-		return self.storySeries
-		
-
 		
 if __name__ == '__main__':
 	url = 'http://www.ficwad.com/story/14536'
diff --git a/fpcom.py b/fpcom.py
index 0389e9a9..04266888 100644
--- a/fpcom.py
+++ b/fpcom.py
@@ -27,23 +27,16 @@ except:
 	# tough luck
 	pass
 
-try:
-	from google.appengine.api.urlfetch import fetch as googlefetch
-	appEngine = True
-except:
-	appEngine = False
-
 class FPCom(FanfictionSiteAdapter):
-	def __init__(self, url):
+	def __init__(self, url):		
 		self.url = url
 		parsedUrl = up.urlparse(url)
 		self.host = parsedUrl.netloc
 		self.path = parsedUrl.path
 		
-		self.storyName = 'Story'
-		self.authorName = 'Author'
-		self.outputName = 'Story'
-		self.storyDescription = 'A Story'
+		self.storyName = ''
+		self.authorName = ''
+		self.storyDescription = ''
 		self.storyCharacters = []
 		self.storySeries = ''
 		self.authorId = '0'
@@ -55,23 +48,21 @@ class FPCom(FanfictionSiteAdapter):
 		self.languageId = 'en-UK'
 		self.language = 'English'
 		self.subjects = []
-		logging.debug('self.subjects=%s' % self.subjects)
 		self.publisher = self.host
 		self.numChapters = 0
 		self.numWords = 0
-		self.genre = 'Fiction'
-		self.category = 'Category'
+		self.genre = ''
+		self.category = ''
 		self.storyStatus = 'In-Progress'
 		self.storyRating = 'K'
 		self.storyUserRating = '0'
+		self.outputName = ''
+		self.outputStorySep = '-fpcom_'
 		
-		logging.debug('self.path=%s' % self.path)
-
 		if self.path.startswith('/'):
 			self.path = self.path[1:]
 		
 		spl = self.path.split('/')
-		logging.debug('spl=%s' % spl)
 		if spl is not None:
 			if len(spl) > 0 and spl[0] != 's':
 				logging.error("Error URL \"%s\" is not a story." % self.url)
@@ -84,33 +75,22 @@ class FPCom(FanfictionSiteAdapter):
 				chapter = '1'
 			if len(spl) == 5:
 				self.path = "/".join(spl[1:-1])
-				self.outputName = spl[4] + '-ffnet_' + spl[2]
 		
 		if self.path.endswith('/'):
 			self.path = self.path[:-1]
 		
 		logging.debug('self.path=%s' % self.path)
 		
-		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
-		logging.debug('self.uuid=%s' % self.uuid)
-
-		logging.debug('self.storyId=%s, chapter=%s, self.outputName=%s' % (self.storyId, chapter, self.outputName))
-		if not appEngine:
+		if not self.appEngine:
 			self.opener = u2.build_opener(u2.HTTPCookieProcessor())
 		else:
 			self.opener = None
 	
-		logging.debug("Created FF.Net: url=%s" % (self.url))
+		logging.debug("Created FP.Com: url=%s" % (self.url))
 	
 	def _getLoginScript(self):
 		return self.path
 
-	def requiresLogin(self, url = None):
-		return False
-
-	def performLogin(self, url = None):
-		return True
-
 	def _getVarValue(self, varstr):
 		#logging.debug('_getVarValue varstr=%s' % varstr)
 		vals = varstr.split('=')
@@ -125,7 +105,7 @@ class FPCom(FanfictionSiteAdapter):
 	
 	def _splitCrossover(self, subject):
 		if "Crossover" in subject:
-			self._addSubject ("Crossover")
+			self.addSubject ("Crossover")
 			logging.debug('Crossover=%s' % subject)
 			if subject.find(' and ') != -1:
 				words = subject.split(' ')
@@ -134,18 +114,18 @@ class FPCom(FanfictionSiteAdapter):
 				for s in words:
 					if s in "and Crossover":
 						if len(subj) > 0:
-							self._addSubject(subj)
+							self.addSubject(subj)
 						subj = ''
 					else:
 						if len(subj) > 0:
 							subj = subj + ' '
 						subj = subj + s
 				if len(subj) > 0:
-					self._addSubject(subj)
+					self.addSubject(subj)
 			else:
-				self._addSubject(subject)
+				self.addSubject(subject)
 		else:
-			self._addSubject(subject)
+			self.addSubject(subject)
 		return True
 
 	def _splitGenre(self, subject):
@@ -154,28 +134,11 @@ class FPCom(FanfictionSiteAdapter):
 			logging.debug('words=%s' % words)
 			for subj in words:
 			    if len(subj) > 0:
-				self._addSubject(subj)
-		return True
-
-	def _addSubject(self, subject):
-		subj = subject.upper()
-		for s in self.subjects:
-			if s.upper() == subj:
-				return False
-
-		self.subjects.append(subject)
-		return True
-
-	def _addCharacter(self, character):
-		chara = character.upper()
-		for c in self.storyCharacters:
-			if c.upper() == chara:
-				return False
-		self.storyCharacters.append(character)
+				self.addSubject(subj)
 		return True
 
 	def _fetchUrl(self, url):
-		if not appEngine:
+		if not self.appEngine:
 			return self.opener.open(url).read().decode('utf-8')
 		else:
 			return googlefetch(url).content
@@ -206,8 +169,7 @@ class FPCom(FanfictionSiteAdapter):
 					if tt is not None:
 						if len(tt) > 0:
 							self.storyName = tt[0]
-							self.outputName = self.storyName.replace(" ", "_") + '-fpcom_' + self.storyId
-							logging.debug('self.storyId=%s, self.storyName=%s, self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
+							logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
 						if len(tt) > 1:
 							tt1 = tt[1].split(' - ')
 							if tt1 is not None and len(tt1) > 0:
@@ -217,31 +179,33 @@ class FPCom(FanfictionSiteAdapter):
 								for cc1 in cc:
 									if cc1 is not None and cc1 != 'a':
 										if cc1 == 'fanfic':
-											self._addSubject('FanFiction')
+											self.addSubject('FanFiction')
 										else:
-											self._addSubject(cc1)
+											self.addSubject(cc1)
 								logging.debug('self.subjects=%s' % self.subjects)
 								
 
+		numchapters = 0
+		urlstory = ''
+
 		fidochap = soup.find('form', {'name':'fidochap'})
 		sl = fidochap.find('select', {'title':'chapter navigation'})
-		logging.debug('sl=%s' % sl )
-		urlstory = ''
-		if 'onchange' in sl._getAttrMap():
-			ocs = sl['onchange'].split('\'')
-			logging.debug('ocs=%s' % ocs)
-			if ocs is not None and len(ocs) > 3:
-				urlstory = ocs[3]
-				logging.debug('urlstory=%s' % urlstory)
-			
-		numchapters = 0
-		opts = sl.findAll('option')
-		for o in opts:
-			if 'value' in o._getAttrMap():
-				url = 'http://' + self.host + '/s/' + self.storyId  + '/' + o['value'] + urlstory
-				logging.debug('URL=%s, Title=%s' % (url, o.string))
-				urls.append((url, o.string))
-				numchapters = numchapters + 1
+		if sl is not None:
+			logging.debug('sl=%s' % sl )
+			if 'onchange' in sl._getAttrMap():
+				ocs = sl['onchange'].split('\'')
+				logging.debug('ocs=%s' % ocs)
+				if ocs is not None and len(ocs) > 3:
+					urlstory = ocs[3]
+					logging.debug('urlstory=%s' % urlstory)
+				
+			opts = sl.findAll('option')
+			for o in opts:
+				if 'value' in o._getAttrMap():
+					url = 'http://' + self.host + '/s/' + self.storyId  + '/' + o['value'] + urlstory
+					logging.debug('URL=%s, Title=%s' % (url, o.string))
+					urls.append((url, o.string))
+					numchapters = numchapters + 1
 		
 		if numchapters == 0:
 			numchapters = 1
@@ -265,7 +229,7 @@ class FPCom(FanfictionSiteAdapter):
 						if len(self.genre) > 0:
 							self.genre = self.genre + ', '
 						self.genre = self.genre + ss
-						self._addSubject(ss)
+						self.addSubject(ss)
 				logging.debug('self.genre=%s' % self.genre)
 				logging.debug('self.subjects=%s' % self.subjects)
 			tda = td.find ('a')
@@ -290,7 +254,7 @@ class FPCom(FanfictionSiteAdapter):
 								logging.debug('self.category=%s' % self.category)
 								sgs = self.category.split('/')
 								for sg in sgs:
-									self._addSubject(sg)
+									self.addSubject(sg)
 								logging.debug('self.subjects=%s' % self.subjects)
 							if lls > 3 and ss[3].strip() == 'Reviews:' and ll > 4:
 								reviews = tdas[4] 
@@ -301,23 +265,19 @@ class FPCom(FanfictionSiteAdapter):
 							lls = len(ss)
 							if lls > 1:
 								sds = ss[1].split(': ')
-								logging.debug('sds=%s' % sds)
 								if sds is not None and len(sds) > 1 and sds[0] == 'Published':
 									self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sds[1].strip(' '), "%m-%d-%y")))
 									logging.debug('self.storyPublished=%s' % self.storyPublished)
 							lls = len(ss)
 							if lls > 2:
 								sds = ss[2].split(': ')
-								logging.debug('sds=%s' % sds)
 								if sds is not None and len(sds) > 1 and sds[0] == 'Updated':
 									self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sds[1].strip(' '), "%m-%d-%y")))
 									logging.debug('self.storyUpdated=%s' % self.storyUpdated)
 									
 
-		self.uuid = 'urn:uuid:' + self.host + '-a.' + self.authorId + '-s.' + self.storyId
 		self.authorURL = 'http://' + self.host + '/u/' + self.authorId
-		logging.debug('self.uuid=%s' % self.uuid)
 
 		return urls
 	
@@ -348,154 +308,15 @@ class FPCom(FanfictionSiteAdapter):
 			
 		return div.__str__('utf8')
 					
-	def setLogin(self, login):
-		self.login = login
-
-	def setPassword(self, password):
-		self.password = password
-
-	def getHost(self):
-		logging.debug('self.host=%s' % self.host)
-		return self.host
-
-	def getStoryURL(self):
-		logging.debug('self.url=%s' % self.url)
-		return self.url
-
-	def getUUID(self):
-		logging.debug('self.uuid=%s' % self.uuid)
-		return self.uuid
-
-	def getOutputName(self):
-		logging.debug('self.storyId=%s, self.storyName=%s self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
-		return self.outputName
-
-	def getAuthorName(self):
-		logging.debug('self.authorName=%s' % self.authorName)
-		return self.authorName
-
-	def getAuthorId(self):
-		logging.debug('self.authorId=%s' % self.authorId)
-		return self.authorId
-
-	def getAuthorURL(self):
-		logging.debug('self.authorURL=%s' % self.authorURL)
-		return self.authorURL
-
-	def getStoryId(self):
-		logging.debug('self.storyId=%s' % self.storyId)
-		return self.storyId
-
-	def getStoryName(self):
-		logging.debug('self.storyName=%s' % self.storyName)
-		return self.storyName
-
-	def getStoryDescription(self):
-		logging.debug('self.storyDescription=%s' % self.storyDescription)
-		return self.storyDescription
-
-	def getStoryPublished(self):
-		logging.debug('self.storyPublished=%s' % self.storyPublished)
-		return self.storyPublished
-
-	def getStoryCreated(self):
-		self.storyCreated = datetime.datetime.now()
-		logging.debug('self.storyCreated=%s' % self.storyCreated)
-		return self.storyCreated
-
-	def getStoryUpdated(self):
-		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
-		return self.storyUpdated
-
-	def getLanguage(self):
-		logging.debug('self.language=%s' % self.language)
-		return self.language
-
-	def getLanguageId(self):
-		logging.debug('self.languageId=%s' % self.languageId)
-		return self.languageId
-
-	def getSubjects(self):
-		logging.debug('self.subjects=%s' % self.authorName)
-		return self.subjects
-
-	def getPublisher(self):
-		logging.debug('self.publisher=%s' % self.publisher)
-		return self.publisher
-
-	def getNumChapters(self):
-		logging.debug('self.numChapters=%s' % self.numChapters)
-		return self.numChapters
-
-	def getNumWords(self):
-		logging.debug('self.numWords=%s' % self.numWords)
-		return self.numWords
-
-	def getCategory(self):
-		logging.debug('self.category=%s' % self.category)
-		return self.category
-
-	def getGenre(self):
-		logging.debug('self.genre=%s' % self.genre)
-		return self.genre
-
-	def getStoryStatus(self):
-		logging.debug('self.storyStatus=%s' % self.storyStatus)
-		return self.storyStatus
-
-	def getStoryRating(self):
-		logging.debug('self.storyRating=%s' % self.storyRating)
-		return self.storyRating
-
-	def getStoryUserRating(self):
-		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
-		return self.storyUserRating
-
-	def getPrintableUrl(self, url):
-		pass
-
-	def getStoryCharacters(self):
-		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
-		return self.storyCharacters
-	
-	def getStorySeries(self):
-		logging.debug('self.storySeries=%s' % self.storySeries)
-		return self.storySeries
 		
-class FFA_UnitTests(unittest.TestCase):
+class FPC_UnitTests(unittest.TestCase):
 	def setUp(self):
 		logging.basicConfig(level=logging.DEBUG)
 		pass
 	
-	def testChaptersAuthStory(self):
-		f = FFNet('http://www.fanfiction.net/s/5257563/1')
-		f.extractIndividualUrls()
-		
-		self.assertEquals('Beka0502', f.getAuthorName())
-		self.assertEquals("Draco's Redemption", f.getStoryName())
-
-	def testChaptersCountNames(self):
-		f = FFNet('http://www.fanfiction.net/s/5257563/1')
-		urls = f.extractIndividualUrls()
-		
-		self.assertEquals(10, len(urls))
-	
-	def testGetText(self):
-		url = 'http://www.fanfiction.net/s/5257563/1'
-		f = FFNet(url)
-		text = f.getText(url)
-		self.assertTrue(text.find('He was just about to look at some photos when he heard a crack') != -1)
-	
-	def testBrokenWands(self):
-		url = 'http://www.fanfiction.net/s/1527263/30/Harry_Potter_and_Broken_Wands'
-		f = FFNet(url)
-		text = f.getText(url)
-		
-		urls = f.extractIndividualUrls()
-	
 	def testFictionPress(self):
 		url = 'http://www.fictionpress.com/s/2725180/1/Behind_This_Facade'
-		f = FFNet(url)
+		f = FPCom(url)
 		urls = f.extractIndividualUrls()
 		
 		self.assertEquals('Behind This Facade', f.getStoryName())
@@ -503,5 +324,6 @@ class FFA_UnitTests(unittest.TestCase):
 	
 		text = f.getText(url)
 		self.assertTrue(text.find('Kale Resgerald at your service" He answered, "So, can we go now? Or do you want to') != -1)
+
 if __name__ == '__main__':
 	unittest.main()
diff --git a/hpfiction.py b/hpfiction.py
index 1bf46f55..38509391 100644
--- a/hpfiction.py
+++ b/hpfiction.py
@@ -75,36 +75,14 @@ class HPFiction(FanfictionSiteAdapter):
 		self.storyUserRating = '0'
 		self.storyCharacters = []
 		self.storySeries = ''
-		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
-		logging.debug('self.uuid=%s' % self.uuid)
+		self.outputName = ''
+		self.outputStorySep = '-hp_'
 		
 		logging.debug("Created HPFiction: url=%s" % (self.url))
 	
 	def _getLoginScript(self):
 		return self.path
-
-	def requiresLogin(self, url = None):
-		return False
-
-	def performLogin(self, url = None):
-		return True
 	
-	def _addSubject(self, subject):
-		subj = subject.upper()
-		for s in self.subjects:
-			if s.upper() == subj:
-				return False
-		self.subjects.append(subject)
-		return True
-
-	def _addCharacter(self, character):
-		chara = character.upper()
-		for c in self.storyCharacters:
-			if c.upper() == chara:
-				return False
-		self.storyCharacters.append(character)
-		return True
-
 	def extractIndividualUrls(self):
 		
 		data = self.opener.open(self.url).read()
@@ -182,7 +160,7 @@ class HPFiction(FanfictionSiteAdapter):
 							elif s[ii] == 'Characters:':
 								s2 = s[ii+1].split(', ')
 								for ss2 in s2:
-									self._addCharacter(ss2)
+									self.addCharacter(ss2)
 								logging.debug('self.storyCharacters=%s' % self.storyCharacters)
 								ii = ii + 2
 							elif s[ii] == 'Genre(s):':
@@ -190,7 +168,7 @@ class HPFiction(FanfictionSiteAdapter):
 								logging.debug('self.genre=%s' % self.genre)
 								s2 = s[ii+1].split(', ')
 								for ss2 in s2:
-									self._addSubject(ss2)
+									self.addSubject(ss2)
 								logging.debug('self.subjects=%s' % self.subjects)
 								ii = ii + 2
 							elif s[ii] == 'Status:':
@@ -222,7 +200,6 @@ class HPFiction(FanfictionSiteAdapter):
 					logging.debug('self.storyDescription=%s' % self.storyDescription)
 		
 		urls = []
-		self.outputName = self.storyName.replace(" ", "_") + '-hp_' + self.storyId
 
 		select = soup.find('select', {'name' : 'chapterid'})
 		if select is None:
@@ -239,24 +216,8 @@ class HPFiction(FanfictionSiteAdapter):
 					if title != "Story Index":
 						urls.append((url,title))
 
-		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
-		logging.debug('self.uuid=%s' % self.uuid)
-		
 		return urls
 
-	def getHost(self):
-		logging.debug('self.host=%s' % self.host)
-		return self.host
-
-	def getStoryName(self):
-		return self.storyName
-
-	def getOutputName(self):
-		return self.outputName
-		
-	def getAuthorName(self):
-		return self.authorName
-	
 	def getText(self, url):
 		logging.debug('Downloading from URL: %s' % url)
 		data = self.opener.open(url).read()
@@ -267,96 +228,6 @@ class HPFiction(FanfictionSiteAdapter):
 			exit(20)
 		return divtext.__str__('utf8')
 
-	def getAuthorId(self):
-		logging.debug('self.authorId=%s' % self.authorId)
-		return self.authorId
-
-	def getStoryId(self):
-		logging.debug('self.storyId=%s' % self.storyId)
-		return self.storyId
-
-	def getStoryDescription(self):
-		logging.debug('self.storyDescription=%s' % self.storyDescription)
-		return self.storyDescription
-
-	def getStoryPublished(self):
-		logging.debug('self.storyPublished=%s' % self.storyPublished)
-		return self.storyPublished
-
-	def getStoryCreated(self):
-		self.storyCreated = datetime.datetime.now()
-		logging.debug('self.storyCreated=%s' % self.storyCreated)
-		return self.storyCreated
-
-	def getStoryUpdated(self):
-		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
-		return self.storyUpdated
-
-	def getLanguage(self):
-		logging.debug('self.language=%s' % self.language)
-		return self.language
-
-	def getLanguageId(self):
-		logging.debug('self.languageId=%s' % self.languageId)
-		return self.languageId
-
-	def getSubjects(self):
-		logging.debug('self.subjects=%s' % self.authorName)
-		return self.subjects
-
-	def getPublisher(self):
-		logging.debug('self.publisher=%s' % self.publisher)
-		return self.publisher
-
-	def getNumChapters(self):
-		logging.debug('self.numChapters=%s' % self.numChapters)
-		return self.numChapters
-
-	def getNumWords(self):
-		logging.debug('self.numWords=%s' % self.numWords)
-		return self.numWords
-
-	def getStoryURL(self):
-		logging.debug('self.url=%s' % self.url)
-		return self.url
-
-	def getAuthorURL(self):
-		logging.debug('self.authorURL=%s' % self.authorURL)
-		return self.authorURL
-
-	def getUUID(self):
-		logging.debug('self.uuid=%s' % self.uuid)
-		return self.uuid
-
-	def getCategory(self):
-		logging.debug('self.category=%s' % self.category)
-		return self.category
-
-	def getGenre(self):
-		logging.debug('self.genre=%s' % self.genre)
-		return self.genre
-
-	def getStoryStatus(self):
-		logging.debug('self.storyStatus=%s' % self.storyStatus)
-		return self.storyStatus
-
-	def getStoryRating(self):
-		logging.debug('self.storyRating=%s' % self.storyRating)
-		return self.storyRating
-
-	def getStoryUserRating(self):
-		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
-		return self.storyUserRating
-
-	def getStoryCharacters(self):
-		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
-		return self.storyCharacters
-	
-	def getStorySeries(self):
-		logging.debug('self.storySeries=%s' % self.storySeries)
-		return self.storySeries
-		
-
 
 class FF_UnitTests(unittest.TestCase):
 	def setUp(self):
diff --git a/potionsNsnitches.py b/potionsNsnitches.py
index 95ac435c..3868e934 100644
--- a/potionsNsnitches.py
+++ b/potionsNsnitches.py
@@ -53,84 +53,37 @@ class PotionsNSnitches(FanfictionSiteAdapter):
         self.storyUserRating = '0'
         self.storyCharacters = []
         self.storySeries = ''
-        
+        self.outputName = ''
+        self.outputStorySep = '-pns_'
+
         self.chapurl = False
         ss=self.url.split('?')
-        logging.debug('ss=%s' % ss)
         if ss is not None and len(ss) > 1:
             sss = ss[1].replace('&amp;','&').split('&')
-            logging.debug('sss=%s' % sss)
             if sss is not None and len(sss) > 0:
                 ssss = sss[0].split('=')
-                logging.debug('ssss=%s' % ssss)
                 if ssss is not None and len(ssss) > 1 and ssss[0] == 'sid':
                     self.storyId = ssss[1]
                 if len(sss) > 1:
                     ssss = sss[1].split('=')
-                    logging.debug('ssss=%s' % ssss)
                     if ssss is not None and len(ssss) > 1 and ssss[0] == 'chapter':
                         self.chapurl = True
 
         self.url = 'http://' + self.host + '/' + self.path + '?sid=' + self.storyId
         logging.debug('self.url=%s' % self.url)
         
-        self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
-        logging.debug('self.uuid=%s' % self.uuid)
-    
         logging.debug("Created PotionsNSnitches: url=%s" % (self.url))
 
 
-    def requiresLogin(self, url = None):
-        # potionsandsnitches.net doesn't require login.
-        if self.host == 'potionsandsnitches.net':
-          return False
-        else:
+    def _getLoginScript(self):
+        return '/user.php?action=login'
+
+    def reqLoginData(self, data):
+        if data.find('Registered Users Only. Please click OK to login or register.') != -1 or data.find('There is no such account on our website') != -1:
           return True
-
-    def performLogin(self, url = None):
-        data = {}
-    
-        data['penname'] = self.login
-        data['password'] = self.password
-        data['cookiecheck'] = '1'
-        data['submit'] = 'Submit'
-    
-        urlvals = u.urlencode(data)
-        loginUrl = 'http://' + self.host + self._getLoginScript()
-        logging.debug("Will now login to URL %s" % loginUrl)
-    
-        req = self.opener.open(loginUrl, urlvals)
-    
-        d = req.read().decode('utf-8')
-    
-        if self.reqLoginData(d) :
-          return False
         else:
-          return True
+          return False
 
-
-    def setLogin(self, login):
-        self.login = login
-
-    def setPassword(self, password):
-        self.password = password
-
-    def _addSubject(self, subject):
-        subj = subject.upper()
-        for s in self.subjects:
-            if s.upper() == subj:
-                return False
-        self.subjects.append(subject)
-        return True
-
-    def _addCharacter(self, character):
-        chara = character.upper()
-        for c in self.storyCharacters:
-            if c.upper() == chara:
-                return False
-        self.storyCharacters.append(character)
-        return True 
-    
     def _fillCharacters(self, strlist, idx, maxlen):
         ii = idx
         while ii < maxlen:
@@ -139,7 +92,7 @@ class PotionsNSnitches(FanfictionSiteAdapter):
                 if chara.find(':') != -1:
                     return (ii-1)
                 elif chara.find(',') == -1:
-                    self._addCharacter (chara)
+                    self.addCharacter (chara)
             ii = ii + 1
         return (ii) 
 
@@ -154,7 +107,7 @@ class PotionsNSnitches(FanfictionSiteAdapter):
                 elif genre.find(',') != -1:
                     genre = ', '
                 else:
-                    self._addSubject (genre)
+                    self.addSubject (genre)
                 self.genre = self.genre + genre
             ii = ii + 1
         return (ii) 
@@ -170,7 +123,7 @@ class PotionsNSnitches(FanfictionSiteAdapter):
                 elif cat.find(',') != -1:
                     cat = ', '
                 else:
-                    self._addSubject (cat)
+                    self.addSubject (cat)
                 self.category = self.category + cat
             ii = ii + 1
         return (ii) 
@@ -197,9 +150,8 @@ class PotionsNSnitches(FanfictionSiteAdapter):
             if ss is not None and len(ss) > 1:
                 self.storyName = ss[0].strip()
                 self.authorName = ss[1].strip()
-                self.outputName = self.storyName.replace(" ", "_") + '-pNs_' + self.storyId
 
-        logging.debug('self.storyId=%s, self.storyName=%s, self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
+        logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
         logging.debug('self.authorId=%s, self.authorName=%s' % (self.authorId, self.authorName))
                 
         select = soup.find('select', { 'name' : 'chapter' } )
@@ -342,22 +294,7 @@ class PotionsNSnitches(FanfictionSiteAdapter):
             logging.error('self.storyName is empty!!  Exitting!')
             exit(1)
             
-        self.outputName = self.storyName.replace(" ", "_") + '-pNs_' + self.storyId
-        logging.debug('self.outputName=%s' % self.outputName)
-        
-        self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
-        logging.debug('self.uuid=%s' % self.uuid)
-
         return result
-
-    def getStoryName(self):
-        return self.storyName
-
-    def getOutputName(self):
-        return self.outputName
-		
-    def getAuthorName(self):
-        return self.authorName
     
     def getText(self, url):
         if url.find('http://') == -1:
@@ -380,107 +317,6 @@ class PotionsNSnitches(FanfictionSiteAdapter):
         text = div.__str__('utf8').replace(' SOMETHING_BR ','<br />')    
         return text
 
-    def _getLoginScript(self):
-        return '/user.php?action=login'
-
-    def reqLoginData(self, data):
-        if data.find('Registered Users Only. Please click OK to login or register.') != -1 or data.find('There is no such account on our website') != -1:
-          return True
-        else:
-          return False
-
-    def getHost(self):
-        logging.debug('self.host=%s' % self.host)
-        return self.host
-
-    def getStoryURL(self):
-        logging.debug('self.url=%s' % self.url)
-        return self.url
-
-    def getAuthorURL(self):
-        logging.debug('self.authorURL=%s' % self.authorURL)
-        return self.authorURL
-
-    def getUUID(self):
-        logging.debug('self.uuid=%s' % self.uuid)
-        return self.uuid
-    
-    def getStoryDescription(self):
-        logging.debug('self.storyDescription=%s' % self.storyDescription)
-        return self.storyDescription
-    
-    def getStoryPublished(self):
-        logging.debug('self.storyPublished=%s' % self.storyPublished)
-        return self.storyPublished
-    
-    def getStoryCreated(self):
-        self.storyCreated = datetime.datetime.now()
-        logging.debug('self.storyCreated=%s' % self.storyCreated)
-        return self.storyCreated
-    
-    def getStoryUpdated(self):
-        logging.debug('self.storyUpdated=%s' % self.storyUpdated)
-        return self.storyUpdated
-    
-    def getLanguage(self):
-        logging.debug('self.language=%s' % self.language)
-        return self.language
-    
-    def getLanguageId(self):
-        logging.debug('self.languageId=%s' % self.languageId)
-        return self.languageId
-    
-    def getSubjects(self):
-        logging.debug('self.subjects=%s' % self.authorName)
-        return self.subjects
-    
-    def getPublisher(self):
-        logging.debug('self.publisher=%s' % self.publisher)
-        return self.publisher
-    
-    def getNumChapters(self):
-        logging.debug('self.numChapters=%s' % self.numChapters)
-        return self.numChapters
-    
-    def getNumWords(self):
-        logging.debug('self.numWords=%s' % self.numWords)
-        return self.numWords
-    
-    def getAuthorId(self):
-        logging.debug('self.authorId=%s' % self.authorId)
-        return self.authorId
-    
-    def getStoryId(self):
-        logging.debug('self.storyId=%s' % self.storyId)
-        return self.storyId
-    
-    def getCategory(self):
-        logging.debug('self.category=%s' % self.category)
-        return self.category
-    
-    def getGenre(self):
-        logging.debug('self.genre=%s' % self.genre)
-        return self.genre
-    
-    def getStoryStatus(self):
-        logging.debug('self.storyStatus=%s' % self.storyStatus)
-        return self.storyStatus
-    
-    def getStoryRating(self):
-        logging.debug('self.storyRating=%s' % self.storyRating)
-        return self.storyRating
-    
-    def getStoryUserRating(self):
-        logging.debug('self.storyUserRating=%s' % self.storyUserRating)
-        return self.storyUserRating
-    
-    def getStoryCharacters(self):
-        logging.debug('self.storyCharacters=%s' % self.storyCharacters)
-        return self.storyCharacters
-
-    def getStorySeries(self):
-        logging.debug('self.storySeries=%s' % self.storySeries)
-        return self.storySeries
 
 class PotionsNSnitches_UnitTests(unittest.TestCase):
     def setUp(self):
diff --git a/twilighted.py b/twilighted.py
index d45e4688..ed293406 100644
--- a/twilighted.py
+++ b/twilighted.py
@@ -43,13 +43,15 @@ class Twilighted(FanfictionSiteAdapter):
         self.publisher = self.host
         self.numChapters = 0
         self.numWords = 0
-        self.genre = 'FanFiction'
-        self.category = 'Category'
+        self.genre = ''
+        self.category = 'Fanfiction'
         self.storyStatus = 'In-Progress'
         self.storyRating = 'PG'
         self.storyUserRating = '0'
         self.storyCharacters = []
         self.storySeries = ''
+        self.outputName = ''
+        self.outputStorySep = '-tw_'
         
         self.chapurl = False
         ss=self.url.split('?')
@@ -71,18 +73,19 @@ class Twilighted(FanfictionSiteAdapter):
         self.url = 'http://' + self.host + '/' + self.path + '?sid=' + self.storyId
         logging.debug('self.url=%s' % self.url)
         
-        self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
-        logging.debug('self.uuid=%s' % self.uuid)
-    
         logging.debug("Created Twilighted: url=%s" % (self.url))
 
+    def _getLoginScript(self):
+        return '/user.php?action=login'
+
+    def reqLoginData(self, data):
+        if data.find('Registered Users Only. Please click OK to login or register.') != -1 or data.find('There is no such account on our website') != -1:
+          return True
+        else:
+          return False
 
     def requiresLogin(self, url = None):
-        # potionsandsnitches.net doesn't require login.
-        if self.host == 'potionsandsnitches.net':
-          return False
-        else:
-          return True
+        return True
 
     def performLogin(self, url = None):
         data = {}
@@ -105,29 +108,6 @@ class Twilighted(FanfictionSiteAdapter):
         else:
           return True
 
-
-    def setLogin(self, login):
-        self.login = login
-
-    def setPassword(self, password):
-        self.password = password
-
-    def _addSubject(self, subject):
-        subj = subject.upper()
-        for s in self.subjects:
-            if s.upper() == subj:
-                return False
-        self.subjects.append(subject)
-        return True
-
-    def _addCharacter(self, character):
-        chara = character.upper()
-        for c in self.storyCharacters:
-            if c.upper() == chara:
-                return False
-        self.storyCharacters.append(character)
-        return True
-
     def extractIndividualUrls(self):
         url = self.url + '&chapter=1'
         data = self.opener.open(url).read()
@@ -144,9 +124,8 @@ class Twilighted(FanfictionSiteAdapter):
         logging.debug('Title: %s' % title)
         self.storyName = title.split(' by ')[0].strip()
         self.authorName = title.split(' by ')[1].strip()
-        self.outputName = self.storyName.replace(" ", "_") + '-tw_' + self.storyId
 
-        logging.debug('self.storyId=%s, self.storyName=%s, self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
+        logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
         logging.debug('self.authorId=%s, self.authorName=%s' % (self.authorId, self.authorName))
                 
         select = soup.find('select', { 'name' : 'chapter' } )
@@ -192,8 +171,6 @@ class Twilighted(FanfictionSiteAdapter):
                                             str1 = a.string
                                             (vs, self.storyId) = a['href'].split('=')
                                             logging.debug('self.storyId=%s self.storyName=%s' % (self.storyId, self.storyName))
-                                            self.outputName = self.outputName + "-tw_" + self.storyId
-                                            logging.debug('self.outputName=%s' % self.outputName)
                                         if a['href'].find('viewuser.php?uid=') != -1:
                                             str1 = a.string
                                             (vs, self.authorId) = a['href'].split('=')
@@ -217,16 +194,19 @@ class Twilighted(FanfictionSiteAdapter):
                                             ii = ii+1
                                             while stlen > ii and len(strs[ii]) != 0 and strs[ii].find(':') == -1:
                                                 if strs[ii] != ' ' and strs[ii] != ', ':
-                                                    if self.category == 'Category':
+                                                    if len(self.genre) > 0:
+                                                        self.genre = self.genre + ', '
+                                                    self.genre = strs[ii].strip(' ')
+                                                    if len(self.category) == 0:
                                                         self.category = strs[ii].strip(' ')
-                                                    self._addSubject(strs[ii].strip(' '))
+                                                    self.addSubject(strs[ii].strip(' '))
                                                 ii = ii+1
                                             logging.debug('self.subjects=%s' % self.subjects)
                                         if strs[ii] == 'Characters: ':
                                             ii = ii+1
                                             while stlen > ii and len(strs[ii]) != 0 and strs[ii].find(':') == -1:
                                                 if strs[ii] != ' ' and strs[ii] != ', ':
-                                                    self._addCharacter(strs[ii].strip(' '))
+                                                    self.addCharacter(strs[ii].strip(' '))
                                                 ii = ii+1
                                             logging.debug('self.storyCharacters=%s' % self.storyCharacters)
                                         elif strs[ii] == 'Completed:':
@@ -266,20 +246,8 @@ class Twilighted(FanfictionSiteAdapter):
                                             logging.debug('Skipped Label \"%s\" Value \"%s\"' % (strs[ii], strs[ii+1]))
                                             ii = ii+2
                                 
-        self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
-        logging.debug('self.uuid=%s' % self.uuid)
-
         return result
 
-    def getStoryName(self):
-        return self.storyName
-
-    def getOutputName(self):
-        return self.outputName
-		
-    def getAuthorName(self):
-        return self.authorName
-    
     def getText(self, url):
         if url.find('http://') == -1:
           url = 'http://' + self.host + '/' + url
@@ -297,107 +265,6 @@ class Twilighted(FanfictionSiteAdapter):
     
         return div.__str__('utf8')
 
-    def _getLoginScript(self):
-        return '/user.php?action=login'
-
-    def reqLoginData(self, data):
-        if data.find('Registered Users Only. Please click OK to login or register.') != -1 or data.find('There is no such account on our website') != -1:
-          return True
-        else:
-          return False
-
-    def getHost(self):
-        logging.debug('self.host=%s' % self.host)
-        return self.host
-
-    def getStoryURL(self):
-        logging.debug('self.url=%s' % self.url)
-        return self.url
-
-    def getAuthorURL(self):
-        logging.debug('self.authorURL=%s' % self.authorURL)
-        return self.authorURL
-
-    def getUUID(self):
-        logging.debug('self.uuid=%s' % self.uuid)
-        return self.uuid
-    
-    def getStoryDescription(self):
-        logging.debug('self.storyDescription=%s' % self.storyDescription)
-        return self.storyDescription
-    
-    def getStoryPublished(self):
-        logging.debug('self.storyPublished=%s' % self.storyPublished)
-        return self.storyPublished
-    
-    def getStoryCreated(self):
-        self.storyCreated = datetime.datetime.now()
-        logging.debug('self.storyCreated=%s' % self.storyCreated)
-        return self.storyCreated
-    
-    def getStoryUpdated(self):
-        logging.debug('self.storyUpdated=%s' % self.storyUpdated)
-        return self.storyUpdated
-    
-    def getLanguage(self):
-        logging.debug('self.language=%s' % self.language)
-        return self.language
-    
-    def getLanguageId(self):
-        logging.debug('self.languageId=%s' % self.languageId)
-        return self.languageId
-    
-    def getSubjects(self):
-        logging.debug('self.subjects=%s' % self.authorName)
-        return self.subjects
-    
-    def getPublisher(self):
-        logging.debug('self.publisher=%s' % self.publisher)
-        return self.publisher
-    
-    def getNumChapters(self):
-        logging.debug('self.numChapters=%s' % self.numChapters)
-        return self.numChapters
-    
-    def getNumWords(self):
-        logging.debug('self.numWords=%s' % self.numWords)
-        return self.numWords
-    
-    def getAuthorId(self):
-        logging.debug('self.authorId=%s' % self.authorId)
-        return self.authorId
-    
-    def getStoryId(self):
-        logging.debug('self.storyId=%s' % self.storyId)
-        return self.storyId
-    
-    def getCategory(self):
-        logging.debug('self.category=%s' % self.category)
-        return self.category
-    
-    def getGenre(self):
-        logging.debug('self.genre=%s' % self.genre)
-        return self.genre
-    
-    def getStoryStatus(self):
-        logging.debug('self.storyStatus=%s' % self.storyStatus)
-        return self.storyStatus
-    
-    def getStoryRating(self):
-        logging.debug('self.storyRating=%s' % self.storyRating)
-        return self.storyRating
-    
-    def getStoryUserRating(self):
-        logging.debug('self.storyUserRating=%s' % self.storyUserRating)
-        return self.storyUserRating
-    
-    def getStoryCharacters(self):
-        logging.debug('self.storyCharacters=%s' % self.storyCharacters)
-        return self.storyCharacters
-
-    def getStorySeries(self):
-        logging.debug('self.storySeries=%s' % self.storySeries)
-        return self.storySeries
 
 class Twilighted_UnitTests(unittest.TestCase):
   def setUp(self):

From b51dd549f5b807e61f94ae93a0303560d8edf79a Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Thu, 11 Nov 2010 13:22:30 -0600
Subject: [PATCH 63/94] self.numChapters was one too many.

---
 ficwad.py | 4 +---
 1 file changed, 1 insertion(+), 3 deletions(-)

diff --git a/ficwad.py b/ficwad.py
index ddac91a8..7e9f3ae8 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -193,6 +193,7 @@ class FicWad(FanfictionSiteAdapter):
 
 			if select is None:
 				self.numChapters = '1'
+				logging.debug('self.numChapters=%s' % self.numChapters)
 				result.append((self.url,self.storyName))
 				logging.debug('Chapter[%s]=%s %s' % (ii, self.url, self.storyName))
 			else:
@@ -209,9 +210,6 @@ class FicWad(FanfictionSiteAdapter):
 					else:
 						logging.debug('Skipping Story Index.  URL %s' % url)
 		
-		self.numChapters = str(ii)
-		logging.debug('self.numChapters=%s' % self.numChapters)
-		
 		return result
 	
 	def getText(self, url):

From 981a922d00ae5b9663a5515896c9ddcadcd28e8f Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Thu, 11 Nov 2010 13:53:48 -0600
Subject: [PATCH 64/94] Deal with being passed in the first chapter as the url.

---
 fictionalley.py | 40 +++++++++++++++++++++++++++++++++++-----
 1 file changed, 35 insertions(+), 5 deletions(-)

diff --git a/fictionalley.py b/fictionalley.py
index 00d34815..fbbe95ee 100644
--- a/fictionalley.py
+++ b/fictionalley.py
@@ -74,6 +74,7 @@ class FictionAlley(FanfictionSiteAdapter):
 		self.storyUserRating = '0'
 		self.storyCharacters = []
 		self.storySeries = ''
+		self.storyName = ''
 		self.outputName = ''
 		self.outputStorySep = '-fa_'	
 		
@@ -129,18 +130,47 @@ class FictionAlley(FanfictionSiteAdapter):
 		data = data.replace('<!-- headerstart -->','<crazytagstringnobodywouldstumbleonaccidently id="storyheaders">').replace('<!-- headerend -->','</crazytagstringnobodywouldstumbleonaccidently>')
 		soup = bs.BeautifulStoneSoup(data)
 				
-		# Get title from <title>, remove before '-'.
-		title = soup.find('title').string
-		self.storyName = "-".join(title.split('-')[1:]).strip().replace(" (Story Text)","")
-		
-		links = soup.findAll('li')
+		breadcrumbs = soup.find('div', {'class': 'breadcrumbs'})
+		if breadcrumbs is not None:
+			# Be aware that this means that the user has entered the {STORY}01.html 
+			# We will not have valid Publised and Updated dates.  User should enter 
+			# the {STORY}.html instead.  We should force that instead of this.
+			logging.debug('breadcrumbs=%s' % breadcrumbs )
+			bcas = breadcrumbs.findAll('a')
+			logging.debug('bcas=%s' % bcas )
+			if bcas is not None and len(bcas) > 1:
+				bca = bcas[1]
+				logging.debug('bca=%s' % bca )
+				if 'href' in bca._getAttrMap():
+					logging.debug('bca.href=%s' % bca['href'] )
+					url = str(bca['href'])
+					if url is not None and len(url) > 0:
+						self.url = url
+						logging.debug('self.url=%s' % self.url )
+						ss = self.url.split('/')
+						self.storyId = ss[-1].replace('.html','')
+						self.storyName = bca.string
+						logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
 
+						data = self.opener.open(self.url).read()		
+						
+						# There is some usefull information in the headers of the first chapter page..
+						data = data.replace('<!-- headerstart -->','<crazytagstringnobodywouldstumbleonaccidently id="storyheaders">').replace('<!-- headerend -->','</crazytagstringnobodywouldstumbleonaccidently>')
+						soup = bs.BeautifulStoneSoup(data)
+		
 		# If it is decided that we really do care about number of words..  It's only available on the author's page..
 		#d0 = self.opener.open(self.authorURL).read()
 		#soupA = bs.BeautifulStoneSoup(d0)
 		#dls = soupA.findAll('dl')
 		#logging.debug('dls=%s' % dls)
 		
+		# Get title from <title>, remove before '-'.
+		if len(self.storyName) == 0:
+			title = soup.find('title').string
+			self.storyName = "-".join(title.split('-')[1:]).strip().replace(" (Story Text)","")
+		
+		links = soup.findAll('li')
+
 		self.numChapters = 0;
 		result = []
 		if len(links) == 0:

From bdf429b41c5482b7e9078db81c06ecac8cfd9ebf Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Fri, 12 Nov 2010 20:25:55 -0600
Subject: [PATCH 65/94] Added in mediaminer.org adapter.  Still has problems
 becaue mm seems to use the &#8820; type character encoding, and I couldn't
 manage to replace them.

---
 downloader.py |   3 +
 mediaminer.py | 402 ++++++++++++++++++++++++++++++++++++++++++++++++++
 2 files changed, 405 insertions(+)
 create mode 100644 mediaminer.py

diff --git a/downloader.py b/downloader.py
index 431bbad4..310eac41 100644
--- a/downloader.py
+++ b/downloader.py
@@ -24,6 +24,7 @@ import fictionalley
 import hpfiction
 import twilighted
 import potionsNsnitches
+import mediaminer
 
 import time
 
@@ -107,6 +108,8 @@ if __name__ == '__main__':
 		adapter = twilighted.Twilighted(url)
 	elif url.find('potionsandsnitches.net') != -1:
 		adapter = potionsNsnitches.PotionsNSnitches(url)
+	elif url.find('mediaminer.org') != -1:
+		adapter = mediaminer.MediaMiner(url)
 	else:
 		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
 		sys.exit(1)
diff --git a/mediaminer.py b/mediaminer.py
new file mode 100644
index 00000000..dd2ef3ea
--- /dev/null
+++ b/mediaminer.py
@@ -0,0 +1,402 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import os.path
+import logging
+import unittest
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time
+import datetime
+
+from constants import *
+from adapter import *
+
+try:
+	import login_password
+except:
+	# tough luck
+	pass
+
+class MediaMiner(FanfictionSiteAdapter):
+	def __init__(self, url):		
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		
+		self.storyName = ''
+		self.authorName = ''
+		self.storyDescription = ''
+		self.storyCharacters = []
+		self.storySeries = ''
+		self.authorId = '0'
+		self.authorURL = self.path
+		self.storyId = '0'
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = ''
+		self.category = ''
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'K'
+		self.storyUserRating = '0'
+		self.outputName = ''
+		self.outputStorySep = '-mm_'
+				
+		logging.debug('self.url=%s' % self.url)
+		
+		if self.url.find('view_st.php') != -1:
+			ss = self.url.split('view_st.php')
+			logging.debug('ss=%s' % ss)
+			if ss is not None and len(ss) > 1:
+				self.storyId = ss[1].replace('/','').strip()
+		elif self.url.find('view_ch.php?') != -1:
+			ss = self.url.split('=')
+			logging.debug('ss=%s' % ss)
+			if ss is not None and len(ss) > 1:
+				self.storyId = ss[-1].replace('/','').strip()
+				self.path = '/fanfic/view_st.php/' + self.storyId
+				self.url = 'http://' + self.host + self.path
+				logging.debug('self.url=%s' % self.url)
+		elif self.url.find('view_ch.php/') != -1:
+			ss = self.url.split('/')
+			logging.debug('ss=%s' % ss)
+			if ss is not None and len(ss) > 2:
+				self.storyId = ss[-2].strip()
+				self.path = '/fanfic/view_st.php/' + self.storyId
+				self.url = 'http://' + self.host + self.path
+				logging.debug('self.url=%s' % self.url)			
+			
+		logging.debug('self.storyId=%s' % self.storyId)
+		
+		logging.debug('self.path=%s' % self.path)
+		
+		if not self.appEngine:
+			self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+		else:
+			self.opener = None
+	
+		logging.debug("Created MediaMiner: url=%s" % (self.url))
+	
+	def _getLoginScript(self):
+		return self.path
+
+	def _getVarValue(self, varstr):
+		#logging.debug('_getVarValue varstr=%s' % varstr)
+		vals = varstr.split('=')
+		#logging.debug('vals=%s' % vals)
+		retstr="".join(vals[+1:])
+		#logging.debug('retstr=%s' % retstr)
+		if retstr.startswith(' '):
+			retstr = retstr[1:]
+		if retstr.endswith(';'):
+			retstr = retstr[:-1]
+		return retstr
+	
+	def _splitCrossover(self, subject):
+		if "Crossover" in subject:
+			self.addSubject ("Crossover")
+			logging.debug('Crossover=%s' % subject)
+			if subject.find(' and ') != -1:
+				words = subject.split(' ')
+				logging.debug('words=%s' % words)
+				subj = ''
+				for s in words:
+					if s in "and Crossover":
+						if len(subj) > 0:
+							self.addSubject(subj)
+						subj = ''
+					else:
+						if len(subj) > 0:
+							subj = subj + ' '
+						subj = subj + s
+				if len(subj) > 0:
+					self.addSubject(subj)
+			else:
+				self.addSubject(subject)
+		else:
+			self.addSubject(subject)
+		return True
+
+	def _splitGenre(self, subject):
+		if len(subject) > 0:
+			words = subject.split('/')
+			logging.debug('words=%s' % words)
+			for subj in words:
+			    if len(subj) > 0:
+				self.addSubject(subj)
+		return True
+
+	def _fetchUrl(self, url):
+		if not self.appEngine:
+			return self.opener.open(url).read().decode('utf-8')
+		else:
+			return googlefetch(url).content
+	
+	def extractIndividualUrls(self):
+		data = self._fetchUrl(self.url)
+		#data.replace('<br />',' ').replace('<br>',' ').replace('</br>',' ')
+		soup = bs.BeautifulSoup(data)
+		#logging.debug('soap=%s' % soup)
+		urls = []
+		
+		td_ffh = soup.find('td', {'class' : 'ffh'})
+		#logging.debug('td_ffh=%s' % td_ffh)
+		if td_ffh is not None:
+			#logging.debug('td_ffh.text=%s' % td_ffh.find(text=True))
+			self.storyName = str(td_ffh.find(text=True)).strip()
+			logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+			fft = td_ffh.find('font', {'class' : 'smtxt'})
+			#logging.debug('fft=%s' % fft)
+			if fft is not None:
+				ffts = fft.string.split(' ')
+				if ffts is not None:
+					if len(ffts) > 1:
+						self.storyRating = ffts[1]
+						logging.debug('self.storyRating=%s' % self.storyRating)
+		self.genre = ''
+		td_smtxt = soup.findAll('td')
+		if td_smtxt is None:
+			logging.debug('td_smtxt is NONE!')
+			pass
+		else:
+			ll = len(td_smtxt)
+			#logging.debug('td_smtxt=%s, len=%s' % (td_smtxt, ll))
+			for ii in range(ll):
+				td = td_smtxt[ii]
+				if 'class' in td._getAttrMap() and td['class'] != 'smtxt':
+					logging.debug('td has class attribute but is not smtxt')
+					continue
+				ss = str(td).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
+				#logging.debug('ss=%s' % ss)
+				if len(ss) > 1 and (ss.find('Genre(s):') != -1 or ss.find('Type:') != -1):
+					#logging.debug('ss=%s' % ss)
+					ssbs = td.findAll('b')
+					#logging.debug('ssbs=%s' % ssbs)
+					bb = 0
+					while bb < len(ssbs):
+						nvs = bs.NavigableString('')
+						sst=''
+						ssb = ssbs[bb]
+						ssbt = str(ssb.text).strip()
+						#logging.debug('ssb=%s' % ssb)
+						#logging.debug('ssbt=%s' % ssbt)
+						ssbn = ssb.nextSibling
+						while ssbn is not None:
+							#logging.debug('ssbn=%s' % ssbn)
+							#logging.debug('ssbn.class=%s' % ssbn.__class__)
+							if nvs.__class__ == ssbn.__class__:
+								st = str(ssbn)
+								if st.strip() != '|':
+									sst = sst + st
+							else:
+								#logging.debug('ssbn.name=%s' % ssbn.name)
+								if ssbn.name == 'b':
+									break								
+								ssbnts = ssbn.findAll(text=True)
+								for ssbnt in ssbnts:
+									sst = sst + ssbnt
+							ssbn = ssbn.nextSibling
+						sst = sst.replace('&nbsp;',' ').strip()
+						#logging.debug('sst=%s' % sst)
+						if bb == 0:
+							ssbt = ssbt.replace(':','')
+							self.addSubject(ssbt)
+							self.addSubject(sst)
+							logging.debug('self.subjects=%s' % self.subjects)
+						else:
+							if ssbt == 'Genre(s):':
+								self.genre = sst
+								logging.debug('self.genre=%s' % self.genre)
+								sts = sst.split(' / ')
+								for st in sts:
+									self.addSubject(st.strip())
+								logging.debug('self.subjects=%s' % self.subjects)
+							elif ssbt == 'Type:':
+								self.category = sst
+								logging.debug('self.category=%s' % self.category)
+								self.addSubject(sst)
+								logging.debug('self.subjects=%s' % self.subjects)
+							elif ssbt == 'Author:':
+								pass
+							elif ssbt == 'Visits:':
+								pass
+							elif ssbt == 'Size:':
+								pass
+							elif ssbt == 'Pages:':
+								pass
+							elif ssbt == 'Status:':
+								if sst == "Completed":
+									self.storyStatus = 'Completed'
+								else:
+									self.storyStatus = 'In-Progress'
+							elif ssbt == 'Words:':
+								self.numWords = sst.replace('|','').strip()
+								logging.debug('self.numWords=%s' % self.numWords)
+								pass
+							elif ssbt == 'Summary:':
+								self.storyDescription = sst.strip()
+								logging.debug('self.storyDescription=%s' % self.storyDescription)
+							elif ssbt == 'Latest Revision:' or ssbt == 'Uploaded On:':
+								logging.debug('sst=%s' % sst)
+								self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sst.strip(' '), "%B %d, %Y %H:%M %Z")))
+								logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+							else:
+								pass
+						bb = bb+1
+						
+					smtxt_as = td_smtxt[ii].findAll('a')
+					#logging.debug('smtxt_as=%s' % smtxt_as)
+					for smtxt_a in smtxt_as:
+						if 'href' in smtxt_a._getAttrMap() and smtxt_a['href'].find('/u/'):
+							sta = smtxt_a['href']
+							#logging.debug('sta=%s' % sta)
+							stas = sta.split('/u/')
+							#logging.debug('stas=%s' % stas)
+							if stas is not None and len(stas) > 1:
+								self.authorId = stas[1]
+								self.authorURL = 'http://' + self.host + sta
+								self.authorName = smtxt_a.string
+								logging.debug('self.authorName=%s, self.authorId=%s' % (self.authorName, self.authorId))
+				
+		urlstory=''
+		numchapters = 0
+		td_tbbrdr = soup.find('td', {'class' : 'tbbrdr'})
+		if td_tbbrdr is not None:
+			#logging.debug('td_tbbrdr=%s' % td_tbbrdr )
+
+			sl = td_tbbrdr.find('select', {'name':'cid'})
+			if sl is not None:
+				#logging.debug('sl=%s' % sl )
+				opts = sl.findAll('option')
+				for o in opts:
+					#logging.debug('o=%s' % o)				
+					if 'value' in o._getAttrMap():
+						url = 'http://' + self.host + '/fanfic/view_ch.php/' + self.storyId  + '/' + o['value']
+						logging.debug('URL=%s, Title=%s' % (url, o.string))
+						if numchapters == 0:
+							ss = o.string.split('[')
+							if ss is not None and len(ss) > 1:
+								ssd = ss[-1].replace(']','') 
+								#logging.debug('ssd=%s' % ssd)
+								self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(ssd.strip(' '), "%b %d, %Y")))
+								logging.debug('self.storyPublished=%s' % self.storyPublished)
+						urls.append((url, o.string))
+						numchapters = numchapters + 1
+		
+		if numchapters == 0:
+			numchapters = 1
+			url = 'http://' + self.host + '/fanfic/view_st.php/' + self.storyId
+			self.storyPublished = self.storyUpdated
+			logging.debug('self.storyPublished=%s' % self.storyPublished)
+			ssd = self.storyName + ' [' + self.storyPublished.strftime("%b %d, %Y") + ']'
+			logging.debug('URL=%s, Title=%s' % (url, ssd))
+			urls.append((url, ssd))
+			
+		self.numChapters = str(numchapters)
+		logging.debug('self.numChapters=%s' % self.numChapters)
+		logging.debug('urls=%s' % urls)
+		
+		return urls
+	
+	def getText(self, url):
+		time.sleep( 2.0 )
+		logging.debug('url=%s' % url)
+		data = self._fetchUrl(url)
+
+		try:
+			soup = bs.BeautifulSoup(data)
+		except:
+			logging.info("Failed to decode: <%s>" % data)
+			soup = None
+			exit(20)
+			return '<html/>'
+		
+		#div = soup.find('div', {'id' : 'storytext'})
+		#if div is None:
+			#logging.error("Error downloading Chapter: %s" % url)
+			#exit (20)
+			#return '<html/>'
+			
+		#logging.info("Soup: %s" % soup.prettify())
+
+		nvs = bs.NavigableString('')
+		sst=''
+		allAs = soup.findAll ('a', { 'name' : 'fic_c' })
+		#logging.debug('allAs=%s' % allAs)
+		for a in allAs:
+			#logging.debug('a=%s' % a)
+			foundfirst = False
+			done = False
+			nxta = a.nextSibling
+			while nxta is not None and not done:
+				#logging.debug('nxta=%s' % nxta)
+				#logging.debug('nxta.class=%s' % nxta.__class__)
+				st = str(nxta)
+				if nvs.__class__ != nxta.__class__:
+					#logging.debug('nxta.name=%s' % nxta.name)
+					if nxta.name == 'table':
+						st = ''
+						if foundfirst:
+							done = True
+					if nxta.name == 'div' and 'class' in nxta._getAttrMap() and nxta['class'] == 'acl' and foundfirst:
+						st = ''
+						done = True
+				
+					if nxta.name == 'br':
+						if not foundfirst:
+							st = ''
+					else:
+						foundfirst = True
+				else:
+					foundfirst = True
+					
+				sst = sst + st
+				nxta = nxta.nextSibling
+
+		#sst = sst.replace('&nbsp;',' ').strip()
+		#logging.debug('sst=%s' % sst)
+		
+		#logging.debug('sst.0=%s' % sst)
+		#sst0 = sst.replace(u'&#8820;', u'&ldquo;').replace(u'&#8821;','&rdquo;').replace(u'&#8816;',u'&lsquo;').replace(u'&#8817;',u'&rsquo;')
+		#sst0 = sst.replace(u"&#8821;","&rdquo;")
+		#logging.debug('sst.1=%s' % sst0)
+		#sst1 = sst.replace(u'&#8820;', u'\"').replace('&#8821;','\"').replace('&#8816;','\'').replace('&#8817;','\'')
+		#logging.debug('sst.2=%s' % sst1)
+					
+		return sst
+			
+class FPC_UnitTests(unittest.TestCase):
+	def setUp(self):
+		logging.basicConfig(level=logging.DEBUG)
+		pass
+	
+	def testFictionPress(self):
+		url = 'http://www.fictionpress.com/s/2725180/1/Behind_This_Facade'
+		f = FPCom(url)
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals('Behind This Facade', f.getStoryName())
+		self.assertEquals('IntoxicatingMelody', f.getAuthorName())
+	
+		text = f.getText(url)
+		self.assertTrue(text.find('Kale Resgerald at your service" He answered, "So, can we go now? Or do you want to') != -1)
+
+if __name__ == '__main__':
+	unittest.main()

From 99ba1b48aadc20401549096ca57ec06ab7a3e689 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Fri, 12 Nov 2010 20:27:17 -0600
Subject: [PATCH 66/94] The getSubjects function was returning the author.

---
 adapter.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/adapter.py b/adapter.py
index d4f80cc5..054267b9 100644
--- a/adapter.py
+++ b/adapter.py
@@ -163,7 +163,7 @@ class FanfictionSiteAdapter:
 		return True
 
 	def getSubjects(self):
-		logging.debug('self.subjects=%s' % self.authorName)
+		logging.debug('self.subjects=%s' % self.subjects)
 		return self.subjects
 
 	def getPublisher(self):

From c77498e6ea9dc4ee66ab2ec804b85883abf9a307 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Fri, 12 Nov 2010 21:28:25 -0600
Subject: [PATCH 67/94] Some changes in order to allow the refactoring of
 functions to work from within the appEngine.

---
 adapter.py    | 25 +++++++++++++++++++------
 downloader.py | 11 +++++++----
 ffnet.py      | 10 ++--------
 fpcom.py      | 10 ++--------
 mediaminer.py | 10 ++--------
 5 files changed, 32 insertions(+), 34 deletions(-)

diff --git a/adapter.py b/adapter.py
index 054267b9..9c1d6d5a 100644
--- a/adapter.py
+++ b/adapter.py
@@ -3,6 +3,11 @@
 import logging
 import datetime
 
+try:
+	from google.appengine.api.urlfetch import fetch as googlefetch
+	appEngineGlob = True
+except:
+	appEngineGlob = False
 
 class LoginRequiredException(Exception):
 	def __init__(self, url):
@@ -12,11 +17,7 @@ class LoginRequiredException(Exception):
 		return repr(self.url + ' requires user to be logged in')
 
 class FanfictionSiteAdapter:
-	try:
-		from google.appengine.api.urlfetch import fetch as googlefetch
-		appEngine = True
-	except:
-		appEngine = False
+	appEngine = appEngineGlob
 	login = ''
 	password = ''
 	url = ''
@@ -30,6 +31,7 @@ class FanfictionSiteAdapter:
 	authorURL = ''
 	outputStorySep = '-Ukn_'
 	outputName = ''
+	outputFileName = ''
 	storyDescription = ''
 	storyCharacters = []
 	storySeries = ''
@@ -57,6 +59,12 @@ class FanfictionSiteAdapter:
 	def hasAppEngine(self):
 		return self.appEngine
 	
+	def fetchUrl(self, url):
+		if not self.appEngine:
+			return self.opener.open(url).read().decode('utf-8')
+		else:
+			return googlefetch(url).content
+	
 	def requiresLogin(self, url = None):
 		return False
 	
@@ -86,9 +94,14 @@ class FanfictionSiteAdapter:
 
 	def getOutputName(self):
 		self.outputName = self.storyName.replace(" ", "_") + self.outputStorySep + self.storyId
-		logging.debug('self.storyId=%s, self.storyName=%s self.outputName=%s' % (self.storyId, self.storyName, self.outputName))
+		logging.debug('self.outputName=%s' % self.outputName)
 		return self.outputName
 
+	def getOutputFileName(self, booksDirectory, format):
+		self.outputFileName = booksDirectory + "/" + self.getOutputName() + "." + format
+		logging.debug('self.outputFileName=%s' % self.outputFileName)
+		return self.outputNameFileName
+
 	def getAuthorURL(self):
 		logging.debug('self.authorURL=%s' % self.authorURL)
 		return self.authorURL
diff --git a/downloader.py b/downloader.py
index 310eac41..ee0120f3 100644
--- a/downloader.py
+++ b/downloader.py
@@ -55,10 +55,13 @@ class FanficLoader:
 		
 		urls = self.adapter.extractIndividualUrls()
 
-		s = self.booksDirectory + "/" + self.adapter.getOutputName() + "." + format
-		if not self.overWrite and os.path.isfile(s):
-			print >> sys.stderr, "File " + s + " already exists!  Skipping!"
-			exit(10)
+		if (self.adapter.hasAppEngine):
+			self.overWrite = True
+		else:
+			s = self.adapter.getOutputFileName(self.booksDirectory, format)
+			if not self.overWrite and os.path.isfile(s):
+				print >> sys.stderr, "File " + s + " already exists!  Skipping!"
+				exit(10)
 
 		self.writer = self.writerClass(self.booksDirectory, self.adapter, inmemory=self.inmemory, compress=self.compress)
 		
diff --git a/ffnet.py b/ffnet.py
index a036988e..d0eff9e7 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -143,14 +143,8 @@ class FFNet(FanfictionSiteAdapter):
 				self.addSubject(subj)
 		return True
 
-	def _fetchUrl(self, url):
-		if not self.appEngine:
-			return self.opener.open(url).read().decode('utf-8')
-		else:
-			return googlefetch(url).content
-	
 	def extractIndividualUrls(self):
-		data = self._fetchUrl(self.url)
+		data = self.fetchUrl(self.url)
 		d2 = re.sub('&\#[0-9]+;', ' ', data)
 		soup = bs.BeautifulStoneSoup(d2)
 		allA = soup.findAll('a')
@@ -264,7 +258,7 @@ class FFNet(FanfictionSiteAdapter):
 	
 	def getText(self, url):
 		time.sleep( 2.0 )
-		data = self._fetchUrl(url)
+		data = self.fetchUrl(url)
 		lines = data.split('\n')
 		
 		textbuf = ''
diff --git a/fpcom.py b/fpcom.py
index 04266888..b9431322 100644
--- a/fpcom.py
+++ b/fpcom.py
@@ -136,15 +136,9 @@ class FPCom(FanfictionSiteAdapter):
 			    if len(subj) > 0:
 				self.addSubject(subj)
 		return True
-
-	def _fetchUrl(self, url):
-		if not self.appEngine:
-			return self.opener.open(url).read().decode('utf-8')
-		else:
-			return googlefetch(url).content
 	
 	def extractIndividualUrls(self):
-		data = self._fetchUrl(self.url)
+		data = self.fetchUrl(self.url)
 		d2 = re.sub('&\#[0-9]+;', ' ', data)
 		soup = bs.BeautifulStoneSoup(d2)
 		allA = soup.findAll('a')
@@ -283,7 +277,7 @@ class FPCom(FanfictionSiteAdapter):
 	
 	def getText(self, url):
 		time.sleep( 2.0 )
-		data = self._fetchUrl(url)
+		data = self.fetchUrl(url)
 		lines = data.split('\n')
 		
 		textbuf = ''
diff --git a/mediaminer.py b/mediaminer.py
index dd2ef3ea..77ff29bd 100644
--- a/mediaminer.py
+++ b/mediaminer.py
@@ -143,14 +143,8 @@ class MediaMiner(FanfictionSiteAdapter):
 				self.addSubject(subj)
 		return True
 
-	def _fetchUrl(self, url):
-		if not self.appEngine:
-			return self.opener.open(url).read().decode('utf-8')
-		else:
-			return googlefetch(url).content
-	
 	def extractIndividualUrls(self):
-		data = self._fetchUrl(self.url)
+		data = self.fetchUrl(self.url)
 		#data.replace('<br />',' ').replace('<br>',' ').replace('</br>',' ')
 		soup = bs.BeautifulSoup(data)
 		#logging.debug('soap=%s' % soup)
@@ -318,7 +312,7 @@ class MediaMiner(FanfictionSiteAdapter):
 	def getText(self, url):
 		time.sleep( 2.0 )
 		logging.debug('url=%s' % url)
-		data = self._fetchUrl(url)
+		data = self.fetchUrl(url)
 
 		try:
 			soup = bs.BeautifulSoup(data)

From dbec6c95b2ae5bdd31b22f55bb41508d59a21a52 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Fri, 12 Nov 2010 21:51:46 -0600
Subject: [PATCH 68/94] Changed to deal with somebody putting in the mobile url
 for fanfiction.net...  ie <http://m.fanfiction.net/s/11> will get changed to
 <http://www.fanfiction.net/s/11>

---
 ffnet.py | 8 +++++++-
 1 file changed, 7 insertions(+), 1 deletion(-)

diff --git a/ffnet.py b/ffnet.py
index d0eff9e7..7a201e2b 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -86,7 +86,13 @@ class FFNet(FanfictionSiteAdapter):
 		
 		logging.debug('self.path=%s' % self.path)
 		
-		logging.debug('self.storyId=%s, chapter=%s' % (self.storyId, chapter))
+		if self.host is not None and self.host == "m.fanfiction.net":
+			self.host = "www.fanfiction.net"
+			logging.debug('self.host=%s' % self.host)
+			self.url = "http://" + self.host + "/" + self.path
+			logging.debug('self.url=%s' % self.url)
+			
+		logging.debug('self.storyId=%s' % self.storyId)
 		if not self.appEngine:
 			self.opener = u2.build_opener(u2.HTTPCookieProcessor())
 		else:

From 5618d8036be2b70f8774e4e0c2e62afc66d458ee Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Sat, 13 Nov 2010 23:30:47 -0600
Subject: [PATCH 69/94] MediaMiner was not sending the date with the correct
 timezone info, so strip it off.  We don't need the time anyways.

---
 mediaminer.py | 10 +++++++---
 1 file changed, 7 insertions(+), 3 deletions(-)

diff --git a/mediaminer.py b/mediaminer.py
index 77ff29bd..e8389abc 100644
--- a/mediaminer.py
+++ b/mediaminer.py
@@ -167,7 +167,7 @@ class MediaMiner(FanfictionSiteAdapter):
 		self.genre = ''
 		td_smtxt = soup.findAll('td')
 		if td_smtxt is None:
-			logging.debug('td_smtxt is NONE!')
+			#logging.debug('td_smtxt is NONE!')
 			pass
 		else:
 			ll = len(td_smtxt)
@@ -248,8 +248,12 @@ class MediaMiner(FanfictionSiteAdapter):
 								self.storyDescription = sst.strip()
 								logging.debug('self.storyDescription=%s' % self.storyDescription)
 							elif ssbt == 'Latest Revision:' or ssbt == 'Uploaded On:':
-								logging.debug('sst=%s' % sst)
-								self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sst.strip(' '), "%B %d, %Y %H:%M %Z")))
+								#logging.debug('sst=%s' % sst)
+								ssts = sst.split(' ')
+								if ssts is not None and len(ssts) > 3:
+									sst = ssts[0] + ' ' + ssts[1] + ' ' + ssts[2]
+								#logging.debug('sst=%s' % sst)
+								self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sst.strip(' '), "%B %d, %Y")))
 								logging.debug('self.storyUpdated=%s' % self.storyUpdated)
 							else:
 								pass

From e3b4769bfb95cdf9ea45511ae7724d6fdbbff1b7 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Tue, 16 Nov 2010 09:09:26 -0600
Subject: [PATCH 70/94] Misspelled the return variable from getOutputFileName.

---
 adapter.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/adapter.py b/adapter.py
index 9c1d6d5a..13608244 100644
--- a/adapter.py
+++ b/adapter.py
@@ -100,7 +100,7 @@ class FanfictionSiteAdapter:
 	def getOutputFileName(self, booksDirectory, format):
 		self.outputFileName = booksDirectory + "/" + self.getOutputName() + "." + format
 		logging.debug('self.outputFileName=%s' % self.outputFileName)
-		return self.outputNameFileName
+		return self.outputFileName
 
 	def getAuthorURL(self):
 		logging.debug('self.authorURL=%s' % self.authorURL)

From 9b6fdb4540b5620cc62427ca4158d5407d57f291 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Thu, 18 Nov 2010 14:26:16 -0600
Subject: [PATCH 71/94] Fix numeric entities--correctly this time.  Reduce
 margins slightly, tweak description escaping slightly.

---
 constants.py | 2 +-
 output.py    | 9 ++++-----
 2 files changed, 5 insertions(+), 6 deletions(-)

diff --git a/constants.py b/constants.py
index dc185eb6..bd35546a 100644
--- a/constants.py
+++ b/constants.py
@@ -1,6 +1,6 @@
 # -*- coding: utf-8 -*-
 
-CSS = '''body { margin-left: 5%; margin-right: 5%; margin-top: 5%; margin-bottom: 5%; text-align: justify; }
+CSS = '''body { margin-left: 2%; margin-right: 2%; margin-top: 2%; margin-bottom: 2%; text-align: justify; }
 pre { font-size: x-small; }
 sml { font-size: small; }
 h1 { text-align: center; }
diff --git a/output.py b/output.py
index e028237e..a320a42e 100644
--- a/output.py
+++ b/output.py
@@ -243,8 +243,8 @@ class EPubFanficWriter(FanficWriter):
 		else:
 			description = str(description)
 		if description is not None and len(description) > 0:
-			description = description.replace ('\\\'', '').replace('\\\"', '')
-			description =  removeEntities(description.replace('&nbsp;',' ').replace('&rsquo;',''))
+			description = description.replace ('\\', '\'').replace('\\\"', '\"')
+			description =  removeEntities(description)
 		else:
 			description = ' '
 
@@ -336,12 +336,11 @@ class EPubFanficWriter(FanficWriter):
 
 def unirepl(match):
 	"Return the unicode string for a decimal number"
-	s = match.group()
-	if s[2].lower()=='x':
+	if match.group(1)=='x':
 		radix=16
 	else:
 		radix=10
-	value = int(s[3:-1], radix )
+	value = int(match.group(2), radix )
 	return unichr(value)
 
 def replaceNumberEntities(data):

From 22d0989d0ab4acdf32664a21e205aa06b02513c8 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Thu, 18 Nov 2010 16:07:58 -0600
Subject: [PATCH 72/94] Raise exceptions instead of an exit when errors are
 detected. Added static functions to the writer classes that contain the type
 name and type extension to use when writing out the destination file. Added a
 function to the zipdir that will check the date the fic was last updated in
 the current archive of a fic against the current last updated date and return
 whether the fic is newer then the archive file.  This is not useful at this
 time for when this is running under appEngine. Added a flag to indicate if
 the program is running from appEngine or not.

---
 adapter.py          |  20 +++++++--
 downloader.py       |  86 ++++++++++++++++++++++++++++++-------
 ffnet.py            |  40 ++++++++++++-----
 fictionalley.py     |  45 ++++++++++++++-----
 ficwad.py           |  48 +++++++++++++++++----
 fpcom.py            |  39 +++++++++++++----
 hpfiction.py        |  39 ++++++++++++++---
 mediaminer.py       |  62 +++++++++++++++------------
 output.py           | 102 ++++++++++++++++++++++++++++----------------
 potionsNsnitches.py |  53 ++++++++++++++++++-----
 twilighted.py       |  53 ++++++++++++++++++-----
 zipdir.py           |  68 +++++++++++++++++++++++++++++
 12 files changed, 506 insertions(+), 149 deletions(-)

diff --git a/adapter.py b/adapter.py
index 13608244..f4dd116a 100644
--- a/adapter.py
+++ b/adapter.py
@@ -2,6 +2,7 @@
 
 import logging
 import datetime
+from output import makeAcceptableFilename
 
 try:
 	from google.appengine.api.urlfetch import fetch as googlefetch
@@ -15,6 +16,18 @@ class LoginRequiredException(Exception):
 	
 	def __str__(self):
 		return repr(self.url + ' requires user to be logged in')
+	
+class StoryArchivedAlready(Exception):
+	pass
+
+class StoryDoesNotExist(Exception):
+	pass
+
+class FailedToDownload(Exception):
+	pass
+
+class InvalidStoryURL(Exception):
+	pass
 
 class FanfictionSiteAdapter:
 	appEngine = appEngineGlob
@@ -93,12 +106,13 @@ class FanfictionSiteAdapter:
 		return self.uuid
 
 	def getOutputName(self):
-		self.outputName = self.storyName.replace(" ", "_") + self.outputStorySep + self.storyId
+		self.outputName = makeAcceptableFilename(self.storyName.replace(" ", "_") + self.outputStorySep + self.storyId)
 		logging.debug('self.outputName=%s' % self.outputName)
 		return self.outputName
 
-	def getOutputFileName(self, booksDirectory, format):
-		self.outputFileName = booksDirectory + "/" + self.getOutputName() + "." + format
+	def getOutputFileName(self, booksDirectory, bookExt):
+		self.getOutputName()	# make sure self.outputName is populated
+		self.outputFileName = booksDirectory + "/" + self.outputName + bookExt
 		logging.debug('self.outputFileName=%s' % self.outputFileName)
 		return self.outputFileName
 
diff --git a/downloader.py b/downloader.py
index ee0120f3..3dfd7fc0 100644
--- a/downloader.py
+++ b/downloader.py
@@ -14,12 +14,18 @@ import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
+import zipdir
 
+import output
+import adapter
+from adapter import StoryArchivedAlready
+from adapter import StoryDoesNotExist
+from adapter import FailedToDownload
+from adapter import InvalidStoryURL
+from adapter import LoginRequiredException
 import ffnet
 import fpcom
 import ficwad
-import output
-import adapter
 import fictionalley
 import hpfiction
 import twilighted
@@ -31,15 +37,30 @@ import time
 class FanficLoader:
 	'''A controller class which handles the interaction between various specific downloaders and writers'''
 	booksDirectory = "books"
+	standAlone = False
 	
-	def __init__(self, adapter, writerClass, quiet = False, inmemory = False, compress=True):
+	def __init__(self, adapter, writerClass, quiet = False, inmemory = False, compress=True, overwrite=False):
 		self.adapter = adapter
 		self.writerClass = writerClass
 		self.quiet = quiet
 		self.inmemory = inmemory
 		self.compress = compress
 		self.badLogin = False
-		self.overWrite = True
+		self.overWrite = overwrite
+			
+	def getBooksDirectory(self):
+		return self.booksDirectory
+
+	def setBooksDirectory(self, bd):
+		self.booksDirectory = bd
+		return self.booksDirectory
+	
+	def getStandAlone(self):
+		return self.standAlone
+
+	def setStandAlone(self, sa):
+		self.standAlone = sa
+		return self.standAlone
 	
 	def getAdapter():
 		return self.adapter
@@ -55,13 +76,16 @@ class FanficLoader:
 		
 		urls = self.adapter.extractIndividualUrls()
 
-		if (self.adapter.hasAppEngine):
-			self.overWrite = True
+		logging.debug("self.writerClass=%s" % self.writerClass)
+		if self.standAlone and not self.inmemory:
+			s = self.adapter.getOutputFileName(self.booksDirectory, self.writerClass.getFormatExt())
+			logging.debug("Always overwrite? %s" % self.overWrite)
+			if not self.overWrite:
+				logging.debug("Checking if current archive of the story exists.  Filename=%s" % s)
+				if not zipdir.checkNewer ( s, self.adapter.getStoryUpdated() ):
+					raise StoryArchivedAlready("A Current archive file \"" + s + "\" already exists!  Skipping!")
 		else:
-			s = self.adapter.getOutputFileName(self.booksDirectory, format)
-			if not self.overWrite and os.path.isfile(s):
-				print >> sys.stderr, "File " + s + " already exists!  Skipping!"
-				exit(10)
+			logging.debug("Do not check for existance of archive file.")
 
 		self.writer = self.writerClass(self.booksDirectory, self.adapter, inmemory=self.inmemory, compress=self.compress)
 		
@@ -83,10 +107,17 @@ class FanficLoader:
 
 if __name__ == '__main__':
 	logging.basicConfig(level=logging.DEBUG)
-	(url, format) = sys.argv[1:]
-	# (url) = sys.argv[1]
-	# format = 'epub'
+	argvlen = len(sys.argv)
+	url = None
+	if argvlen > 1:
+		url = sys.argv[1]
+	if argvlen > 2:
+		bookFormat = sys.argv[2]
 	
+	if url is None: 
+		print >> sys.stderr, "Usage: downloader.py URL Type"
+		sys.exit(-1)
+		
 	if type(url) is unicode:
 		print('URL is unicode')
 		url = url.encode('latin1')
@@ -117,9 +148,9 @@ if __name__ == '__main__':
 		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
 		sys.exit(1)
 
-	if format == 'epub':
+	if bookFormat == 'epub':
 		writerClass = output.EPubFanficWriter
-	elif format == 'html':
+	elif bookFormat == 'html':
 		writerClass = output.HTMLWriter
 	
 	if adapter.requiresLogin(url):
@@ -134,5 +165,28 @@ if __name__ == '__main__':
 		
 	
 	loader = FanficLoader(adapter, writerClass)
-	loader.download()
+	loader.setStandAlone(True)
+
+	try:
+		loader.download()
+	except FailedToDownload, ftd:
+		print >> sys.stderr, str(ftd)
+		sys.exit(2)		# Error Downloading
+	except InvalidStoryURL, isu:
+		print >> sys.stderr, str(isu)
+		sys.exit(3)		# Unknown Error
+	except StoryArchivedAlready, se:
+		print >> sys.stderr, str(se)
+		sys.exit(10)	# Skipped
+	except StoryDoesNotExist, sdne:
+		print >> sys.stderr, str(sdne)
+		sys.exit(20) 	# Missing
+	except LoginRequiredException, lre:
+		print >> sys.stderr, str(lre)
+		sys.exit(30) 	# Missing
+	except Exception, e:
+		print >> sys.stderr, str(e)
+		sys.exit(99)		# Unknown Error
+	
+	sys.exit(0)
 	
diff --git a/ffnet.py b/ffnet.py
index 7a201e2b..a6fee2dc 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -70,8 +70,7 @@ class FFNet(FanfictionSiteAdapter):
 		logging.debug('spl=%s' % spl)
 		if spl is not None:
 			if len(spl) > 0 and spl[0] != 's':
-				logging.error("Error URL \"%s\" is not a story." % self.url)
-				exit (20)				
+				raise InvalidStoryURL("Error URL \"%s\" is not a story." % self.url)
 			if len(spl) > 1:
 				self.storyId = spl[1]
 			if len(spl) > 2:
@@ -150,9 +149,23 @@ class FFNet(FanfictionSiteAdapter):
 		return True
 
 	def extractIndividualUrls(self):
-		data = self.fetchUrl(self.url)
+		data = ''
+		try:
+			data = self.fetchUrl(self.url)
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
+		
 		d2 = re.sub('&\#[0-9]+;', ' ', data)
-		soup = bs.BeautifulStoneSoup(d2)
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(d2)
+		except:
+			logging.error("Failed to decode: <%s>" % d2)
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
+
 		allA = soup.findAll('a')
 		for a in allA:
 			if 'href' in a._getAttrMap() and a['href'].find('/u/') != -1:
@@ -264,7 +277,15 @@ class FFNet(FanfictionSiteAdapter):
 	
 	def getText(self, url):
 		time.sleep( 2.0 )
-		data = self.fetchUrl(url)
+		data = ''
+		try:
+			data = self.fetchUrl(url)
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
 		lines = data.split('\n')
 		
 		textbuf = ''
@@ -276,16 +297,15 @@ class FFNet(FanfictionSiteAdapter):
 		except:
 			data = olddata
 		
+		soup = None
 		try:
 			soup = bs.BeautifulStoneSoup(data)
 		except:
-			logging.info("Failed to decode: <%s>" % data)
-			soup = None
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+
 		div = soup.find('div', {'id' : 'storytext'})
 		if None == div:
-			logging.error("Error downloading Chapter: %s" % url)
-			exit (20)
-			return '<html/>'
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
 			
 		return div.__str__('utf8')
 					
diff --git a/fictionalley.py b/fictionalley.py
index fbbe95ee..31f43b5d 100644
--- a/fictionalley.py
+++ b/fictionalley.py
@@ -124,25 +124,36 @@ class FictionAlley(FanfictionSiteAdapter):
 	
 		
 	def extractIndividualUrls(self):
-		data = self.opener.open(self.url).read()		
+		data = ''
+		try:
+			data = self.opener.open(self.url).read()		
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
 		
 		# There is some usefull information in the headers of the first chapter page..
 		data = data.replace('<!-- headerstart -->','<crazytagstringnobodywouldstumbleonaccidently id="storyheaders">').replace('<!-- headerend -->','</crazytagstringnobodywouldstumbleonaccidently>')
-		soup = bs.BeautifulStoneSoup(data)
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
 				
 		breadcrumbs = soup.find('div', {'class': 'breadcrumbs'})
 		if breadcrumbs is not None:
 			# Be aware that this means that the user has entered the {STORY}01.html 
 			# We will not have valid Publised and Updated dates.  User should enter 
 			# the {STORY}.html instead.  We should force that instead of this.
-			logging.debug('breadcrumbs=%s' % breadcrumbs )
+			#logging.debug('breadcrumbs=%s' % breadcrumbs )
 			bcas = breadcrumbs.findAll('a')
-			logging.debug('bcas=%s' % bcas )
+			#logging.debug('bcas=%s' % bcas )
 			if bcas is not None and len(bcas) > 1:
 				bca = bcas[1]
-				logging.debug('bca=%s' % bca )
+				#logging.debug('bca=%s' % bca )
 				if 'href' in bca._getAttrMap():
-					logging.debug('bca.href=%s' % bca['href'] )
+					#logging.debug('bca.href=%s' % bca['href'] )
 					url = str(bca['href'])
 					if url is not None and len(url) > 0:
 						self.url = url
@@ -244,7 +255,15 @@ class FictionAlley(FanfictionSiteAdapter):
 	
 	def getText(self, url):
 		# fictionalley uses full URLs in chapter list.
-		data = self.opener.open(url).read()
+		data = ''
+		try:
+			data = self.opener.open(url).read()
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
 		
 		# find <!-- headerend --> & <!-- footerstart --> and
 		# replaced with matching div pair for easier parsing.
@@ -252,13 +271,17 @@ class FictionAlley(FanfictionSiteAdapter):
 		# something other than div prevents soup from pairing
 		# our div with poor html inside the story text.
 		data = data.replace('<!-- headerend -->','<crazytagstringnobodywouldstumbleonaccidently id="storytext">').replace('<!-- footerstart -->','</crazytagstringnobodywouldstumbleonaccidently>')
-		soup = bs.BeautifulStoneSoup(data)
+		
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			logging.info("Failed to decode: <%s>" % data)
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
 		
 		div = soup.find('crazytagstringnobodywouldstumbleonaccidently', {'id' : 'storytext'})
 		if None == div:
-			logging.error("Error downloading Chapter: %s" % url)
-			exit(20)
-			return '<html/>'
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
 
 		html = soup.findAll('html')
 		if len(html) > 1:
diff --git a/ficwad.py b/ficwad.py
index 7e9f3ae8..a2aab789 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -57,9 +57,21 @@ class FicWad(FanfictionSiteAdapter):
 
 	def extractIndividualUrls(self):
 		oldurl = ''
-		
-		data = u2.urlopen(self.url).read()
-		soup = bs.BeautifulStoneSoup(data)
+		cururl = self.url
+		data = ''
+		try:
+			data = u2.urlopen(self.url).read()
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
+
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
 		
 		story = soup.find('div', {'id' : 'story'})
 		crumbtrail = story.find('h3') # the only h3 ficwad uses.
@@ -100,7 +112,7 @@ class FicWad(FanfictionSiteAdapter):
 		meta = soup.find('p', {'class' : 'meta'})
 		if meta is not None:
 			s = str(meta).replace('\n',' ').replace('\t','').split(' - ')
-			logging.debug('meta.s=%s' % s)
+			#logging.debug('meta.s=%s' % s)
 			for ss in s:
 				s1 = ss.replace('&nbsp;','').split(':')
 				#logging.debug('meta.s.s1=%s' % s1)
@@ -164,11 +176,18 @@ class FicWad(FanfictionSiteAdapter):
 		ii = 1
 
 		if oldurl is not None and len(oldurl) > 0:
+			logging.debug('Switching back to %s' % oldurl)
+			cururl = oldurl
 			data = u2.urlopen(oldurl).read()
 			soup = bs.BeautifulStoneSoup(data)
 			
 		storylist = soup.find('ul', {'id' : 'storylist'})
 		if storylist is not None:
+			allBlocked = storylist.findAll('li', {'class' : 'blocked'})
+			if allBlocked is not None:
+				#logging.debug('allBlocked=%s' % allBlocked)
+				raise LoginRequiredException(cururl)
+
 			allH4s = storylist.findAll('h4')
 			#logging.debug('allH4s=%s' % allH4s)
 	
@@ -216,14 +235,25 @@ class FicWad(FanfictionSiteAdapter):
 		if url.find('http://') == -1:
 			url = 'http://' + self.host + '/' + url
 		
-		data = u2.urlopen(url).read()
+		data = ''
+		try:
+			data = u2.urlopen(url).read()
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			logging.info("Failed to decode: <%s>" % data)
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
 		
-		soup = bs.BeautifulStoneSoup(data)
 		div = soup.find('div', {'id' : 'storytext'})
 		if None == div:
-			logging.error("Error downloading Chapter: %s" % url)
-			exit(20)
-			return '<html/>'
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
+
 		return div.__str__('utf8')
 	
 		
diff --git a/fpcom.py b/fpcom.py
index b9431322..3598c2ec 100644
--- a/fpcom.py
+++ b/fpcom.py
@@ -65,8 +65,7 @@ class FPCom(FanfictionSiteAdapter):
 		spl = self.path.split('/')
 		if spl is not None:
 			if len(spl) > 0 and spl[0] != 's':
-				logging.error("Error URL \"%s\" is not a story." % self.url)
-				exit (20)				
+				raise InvalidStoryURL("Error URL \"%s\" is not a story." % self.url)
 			if len(spl) > 1:
 				self.storyId = spl[1]
 			if len(spl) > 2:
@@ -138,9 +137,23 @@ class FPCom(FanfictionSiteAdapter):
 		return True
 	
 	def extractIndividualUrls(self):
-		data = self.fetchUrl(self.url)
+		data = ''
+		try:
+			data = self.fetchUrl(self.url)
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
+		
 		d2 = re.sub('&\#[0-9]+;', ' ', data)
-		soup = bs.BeautifulStoneSoup(d2)
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(d2)
+		except:
+			logging.error("Failed to decode: <%s>" % d2)
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
+
 		allA = soup.findAll('a')
 		for a in allA:
 			if 'href' in a._getAttrMap() and a['href'].find('/u/') != -1:
@@ -277,7 +290,15 @@ class FPCom(FanfictionSiteAdapter):
 	
 	def getText(self, url):
 		time.sleep( 2.0 )
-		data = self.fetchUrl(url)
+		data = ''
+		try:
+			data = self.fetchUrl(url)
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
 		lines = data.split('\n')
 		
 		textbuf = ''
@@ -289,16 +310,16 @@ class FPCom(FanfictionSiteAdapter):
 		except:
 			data = olddata
 		
+		soup = None
 		try:
 			soup = bs.BeautifulStoneSoup(data)
 		except:
 			logging.info("Failed to decode: <%s>" % data)
-			soup = None
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+
 		div = soup.find('div', {'id' : 'storytext'})
 		if None == div:
-			logging.error("Error downloading Chapter: %s" % url)
-			exit (20)
-			return '<html/>'
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
 			
 		return div.__str__('utf8')
 					
diff --git a/hpfiction.py b/hpfiction.py
index 38509391..b2116efe 100644
--- a/hpfiction.py
+++ b/hpfiction.py
@@ -84,10 +84,21 @@ class HPFiction(FanfictionSiteAdapter):
 		return self.path
 	
 	def extractIndividualUrls(self):
+		data = ''
+		try:
+			data = self.opener.open(self.url).read()
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
 		
-		data = self.opener.open(self.url).read()
-		soup = bs.BeautifulSoup(data)
-		
+		soup = None
+		try:
+			soup = bs.BeautifulSoup(data)
+		except:
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
+				
 		links = soup.findAll('a')
 		def_chapurl = ''
 		def_chaptitle = ''
@@ -220,12 +231,26 @@ class HPFiction(FanfictionSiteAdapter):
 
 	def getText(self, url):
 		logging.debug('Downloading from URL: %s' % url)
-		data = self.opener.open(url).read()
-		soup = bs.BeautifulSoup(data)
+		data = ''
+		try:
+			data = self.opener.open(url).read()
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
+		soup = None
+		try:
+			soup = bs.BeautifulSoup(data)
+		except:
+			logging.info("Failed to decode: <%s>" % data)
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+		
 		divtext = soup.find('div', {'id' : 'fluidtext'})
 		if None == divtext:
-			logging.error("Error downloading Chapter: %s" % url)
-			exit(20)
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
+
 		return divtext.__str__('utf8')
 
 
diff --git a/mediaminer.py b/mediaminer.py
index e8389abc..2b790f45 100644
--- a/mediaminer.py
+++ b/mediaminer.py
@@ -81,7 +81,9 @@ class MediaMiner(FanfictionSiteAdapter):
 				self.storyId = ss[-2].strip()
 				self.path = '/fanfic/view_st.php/' + self.storyId
 				self.url = 'http://' + self.host + self.path
-				logging.debug('self.url=%s' % self.url)			
+				logging.debug('self.url=%s' % self.url)
+		else:			
+			raise InvalidStoryURL("Error URL \"%s\" is not a story." % self.url)
 			
 		logging.debug('self.storyId=%s' % self.storyId)
 		
@@ -144,9 +146,23 @@ class MediaMiner(FanfictionSiteAdapter):
 		return True
 
 	def extractIndividualUrls(self):
-		data = self.fetchUrl(self.url)
+		data = None
+		try:
+			data = self.fetchUrl(self.url)
+		except Exception, e:
+			data = None
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
+		
 		#data.replace('<br />',' ').replace('<br>',' ').replace('</br>',' ')
-		soup = bs.BeautifulSoup(data)
+		soup = None
+		try:
+			soup = bs.BeautifulSoup(data)
+		except:
+			logging.error("Failed to decode: <%s>" % data)
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
+
 		#logging.debug('soap=%s' % soup)
 		urls = []
 		
@@ -175,7 +191,7 @@ class MediaMiner(FanfictionSiteAdapter):
 			for ii in range(ll):
 				td = td_smtxt[ii]
 				if 'class' in td._getAttrMap() and td['class'] != 'smtxt':
-					logging.debug('td has class attribute but is not smtxt')
+					#logging.debug('td has class attribute but is not smtxt')
 					continue
 				ss = str(td).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
 				#logging.debug('ss=%s' % ss)
@@ -309,31 +325,28 @@ class MediaMiner(FanfictionSiteAdapter):
 			
 		self.numChapters = str(numchapters)
 		logging.debug('self.numChapters=%s' % self.numChapters)
-		logging.debug('urls=%s' % urls)
+		#logging.debug('urls=%s' % urls)
 		
 		return urls
 	
 	def getText(self, url):
 		time.sleep( 2.0 )
 		logging.debug('url=%s' % url)
-		data = self.fetchUrl(url)
-
+		data = ''
+		try:
+			data = self.fetchUrl(url)
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
+		soup = None
 		try:
 			soup = bs.BeautifulSoup(data)
 		except:
-			logging.info("Failed to decode: <%s>" % data)
-			soup = None
-			exit(20)
-			return '<html/>'
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
 		
-		#div = soup.find('div', {'id' : 'storytext'})
-		#if div is None:
-			#logging.error("Error downloading Chapter: %s" % url)
-			#exit (20)
-			#return '<html/>'
-			
-		#logging.info("Soup: %s" % soup.prettify())
-
 		nvs = bs.NavigableString('')
 		sst=''
 		allAs = soup.findAll ('a', { 'name' : 'fic_c' })
@@ -368,16 +381,9 @@ class MediaMiner(FanfictionSiteAdapter):
 				sst = sst + st
 				nxta = nxta.nextSibling
 
-		#sst = sst.replace('&nbsp;',' ').strip()
-		#logging.debug('sst=%s' % sst)
+		if sst is None:	
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
 		
-		#logging.debug('sst.0=%s' % sst)
-		#sst0 = sst.replace(u'&#8820;', u'&ldquo;').replace(u'&#8821;','&rdquo;').replace(u'&#8816;',u'&lsquo;').replace(u'&#8817;',u'&rsquo;')
-		#sst0 = sst.replace(u"&#8821;","&rdquo;")
-		#logging.debug('sst.1=%s' % sst0)
-		#sst1 = sst.replace(u'&#8820;', u'\"').replace('&#8821;','\"').replace('&#8816;','\'').replace('&#8817;','\'')
-		#logging.debug('sst.2=%s' % sst1)
-					
 		return sst
 			
 class FPC_UnitTests(unittest.TestCase):
diff --git a/output.py b/output.py
index a320a42e..64a64d0c 100644
--- a/output.py
+++ b/output.py
@@ -40,9 +40,25 @@ class FanficWriter:
 	def finalise(self):
 		pass
 
+	@staticmethod
+	def getFormatName():
+		return 'base'
+	
+	@staticmethod	
+	def getFormatExt():
+		return '.bse'
+	
 class TextWriter(FanficWriter):
 	htmlWriter = None
 	
+	@staticmethod
+	def getFormatName():
+		return 'text'
+	
+	@staticmethod	
+	def getFormatExt():
+		return '.txt'
+	
 	def __init__(self, base, adapter, inmemory=False, compress=False):
 		self.htmlWriter = HTMLWriter(base, adapter, True, False)
 	
@@ -59,11 +75,19 @@ class TextWriter(FanficWriter):
 class HTMLWriter(FanficWriter):
 	body = ''
 	
+	@staticmethod
+	def getFormatName():
+		return 'html'
+	
+	@staticmethod	
+	def getFormatExt():
+		return '.html'
+	
 	def __init__(self, base, adapter, inmemory=False, compress=False):
 		self.basePath = base
 		self.storyTitle = removeEntities(adapter.getStoryName())
 		self.name = makeAcceptableFilename(adapter.getOutputName())
-		self.fileName = self.basePath + '/' + self.name + '.html'
+		self.fileName = self.basePath + '/' + self.name + self.getFormatExt()
 		self.authorName = removeEntities(adapter.getAuthorName())
 		self.adapter = adapter
 		
@@ -111,6 +135,45 @@ class EPubFanficWriter(FanficWriter):
 	
 	files = {}
 	
+	@staticmethod
+	def getFormatName():
+		return 'epub'
+	
+	@staticmethod	
+	def getFormatExt():
+		return '.epub'
+	
+	def __init__(self, base, adapter, inmemory=False, compress=True):
+		self.basePath = base
+		self.storyTitle = removeEntities(adapter.getStoryName())
+		self.name = makeAcceptableFilename(adapter.getOutputName())
+		self.directory = self.basePath + '/' + self.name
+		self.authorName = removeEntities(adapter.getAuthorName())
+		self.inmemory = inmemory
+		self.adapter = adapter
+		
+		self.files = {}
+		self.chapters = []
+		
+		if not self.inmemory:
+			self.inmemory = True
+			self.writeToFile = True
+		else:
+			self.writeToFile = False
+
+		if not self.inmemory:
+			if os.path.exists(self.directory):
+				shutil.rmtree(self.directory)
+		
+			os.mkdir(self.directory)
+		
+			os.mkdir(self.directory + '/META-INF')
+			os.mkdir(self.directory + '/OEBPS')
+		
+		self._writeFile('mimetype', MIMETYPE)
+		self._writeFile('META-INF/container.xml', CONTAINER)
+		self._writeFile('OEBPS/stylesheet.css', CSS)
+
 	def _writeFile(self, fileName, data):
 		#logging.debug('_writeFile(`%s`, data)' % fileName)
 		if fileName in self.files:
@@ -134,39 +197,6 @@ class EPubFanficWriter(FanficWriter):
 			for f in self.files:
 				self.files[f].close()
 	
-	def __init__(self, base, adapter, inmemory=False, compress=True):
-		self.basePath = base
-		self.storyTitle = removeEntities(adapter.getStoryName())
-		self.name = makeAcceptableFilename(adapter.getOutputName())
-		self.directory = self.basePath + '/' + self.name
-		self.authorName = removeEntities(adapter.getAuthorName())
-		self.inmemory = inmemory
-		self.adapter = adapter
-		
-		self.files = {}
-		self.chapters = []
-		
-		if not self.inmemory:
-			self.inmemory = True
-			self.writeToFile = True
-		else:
-			self.writeToFile = False
-		
-
-
-		if not self.inmemory:
-			if os.path.exists(self.directory):
-				shutil.rmtree(self.directory)
-		
-			os.mkdir(self.directory)
-		
-			os.mkdir(self.directory + '/META-INF')
-			os.mkdir(self.directory + '/OEBPS')
-		
-		self._writeFile('mimetype', MIMETYPE)
-		self._writeFile('META-INF/container.xml', CONTAINER)
-		self._writeFile('OEBPS/stylesheet.css', CSS)
-
 	def writeChapter(self, index, title, text):
 		title = removeEntities(title)
 		logging.debug("Writing chapter: %s" % title)
@@ -321,7 +351,7 @@ class EPubFanficWriter(FanficWriter):
 		
 		self._closeFiles()
 		
-		filename = self.directory + '.epub'
+		filename = self.directory + self.getFormatExt()
 		
 		zipdata = zipdir.inMemoryZip(self.files)
 		
@@ -382,4 +412,4 @@ def removeEntities(text):
 	return text
 	
 def makeAcceptableFilename(text):
-	return re.sub('[^a-zA-Z0-9_\'-]+','',removeEntities(text).replace(" ", "_").replace(":","_"))	
+	return re.sub('[^a-zA-Z0-9_-]+','',removeEntities(text).replace(" ", "_").replace(":","_"))	
diff --git a/potionsNsnitches.py b/potionsNsnitches.py
index 3868e934..d0c3fa53 100644
--- a/potionsNsnitches.py
+++ b/potionsNsnitches.py
@@ -130,15 +130,35 @@ class PotionsNSnitches(FanfictionSiteAdapter):
 
     def extractIndividualUrls(self):
         url = self.url + '&chapter=1'
-        data = self.opener.open(url).read()
+        data = ''
+        try:
+            data = self.opener.open(url).read()
+        except Exception, e:
+            data = ''
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+        if data is None:
+            raise StoryDoesNotExist("Problem reading story URL " + url + "!")
         
         if self.reqLoginData(data):
-          self.performLogin()
-          data = self.opener.open(url).read()
-          if self.reqLoginData(data):
-            return None
+            self.performLogin()
+            
+            data = ''
+            try:
+                data = self.opener.open(url).read()
+            except Exception, e:
+                data = ''
+                logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+            if data is None:
+                raise StoryDoesNotExist("Problem reading story URL " + url + "!")
         
-        soup = bs.BeautifulStoneSoup(data)
+            if self.reqLoginData(data):
+                raise FailedToDownload("Error downloading Story: %s!  Login Failed!" % url)    
+        
+        soup = None
+        try:
+            soup = bs.BeautifulStoneSoup(data)
+        except:
+            raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % url)    
 
         self.storyName = ''
         self.authorName = ''
@@ -302,16 +322,29 @@ class PotionsNSnitches(FanfictionSiteAdapter):
     
         logging.debug('Getting data from: %s' % url)
     
-        data = self.opener.open(url).read()
+        data = ''
+        try:
+            data = self.opener.open(url).read()
+        except Exception, e:
+            data = ''
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+        if data is None:
+            raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
         
         # need to do this, because for some reason the <br /> tag in the story causes problems
         data = data.replace('<br />', ' SOMETHING_BR ')
-        soup = bs.BeautifulStoneSoup(data, convertEntities=bs.BeautifulStoneSoup.HTML_ENTITIES)
-    
+
+        soup = None
+        try:
+            soup = bs.BeautifulStoneSoup(data, convertEntities=bs.BeautifulStoneSoup.HTML_ENTITIES)
+        except:
+            logging.info("Failed to decode: <%s>" % data)
+            raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+        
         div = soup.find('div', {'id' : 'story'})
     
         if None == div:
-          return '<html/>'
+            raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
 
         # put the <br /> tags back in..
         text = div.__str__('utf8').replace(' SOMETHING_BR ','<br />')    
diff --git a/twilighted.py b/twilighted.py
index ed293406..00f59364 100644
--- a/twilighted.py
+++ b/twilighted.py
@@ -110,15 +110,36 @@ class Twilighted(FanfictionSiteAdapter):
 
     def extractIndividualUrls(self):
         url = self.url + '&chapter=1'
-        data = self.opener.open(url).read()
+
+        data = ''
+        try:
+            data = self.opener.open(url).read()
+        except Exception, e:
+            data = ''
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+        if data is None:
+            raise StoryDoesNotExist("Problem reading story URL " + url + "!")
         
         if self.reqLoginData(data):
-          self.performLogin()
-          data = self.opener.open(url).read()
-          if self.reqLoginData(data):
-            return None
+            self.performLogin()
+
+            data = ''
+            try:
+                data = self.opener.open(url).read()
+            except Exception, e:
+                data = ''
+                logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+            if data is None:
+                raise StoryDoesNotExist("Problem reading story URL " + url + "!")
         
-        soup = bs.BeautifulStoneSoup(data)
+            if self.reqLoginData(data):
+                raise FailedToDownload("Error downloading Story: %s!  Login Failed!" % url)    
+        
+        soup = None
+        try:
+            soup = bs.BeautifulStoneSoup(data)
+        except:
+            raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % url)    
 
         title = soup.find('title').string
         logging.debug('Title: %s' % title)
@@ -254,14 +275,26 @@ class Twilighted(FanfictionSiteAdapter):
     
         logging.debug('Getting data from: %s' % url)
     
-        data = self.opener.open(url).read()
+        data = ''
+        try:
+            data = self.opener.open(url).read()
+        except Exception, e:
+            data = ''
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+        if data is None:
+            raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+                
+        soup = None
+        try:
+            soup = bs.BeautifulStoneSoup(data, convertEntities=bs.BeautifulStoneSoup.HTML_ENTITIES)
+        except:
+            logging.info("Failed to decode: <%s>" % data)
+            raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
         
-        soup = bs.BeautifulStoneSoup(data, convertEntities=bs.BeautifulStoneSoup.HTML_ENTITIES)
-    
         div = soup.find('div', {'id' : 'story'})
     
         if None == div:
-          return '<html/>'
+            raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
     
         return div.__str__('utf8')
 
diff --git a/zipdir.py b/zipdir.py
index 597b4f8c..6079e083 100644
--- a/zipdir.py
+++ b/zipdir.py
@@ -1,11 +1,79 @@
 # -*- coding: utf-8 -*-
 
+import sys
 import os
+import zlib
 import zipfile
+from zipfile import ZipFile, ZIP_STORED, ZIP_DEFLATED
+from contextlib import closing
 import logging
 
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time
+import datetime
+from datetime import timedelta
+
 import StringIO
 
+class InvalidEPub(Exception):
+    pass
+
+def checkNewer(filename, curdte):
+	ret = True
+	
+	if not os.path.isfile(filename):
+		logging.debug('File %s does not already exist.' % filename)
+		return ret
+	
+	#logging.debug('filename=%s, curdte=%s' % (filename, curdte))
+	lastdate = None
+	with closing(ZipFile(open(filename, 'rb'))) as epub:
+		titleFilePath = "OEBPS/title_page.xhtml"
+		contentFilePath = "OEBPS/content.opf"
+		
+		namelist = set(epub.namelist())
+		#logging.debug('namelist=%s' % namelist)
+		if 'mimetype' not in namelist or \
+		   'META-INF/container.xml' not in namelist:
+			#raise InvalidEPub('%s: not a valid EPUB' % filename)
+			logging.debug('File %s is not a valid EPub format file.' % filename)
+			return ret
+		
+		if contentFilePath not in namelist:
+			return ret	# file is not newer
+		
+		data = epub.read(contentFilePath)
+		soup = bs.BeautifulStoneSoup(data)
+		lstdte = soup.find ('dc:date', {'opf:event' : 'modification'})
+		#logging.debug('lstdte=%s' % lstdte.string)
+		if lstdte is None and titleFilePath in namelist:
+			data = epub.read(titleFilePath)
+			soup = bs.BeautifulStoneSoup(data)
+			fld = ''
+			allTDs = soup.findAll ('td')
+			for td in allTDs:
+				b = td.find ('b')
+				if b is not None:
+					fld = b.string
+				if td.string is not None and fld == "Updated:":
+					lastdate = td.string
+					#logging.debug('title lastdate=%s' % lastdate)
+		else:
+			lastdate = lstdte.string.strip(' ')
+			#logging.debug('contents lastdate=%s' % lastdate)
+	
+	if lastdate is not None:	
+		currUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(curdte.strftime('%Y-%m-%d'), "%Y-%m-%d")))
+		storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(lastdate, "%Y-%m-%d")))
+		logging.debug('File %s last update date is %s, comparing to %s' % (filename, storyUpdated, currUpdated))
+		if currUpdated <= storyUpdated :	
+			ret = False
+	
+	logging.debug("Does %s need to be updated? %s" % (filename, ret))
+	return ret
+
+
 def toZip(filename, directory):
 	zippedHelp = zipfile.ZipFile(filename, "w", compression=zipfile.ZIP_DEFLATED)
 	lst = os.listdir(directory)

From 26f6ddabd9674d949d3782f9c18c476a54774a53 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Thu, 18 Nov 2010 20:08:55 -0600
Subject: [PATCH 73/94] The with call is not an automatic in python 2.5, you
 need to import with_statement for it to work. the from __future__ import
 with_statement needs to be the first import statment as well.

---
 zipdir.py | 2 ++
 1 file changed, 2 insertions(+)

diff --git a/zipdir.py b/zipdir.py
index 6079e083..eb50c961 100644
--- a/zipdir.py
+++ b/zipdir.py
@@ -1,5 +1,7 @@
 # -*- coding: utf-8 -*-
 
+from __future__ import with_statement
+
 import sys
 import os
 import zlib

From df6b85b7238d642107af508e12a5dbaee920133b Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Thu, 18 Nov 2010 23:34:25 -0600
Subject: [PATCH 74/94] Fix desc escaping.  <sigh>

---
 output.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/output.py b/output.py
index 64a64d0c..3f4189d5 100644
--- a/output.py
+++ b/output.py
@@ -273,7 +273,7 @@ class EPubFanficWriter(FanficWriter):
 		else:
 			description = str(description)
 		if description is not None and len(description) > 0:
-			description = description.replace ('\\', '\'').replace('\\\"', '\"')
+			description = description.replace ('\\\'', '\'').replace('\\\"', '\"')
 			description =  removeEntities(description)
 		else:
 			description = ' '

From f584b3f1e8320bacc5358a0b55ff89c92d1212f4 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Sun, 21 Nov 2010 11:52:11 -0600
Subject: [PATCH 75/94] Change calls for str() to unicode().  Default CL type
 to epub if not given.

---
 downloader.py       |  3 ++-
 ffnet.py            | 10 +++++-----
 fictionalley.py     | 12 ++++++------
 ficwad.py           | 12 ++++++------
 fpcom.py            | 10 +++++-----
 hpfiction.py        |  8 ++++----
 mediaminer.py       | 16 ++++++++--------
 output.py           |  6 +++---
 potionsNsnitches.py | 20 ++++++++++----------
 twilighted.py       |  6 +++---
 10 files changed, 52 insertions(+), 51 deletions(-)

diff --git a/downloader.py b/downloader.py
index 3dfd7fc0..cb4ca7d4 100644
--- a/downloader.py
+++ b/downloader.py
@@ -109,6 +109,7 @@ if __name__ == '__main__':
 	logging.basicConfig(level=logging.DEBUG)
 	argvlen = len(sys.argv)
 	url = None
+	bookFormat = 'epub'
 	if argvlen > 1:
 		url = sys.argv[1]
 	if argvlen > 2:
@@ -121,7 +122,7 @@ if __name__ == '__main__':
 	if type(url) is unicode:
 		print('URL is unicode')
 		url = url.encode('latin1')
-	
+	url = url.strip()
 	adapter = None
 	writerClass = None
 	
diff --git a/ffnet.py b/ffnet.py
index a6fee2dc..3963d529 100644
--- a/ffnet.py
+++ b/ffnet.py
@@ -154,7 +154,7 @@ class FFNet(FanfictionSiteAdapter):
 			data = self.fetchUrl(self.url)
 		except Exception, e:
 			data = ''
-			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
 		
@@ -178,16 +178,16 @@ class FFNet(FanfictionSiteAdapter):
 		for l in lines:
 			if l.find("&#187;") != -1 and l.find('<b>') != -1:
 				s2 = bs.BeautifulStoneSoup(l)
-				self.storyName = str(s2.find('b').string)
+				self.storyName = unicode(s2.find('b').string)
 				logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
 			elif l.find("<a href='/u/") != -1:
 				s2 = bs.BeautifulStoneSoup(l)
-				self.authorName = str(s2.a.string)
+				self.authorName = unicode(s2.a.string)
 				(u1, u2, self.authorId, u3) = s2.a['href'].split('/')
 				logging.debug('self.authorId=%s, self.authorName=%s' % (self.authorId, self.authorName))
 			elif l.find("Rated: <a href=") != -1:
 				s2 = bs.BeautifulStoneSoup(l)
-				self.storyRating = str(s2.a.string).strip()
+				self.storyRating = unicode(s2.a.string).strip()
 				logging.debug('self.storyRating=%s' % self.storyRating)
 				logging.debug('s2.a=%s' % s2.a)
 				s3 = l.split('-')
@@ -282,7 +282,7 @@ class FFNet(FanfictionSiteAdapter):
 			data = self.fetchUrl(url)
 		except Exception, e:
 			data = ''
-			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
 		
diff --git a/fictionalley.py b/fictionalley.py
index 31f43b5d..332a08af 100644
--- a/fictionalley.py
+++ b/fictionalley.py
@@ -36,7 +36,7 @@ class FictionAlley(FanfictionSiteAdapter):
                   domain='www.fictionalley.org', domain_specified=False, domain_initial_dot=False,
                  path='/authors', path_specified=True,
                  secure=False,
-                 expires=time.time()+100,
+                 expires=time.time()+10000,
                  discard=False,
                  comment=None,
                  comment_url=None,
@@ -97,7 +97,7 @@ class FictionAlley(FanfictionSiteAdapter):
 			if len(br.contents) > 2:
 				keystr = br.contents[1]
 				if keystr is not None:
-					strs = re.split ("<[^>]+>", str(keystr))
+					strs = re.split ("<[^>]+>", unicode(keystr))
 					keystr=''
 					for s in strs:
 						keystr = keystr + s					
@@ -129,7 +129,7 @@ class FictionAlley(FanfictionSiteAdapter):
 			data = self.opener.open(self.url).read()		
 		except Exception, e:
 			data = ''
-			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
 		
@@ -154,7 +154,7 @@ class FictionAlley(FanfictionSiteAdapter):
 				#logging.debug('bca=%s' % bca )
 				if 'href' in bca._getAttrMap():
 					#logging.debug('bca.href=%s' % bca['href'] )
-					url = str(bca['href'])
+					url = unicode(bca['href'])
 					if url is not None and len(url) > 0:
 						self.url = url
 						logging.debug('self.url=%s' % self.url )
@@ -207,7 +207,7 @@ class FictionAlley(FanfictionSiteAdapter):
 				if len(ss1) > 1 and ss1[0] == 'Rating':
 					self.storyRating = ss1[1]
 					logging.debug('self.storyRating=%s' % self.storyRating)
-				self.storyDescription = str(ss[1]).replace("<br>","").replace("</br>","").replace('\n','')
+				self.storyDescription = unicode(ss[1]).replace("<br>","").replace("</br>","").replace('\n','')
 				logging.debug('self.storyDescription=%s' % self.storyDescription)
 			
 			for li in links:
@@ -260,7 +260,7 @@ class FictionAlley(FanfictionSiteAdapter):
 			data = self.opener.open(url).read()
 		except Exception, e:
 			data = ''
-			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
 		
diff --git a/ficwad.py b/ficwad.py
index a2aab789..13e7a45d 100644
--- a/ficwad.py
+++ b/ficwad.py
@@ -63,7 +63,7 @@ class FicWad(FanfictionSiteAdapter):
 			data = u2.urlopen(self.url).read()
 		except Exception, e:
 			data = ''
-			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
 
@@ -99,19 +99,19 @@ class FicWad(FanfictionSiteAdapter):
 		logging.debug('self.storyName=%s, self.storyId=%s' % (self.storyName, self.storyId))
 		
 		author = soup.find('span', {'class' : 'author'})
-		self.authorName = str(author.a.string)
+		self.authorName = unicode(author.a.string)
 		(u0, u1,self.authorId) = author.a['href'].split('/')
 		self.authorURL = 'http://' + self.host + author.a['href']
 		logging.debug('self.authorName=%s self.authorId=%s' % (self.authorName, self.authorId))
 		
 		description = soup.find('blockquote', {'class' : 'summary'})
 		if description is not None:
-			self.storyDescription = str(description.p.string)
+			self.storyDescription = unicode(description.p.string)
 		logging.debug('self.storyDescription=%s' % self.storyDescription)
 		
 		meta = soup.find('p', {'class' : 'meta'})
 		if meta is not None:
-			s = str(meta).replace('\n',' ').replace('\t','').split(' - ')
+			s = unicode(meta).replace('\n',' ').replace('\t','').split(' - ')
 			#logging.debug('meta.s=%s' % s)
 			for ss in s:
 				s1 = ss.replace('&nbsp;','').split(':')
@@ -128,7 +128,7 @@ class FicWad(FanfictionSiteAdapter):
 						allAs = soup1.findAll('a')
 						for a in allAs:
 							if self.category == 'Category':
-								self.category = str(a.string)
+								self.category = unicode(a.string)
 								logging.debug('self.category=%s' % self.category)
 							self.addSubject(self.category)
 						logging.debug('self.subjects=%s' % self.subjects)
@@ -240,7 +240,7 @@ class FicWad(FanfictionSiteAdapter):
 			data = u2.urlopen(url).read()
 		except Exception, e:
 			data = ''
-			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
 		
diff --git a/fpcom.py b/fpcom.py
index 3598c2ec..471c0b85 100644
--- a/fpcom.py
+++ b/fpcom.py
@@ -142,7 +142,7 @@ class FPCom(FanfictionSiteAdapter):
 			data = self.fetchUrl(self.url)
 		except Exception, e:
 			data = ''
-			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
 		
@@ -167,7 +167,7 @@ class FPCom(FanfictionSiteAdapter):
 		if metas is not None:
 			for meta in metas:
 				if 'content' in meta._getAttrMap():
-					self.storyDescription = str(meta['content'])
+					self.storyDescription = unicode(meta['content'])
 					logging.debug('self.storyDescription=%s' % self.storyDescription)
 					
 					title=meta.find('title')
@@ -220,7 +220,7 @@ class FPCom(FanfictionSiteAdapter):
 			logging.debug('URL=%s, Title=%s' % (url, self.storyName))
 			urls.append((url, self.storyName))
 			
-		self.numChapters = str(numchapters)
+		self.numChapters = unicode(numchapters)
 		logging.debug('self.numChapters=%s' % self.numChapters)
 		logging.debug('urls=%s' % urls)
 		
@@ -241,7 +241,7 @@ class FPCom(FanfictionSiteAdapter):
 				logging.debug('self.subjects=%s' % self.subjects)
 			tda = td.find ('a')
 			if tda is not None and tda.string.find('Rated:') != -1:
-				tdas = re.split ("<[^>]+>", str(td).replace('\n','').replace('&nbsp;',' '))
+				tdas = re.split ("<[^>]+>", unicode(td).replace('\n','').replace('&nbsp;',' '))
 				if tdas is not None:
 					ll = len(tdas)
 					if ll > 2:
@@ -295,7 +295,7 @@ class FPCom(FanfictionSiteAdapter):
 			data = self.fetchUrl(url)
 		except Exception, e:
 			data = ''
-			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
 		
diff --git a/hpfiction.py b/hpfiction.py
index b2116efe..aeda7d36 100644
--- a/hpfiction.py
+++ b/hpfiction.py
@@ -89,7 +89,7 @@ class HPFiction(FanfictionSiteAdapter):
 			data = self.opener.open(self.url).read()
 		except Exception, e:
 			data = ''
-			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
 		
@@ -145,7 +145,7 @@ class HPFiction(FanfictionSiteAdapter):
 				(u1, self.authorId) = a['href'].split('=')
 				logging.debug('self.authorName=%s, self.authorId=%s' % (self.authorName, self.authorId))
 			elif a['href'].find('chapterid=') != -1 and len(def_chapurl) == 0:
-				def_chapurl = 'http://' + self.host + '/viewstory.php' + str(a['href'])
+				def_chapurl = 'http://' + self.host + '/viewstory.php' + unicode(a['href'])
 				def_chaptitle = a.string
 				logging.debug('def_chapurl=%s, def_chaptitle=%s' % (def_chapurl, def_chaptitle))
 		
@@ -154,7 +154,7 @@ class HPFiction(FanfictionSiteAdapter):
 			tds = center.findAll ('td')
 			if tds is not None and len(tds) > 0:
 				for td in tds:
-					s = re.split ("<[^>]+>", str(td).replace('\n','').replace('&nbsp;',' '))
+					s = re.split ("<[^>]+>", unicode(td).replace('\n','').replace('&nbsp;',' '))
 					ii = 0
 					ll = len(s)
 					sss = ''
@@ -236,7 +236,7 @@ class HPFiction(FanfictionSiteAdapter):
 			data = self.opener.open(url).read()
 		except Exception, e:
 			data = ''
-			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
 		
diff --git a/mediaminer.py b/mediaminer.py
index 2b790f45..6a4c03a7 100644
--- a/mediaminer.py
+++ b/mediaminer.py
@@ -151,7 +151,7 @@ class MediaMiner(FanfictionSiteAdapter):
 			data = self.fetchUrl(self.url)
 		except Exception, e:
 			data = None
-			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
 		
@@ -170,7 +170,7 @@ class MediaMiner(FanfictionSiteAdapter):
 		#logging.debug('td_ffh=%s' % td_ffh)
 		if td_ffh is not None:
 			#logging.debug('td_ffh.text=%s' % td_ffh.find(text=True))
-			self.storyName = str(td_ffh.find(text=True)).strip()
+			self.storyName = unicode(td_ffh.find(text=True)).strip()
 			logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
 			fft = td_ffh.find('font', {'class' : 'smtxt'})
 			#logging.debug('fft=%s' % fft)
@@ -193,7 +193,7 @@ class MediaMiner(FanfictionSiteAdapter):
 				if 'class' in td._getAttrMap() and td['class'] != 'smtxt':
 					#logging.debug('td has class attribute but is not smtxt')
 					continue
-				ss = str(td).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
+				ss = unicode(td).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
 				#logging.debug('ss=%s' % ss)
 				if len(ss) > 1 and (ss.find('Genre(s):') != -1 or ss.find('Type:') != -1):
 					#logging.debug('ss=%s' % ss)
@@ -204,7 +204,7 @@ class MediaMiner(FanfictionSiteAdapter):
 						nvs = bs.NavigableString('')
 						sst=''
 						ssb = ssbs[bb]
-						ssbt = str(ssb.text).strip()
+						ssbt = unicode(ssb.text).strip()
 						#logging.debug('ssb=%s' % ssb)
 						#logging.debug('ssbt=%s' % ssbt)
 						ssbn = ssb.nextSibling
@@ -212,7 +212,7 @@ class MediaMiner(FanfictionSiteAdapter):
 							#logging.debug('ssbn=%s' % ssbn)
 							#logging.debug('ssbn.class=%s' % ssbn.__class__)
 							if nvs.__class__ == ssbn.__class__:
-								st = str(ssbn)
+								st = unicode(ssbn)
 								if st.strip() != '|':
 									sst = sst + st
 							else:
@@ -323,7 +323,7 @@ class MediaMiner(FanfictionSiteAdapter):
 			logging.debug('URL=%s, Title=%s' % (url, ssd))
 			urls.append((url, ssd))
 			
-		self.numChapters = str(numchapters)
+		self.numChapters = unicode(numchapters)
 		logging.debug('self.numChapters=%s' % self.numChapters)
 		#logging.debug('urls=%s' % urls)
 		
@@ -337,7 +337,7 @@ class MediaMiner(FanfictionSiteAdapter):
 			data = self.fetchUrl(url)
 		except Exception, e:
 			data = ''
-			logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
 		if data is None:
 			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
 		
@@ -359,7 +359,7 @@ class MediaMiner(FanfictionSiteAdapter):
 			while nxta is not None and not done:
 				#logging.debug('nxta=%s' % nxta)
 				#logging.debug('nxta.class=%s' % nxta.__class__)
-				st = str(nxta)
+				st = unicode(nxta)
 				if nvs.__class__ != nxta.__class__:
 					#logging.debug('nxta.name=%s' % nxta.name)
 					if nxta.name == 'table':
diff --git a/output.py b/output.py
index 3f4189d5..af6788ce 100644
--- a/output.py
+++ b/output.py
@@ -269,9 +269,9 @@ class EPubFanficWriter(FanficWriter):
 		
 		description = self.adapter.getStoryDescription()
 		if hasattr(description, "text"):
-			description = str(description.text)
+			description = unicode(description.text)
 		else:
-			description = str(description)
+			description = unicode(description)
 		if description is not None and len(description) > 0:
 			description = description.replace ('\\\'', '\'').replace('\\\"', '\"')
 			description =  removeEntities(description)
@@ -289,7 +289,7 @@ class EPubFanficWriter(FanficWriter):
 		self._writeFile(titleFilePath, TITLE_ENTRY % ('Packaged:', createda))
 		tmpstr = self.adapter.getStoryRating() + " / " + self.adapter.getStoryUserRating()		 
 		self._writeFile(titleFilePath, TITLE_ENTRY % ('Rating Age/User:', tmpstr))
-		tmpstr = str(self.adapter.getNumChapters()) + " / " + str(self.adapter.getNumWords())
+		tmpstr = unicode(self.adapter.getNumChapters()) + " / " + unicode(self.adapter.getNumWords())
 		self._writeFile(titleFilePath, TITLE_ENTRY % ('Chapters/Words:', tmpstr))
 		self._writeFile(titleFilePath, TITLE_ENTRY % ('Publisher:', self.adapter.getHost()))
 		self._writeFile(titleFilePath, TITLE_ENTRY % ('Story ID:', self.adapter.getStoryId()))
diff --git a/potionsNsnitches.py b/potionsNsnitches.py
index d0c3fa53..43dc47a7 100644
--- a/potionsNsnitches.py
+++ b/potionsNsnitches.py
@@ -69,7 +69,7 @@ class PotionsNSnitches(FanfictionSiteAdapter):
                     if ssss is not None and len(ssss) > 1 and ssss[0] == 'chapter':
                         self.chapurl = True
 
-        self.url = 'http://' + self.host + '/' + self.path + '?sid=' + self.storyId
+        self.url = 'http://' + self.host + self.path + '?sid=' + self.storyId
         logging.debug('self.url=%s' % self.url)
         
         logging.debug("Created PotionsNSnitches: url=%s" % (self.url))
@@ -135,7 +135,7 @@ class PotionsNSnitches(FanfictionSiteAdapter):
             data = self.opener.open(url).read()
         except Exception, e:
             data = ''
-            logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
         if data is None:
             raise StoryDoesNotExist("Problem reading story URL " + url + "!")
         
@@ -147,7 +147,7 @@ class PotionsNSnitches(FanfictionSiteAdapter):
                 data = self.opener.open(url).read()
             except Exception, e:
                 data = ''
-                logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+                logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
             if data is None:
                 raise StoryDoesNotExist("Problem reading story URL " + url + "!")
         
@@ -211,9 +211,9 @@ class PotionsNSnitches(FanfictionSiteAdapter):
                 logging.debug('self.authorName=%s, self.authorId=%s' % (self.authorName, self.authorId))
 
         output = soup.find('div', {'id' : 'output'})
-        #logging.debug('output: %s' % str(output))
-        if output is not None and len(str(output)) > 1:
-            s2 = re.split ('<[^>]+>', str(output))
+        #logging.debug('output: %s' % unicode(output))
+        if output is not None and len(unicode(output)) > 1:
+            s2 = re.split ('<[^>]+>', unicode(output))
             #logging.debug('s2=%s' % s2)
             ii = 0
             ll = len(s2)
@@ -229,8 +229,8 @@ class PotionsNSnitches(FanfictionSiteAdapter):
         cnttd = cnt.findAll('td')
         #logging.debug('cnttd: %s' % cnttd)
         for td in cnttd:
-            #logging.debug('td: %s' % str(td))
-            ss = str(td).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
+            #logging.debug('td: %s' % unicode(td))
+            ss = unicode(td).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
             if len(ss) > 1:
                 s2 = re.split ('<[^>]+>', ss)
                 #logging.debug('s2=%s' % s2)
@@ -288,7 +288,7 @@ class PotionsNSnitches(FanfictionSiteAdapter):
         tls = soup.findAll('div', {'style' : 'text-align: center;'})
         for tl in tls:
             #logging.debug('tl: %s' % tl)
-            ss = str(tl).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
+            ss = unicode(tl).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
             if ss.find('Published:') != -1:
                 s2 = re.split ('<[^>]+>', ss)
                 #logging.debug('s2: %s' % s2)
@@ -327,7 +327,7 @@ class PotionsNSnitches(FanfictionSiteAdapter):
             data = self.opener.open(url).read()
         except Exception, e:
             data = ''
-            logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
         if data is None:
             raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
         
diff --git a/twilighted.py b/twilighted.py
index 00f59364..f3b72e3c 100644
--- a/twilighted.py
+++ b/twilighted.py
@@ -116,7 +116,7 @@ class Twilighted(FanfictionSiteAdapter):
             data = self.opener.open(url).read()
         except Exception, e:
             data = ''
-            logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
         if data is None:
             raise StoryDoesNotExist("Problem reading story URL " + url + "!")
         
@@ -128,7 +128,7 @@ class Twilighted(FanfictionSiteAdapter):
                 data = self.opener.open(url).read()
             except Exception, e:
                 data = ''
-                logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+                logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
             if data is None:
                 raise StoryDoesNotExist("Problem reading story URL " + url + "!")
         
@@ -280,7 +280,7 @@ class Twilighted(FanfictionSiteAdapter):
             data = self.opener.open(url).read()
         except Exception, e:
             data = ''
-            logging.error("Caught an exception reading URL " + url + ".  Exception " + str(e) + ".")
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
         if data is None:
             raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
                 

From 5549786946cd7b19ecc129b59414c9fceabc4418 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Mon, 22 Nov 2010 07:04:17 +0000
Subject: [PATCH 76/94] Adding AppEngine files under the source control, moving
 downloaded code one directory deeper.

---
 app.yaml                                      |   31 +
 cron.yaml                                     |    4 +
 css/index.css                                 |   71 +
 delete_fic.py                                 |   59 +
 .../BeautifulSoup.py                          |    0
 __init__.py => fanficdownloader/__init__.py   |    0
 adapter.py => fanficdownloader/adapter.py     |    0
 constants.py => fanficdownloader/constants.py |    0
 .../downloader.py                             |    0
 ffnet.py => fanficdownloader/ffnet.py         |    5 +-
 .../fictionalley.py                           |    0
 ficwad.py => fanficdownloader/ficwad.py       |    0
 fpcom.py => fanficdownloader/fpcom.py         |    0
 hpfiction.py => fanficdownloader/hpfiction.py |    0
 html2text.py => fanficdownloader/html2text.py |    0
 .../html_constants.py                         |    0
 .../mediaminer.py                             |    0
 output.py => fanficdownloader/output.py       |    0
 .../potionsNsnitches.py                       |    0
 readme.txt => fanficdownloader/readme.txt     |    0
 .../twilighted.py                             |    0
 .../twipassword.py                            |    0
 zipdir.py => fanficdownloader/zipdir.py       |    0
 ffstorage.py                                  |   21 +
 index-ajax.html                               |  109 +
 index.html                                    |  189 +
 index.yaml                                    |   22 +
 js/fdownloader.js                             |  116 +
 js/jquery-1.3.2.js                            | 4376 +++++++++++++++++
 main.py                                       |  309 ++
 queue.yaml                                    |    5 +
 recent.html                                   |   69 +
 simplejson/__init__.py                        |  318 ++
 simplejson/__init__.pyc                       |  Bin 0 -> 12071 bytes
 simplejson/_speedups.c                        | 2329 +++++++++
 simplejson/decoder.py                         |  354 ++
 simplejson/decoder.pyc                        |  Bin 0 -> 11292 bytes
 simplejson/encoder.py                         |  440 ++
 simplejson/encoder.pyc                        |  Bin 0 -> 13938 bytes
 simplejson/scanner.py                         |   65 +
 simplejson/scanner.pyc                        |  Bin 0 -> 2340 bytes
 simplejson/tests/__init__.py                  |   23 +
 simplejson/tests/test_check_circular.py       |   30 +
 simplejson/tests/test_decode.py               |   22 +
 simplejson/tests/test_default.py              |    9 +
 simplejson/tests/test_dump.py                 |   21 +
 .../tests/test_encode_basestring_ascii.py     |   38 +
 simplejson/tests/test_fail.py                 |   76 +
 simplejson/tests/test_float.py                |   15 +
 simplejson/tests/test_indent.py               |   41 +
 simplejson/tests/test_pass1.py                |   76 +
 simplejson/tests/test_pass2.py                |   14 +
 simplejson/tests/test_pass3.py                |   20 +
 simplejson/tests/test_recursion.py            |   67 +
 simplejson/tests/test_scanstring.py           |  111 +
 simplejson/tests/test_separators.py           |   42 +
 simplejson/tests/test_unicode.py              |   64 +
 simplejson/tool.py                            |   37 +
 static/ajax-loader.gif                        |  Bin 0 -> 10819 bytes
 static/favicon.ico                            |  Bin 0 -> 21792 bytes
 utils/remover.py                              |   53 +
 61 files changed, 9650 insertions(+), 1 deletion(-)
 create mode 100644 app.yaml
 create mode 100644 cron.yaml
 create mode 100644 css/index.css
 create mode 100644 delete_fic.py
 rename BeautifulSoup.py => fanficdownloader/BeautifulSoup.py (100%)
 rename __init__.py => fanficdownloader/__init__.py (100%)
 rename adapter.py => fanficdownloader/adapter.py (100%)
 rename constants.py => fanficdownloader/constants.py (100%)
 rename downloader.py => fanficdownloader/downloader.py (100%)
 rename ffnet.py => fanficdownloader/ffnet.py (98%)
 rename fictionalley.py => fanficdownloader/fictionalley.py (100%)
 rename ficwad.py => fanficdownloader/ficwad.py (100%)
 rename fpcom.py => fanficdownloader/fpcom.py (100%)
 rename hpfiction.py => fanficdownloader/hpfiction.py (100%)
 rename html2text.py => fanficdownloader/html2text.py (100%)
 rename html_constants.py => fanficdownloader/html_constants.py (100%)
 rename mediaminer.py => fanficdownloader/mediaminer.py (100%)
 rename output.py => fanficdownloader/output.py (100%)
 rename potionsNsnitches.py => fanficdownloader/potionsNsnitches.py (100%)
 rename readme.txt => fanficdownloader/readme.txt (100%)
 rename twilighted.py => fanficdownloader/twilighted.py (100%)
 rename twipassword.py => fanficdownloader/twipassword.py (100%)
 rename zipdir.py => fanficdownloader/zipdir.py (100%)
 create mode 100644 ffstorage.py
 create mode 100644 index-ajax.html
 create mode 100644 index.html
 create mode 100644 index.yaml
 create mode 100644 js/fdownloader.js
 create mode 100644 js/jquery-1.3.2.js
 create mode 100644 main.py
 create mode 100644 queue.yaml
 create mode 100644 recent.html
 create mode 100644 simplejson/__init__.py
 create mode 100644 simplejson/__init__.pyc
 create mode 100644 simplejson/_speedups.c
 create mode 100644 simplejson/decoder.py
 create mode 100644 simplejson/decoder.pyc
 create mode 100644 simplejson/encoder.py
 create mode 100644 simplejson/encoder.pyc
 create mode 100644 simplejson/scanner.py
 create mode 100644 simplejson/scanner.pyc
 create mode 100644 simplejson/tests/__init__.py
 create mode 100644 simplejson/tests/test_check_circular.py
 create mode 100644 simplejson/tests/test_decode.py
 create mode 100644 simplejson/tests/test_default.py
 create mode 100644 simplejson/tests/test_dump.py
 create mode 100644 simplejson/tests/test_encode_basestring_ascii.py
 create mode 100644 simplejson/tests/test_fail.py
 create mode 100644 simplejson/tests/test_float.py
 create mode 100644 simplejson/tests/test_indent.py
 create mode 100644 simplejson/tests/test_pass1.py
 create mode 100644 simplejson/tests/test_pass2.py
 create mode 100644 simplejson/tests/test_pass3.py
 create mode 100644 simplejson/tests/test_recursion.py
 create mode 100644 simplejson/tests/test_scanstring.py
 create mode 100644 simplejson/tests/test_separators.py
 create mode 100644 simplejson/tests/test_unicode.py
 create mode 100644 simplejson/tool.py
 create mode 100644 static/ajax-loader.gif
 create mode 100644 static/favicon.ico
 create mode 100644 utils/remover.py

diff --git a/app.yaml b/app.yaml
new file mode 100644
index 00000000..6f1ccdc8
--- /dev/null
+++ b/app.yaml
@@ -0,0 +1,31 @@
+application: fanfictionloader
+version: 2-5-5
+runtime: python
+api_version: 1
+
+handlers:
+- url: /generate_mock_data
+  script: mocks/generate_mock_data.py
+  login: admin
+
+- url: /r3m0v3r
+  script: utils/remover.py
+  login: admin
+
+- url: /r3m0v3r
+  script: main.py
+  login: admin
+  
+- url: /css
+  static_dir: css
+
+- url: /js
+  static_dir: js
+
+- url: /static
+  static_dir: static
+
+
+- url: /.*
+  script: main.py
+ 
diff --git a/cron.yaml b/cron.yaml
new file mode 100644
index 00000000..1d9c70a0
--- /dev/null
+++ b/cron.yaml
@@ -0,0 +1,4 @@
+cron:
+- description: cleanup job
+  url: /r3m0v3r
+  schedule: every 3 hours
\ No newline at end of file
diff --git a/css/index.css b/css/index.css
new file mode 100644
index 00000000..f4aec452
--- /dev/null
+++ b/css/index.css
@@ -0,0 +1,71 @@
+body
+{
+	font: 0.9em "Helvetica Neue", Arial, Helvetica, Geneva, sans-serif;
+}
+
+#main
+{
+	width: 43%;
+	margin-left: 23%;
+	background-color: #dae6ff;
+	padding: 2em;
+}
+
+#greeting
+{
+	margin-bottom: 1em;
+	border-color: #efefef;
+}
+
+
+
+#logpassword:hover, #logpasswordtable:hover, #urlbox:hover, #typebox:hover, #helpbox:hover, #yourfile:hover
+{
+	border: thin solid #fffeff;	
+}
+
+h1
+{
+	text-decoration: none;
+}
+
+#logpasswordtable
+{
+	padding: 1em;
+}
+
+#logpassword, #logpasswordtable {
+  display: none;
+}
+
+#urlbox, #typebox, #logpasswordtable, #logpassword, #helpbox, #yourfile
+{
+	margin: 1em;
+	padding: 1em;
+	border: thin dotted #fffeff;	
+}
+
+div.field
+{
+	margin-bottom: 0.5em;
+}
+
+#submitbtn
+{
+	padding: 1em;
+}
+
+#typelabel
+{
+}
+
+#typeoptions
+{
+	margin-top: 0.5em;
+}
+
+#error
+{
+	font-size: small;
+	color: #f00;
+}
\ No newline at end of file
diff --git a/delete_fic.py b/delete_fic.py
new file mode 100644
index 00000000..73722724
--- /dev/null
+++ b/delete_fic.py
@@ -0,0 +1,59 @@
+import os
+import cgi
+import sys
+import logging
+import traceback
+import StringIO
+
+from google.appengine.api import users
+from google.appengine.ext import webapp
+from google.appengine.ext.webapp import util
+
+from fanficdownloader.downaloder import *
+from fanficdownloader.ffnet import *
+from fanficdownloader.output import *
+
+from google.appengine.ext import db
+
+from fanficdownloader.zipdir import *
+
+from ffstorage import *
+
+def create_mac(user, fic_id, fic_url):
+  return str(abs(hash(user)+hash(fic_id)))+str(abs(hash(fic_url)))
+  
+def check_mac(user, fic_id, fic_url, mac):
+  return (create_mac(user, fic_id, fic_url) == mac)
+
+def create_mac_for_fic(user, fic_id):
+  key = db.Key(fic_id)
+	fanfic = db.get(key)
+	if fanfic.user != user:
+	  return None
+	else:
+	  return create_mac(user, key, fanfic.url)
+
+class DeleteFicHandler(webapp.RequestHandler):
+	def get(self):
+		user = users.get_current_user()
+		if not user:
+			self.redirect('/login')
+
+    fic_id = self.request.get('fic_id')
+    fic_mac = self.request.get('key_id')
+    
+    actual_mac = create_mac_for_fic(user, fic_id)
+    if actual_mac != fic_mac:
+      self.response.out.write("Ooops")
+    else:
+      key = db.Key(fic_id)
+    	fanfic = db.get(key)
+      fanfic.delete()
+      self.redirect('/recent')
+    
+
+		fics = db.GqlQuery("Select * From DownloadedFanfic WHERE user = :1", user)
+		template_values = dict(fics = fics, nickname = user.nickname())
+		path = os.path.join(os.path.dirname(__file__), 'recent.html')
+		self.response.out.write(template.render(path, template_values))
+	
\ No newline at end of file
diff --git a/BeautifulSoup.py b/fanficdownloader/BeautifulSoup.py
similarity index 100%
rename from BeautifulSoup.py
rename to fanficdownloader/BeautifulSoup.py
diff --git a/__init__.py b/fanficdownloader/__init__.py
similarity index 100%
rename from __init__.py
rename to fanficdownloader/__init__.py
diff --git a/adapter.py b/fanficdownloader/adapter.py
similarity index 100%
rename from adapter.py
rename to fanficdownloader/adapter.py
diff --git a/constants.py b/fanficdownloader/constants.py
similarity index 100%
rename from constants.py
rename to fanficdownloader/constants.py
diff --git a/downloader.py b/fanficdownloader/downloader.py
similarity index 100%
rename from downloader.py
rename to fanficdownloader/downloader.py
diff --git a/ffnet.py b/fanficdownloader/ffnet.py
similarity index 98%
rename from ffnet.py
rename to fanficdownloader/ffnet.py
index 3963d529..4caa13fa 100644
--- a/ffnet.py
+++ b/fanficdownloader/ffnet.py
@@ -276,9 +276,10 @@ class FFNet(FanfictionSiteAdapter):
 		return urls
 	
 	def getText(self, url):
-		time.sleep( 2.0 )
+		# time.sleep( 2.0 )
 		data = ''
 		try:
+			logging.debug("Fetching URL: %s" % url)
 			data = self.fetchUrl(url)
 		except Exception, e:
 			data = ''
@@ -301,10 +302,12 @@ class FFNet(FanfictionSiteAdapter):
 		try:
 			soup = bs.BeautifulStoneSoup(data)
 		except:
+			logging.debug(data)
 			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
 
 		div = soup.find('div', {'id' : 'storytext'})
 		if None == div:
+			logging.debug(data)
 			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
 			
 		return div.__str__('utf8')
diff --git a/fictionalley.py b/fanficdownloader/fictionalley.py
similarity index 100%
rename from fictionalley.py
rename to fanficdownloader/fictionalley.py
diff --git a/ficwad.py b/fanficdownloader/ficwad.py
similarity index 100%
rename from ficwad.py
rename to fanficdownloader/ficwad.py
diff --git a/fpcom.py b/fanficdownloader/fpcom.py
similarity index 100%
rename from fpcom.py
rename to fanficdownloader/fpcom.py
diff --git a/hpfiction.py b/fanficdownloader/hpfiction.py
similarity index 100%
rename from hpfiction.py
rename to fanficdownloader/hpfiction.py
diff --git a/html2text.py b/fanficdownloader/html2text.py
similarity index 100%
rename from html2text.py
rename to fanficdownloader/html2text.py
diff --git a/html_constants.py b/fanficdownloader/html_constants.py
similarity index 100%
rename from html_constants.py
rename to fanficdownloader/html_constants.py
diff --git a/mediaminer.py b/fanficdownloader/mediaminer.py
similarity index 100%
rename from mediaminer.py
rename to fanficdownloader/mediaminer.py
diff --git a/output.py b/fanficdownloader/output.py
similarity index 100%
rename from output.py
rename to fanficdownloader/output.py
diff --git a/potionsNsnitches.py b/fanficdownloader/potionsNsnitches.py
similarity index 100%
rename from potionsNsnitches.py
rename to fanficdownloader/potionsNsnitches.py
diff --git a/readme.txt b/fanficdownloader/readme.txt
similarity index 100%
rename from readme.txt
rename to fanficdownloader/readme.txt
diff --git a/twilighted.py b/fanficdownloader/twilighted.py
similarity index 100%
rename from twilighted.py
rename to fanficdownloader/twilighted.py
diff --git a/twipassword.py b/fanficdownloader/twipassword.py
similarity index 100%
rename from twipassword.py
rename to fanficdownloader/twipassword.py
diff --git a/zipdir.py b/fanficdownloader/zipdir.py
similarity index 100%
rename from zipdir.py
rename to fanficdownloader/zipdir.py
diff --git a/ffstorage.py b/ffstorage.py
new file mode 100644
index 00000000..78647803
--- /dev/null
+++ b/ffstorage.py
@@ -0,0 +1,21 @@
+from google.appengine.ext import db
+
+class OneDownload(db.Model):
+	user = db.UserProperty()
+	url = db.StringProperty()
+	format = db.StringProperty()
+	login = db.StringProperty()
+	password = db.StringProperty()
+	failure = db.StringProperty()
+	date = db.DateTimeProperty(auto_now_add=True)
+	
+class DownloadedFanfic(db.Model):
+	user = db.UserProperty()
+	url = db.StringProperty()
+	name = db.StringProperty()
+	author = db.StringProperty()
+	format = db.StringProperty()
+	date = db.DateTimeProperty(auto_now_add=True)
+	blob = db.BlobProperty()
+	mac = db.StringProperty()
+	cleared = db.BooleanProperty(default=False)
\ No newline at end of file
diff --git a/index-ajax.html b/index-ajax.html
new file mode 100644
index 00000000..51dc6318
--- /dev/null
+++ b/index-ajax.html
@@ -0,0 +1,109 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01//EN">
+<html>
+	<head>
+		<link href="css/index.css" rel="stylesheet" type="text/css">
+		<link type="text/css" href="http://jqueryui.com/latest/themes/base/ui.all.css" rel="stylesheet" />
+	 
+		<title>Fanfiction Downloader (fanfiction.net, fictionalley, ficwad to epub and HTML)</title>
+		<meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
+		<script src="/js/jquery-1.3.2.js"></script>
+		<script src="/js/fdownloader.js"></script>
+		
+		<script type="text/javascript" src="http://jqueryui.com/latest/ui/ui.core.js"></script>
+	    <script type="text/javascript" src="http://jqueryui.com/latest/ui/ui.progressbar.js"></script>
+	  
+	</head>
+	<body>
+		<div id='main'>
+			<h1>
+				<a href="/" style="text-decoration: none; color: black;">FanFiction Downloader</a>
+			</h1>
+				
+<!--			<form action="/fdown" method="post"> -->
+				<div id='urlbox'>
+					<div id='greeting'>
+						Hi, {{ nickname }}! This is a fan fiction downloader, which makes reading stories from various websites much easier. Please paste a URL of the <em>first chapter</em> in the box to start. Alternatively, see your personal list of <a href="/recent">previously downloaded fanfics</a>.
+					</div>
+					<input type="text" id='url' name="url" size="50" value='{{ url }}'>
+					<div style="margin-top: 0.5em;">
+					Ebook format &nbsp;<select name="format" id="format">
+												<option value='epub'>ePub</option>
+												<option value='html'>HTML</option>
+											</select>
+					</div>
+					
+					<div id='error' style='color: red'>
+
+					</div>
+					
+					
+					
+				</div>
+				
+				<div id='yourfile' style='display:none'>
+				</div>
+				
+				<div id='typebox'>
+				</div>
+				
+				<h3>
+					Login and Password
+				</h3>
+				<div id='logpassword'>
+					If the story requires a login and password to download (e.g. marked as Mature on FFA), you may need to provide your credentials to download it, otherwise just leave it empty
+				</div>
+				<div id='logpasswordtable'>
+					<div class='fieldandlabel'>
+						<div class='label'>Login</div>
+						<div class='field'><input type='text' name='login' id='login' size='50'></div>
+					</div>
+					
+					<div class='fieldandlabel'>
+						<div class='label'>Password</div>
+						<div class='field'><input type='password' id='password' name='password' size='50'></div>
+					</div>
+				</div>
+				<div id='submitbtn'>
+					<span id='submit_button'><button onclick='downloadFanfic();'>Download</button></span>
+					<span id='ajax_loader' style='display:none'><img src="/static/ajax-loader.gif"></span>
+				</div>
+
+				
+				<div id="progressbar">
+					
+				</div>
+				<div id='helpbox'>
+				Few things to know, which will make your life substantially easier:
+				<ol>
+					<li>Small <a href="http://www.sigizmund.com/reading-fanfiction-off-line-in-stanza-and-oth">post written by me</a> &mdash; how to read fiction in Stanza or any other ebook reader. </a></li>
+					<li>Currently we support fanfiction.net, fictionpress.com, fanficauthors.net and ficwad.com</li>
+					<li>Paste a URL of the first chapter of the fanfic, not the index page</li>
+					<li>Fics with a single chapter are not supported (you can just copy and paste it)</li>
+					<li>Stories which are too long may not be downloaded correctly and application will report a time-out error &mdash; this is a limitation which is currently imposed by Google AppEngine on a long-running activities</li>
+					<li>FicWad support is somewhat flaky &mdash; if you feel it doesn't work for you, send all the details to me</li>
+					<li>You can download fanfics and store them for 'later' by just downloading them and visiting <a href="/recent">recent downloads</a> section, but in future they will be deleted after 5 days to save the space</li>
+					<li>If Downloader simply opens a download file window rather than saves the fanfic and gives you a link, it means it is too large to save in the database and you need to download it straight away</li>
+					<li>If you think that something that should work in fact doesn't, drop me a mail to <a href='mailto:sigizmund@gmail.com'>sigizmund@gmail.com</a></li>
+				</ol>
+				Otherwise, just have fun, and if you want to say thank you &mdash; use the email above.
+				</div>
+				<div style='text-align: center'>
+					<img src="http://code.google.com/appengine/images/appengine-silver-120x30.gif"
+					alt="Powered by Google App Engine" />
+					<br/><br/>
+					FanfictionLoader is a web front-end to <A href="http://code.google.com/p/fanficdownloader/">fanficdownloader</a><br/>
+					Copyright &copy; <a href="http://twitter.com/sigizmund">Roman Kirillov</a>
+				</div>
+<!--			</form> -->
+		</div>
+		<script type="text/javascript">
+		var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+		document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+		</script>
+		<script type="text/javascript">
+		try {
+		var pageTracker = _gat._getTracker("UA-12136939-1");
+		pageTracker._trackPageview();
+		} catch(err) {}</script>
+	</body>
+</html>
diff --git a/index.html b/index.html
new file mode 100644
index 00000000..4987804d
--- /dev/null
+++ b/index.html
@@ -0,0 +1,189 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01//EN">
+<html>
+	<head>
+		<link href="css/index.css" rel="stylesheet" type="text/css">
+		<title>Fanfiction Downloader &mdash; twilighted.net, fanfiction.net, fictionpress.com, fictionalley.org, ficwad.com, potionsandsnitches.net, harrypotterfanfiction.com to epub and HTML to Stanza, Kindle, Nook, Sony Reader</title>
+		<meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
+		<meta name="google-site-verification" content="kCFc-G4bka_pJN6Rv8CapPBcwmq0hbAUZPkKWqRsAYU" />
+	</head>
+	<body>
+		<div id='main'>
+			<h1>
+				<a href="/" style="text-decoration: none; color: black;">FanFiction Downloader</a>
+			</h1>
+			
+			<div style="text-align: center">
+                <script type="text/javascript"><!--
+                google_ad_client = "pub-2027714004231956";
+                /* FFD */
+                google_ad_slot = "7330682770";
+                google_ad_width = 468;
+                google_ad_height = 60;
+                //-->
+                </script>
+                <script type="text/javascript"
+                src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
+                </script>
+            </div>
+<!--			<div id='yourfile'> -->
+			{{yourfile}}
+<!--			</div> -->
+
+			{% if authorized %}
+			<form action="/fdown" method="post">
+				<div id='urlbox'>
+					<div id='greeting'>
+					  Hi, {{ nickname }}! This is a fan fiction downloader, which makes reading stories from various websites
+					  much easier. 
+					  <ul>
+					    <li>
+					      For fictionalley.org, please paste the URL of the story's chapter list in the box, such as
+					      <a href="http://www.fictionalley.org/authors/drt/DA.html">this</a>.  Or the story text URL for
+					      fictionalley.org one-shots, such
+					      as <a href="http://www.fictionalley.org/authors/drt/JOTP01a.html">this</a>.
+					    </li>
+					    <li>
+					      For all other supported sites, please paste the URL of the <em>first chapter</em> in the box.  For
+					      one-shots, the first chapter is the whole story.
+					    </li>
+					    <li>
+					      Alternatively, see your personal list of <a href="/recent">previously downloaded fanfics</a>.
+					    </li>
+					  </ul>	
+					</div>
+					<div id='error'>
+					{{ error_message }}
+					</div>
+					<input type="text" name="url" size="50" value='{{ url }}'>
+				</div>
+				
+				<div id='typebox'>
+					<div id='typelabel'>Ebook format</div>
+					<div id='typeoptions'>
+						<input type='radio' name='format' value='epub' checked>EPub</input>
+						<input type='radio' name='format' value='html'>HTML</input>
+						<input type='radio' name='format' value='text'>Plain Text</input>
+					</div>
+				</div>
+				
+				<h3>Login and Password</h3>
+				<div id='logpassword'>
+				  
+					If the story requires a login and password to download (e.g. marked as Mature on FFA), you may need to provide
+					your credentials to download it, otherwise just leave it empty
+				</div>
+				<div id='logpasswordtable'>
+					<div class='fieldandlabel'>
+						<div class='label'>Login</div>
+						<div class='field'><input type='text' name='login' size='50'></div>
+					</div>
+					
+					<div class='fieldandlabel'>
+						<div class='label'>Password</div>
+						<div class='field'><input type='password' name='password' size='50'></div>
+					</div>
+				</div>
+				<div id='submitbtn'>
+					<input type="submit" value="Download">
+				</div>
+			</form>
+			{% else %}
+			<div id='urlbox'>
+				<div id='greeting'>
+					<p>
+					  This is a fan fiction downloader, which makes reading stories from various websites much easier. Before you
+					  can start downloading fanfics, you need to login, so downloader can remember your fanfics and store them.
+					</p>
+					<p><a href="{{ login_url }}">Login using Google account</a></p>
+				</div>
+			</div>
+			{% endif %}
+			
+				<div id='helpbox'>
+				Few things to know, which will make your life substantially easier:
+				<ol>
+				  <li>
+				    First thing to know: I do not use your login and password. In fact, all I know about it is your ID &ndash; password
+				    is being verified by Google and is absolutely, totally unknown to anyone but you.
+				  </li>
+				  <li>
+				    Small <a href="http://www.sigizmund.com/reading-fanfiction-off-line-in-stanza-and-oth">post written by me</a>
+				    &mdash; how to read fiction in Stanza or any other ebook reader.
+				  </li>
+				  <li>
+				    Currently we support fanfiction.net, fictionpress.com, ficwad.com, fictionalley.org, harrypotterfanfiction.com, potionsandsnitches.net, and twilighted.net.
+				    (fanficauthors.net withdrawn as they offer native ePub functionality now.)
+				  </li>
+				  <li>
+				    You can download fanfiction directly from your iPhone, Kindle or (possibly) other ebook reader.
+				  </li>
+				  <li>
+				    Paste a URL of the first chapter of the fanfic, not the index page, except for fictionalley.org.
+				  </li>
+				  <li>
+				    For fictionalley.org, you need to use the URL of the story's chapter list, such as
+				    <a href="http://www.fictionalley.org/authors/drt/DA.html">this</a>.  Or the story text URL for fictionalley.org
+				    one-shots, such as <a href="http://www.fictionalley.org/authors/drt/JOTP01a.html">this</a>.
+				  </li>
+				  <li>
+				    One-shots, fics with a single chapter, <em>are</em> now supported.
+				  </li>
+				  <li>
+				    You can download fanfics and store them for 'later' by just downloading them and visiting <a href="/recent">recent
+				    downloads</a> section.
+				  </li>
+				  <li>
+				    Downloaded stories are deleted after some time (which should give you enough of time to download it and will keep
+				    Google happy about the app not going over the storage limit).
+				  </li>
+				  <li>
+				    If Downloader simply opens a download file window rather than saves the fanfic and gives you a link, it means it is
+				    too large to save in the database and you need to download it straight away.
+				  </li>
+				  <li>
+				    If you see some funny characters in downloaded Plain Text file, make sure you choose text file encoding UTF-8 and
+				    not something else.
+				  </li>
+				  <li>
+				    If you think that something that should work in fact doesn't, drop me a mail
+				    to <a href='mailto:sigizmund@gmail.com'>sigizmund@gmail.com</a>, or, even better, write an email to
+				    our <a href="http://groups.google.com/group/fanfic-downloader">Google Group</a>. I also encourage you to join it so
+				    you will find out about latest updates and fixes as soon as possible
+				  </li>
+				</ol>
+				Otherwise, just have fun, and if you want to say thank you &mdash; use the contacts above. 
+				</div>
+				<div style='text-align: center'>
+					<img src="http://code.google.com/appengine/images/appengine-silver-120x30.gif"
+					alt="Powered by Google App Engine" />
+					<br/><br/>
+					FanfictionLoader is a web front-end to <A href="http://code.google.com/p/fanficdownloader/">fanficdownloader</a><br/>
+					Copyright &copy; <a href="http://twitter.com/sigizmund">Roman Kirillov</a>
+				</div>
+
+			<div style="margin-top: 1em; text-align: center'">
+                <script type="text/javascript"><!--
+                google_ad_client = "pub-2027714004231956";
+                /* FFD */
+                google_ad_slot = "7330682770";
+                google_ad_width = 468;
+                google_ad_height = 60;
+                //-->
+                </script>
+                <script type="text/javascript"
+                src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
+                </script>
+            </div>
+			
+		</div>
+		<script type="text/javascript">
+		var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+		document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+		</script>
+		<script type="text/javascript">
+		try {
+		var pageTracker = _gat._getTracker("UA-12136939-1");
+		pageTracker._trackPageview();
+		} catch(err) {}</script>
+	</body>
+</html>
diff --git a/index.yaml b/index.yaml
new file mode 100644
index 00000000..bbed2dff
--- /dev/null
+++ b/index.yaml
@@ -0,0 +1,22 @@
+indexes:
+
+# AUTOGENERATED
+
+# This index.yaml is automatically updated whenever the dev_appserver
+# detects that a new type of query is run.  If you want to manage the
+# index.yaml file manually, remove the above marker line (the line
+# saying "# AUTOGENERATED").  If you want to manage some indexes
+# manually, move them above the marker line.  The index.yaml file is
+# automatically uploaded to the admin console when you next deploy
+# your application using appcfg.py.
+
+- kind: DownloadedFanfic
+  properties:
+  - name: cleared
+  - name: date
+
+- kind: DownloadedFanfic
+  properties:
+  - name: user
+  - name: date
+    direction: desc
diff --git a/js/fdownloader.js b/js/fdownloader.js
new file mode 100644
index 00000000..8f6ab0a8
--- /dev/null
+++ b/js/fdownloader.js
@@ -0,0 +1,116 @@
+var g_CurrentKey = null;
+var g_Counter = 0;
+
+var COUNTER_MAX = 50;
+
+
+function setErrorState(error)
+{
+	olderr = error;
+	error = error + "<br/><a href='mailto:sigizmund@gmail.com?subject=Problem with the fanfiction downloader'>" + "Complain about this error</a>";
+	$('#error').html(error);
+}
+
+function clearErrorState()
+{
+	$('#error').html('');
+}
+
+function showFile(data)
+{
+	$('#yourfile').html('<a href="/file?id=' + data.key + '">' + data.name + " by " + data.author + "</a>");
+	$('#yourfile').show();
+}
+
+function hideFile()
+{
+	$('#yourfile').hide();
+}
+
+function checkResults()
+{
+	if ( g_Counter >= COUNTER_MAX )
+	{
+		return;
+	}
+	
+	g_Counter+=1;
+
+	$.getJSON('/progress', { 'key' : g_CurrentKey }, function(data)
+	{
+		if ( data.result != "Nope")
+		{
+			if ( data.result != "OK" )
+			{
+				leaveLoadingState();
+				setErrorState(data.result);
+			}
+			else
+			{
+				showFile(data);
+				leaveLoadingState();
+				// result = data.split("|");
+				// showFile(result[1], result[2], result[3]);
+			}
+			
+			$("#progressbar").progressbar('destroy');
+			g_Counter = 101;
+		}
+	});
+	
+	if ( g_Counter < COUNTER_MAX ) 
+		setTimeout("checkResults()", 1000);
+	else
+	{
+		leaveLoadingState();
+		setErrorState("Operation takes too long - terminating by timeout (story too long?)");
+	}
+}
+
+function enterLoadingState()
+{
+	$('#submit_button').hide();
+	$('#ajax_loader').show();
+}
+
+function leaveLoadingState()
+{
+	$('#submit_button').show();
+	$('#ajax_loader').hide();
+}
+
+function downloadFanfic()
+{
+	clearErrorState();
+	hideFile();
+
+
+	format = $("#format").val();
+	alert(format);
+	
+	return;
+	
+	var url = $('#url').val();
+	var login = $('#login').val();
+	var password = $('#password').val();
+	
+	if ( url == '' )
+	{
+		setErrorState('URL shouldn\'t be empty');
+		return;
+	}
+	
+	if ( (url.indexOf('fanfiction.net') == -1 && url.indexOf('fanficauthors') == -1 && url.indexOf('ficwad') == -1  &&  url.indexOf('fictionpress') == -1) || (url.indexOf('adultfanfiction.net') != -1) )
+	{
+		setErrorState("This source is not yet supported. Ping me if you want it!");
+		return;
+	}
+	
+	$.post('/submitDownload', {'url' : url, 'login' : login, 'password' : password, 'format' : format}, function(data)
+	{
+		g_CurrentKey = data;
+		g_Counter = 0;
+		setTimeout("checkResults()", 1000);
+		enterLoadingState();
+	})
+}
\ No newline at end of file
diff --git a/js/jquery-1.3.2.js b/js/jquery-1.3.2.js
new file mode 100644
index 00000000..92635743
--- /dev/null
+++ b/js/jquery-1.3.2.js
@@ -0,0 +1,4376 @@
+/*!
+ * jQuery JavaScript Library v1.3.2
+ * http://jquery.com/
+ *
+ * Copyright (c) 2009 John Resig
+ * Dual licensed under the MIT and GPL licenses.
+ * http://docs.jquery.com/License
+ *
+ * Date: 2009-02-19 17:34:21 -0500 (Thu, 19 Feb 2009)
+ * Revision: 6246
+ */
+(function(){
+
+var 
+	// Will speed up references to window, and allows munging its name.
+	window = this,
+	// Will speed up references to undefined, and allows munging its name.
+	undefined,
+	// Map over jQuery in case of overwrite
+	_jQuery = window.jQuery,
+	// Map over the $ in case of overwrite
+	_$ = window.$,
+
+	jQuery = window.jQuery = window.$ = function( selector, context ) {
+		// The jQuery object is actually just the init constructor 'enhanced'
+		return new jQuery.fn.init( selector, context );
+	},
+
+	// A simple way to check for HTML strings or ID strings
+	// (both of which we optimize for)
+	quickExpr = /^[^<]*(<(.|\s)+>)[^>]*$|^#([\w-]+)$/,
+	// Is it a simple selector
+	isSimple = /^.[^:#\[\.,]*$/;
+
+jQuery.fn = jQuery.prototype = {
+	init: function( selector, context ) {
+		// Make sure that a selection was provided
+		selector = selector || document;
+
+		// Handle $(DOMElement)
+		if ( selector.nodeType ) {
+			this[0] = selector;
+			this.length = 1;
+			this.context = selector;
+			return this;
+		}
+		// Handle HTML strings
+		if ( typeof selector === "string" ) {
+			// Are we dealing with HTML string or an ID?
+			var match = quickExpr.exec( selector );
+
+			// Verify a match, and that no context was specified for #id
+			if ( match && (match[1] || !context) ) {
+
+				// HANDLE: $(html) -> $(array)
+				if ( match[1] )
+					selector = jQuery.clean( [ match[1] ], context );
+
+				// HANDLE: $("#id")
+				else {
+					var elem = document.getElementById( match[3] );
+
+					// Handle the case where IE and Opera return items
+					// by name instead of ID
+					if ( elem && elem.id != match[3] )
+						return jQuery().find( selector );
+
+					// Otherwise, we inject the element directly into the jQuery object
+					var ret = jQuery( elem || [] );
+					ret.context = document;
+					ret.selector = selector;
+					return ret;
+				}
+
+			// HANDLE: $(expr, [context])
+			// (which is just equivalent to: $(content).find(expr)
+			} else
+				return jQuery( context ).find( selector );
+
+		// HANDLE: $(function)
+		// Shortcut for document ready
+		} else if ( jQuery.isFunction( selector ) )
+			return jQuery( document ).ready( selector );
+
+		// Make sure that old selector state is passed along
+		if ( selector.selector && selector.context ) {
+			this.selector = selector.selector;
+			this.context = selector.context;
+		}
+
+		return this.setArray(jQuery.isArray( selector ) ?
+			selector :
+			jQuery.makeArray(selector));
+	},
+
+	// Start with an empty selector
+	selector: "",
+
+	// The current version of jQuery being used
+	jquery: "1.3.2",
+
+	// The number of elements contained in the matched element set
+	size: function() {
+		return this.length;
+	},
+
+	// Get the Nth element in the matched element set OR
+	// Get the whole matched element set as a clean array
+	get: function( num ) {
+		return num === undefined ?
+
+			// Return a 'clean' array
+			Array.prototype.slice.call( this ) :
+
+			// Return just the object
+			this[ num ];
+	},
+
+	// Take an array of elements and push it onto the stack
+	// (returning the new matched element set)
+	pushStack: function( elems, name, selector ) {
+		// Build a new jQuery matched element set
+		var ret = jQuery( elems );
+
+		// Add the old object onto the stack (as a reference)
+		ret.prevObject = this;
+
+		ret.context = this.context;
+
+		if ( name === "find" )
+			ret.selector = this.selector + (this.selector ? " " : "") + selector;
+		else if ( name )
+			ret.selector = this.selector + "." + name + "(" + selector + ")";
+
+		// Return the newly-formed element set
+		return ret;
+	},
+
+	// Force the current matched set of elements to become
+	// the specified array of elements (destroying the stack in the process)
+	// You should use pushStack() in order to do this, but maintain the stack
+	setArray: function( elems ) {
+		// Resetting the length to 0, then using the native Array push
+		// is a super-fast way to populate an object with array-like properties
+		this.length = 0;
+		Array.prototype.push.apply( this, elems );
+
+		return this;
+	},
+
+	// Execute a callback for every element in the matched set.
+	// (You can seed the arguments with an array of args, but this is
+	// only used internally.)
+	each: function( callback, args ) {
+		return jQuery.each( this, callback, args );
+	},
+
+	// Determine the position of an element within
+	// the matched set of elements
+	index: function( elem ) {
+		// Locate the position of the desired element
+		return jQuery.inArray(
+			// If it receives a jQuery object, the first element is used
+			elem && elem.jquery ? elem[0] : elem
+		, this );
+	},
+
+	attr: function( name, value, type ) {
+		var options = name;
+
+		// Look for the case where we're accessing a style value
+		if ( typeof name === "string" )
+			if ( value === undefined )
+				return this[0] && jQuery[ type || "attr" ]( this[0], name );
+
+			else {
+				options = {};
+				options[ name ] = value;
+			}
+
+		// Check to see if we're setting style values
+		return this.each(function(i){
+			// Set all the styles
+			for ( name in options )
+				jQuery.attr(
+					type ?
+						this.style :
+						this,
+					name, jQuery.prop( this, options[ name ], type, i, name )
+				);
+		});
+	},
+
+	css: function( key, value ) {
+		// ignore negative width and height values
+		if ( (key == 'width' || key == 'height') && parseFloat(value) < 0 )
+			value = undefined;
+		return this.attr( key, value, "curCSS" );
+	},
+
+	text: function( text ) {
+		if ( typeof text !== "object" && text != null )
+			return this.empty().append( (this[0] && this[0].ownerDocument || document).createTextNode( text ) );
+
+		var ret = "";
+
+		jQuery.each( text || this, function(){
+			jQuery.each( this.childNodes, function(){
+				if ( this.nodeType != 8 )
+					ret += this.nodeType != 1 ?
+						this.nodeValue :
+						jQuery.fn.text( [ this ] );
+			});
+		});
+
+		return ret;
+	},
+
+	wrapAll: function( html ) {
+		if ( this[0] ) {
+			// The elements to wrap the target around
+			var wrap = jQuery( html, this[0].ownerDocument ).clone();
+
+			if ( this[0].parentNode )
+				wrap.insertBefore( this[0] );
+
+			wrap.map(function(){
+				var elem = this;
+
+				while ( elem.firstChild )
+					elem = elem.firstChild;
+
+				return elem;
+			}).append(this);
+		}
+
+		return this;
+	},
+
+	wrapInner: function( html ) {
+		return this.each(function(){
+			jQuery( this ).contents().wrapAll( html );
+		});
+	},
+
+	wrap: function( html ) {
+		return this.each(function(){
+			jQuery( this ).wrapAll( html );
+		});
+	},
+
+	append: function() {
+		return this.domManip(arguments, true, function(elem){
+			if (this.nodeType == 1)
+				this.appendChild( elem );
+		});
+	},
+
+	prepend: function() {
+		return this.domManip(arguments, true, function(elem){
+			if (this.nodeType == 1)
+				this.insertBefore( elem, this.firstChild );
+		});
+	},
+
+	before: function() {
+		return this.domManip(arguments, false, function(elem){
+			this.parentNode.insertBefore( elem, this );
+		});
+	},
+
+	after: function() {
+		return this.domManip(arguments, false, function(elem){
+			this.parentNode.insertBefore( elem, this.nextSibling );
+		});
+	},
+
+	end: function() {
+		return this.prevObject || jQuery( [] );
+	},
+
+	// For internal use only.
+	// Behaves like an Array's method, not like a jQuery method.
+	push: [].push,
+	sort: [].sort,
+	splice: [].splice,
+
+	find: function( selector ) {
+		if ( this.length === 1 ) {
+			var ret = this.pushStack( [], "find", selector );
+			ret.length = 0;
+			jQuery.find( selector, this[0], ret );
+			return ret;
+		} else {
+			return this.pushStack( jQuery.unique(jQuery.map(this, function(elem){
+				return jQuery.find( selector, elem );
+			})), "find", selector );
+		}
+	},
+
+	clone: function( events ) {
+		// Do the clone
+		var ret = this.map(function(){
+			if ( !jQuery.support.noCloneEvent && !jQuery.isXMLDoc(this) ) {
+				// IE copies events bound via attachEvent when
+				// using cloneNode. Calling detachEvent on the
+				// clone will also remove the events from the orignal
+				// In order to get around this, we use innerHTML.
+				// Unfortunately, this means some modifications to
+				// attributes in IE that are actually only stored
+				// as properties will not be copied (such as the
+				// the name attribute on an input).
+				var html = this.outerHTML;
+				if ( !html ) {
+					var div = this.ownerDocument.createElement("div");
+					div.appendChild( this.cloneNode(true) );
+					html = div.innerHTML;
+				}
+
+				return jQuery.clean([html.replace(/ jQuery\d+="(?:\d+|null)"/g, "").replace(/^\s*/, "")])[0];
+			} else
+				return this.cloneNode(true);
+		});
+
+		// Copy the events from the original to the clone
+		if ( events === true ) {
+			var orig = this.find("*").andSelf(), i = 0;
+
+			ret.find("*").andSelf().each(function(){
+				if ( this.nodeName !== orig[i].nodeName )
+					return;
+
+				var events = jQuery.data( orig[i], "events" );
+
+				for ( var type in events ) {
+					for ( var handler in events[ type ] ) {
+						jQuery.event.add( this, type, events[ type ][ handler ], events[ type ][ handler ].data );
+					}
+				}
+
+				i++;
+			});
+		}
+
+		// Return the cloned set
+		return ret;
+	},
+
+	filter: function( selector ) {
+		return this.pushStack(
+			jQuery.isFunction( selector ) &&
+			jQuery.grep(this, function(elem, i){
+				return selector.call( elem, i );
+			}) ||
+
+			jQuery.multiFilter( selector, jQuery.grep(this, function(elem){
+				return elem.nodeType === 1;
+			}) ), "filter", selector );
+	},
+
+	closest: function( selector ) {
+		var pos = jQuery.expr.match.POS.test( selector ) ? jQuery(selector) : null,
+			closer = 0;
+
+		return this.map(function(){
+			var cur = this;
+			while ( cur && cur.ownerDocument ) {
+				if ( pos ? pos.index(cur) > -1 : jQuery(cur).is(selector) ) {
+					jQuery.data(cur, "closest", closer);
+					return cur;
+				}
+				cur = cur.parentNode;
+				closer++;
+			}
+		});
+	},
+
+	not: function( selector ) {
+		if ( typeof selector === "string" )
+			// test special case where just one selector is passed in
+			if ( isSimple.test( selector ) )
+				return this.pushStack( jQuery.multiFilter( selector, this, true ), "not", selector );
+			else
+				selector = jQuery.multiFilter( selector, this );
+
+		var isArrayLike = selector.length && selector[selector.length - 1] !== undefined && !selector.nodeType;
+		return this.filter(function() {
+			return isArrayLike ? jQuery.inArray( this, selector ) < 0 : this != selector;
+		});
+	},
+
+	add: function( selector ) {
+		return this.pushStack( jQuery.unique( jQuery.merge(
+			this.get(),
+			typeof selector === "string" ?
+				jQuery( selector ) :
+				jQuery.makeArray( selector )
+		)));
+	},
+
+	is: function( selector ) {
+		return !!selector && jQuery.multiFilter( selector, this ).length > 0;
+	},
+
+	hasClass: function( selector ) {
+		return !!selector && this.is( "." + selector );
+	},
+
+	val: function( value ) {
+		if ( value === undefined ) {			
+			var elem = this[0];
+
+			if ( elem ) {
+				if( jQuery.nodeName( elem, 'option' ) )
+					return (elem.attributes.value || {}).specified ? elem.value : elem.text;
+				
+				// We need to handle select boxes special
+				if ( jQuery.nodeName( elem, "select" ) ) {
+					var index = elem.selectedIndex,
+						values = [],
+						options = elem.options,
+						one = elem.type == "select-one";
+
+					// Nothing was selected
+					if ( index < 0 )
+						return null;
+
+					// Loop through all the selected options
+					for ( var i = one ? index : 0, max = one ? index + 1 : options.length; i < max; i++ ) {
+						var option = options[ i ];
+
+						if ( option.selected ) {
+							// Get the specifc value for the option
+							value = jQuery(option).val();
+
+							// We don't need an array for one selects
+							if ( one )
+								return value;
+
+							// Multi-Selects return an array
+							values.push( value );
+						}
+					}
+
+					return values;				
+				}
+
+				// Everything else, we just grab the value
+				return (elem.value || "").replace(/\r/g, "");
+
+			}
+
+			return undefined;
+		}
+
+		if ( typeof value === "number" )
+			value += '';
+
+		return this.each(function(){
+			if ( this.nodeType != 1 )
+				return;
+
+			if ( jQuery.isArray(value) && /radio|checkbox/.test( this.type ) )
+				this.checked = (jQuery.inArray(this.value, value) >= 0 ||
+					jQuery.inArray(this.name, value) >= 0);
+
+			else if ( jQuery.nodeName( this, "select" ) ) {
+				var values = jQuery.makeArray(value);
+
+				jQuery( "option", this ).each(function(){
+					this.selected = (jQuery.inArray( this.value, values ) >= 0 ||
+						jQuery.inArray( this.text, values ) >= 0);
+				});
+
+				if ( !values.length )
+					this.selectedIndex = -1;
+
+			} else
+				this.value = value;
+		});
+	},
+
+	html: function( value ) {
+		return value === undefined ?
+			(this[0] ?
+				this[0].innerHTML.replace(/ jQuery\d+="(?:\d+|null)"/g, "") :
+				null) :
+			this.empty().append( value );
+	},
+
+	replaceWith: function( value ) {
+		return this.after( value ).remove();
+	},
+
+	eq: function( i ) {
+		return this.slice( i, +i + 1 );
+	},
+
+	slice: function() {
+		return this.pushStack( Array.prototype.slice.apply( this, arguments ),
+			"slice", Array.prototype.slice.call(arguments).join(",") );
+	},
+
+	map: function( callback ) {
+		return this.pushStack( jQuery.map(this, function(elem, i){
+			return callback.call( elem, i, elem );
+		}));
+	},
+
+	andSelf: function() {
+		return this.add( this.prevObject );
+	},
+
+	domManip: function( args, table, callback ) {
+		if ( this[0] ) {
+			var fragment = (this[0].ownerDocument || this[0]).createDocumentFragment(),
+				scripts = jQuery.clean( args, (this[0].ownerDocument || this[0]), fragment ),
+				first = fragment.firstChild;
+
+			if ( first )
+				for ( var i = 0, l = this.length; i < l; i++ )
+					callback.call( root(this[i], first), this.length > 1 || i > 0 ?
+							fragment.cloneNode(true) : fragment );
+		
+			if ( scripts )
+				jQuery.each( scripts, evalScript );
+		}
+
+		return this;
+		
+		function root( elem, cur ) {
+			return table && jQuery.nodeName(elem, "table") && jQuery.nodeName(cur, "tr") ?
+				(elem.getElementsByTagName("tbody")[0] ||
+				elem.appendChild(elem.ownerDocument.createElement("tbody"))) :
+				elem;
+		}
+	}
+};
+
+// Give the init function the jQuery prototype for later instantiation
+jQuery.fn.init.prototype = jQuery.fn;
+
+function evalScript( i, elem ) {
+	if ( elem.src )
+		jQuery.ajax({
+			url: elem.src,
+			async: false,
+			dataType: "script"
+		});
+
+	else
+		jQuery.globalEval( elem.text || elem.textContent || elem.innerHTML || "" );
+
+	if ( elem.parentNode )
+		elem.parentNode.removeChild( elem );
+}
+
+function now(){
+	return +new Date;
+}
+
+jQuery.extend = jQuery.fn.extend = function() {
+	// copy reference to target object
+	var target = arguments[0] || {}, i = 1, length = arguments.length, deep = false, options;
+
+	// Handle a deep copy situation
+	if ( typeof target === "boolean" ) {
+		deep = target;
+		target = arguments[1] || {};
+		// skip the boolean and the target
+		i = 2;
+	}
+
+	// Handle case when target is a string or something (possible in deep copy)
+	if ( typeof target !== "object" && !jQuery.isFunction(target) )
+		target = {};
+
+	// extend jQuery itself if only one argument is passed
+	if ( length == i ) {
+		target = this;
+		--i;
+	}
+
+	for ( ; i < length; i++ )
+		// Only deal with non-null/undefined values
+		if ( (options = arguments[ i ]) != null )
+			// Extend the base object
+			for ( var name in options ) {
+				var src = target[ name ], copy = options[ name ];
+
+				// Prevent never-ending loop
+				if ( target === copy )
+					continue;
+
+				// Recurse if we're merging object values
+				if ( deep && copy && typeof copy === "object" && !copy.nodeType )
+					target[ name ] = jQuery.extend( deep, 
+						// Never move original objects, clone them
+						src || ( copy.length != null ? [ ] : { } )
+					, copy );
+
+				// Don't bring in undefined values
+				else if ( copy !== undefined )
+					target[ name ] = copy;
+
+			}
+
+	// Return the modified object
+	return target;
+};
+
+// exclude the following css properties to add px
+var	exclude = /z-?index|font-?weight|opacity|zoom|line-?height/i,
+	// cache defaultView
+	defaultView = document.defaultView || {},
+	toString = Object.prototype.toString;
+
+jQuery.extend({
+	noConflict: function( deep ) {
+		window.$ = _$;
+
+		if ( deep )
+			window.jQuery = _jQuery;
+
+		return jQuery;
+	},
+
+	// See test/unit/core.js for details concerning isFunction.
+	// Since version 1.3, DOM methods and functions like alert
+	// aren't supported. They return false on IE (#2968).
+	isFunction: function( obj ) {
+		return toString.call(obj) === "[object Function]";
+	},
+
+	isArray: function( obj ) {
+		return toString.call(obj) === "[object Array]";
+	},
+
+	// check if an element is in a (or is an) XML document
+	isXMLDoc: function( elem ) {
+		return elem.nodeType === 9 && elem.documentElement.nodeName !== "HTML" ||
+			!!elem.ownerDocument && jQuery.isXMLDoc( elem.ownerDocument );
+	},
+
+	// Evalulates a script in a global context
+	globalEval: function( data ) {
+		if ( data && /\S/.test(data) ) {
+			// Inspired by code by Andrea Giammarchi
+			// http://webreflection.blogspot.com/2007/08/global-scope-evaluation-and-dom.html
+			var head = document.getElementsByTagName("head")[0] || document.documentElement,
+				script = document.createElement("script");
+
+			script.type = "text/javascript";
+			if ( jQuery.support.scriptEval )
+				script.appendChild( document.createTextNode( data ) );
+			else
+				script.text = data;
+
+			// Use insertBefore instead of appendChild  to circumvent an IE6 bug.
+			// This arises when a base node is used (#2709).
+			head.insertBefore( script, head.firstChild );
+			head.removeChild( script );
+		}
+	},
+
+	nodeName: function( elem, name ) {
+		return elem.nodeName && elem.nodeName.toUpperCase() == name.toUpperCase();
+	},
+
+	// args is for internal usage only
+	each: function( object, callback, args ) {
+		var name, i = 0, length = object.length;
+
+		if ( args ) {
+			if ( length === undefined ) {
+				for ( name in object )
+					if ( callback.apply( object[ name ], args ) === false )
+						break;
+			} else
+				for ( ; i < length; )
+					if ( callback.apply( object[ i++ ], args ) === false )
+						break;
+
+		// A special, fast, case for the most common use of each
+		} else {
+			if ( length === undefined ) {
+				for ( name in object )
+					if ( callback.call( object[ name ], name, object[ name ] ) === false )
+						break;
+			} else
+				for ( var value = object[0];
+					i < length && callback.call( value, i, value ) !== false; value = object[++i] ){}
+		}
+
+		return object;
+	},
+
+	prop: function( elem, value, type, i, name ) {
+		// Handle executable functions
+		if ( jQuery.isFunction( value ) )
+			value = value.call( elem, i );
+
+		// Handle passing in a number to a CSS property
+		return typeof value === "number" && type == "curCSS" && !exclude.test( name ) ?
+			value + "px" :
+			value;
+	},
+
+	className: {
+		// internal only, use addClass("class")
+		add: function( elem, classNames ) {
+			jQuery.each((classNames || "").split(/\s+/), function(i, className){
+				if ( elem.nodeType == 1 && !jQuery.className.has( elem.className, className ) )
+					elem.className += (elem.className ? " " : "") + className;
+			});
+		},
+
+		// internal only, use removeClass("class")
+		remove: function( elem, classNames ) {
+			if (elem.nodeType == 1)
+				elem.className = classNames !== undefined ?
+					jQuery.grep(elem.className.split(/\s+/), function(className){
+						return !jQuery.className.has( classNames, className );
+					}).join(" ") :
+					"";
+		},
+
+		// internal only, use hasClass("class")
+		has: function( elem, className ) {
+			return elem && jQuery.inArray( className, (elem.className || elem).toString().split(/\s+/) ) > -1;
+		}
+	},
+
+	// A method for quickly swapping in/out CSS properties to get correct calculations
+	swap: function( elem, options, callback ) {
+		var old = {};
+		// Remember the old values, and insert the new ones
+		for ( var name in options ) {
+			old[ name ] = elem.style[ name ];
+			elem.style[ name ] = options[ name ];
+		}
+
+		callback.call( elem );
+
+		// Revert the old values
+		for ( var name in options )
+			elem.style[ name ] = old[ name ];
+	},
+
+	css: function( elem, name, force, extra ) {
+		if ( name == "width" || name == "height" ) {
+			var val, props = { position: "absolute", visibility: "hidden", display:"block" }, which = name == "width" ? [ "Left", "Right" ] : [ "Top", "Bottom" ];
+
+			function getWH() {
+				val = name == "width" ? elem.offsetWidth : elem.offsetHeight;
+
+				if ( extra === "border" )
+					return;
+
+				jQuery.each( which, function() {
+					if ( !extra )
+						val -= parseFloat(jQuery.curCSS( elem, "padding" + this, true)) || 0;
+					if ( extra === "margin" )
+						val += parseFloat(jQuery.curCSS( elem, "margin" + this, true)) || 0;
+					else
+						val -= parseFloat(jQuery.curCSS( elem, "border" + this + "Width", true)) || 0;
+				});
+			}
+
+			if ( elem.offsetWidth !== 0 )
+				getWH();
+			else
+				jQuery.swap( elem, props, getWH );
+
+			return Math.max(0, Math.round(val));
+		}
+
+		return jQuery.curCSS( elem, name, force );
+	},
+
+	curCSS: function( elem, name, force ) {
+		var ret, style = elem.style;
+
+		// We need to handle opacity special in IE
+		if ( name == "opacity" && !jQuery.support.opacity ) {
+			ret = jQuery.attr( style, "opacity" );
+
+			return ret == "" ?
+				"1" :
+				ret;
+		}
+
+		// Make sure we're using the right name for getting the float value
+		if ( name.match( /float/i ) )
+			name = styleFloat;
+
+		if ( !force && style && style[ name ] )
+			ret = style[ name ];
+
+		else if ( defaultView.getComputedStyle ) {
+
+			// Only "float" is needed here
+			if ( name.match( /float/i ) )
+				name = "float";
+
+			name = name.replace( /([A-Z])/g, "-$1" ).toLowerCase();
+
+			var computedStyle = defaultView.getComputedStyle( elem, null );
+
+			if ( computedStyle )
+				ret = computedStyle.getPropertyValue( name );
+
+			// We should always get a number back from opacity
+			if ( name == "opacity" && ret == "" )
+				ret = "1";
+
+		} else if ( elem.currentStyle ) {
+			var camelCase = name.replace(/\-(\w)/g, function(all, letter){
+				return letter.toUpperCase();
+			});
+
+			ret = elem.currentStyle[ name ] || elem.currentStyle[ camelCase ];
+
+			// From the awesome hack by Dean Edwards
+			// http://erik.eae.net/archives/2007/07/27/18.54.15/#comment-102291
+
+			// If we're not dealing with a regular pixel number
+			// but a number that has a weird ending, we need to convert it to pixels
+			if ( !/^\d+(px)?$/i.test( ret ) && /^\d/.test( ret ) ) {
+				// Remember the original values
+				var left = style.left, rsLeft = elem.runtimeStyle.left;
+
+				// Put in the new values to get a computed value out
+				elem.runtimeStyle.left = elem.currentStyle.left;
+				style.left = ret || 0;
+				ret = style.pixelLeft + "px";
+
+				// Revert the changed values
+				style.left = left;
+				elem.runtimeStyle.left = rsLeft;
+			}
+		}
+
+		return ret;
+	},
+
+	clean: function( elems, context, fragment ) {
+		context = context || document;
+
+		// !context.createElement fails in IE with an error but returns typeof 'object'
+		if ( typeof context.createElement === "undefined" )
+			context = context.ownerDocument || context[0] && context[0].ownerDocument || document;
+
+		// If a single string is passed in and it's a single tag
+		// just do a createElement and skip the rest
+		if ( !fragment && elems.length === 1 && typeof elems[0] === "string" ) {
+			var match = /^<(\w+)\s*\/?>$/.exec(elems[0]);
+			if ( match )
+				return [ context.createElement( match[1] ) ];
+		}
+
+		var ret = [], scripts = [], div = context.createElement("div");
+
+		jQuery.each(elems, function(i, elem){
+			if ( typeof elem === "number" )
+				elem += '';
+
+			if ( !elem )
+				return;
+
+			// Convert html string into DOM nodes
+			if ( typeof elem === "string" ) {
+				// Fix "XHTML"-style tags in all browsers
+				elem = elem.replace(/(<(\w+)[^>]*?)\/>/g, function(all, front, tag){
+					return tag.match(/^(abbr|br|col|img|input|link|meta|param|hr|area|embed)$/i) ?
+						all :
+						front + "></" + tag + ">";
+				});
+
+				// Trim whitespace, otherwise indexOf won't work as expected
+				var tags = elem.replace(/^\s+/, "").substring(0, 10).toLowerCase();
+
+				var wrap =
+					// option or optgroup
+					!tags.indexOf("<opt") &&
+					[ 1, "<select multiple='multiple'>", "</select>" ] ||
+
+					!tags.indexOf("<leg") &&
+					[ 1, "<fieldset>", "</fieldset>" ] ||
+
+					tags.match(/^<(thead|tbody|tfoot|colg|cap)/) &&
+					[ 1, "<table>", "</table>" ] ||
+
+					!tags.indexOf("<tr") &&
+					[ 2, "<table><tbody>", "</tbody></table>" ] ||
+
+				 	// <thead> matched above
+					(!tags.indexOf("<td") || !tags.indexOf("<th")) &&
+					[ 3, "<table><tbody><tr>", "</tr></tbody></table>" ] ||
+
+					!tags.indexOf("<col") &&
+					[ 2, "<table><tbody></tbody><colgroup>", "</colgroup></table>" ] ||
+
+					// IE can't serialize <link> and <script> tags normally
+					!jQuery.support.htmlSerialize &&
+					[ 1, "div<div>", "</div>" ] ||
+
+					[ 0, "", "" ];
+
+				// Go to html and back, then peel off extra wrappers
+				div.innerHTML = wrap[1] + elem + wrap[2];
+
+				// Move to the right depth
+				while ( wrap[0]-- )
+					div = div.lastChild;
+
+				// Remove IE's autoinserted <tbody> from table fragments
+				if ( !jQuery.support.tbody ) {
+
+					// String was a <table>, *may* have spurious <tbody>
+					var hasBody = /<tbody/i.test(elem),
+						tbody = !tags.indexOf("<table") && !hasBody ?
+							div.firstChild && div.firstChild.childNodes :
+
+						// String was a bare <thead> or <tfoot>
+						wrap[1] == "<table>" && !hasBody ?
+							div.childNodes :
+							[];
+
+					for ( var j = tbody.length - 1; j >= 0 ; --j )
+						if ( jQuery.nodeName( tbody[ j ], "tbody" ) && !tbody[ j ].childNodes.length )
+							tbody[ j ].parentNode.removeChild( tbody[ j ] );
+
+					}
+
+				// IE completely kills leading whitespace when innerHTML is used
+				if ( !jQuery.support.leadingWhitespace && /^\s/.test( elem ) )
+					div.insertBefore( context.createTextNode( elem.match(/^\s*/)[0] ), div.firstChild );
+				
+				elem = jQuery.makeArray( div.childNodes );
+			}
+
+			if ( elem.nodeType )
+				ret.push( elem );
+			else
+				ret = jQuery.merge( ret, elem );
+
+		});
+
+		if ( fragment ) {
+			for ( var i = 0; ret[i]; i++ ) {
+				if ( jQuery.nodeName( ret[i], "script" ) && (!ret[i].type || ret[i].type.toLowerCase() === "text/javascript") ) {
+					scripts.push( ret[i].parentNode ? ret[i].parentNode.removeChild( ret[i] ) : ret[i] );
+				} else {
+					if ( ret[i].nodeType === 1 )
+						ret.splice.apply( ret, [i + 1, 0].concat(jQuery.makeArray(ret[i].getElementsByTagName("script"))) );
+					fragment.appendChild( ret[i] );
+				}
+			}
+			
+			return scripts;
+		}
+
+		return ret;
+	},
+
+	attr: function( elem, name, value ) {
+		// don't set attributes on text and comment nodes
+		if (!elem || elem.nodeType == 3 || elem.nodeType == 8)
+			return undefined;
+
+		var notxml = !jQuery.isXMLDoc( elem ),
+			// Whether we are setting (or getting)
+			set = value !== undefined;
+
+		// Try to normalize/fix the name
+		name = notxml && jQuery.props[ name ] || name;
+
+		// Only do all the following if this is a node (faster for style)
+		// IE elem.getAttribute passes even for style
+		if ( elem.tagName ) {
+
+			// These attributes require special treatment
+			var special = /href|src|style/.test( name );
+
+			// Safari mis-reports the default selected property of a hidden option
+			// Accessing the parent's selectedIndex property fixes it
+			if ( name == "selected" && elem.parentNode )
+				elem.parentNode.selectedIndex;
+
+			// If applicable, access the attribute via the DOM 0 way
+			if ( name in elem && notxml && !special ) {
+				if ( set ){
+					// We can't allow the type property to be changed (since it causes problems in IE)
+					if ( name == "type" && jQuery.nodeName( elem, "input" ) && elem.parentNode )
+						throw "type property can't be changed";
+
+					elem[ name ] = value;
+				}
+
+				// browsers index elements by id/name on forms, give priority to attributes.
+				if( jQuery.nodeName( elem, "form" ) && elem.getAttributeNode(name) )
+					return elem.getAttributeNode( name ).nodeValue;
+
+				// elem.tabIndex doesn't always return the correct value when it hasn't been explicitly set
+				// http://fluidproject.org/blog/2008/01/09/getting-setting-and-removing-tabindex-values-with-javascript/
+				if ( name == "tabIndex" ) {
+					var attributeNode = elem.getAttributeNode( "tabIndex" );
+					return attributeNode && attributeNode.specified
+						? attributeNode.value
+						: elem.nodeName.match(/(button|input|object|select|textarea)/i)
+							? 0
+							: elem.nodeName.match(/^(a|area)$/i) && elem.href
+								? 0
+								: undefined;
+				}
+
+				return elem[ name ];
+			}
+
+			if ( !jQuery.support.style && notxml &&  name == "style" )
+				return jQuery.attr( elem.style, "cssText", value );
+
+			if ( set )
+				// convert the value to a string (all browsers do this but IE) see #1070
+				elem.setAttribute( name, "" + value );
+
+			var attr = !jQuery.support.hrefNormalized && notxml && special
+					// Some attributes require a special call on IE
+					? elem.getAttribute( name, 2 )
+					: elem.getAttribute( name );
+
+			// Non-existent attributes return null, we normalize to undefined
+			return attr === null ? undefined : attr;
+		}
+
+		// elem is actually elem.style ... set the style
+
+		// IE uses filters for opacity
+		if ( !jQuery.support.opacity && name == "opacity" ) {
+			if ( set ) {
+				// IE has trouble with opacity if it does not have layout
+				// Force it by setting the zoom level
+				elem.zoom = 1;
+
+				// Set the alpha filter to set the opacity
+				elem.filter = (elem.filter || "").replace( /alpha\([^)]*\)/, "" ) +
+					(parseInt( value ) + '' == "NaN" ? "" : "alpha(opacity=" + value * 100 + ")");
+			}
+
+			return elem.filter && elem.filter.indexOf("opacity=") >= 0 ?
+				(parseFloat( elem.filter.match(/opacity=([^)]*)/)[1] ) / 100) + '':
+				"";
+		}
+
+		name = name.replace(/-([a-z])/ig, function(all, letter){
+			return letter.toUpperCase();
+		});
+
+		if ( set )
+			elem[ name ] = value;
+
+		return elem[ name ];
+	},
+
+	trim: function( text ) {
+		return (text || "").replace( /^\s+|\s+$/g, "" );
+	},
+
+	makeArray: function( array ) {
+		var ret = [];
+
+		if( array != null ){
+			var i = array.length;
+			// The window, strings (and functions) also have 'length'
+			if( i == null || typeof array === "string" || jQuery.isFunction(array) || array.setInterval )
+				ret[0] = array;
+			else
+				while( i )
+					ret[--i] = array[i];
+		}
+
+		return ret;
+	},
+
+	inArray: function( elem, array ) {
+		for ( var i = 0, length = array.length; i < length; i++ )
+		// Use === because on IE, window == document
+			if ( array[ i ] === elem )
+				return i;
+
+		return -1;
+	},
+
+	merge: function( first, second ) {
+		// We have to loop this way because IE & Opera overwrite the length
+		// expando of getElementsByTagName
+		var i = 0, elem, pos = first.length;
+		// Also, we need to make sure that the correct elements are being returned
+		// (IE returns comment nodes in a '*' query)
+		if ( !jQuery.support.getAll ) {
+			while ( (elem = second[ i++ ]) != null )
+				if ( elem.nodeType != 8 )
+					first[ pos++ ] = elem;
+
+		} else
+			while ( (elem = second[ i++ ]) != null )
+				first[ pos++ ] = elem;
+
+		return first;
+	},
+
+	unique: function( array ) {
+		var ret = [], done = {};
+
+		try {
+
+			for ( var i = 0, length = array.length; i < length; i++ ) {
+				var id = jQuery.data( array[ i ] );
+
+				if ( !done[ id ] ) {
+					done[ id ] = true;
+					ret.push( array[ i ] );
+				}
+			}
+
+		} catch( e ) {
+			ret = array;
+		}
+
+		return ret;
+	},
+
+	grep: function( elems, callback, inv ) {
+		var ret = [];
+
+		// Go through the array, only saving the items
+		// that pass the validator function
+		for ( var i = 0, length = elems.length; i < length; i++ )
+			if ( !inv != !callback( elems[ i ], i ) )
+				ret.push( elems[ i ] );
+
+		return ret;
+	},
+
+	map: function( elems, callback ) {
+		var ret = [];
+
+		// Go through the array, translating each of the items to their
+		// new value (or values).
+		for ( var i = 0, length = elems.length; i < length; i++ ) {
+			var value = callback( elems[ i ], i );
+
+			if ( value != null )
+				ret[ ret.length ] = value;
+		}
+
+		return ret.concat.apply( [], ret );
+	}
+});
+
+// Use of jQuery.browser is deprecated.
+// It's included for backwards compatibility and plugins,
+// although they should work to migrate away.
+
+var userAgent = navigator.userAgent.toLowerCase();
+
+// Figure out what browser is being used
+jQuery.browser = {
+	version: (userAgent.match( /.+(?:rv|it|ra|ie)[\/: ]([\d.]+)/ ) || [0,'0'])[1],
+	safari: /webkit/.test( userAgent ),
+	opera: /opera/.test( userAgent ),
+	msie: /msie/.test( userAgent ) && !/opera/.test( userAgent ),
+	mozilla: /mozilla/.test( userAgent ) && !/(compatible|webkit)/.test( userAgent )
+};
+
+jQuery.each({
+	parent: function(elem){return elem.parentNode;},
+	parents: function(elem){return jQuery.dir(elem,"parentNode");},
+	next: function(elem){return jQuery.nth(elem,2,"nextSibling");},
+	prev: function(elem){return jQuery.nth(elem,2,"previousSibling");},
+	nextAll: function(elem){return jQuery.dir(elem,"nextSibling");},
+	prevAll: function(elem){return jQuery.dir(elem,"previousSibling");},
+	siblings: function(elem){return jQuery.sibling(elem.parentNode.firstChild,elem);},
+	children: function(elem){return jQuery.sibling(elem.firstChild);},
+	contents: function(elem){return jQuery.nodeName(elem,"iframe")?elem.contentDocument||elem.contentWindow.document:jQuery.makeArray(elem.childNodes);}
+}, function(name, fn){
+	jQuery.fn[ name ] = function( selector ) {
+		var ret = jQuery.map( this, fn );
+
+		if ( selector && typeof selector == "string" )
+			ret = jQuery.multiFilter( selector, ret );
+
+		return this.pushStack( jQuery.unique( ret ), name, selector );
+	};
+});
+
+jQuery.each({
+	appendTo: "append",
+	prependTo: "prepend",
+	insertBefore: "before",
+	insertAfter: "after",
+	replaceAll: "replaceWith"
+}, function(name, original){
+	jQuery.fn[ name ] = function( selector ) {
+		var ret = [], insert = jQuery( selector );
+
+		for ( var i = 0, l = insert.length; i < l; i++ ) {
+			var elems = (i > 0 ? this.clone(true) : this).get();
+			jQuery.fn[ original ].apply( jQuery(insert[i]), elems );
+			ret = ret.concat( elems );
+		}
+
+		return this.pushStack( ret, name, selector );
+	};
+});
+
+jQuery.each({
+	removeAttr: function( name ) {
+		jQuery.attr( this, name, "" );
+		if (this.nodeType == 1)
+			this.removeAttribute( name );
+	},
+
+	addClass: function( classNames ) {
+		jQuery.className.add( this, classNames );
+	},
+
+	removeClass: function( classNames ) {
+		jQuery.className.remove( this, classNames );
+	},
+
+	toggleClass: function( classNames, state ) {
+		if( typeof state !== "boolean" )
+			state = !jQuery.className.has( this, classNames );
+		jQuery.className[ state ? "add" : "remove" ]( this, classNames );
+	},
+
+	remove: function( selector ) {
+		if ( !selector || jQuery.filter( selector, [ this ] ).length ) {
+			// Prevent memory leaks
+			jQuery( "*", this ).add([this]).each(function(){
+				jQuery.event.remove(this);
+				jQuery.removeData(this);
+			});
+			if (this.parentNode)
+				this.parentNode.removeChild( this );
+		}
+	},
+
+	empty: function() {
+		// Remove element nodes and prevent memory leaks
+		jQuery(this).children().remove();
+
+		// Remove any remaining nodes
+		while ( this.firstChild )
+			this.removeChild( this.firstChild );
+	}
+}, function(name, fn){
+	jQuery.fn[ name ] = function(){
+		return this.each( fn, arguments );
+	};
+});
+
+// Helper function used by the dimensions and offset modules
+function num(elem, prop) {
+	return elem[0] && parseInt( jQuery.curCSS(elem[0], prop, true), 10 ) || 0;
+}
+var expando = "jQuery" + now(), uuid = 0, windowData = {};
+
+jQuery.extend({
+	cache: {},
+
+	data: function( elem, name, data ) {
+		elem = elem == window ?
+			windowData :
+			elem;
+
+		var id = elem[ expando ];
+
+		// Compute a unique ID for the element
+		if ( !id )
+			id = elem[ expando ] = ++uuid;
+
+		// Only generate the data cache if we're
+		// trying to access or manipulate it
+		if ( name && !jQuery.cache[ id ] )
+			jQuery.cache[ id ] = {};
+
+		// Prevent overriding the named cache with undefined values
+		if ( data !== undefined )
+			jQuery.cache[ id ][ name ] = data;
+
+		// Return the named cache data, or the ID for the element
+		return name ?
+			jQuery.cache[ id ][ name ] :
+			id;
+	},
+
+	removeData: function( elem, name ) {
+		elem = elem == window ?
+			windowData :
+			elem;
+
+		var id = elem[ expando ];
+
+		// If we want to remove a specific section of the element's data
+		if ( name ) {
+			if ( jQuery.cache[ id ] ) {
+				// Remove the section of cache data
+				delete jQuery.cache[ id ][ name ];
+
+				// If we've removed all the data, remove the element's cache
+				name = "";
+
+				for ( name in jQuery.cache[ id ] )
+					break;
+
+				if ( !name )
+					jQuery.removeData( elem );
+			}
+
+		// Otherwise, we want to remove all of the element's data
+		} else {
+			// Clean up the element expando
+			try {
+				delete elem[ expando ];
+			} catch(e){
+				// IE has trouble directly removing the expando
+				// but it's ok with using removeAttribute
+				if ( elem.removeAttribute )
+					elem.removeAttribute( expando );
+			}
+
+			// Completely remove the data cache
+			delete jQuery.cache[ id ];
+		}
+	},
+	queue: function( elem, type, data ) {
+		if ( elem ){
+	
+			type = (type || "fx") + "queue";
+	
+			var q = jQuery.data( elem, type );
+	
+			if ( !q || jQuery.isArray(data) )
+				q = jQuery.data( elem, type, jQuery.makeArray(data) );
+			else if( data )
+				q.push( data );
+	
+		}
+		return q;
+	},
+
+	dequeue: function( elem, type ){
+		var queue = jQuery.queue( elem, type ),
+			fn = queue.shift();
+		
+		if( !type || type === "fx" )
+			fn = queue[0];
+			
+		if( fn !== undefined )
+			fn.call(elem);
+	}
+});
+
+jQuery.fn.extend({
+	data: function( key, value ){
+		var parts = key.split(".");
+		parts[1] = parts[1] ? "." + parts[1] : "";
+
+		if ( value === undefined ) {
+			var data = this.triggerHandler("getData" + parts[1] + "!", [parts[0]]);
+
+			if ( data === undefined && this.length )
+				data = jQuery.data( this[0], key );
+
+			return data === undefined && parts[1] ?
+				this.data( parts[0] ) :
+				data;
+		} else
+			return this.trigger("setData" + parts[1] + "!", [parts[0], value]).each(function(){
+				jQuery.data( this, key, value );
+			});
+	},
+
+	removeData: function( key ){
+		return this.each(function(){
+			jQuery.removeData( this, key );
+		});
+	},
+	queue: function(type, data){
+		if ( typeof type !== "string" ) {
+			data = type;
+			type = "fx";
+		}
+
+		if ( data === undefined )
+			return jQuery.queue( this[0], type );
+
+		return this.each(function(){
+			var queue = jQuery.queue( this, type, data );
+			
+			 if( type == "fx" && queue.length == 1 )
+				queue[0].call(this);
+		});
+	},
+	dequeue: function(type){
+		return this.each(function(){
+			jQuery.dequeue( this, type );
+		});
+	}
+});/*!
+ * Sizzle CSS Selector Engine - v0.9.3
+ *  Copyright 2009, The Dojo Foundation
+ *  Released under the MIT, BSD, and GPL Licenses.
+ *  More information: http://sizzlejs.com/
+ */
+(function(){
+
+var chunker = /((?:\((?:\([^()]+\)|[^()]+)+\)|\[(?:\[[^[\]]*\]|['"][^'"]*['"]|[^[\]'"]+)+\]|\\.|[^ >+~,(\[\\]+)+|[>+~])(\s*,\s*)?/g,
+	done = 0,
+	toString = Object.prototype.toString;
+
+var Sizzle = function(selector, context, results, seed) {
+	results = results || [];
+	context = context || document;
+
+	if ( context.nodeType !== 1 && context.nodeType !== 9 )
+		return [];
+	
+	if ( !selector || typeof selector !== "string" ) {
+		return results;
+	}
+
+	var parts = [], m, set, checkSet, check, mode, extra, prune = true;
+	
+	// Reset the position of the chunker regexp (start from head)
+	chunker.lastIndex = 0;
+	
+	while ( (m = chunker.exec(selector)) !== null ) {
+		parts.push( m[1] );
+		
+		if ( m[2] ) {
+			extra = RegExp.rightContext;
+			break;
+		}
+	}
+
+	if ( parts.length > 1 && origPOS.exec( selector ) ) {
+		if ( parts.length === 2 && Expr.relative[ parts[0] ] ) {
+			set = posProcess( parts[0] + parts[1], context );
+		} else {
+			set = Expr.relative[ parts[0] ] ?
+				[ context ] :
+				Sizzle( parts.shift(), context );
+
+			while ( parts.length ) {
+				selector = parts.shift();
+
+				if ( Expr.relative[ selector ] )
+					selector += parts.shift();
+
+				set = posProcess( selector, set );
+			}
+		}
+	} else {
+		var ret = seed ?
+			{ expr: parts.pop(), set: makeArray(seed) } :
+			Sizzle.find( parts.pop(), parts.length === 1 && context.parentNode ? context.parentNode : context, isXML(context) );
+		set = Sizzle.filter( ret.expr, ret.set );
+
+		if ( parts.length > 0 ) {
+			checkSet = makeArray(set);
+		} else {
+			prune = false;
+		}
+
+		while ( parts.length ) {
+			var cur = parts.pop(), pop = cur;
+
+			if ( !Expr.relative[ cur ] ) {
+				cur = "";
+			} else {
+				pop = parts.pop();
+			}
+
+			if ( pop == null ) {
+				pop = context;
+			}
+
+			Expr.relative[ cur ]( checkSet, pop, isXML(context) );
+		}
+	}
+
+	if ( !checkSet ) {
+		checkSet = set;
+	}
+
+	if ( !checkSet ) {
+		throw "Syntax error, unrecognized expression: " + (cur || selector);
+	}
+
+	if ( toString.call(checkSet) === "[object Array]" ) {
+		if ( !prune ) {
+			results.push.apply( results, checkSet );
+		} else if ( context.nodeType === 1 ) {
+			for ( var i = 0; checkSet[i] != null; i++ ) {
+				if ( checkSet[i] && (checkSet[i] === true || checkSet[i].nodeType === 1 && contains(context, checkSet[i])) ) {
+					results.push( set[i] );
+				}
+			}
+		} else {
+			for ( var i = 0; checkSet[i] != null; i++ ) {
+				if ( checkSet[i] && checkSet[i].nodeType === 1 ) {
+					results.push( set[i] );
+				}
+			}
+		}
+	} else {
+		makeArray( checkSet, results );
+	}
+
+	if ( extra ) {
+		Sizzle( extra, context, results, seed );
+
+		if ( sortOrder ) {
+			hasDuplicate = false;
+			results.sort(sortOrder);
+
+			if ( hasDuplicate ) {
+				for ( var i = 1; i < results.length; i++ ) {
+					if ( results[i] === results[i-1] ) {
+						results.splice(i--, 1);
+					}
+				}
+			}
+		}
+	}
+
+	return results;
+};
+
+Sizzle.matches = function(expr, set){
+	return Sizzle(expr, null, null, set);
+};
+
+Sizzle.find = function(expr, context, isXML){
+	var set, match;
+
+	if ( !expr ) {
+		return [];
+	}
+
+	for ( var i = 0, l = Expr.order.length; i < l; i++ ) {
+		var type = Expr.order[i], match;
+		
+		if ( (match = Expr.match[ type ].exec( expr )) ) {
+			var left = RegExp.leftContext;
+
+			if ( left.substr( left.length - 1 ) !== "\\" ) {
+				match[1] = (match[1] || "").replace(/\\/g, "");
+				set = Expr.find[ type ]( match, context, isXML );
+				if ( set != null ) {
+					expr = expr.replace( Expr.match[ type ], "" );
+					break;
+				}
+			}
+		}
+	}
+
+	if ( !set ) {
+		set = context.getElementsByTagName("*");
+	}
+
+	return {set: set, expr: expr};
+};
+
+Sizzle.filter = function(expr, set, inplace, not){
+	var old = expr, result = [], curLoop = set, match, anyFound,
+		isXMLFilter = set && set[0] && isXML(set[0]);
+
+	while ( expr && set.length ) {
+		for ( var type in Expr.filter ) {
+			if ( (match = Expr.match[ type ].exec( expr )) != null ) {
+				var filter = Expr.filter[ type ], found, item;
+				anyFound = false;
+
+				if ( curLoop == result ) {
+					result = [];
+				}
+
+				if ( Expr.preFilter[ type ] ) {
+					match = Expr.preFilter[ type ]( match, curLoop, inplace, result, not, isXMLFilter );
+
+					if ( !match ) {
+						anyFound = found = true;
+					} else if ( match === true ) {
+						continue;
+					}
+				}
+
+				if ( match ) {
+					for ( var i = 0; (item = curLoop[i]) != null; i++ ) {
+						if ( item ) {
+							found = filter( item, match, i, curLoop );
+							var pass = not ^ !!found;
+
+							if ( inplace && found != null ) {
+								if ( pass ) {
+									anyFound = true;
+								} else {
+									curLoop[i] = false;
+								}
+							} else if ( pass ) {
+								result.push( item );
+								anyFound = true;
+							}
+						}
+					}
+				}
+
+				if ( found !== undefined ) {
+					if ( !inplace ) {
+						curLoop = result;
+					}
+
+					expr = expr.replace( Expr.match[ type ], "" );
+
+					if ( !anyFound ) {
+						return [];
+					}
+
+					break;
+				}
+			}
+		}
+
+		// Improper expression
+		if ( expr == old ) {
+			if ( anyFound == null ) {
+				throw "Syntax error, unrecognized expression: " + expr;
+			} else {
+				break;
+			}
+		}
+
+		old = expr;
+	}
+
+	return curLoop;
+};
+
+var Expr = Sizzle.selectors = {
+	order: [ "ID", "NAME", "TAG" ],
+	match: {
+		ID: /#((?:[\w\u00c0-\uFFFF_-]|\\.)+)/,
+		CLASS: /\.((?:[\w\u00c0-\uFFFF_-]|\\.)+)/,
+		NAME: /\[name=['"]*((?:[\w\u00c0-\uFFFF_-]|\\.)+)['"]*\]/,
+		ATTR: /\[\s*((?:[\w\u00c0-\uFFFF_-]|\\.)+)\s*(?:(\S?=)\s*(['"]*)(.*?)\3|)\s*\]/,
+		TAG: /^((?:[\w\u00c0-\uFFFF\*_-]|\\.)+)/,
+		CHILD: /:(only|nth|last|first)-child(?:\((even|odd|[\dn+-]*)\))?/,
+		POS: /:(nth|eq|gt|lt|first|last|even|odd)(?:\((\d*)\))?(?=[^-]|$)/,
+		PSEUDO: /:((?:[\w\u00c0-\uFFFF_-]|\\.)+)(?:\((['"]*)((?:\([^\)]+\)|[^\2\(\)]*)+)\2\))?/
+	},
+	attrMap: {
+		"class": "className",
+		"for": "htmlFor"
+	},
+	attrHandle: {
+		href: function(elem){
+			return elem.getAttribute("href");
+		}
+	},
+	relative: {
+		"+": function(checkSet, part, isXML){
+			var isPartStr = typeof part === "string",
+				isTag = isPartStr && !/\W/.test(part),
+				isPartStrNotTag = isPartStr && !isTag;
+
+			if ( isTag && !isXML ) {
+				part = part.toUpperCase();
+			}
+
+			for ( var i = 0, l = checkSet.length, elem; i < l; i++ ) {
+				if ( (elem = checkSet[i]) ) {
+					while ( (elem = elem.previousSibling) && elem.nodeType !== 1 ) {}
+
+					checkSet[i] = isPartStrNotTag || elem && elem.nodeName === part ?
+						elem || false :
+						elem === part;
+				}
+			}
+
+			if ( isPartStrNotTag ) {
+				Sizzle.filter( part, checkSet, true );
+			}
+		},
+		">": function(checkSet, part, isXML){
+			var isPartStr = typeof part === "string";
+
+			if ( isPartStr && !/\W/.test(part) ) {
+				part = isXML ? part : part.toUpperCase();
+
+				for ( var i = 0, l = checkSet.length; i < l; i++ ) {
+					var elem = checkSet[i];
+					if ( elem ) {
+						var parent = elem.parentNode;
+						checkSet[i] = parent.nodeName === part ? parent : false;
+					}
+				}
+			} else {
+				for ( var i = 0, l = checkSet.length; i < l; i++ ) {
+					var elem = checkSet[i];
+					if ( elem ) {
+						checkSet[i] = isPartStr ?
+							elem.parentNode :
+							elem.parentNode === part;
+					}
+				}
+
+				if ( isPartStr ) {
+					Sizzle.filter( part, checkSet, true );
+				}
+			}
+		},
+		"": function(checkSet, part, isXML){
+			var doneName = done++, checkFn = dirCheck;
+
+			if ( !part.match(/\W/) ) {
+				var nodeCheck = part = isXML ? part : part.toUpperCase();
+				checkFn = dirNodeCheck;
+			}
+
+			checkFn("parentNode", part, doneName, checkSet, nodeCheck, isXML);
+		},
+		"~": function(checkSet, part, isXML){
+			var doneName = done++, checkFn = dirCheck;
+
+			if ( typeof part === "string" && !part.match(/\W/) ) {
+				var nodeCheck = part = isXML ? part : part.toUpperCase();
+				checkFn = dirNodeCheck;
+			}
+
+			checkFn("previousSibling", part, doneName, checkSet, nodeCheck, isXML);
+		}
+	},
+	find: {
+		ID: function(match, context, isXML){
+			if ( typeof context.getElementById !== "undefined" && !isXML ) {
+				var m = context.getElementById(match[1]);
+				return m ? [m] : [];
+			}
+		},
+		NAME: function(match, context, isXML){
+			if ( typeof context.getElementsByName !== "undefined" ) {
+				var ret = [], results = context.getElementsByName(match[1]);
+
+				for ( var i = 0, l = results.length; i < l; i++ ) {
+					if ( results[i].getAttribute("name") === match[1] ) {
+						ret.push( results[i] );
+					}
+				}
+
+				return ret.length === 0 ? null : ret;
+			}
+		},
+		TAG: function(match, context){
+			return context.getElementsByTagName(match[1]);
+		}
+	},
+	preFilter: {
+		CLASS: function(match, curLoop, inplace, result, not, isXML){
+			match = " " + match[1].replace(/\\/g, "") + " ";
+
+			if ( isXML ) {
+				return match;
+			}
+
+			for ( var i = 0, elem; (elem = curLoop[i]) != null; i++ ) {
+				if ( elem ) {
+					if ( not ^ (elem.className && (" " + elem.className + " ").indexOf(match) >= 0) ) {
+						if ( !inplace )
+							result.push( elem );
+					} else if ( inplace ) {
+						curLoop[i] = false;
+					}
+				}
+			}
+
+			return false;
+		},
+		ID: function(match){
+			return match[1].replace(/\\/g, "");
+		},
+		TAG: function(match, curLoop){
+			for ( var i = 0; curLoop[i] === false; i++ ){}
+			return curLoop[i] && isXML(curLoop[i]) ? match[1] : match[1].toUpperCase();
+		},
+		CHILD: function(match){
+			if ( match[1] == "nth" ) {
+				// parse equations like 'even', 'odd', '5', '2n', '3n+2', '4n-1', '-n+6'
+				var test = /(-?)(\d*)n((?:\+|-)?\d*)/.exec(
+					match[2] == "even" && "2n" || match[2] == "odd" && "2n+1" ||
+					!/\D/.test( match[2] ) && "0n+" + match[2] || match[2]);
+
+				// calculate the numbers (first)n+(last) including if they are negative
+				match[2] = (test[1] + (test[2] || 1)) - 0;
+				match[3] = test[3] - 0;
+			}
+
+			// TODO: Move to normal caching system
+			match[0] = done++;
+
+			return match;
+		},
+		ATTR: function(match, curLoop, inplace, result, not, isXML){
+			var name = match[1].replace(/\\/g, "");
+			
+			if ( !isXML && Expr.attrMap[name] ) {
+				match[1] = Expr.attrMap[name];
+			}
+
+			if ( match[2] === "~=" ) {
+				match[4] = " " + match[4] + " ";
+			}
+
+			return match;
+		},
+		PSEUDO: function(match, curLoop, inplace, result, not){
+			if ( match[1] === "not" ) {
+				// If we're dealing with a complex expression, or a simple one
+				if ( match[3].match(chunker).length > 1 || /^\w/.test(match[3]) ) {
+					match[3] = Sizzle(match[3], null, null, curLoop);
+				} else {
+					var ret = Sizzle.filter(match[3], curLoop, inplace, true ^ not);
+					if ( !inplace ) {
+						result.push.apply( result, ret );
+					}
+					return false;
+				}
+			} else if ( Expr.match.POS.test( match[0] ) || Expr.match.CHILD.test( match[0] ) ) {
+				return true;
+			}
+			
+			return match;
+		},
+		POS: function(match){
+			match.unshift( true );
+			return match;
+		}
+	},
+	filters: {
+		enabled: function(elem){
+			return elem.disabled === false && elem.type !== "hidden";
+		},
+		disabled: function(elem){
+			return elem.disabled === true;
+		},
+		checked: function(elem){
+			return elem.checked === true;
+		},
+		selected: function(elem){
+			// Accessing this property makes selected-by-default
+			// options in Safari work properly
+			elem.parentNode.selectedIndex;
+			return elem.selected === true;
+		},
+		parent: function(elem){
+			return !!elem.firstChild;
+		},
+		empty: function(elem){
+			return !elem.firstChild;
+		},
+		has: function(elem, i, match){
+			return !!Sizzle( match[3], elem ).length;
+		},
+		header: function(elem){
+			return /h\d/i.test( elem.nodeName );
+		},
+		text: function(elem){
+			return "text" === elem.type;
+		},
+		radio: function(elem){
+			return "radio" === elem.type;
+		},
+		checkbox: function(elem){
+			return "checkbox" === elem.type;
+		},
+		file: function(elem){
+			return "file" === elem.type;
+		},
+		password: function(elem){
+			return "password" === elem.type;
+		},
+		submit: function(elem){
+			return "submit" === elem.type;
+		},
+		image: function(elem){
+			return "image" === elem.type;
+		},
+		reset: function(elem){
+			return "reset" === elem.type;
+		},
+		button: function(elem){
+			return "button" === elem.type || elem.nodeName.toUpperCase() === "BUTTON";
+		},
+		input: function(elem){
+			return /input|select|textarea|button/i.test(elem.nodeName);
+		}
+	},
+	setFilters: {
+		first: function(elem, i){
+			return i === 0;
+		},
+		last: function(elem, i, match, array){
+			return i === array.length - 1;
+		},
+		even: function(elem, i){
+			return i % 2 === 0;
+		},
+		odd: function(elem, i){
+			return i % 2 === 1;
+		},
+		lt: function(elem, i, match){
+			return i < match[3] - 0;
+		},
+		gt: function(elem, i, match){
+			return i > match[3] - 0;
+		},
+		nth: function(elem, i, match){
+			return match[3] - 0 == i;
+		},
+		eq: function(elem, i, match){
+			return match[3] - 0 == i;
+		}
+	},
+	filter: {
+		PSEUDO: function(elem, match, i, array){
+			var name = match[1], filter = Expr.filters[ name ];
+
+			if ( filter ) {
+				return filter( elem, i, match, array );
+			} else if ( name === "contains" ) {
+				return (elem.textContent || elem.innerText || "").indexOf(match[3]) >= 0;
+			} else if ( name === "not" ) {
+				var not = match[3];
+
+				for ( var i = 0, l = not.length; i < l; i++ ) {
+					if ( not[i] === elem ) {
+						return false;
+					}
+				}
+
+				return true;
+			}
+		},
+		CHILD: function(elem, match){
+			var type = match[1], node = elem;
+			switch (type) {
+				case 'only':
+				case 'first':
+					while (node = node.previousSibling)  {
+						if ( node.nodeType === 1 ) return false;
+					}
+					if ( type == 'first') return true;
+					node = elem;
+				case 'last':
+					while (node = node.nextSibling)  {
+						if ( node.nodeType === 1 ) return false;
+					}
+					return true;
+				case 'nth':
+					var first = match[2], last = match[3];
+
+					if ( first == 1 && last == 0 ) {
+						return true;
+					}
+					
+					var doneName = match[0],
+						parent = elem.parentNode;
+	
+					if ( parent && (parent.sizcache !== doneName || !elem.nodeIndex) ) {
+						var count = 0;
+						for ( node = parent.firstChild; node; node = node.nextSibling ) {
+							if ( node.nodeType === 1 ) {
+								node.nodeIndex = ++count;
+							}
+						} 
+						parent.sizcache = doneName;
+					}
+					
+					var diff = elem.nodeIndex - last;
+					if ( first == 0 ) {
+						return diff == 0;
+					} else {
+						return ( diff % first == 0 && diff / first >= 0 );
+					}
+			}
+		},
+		ID: function(elem, match){
+			return elem.nodeType === 1 && elem.getAttribute("id") === match;
+		},
+		TAG: function(elem, match){
+			return (match === "*" && elem.nodeType === 1) || elem.nodeName === match;
+		},
+		CLASS: function(elem, match){
+			return (" " + (elem.className || elem.getAttribute("class")) + " ")
+				.indexOf( match ) > -1;
+		},
+		ATTR: function(elem, match){
+			var name = match[1],
+				result = Expr.attrHandle[ name ] ?
+					Expr.attrHandle[ name ]( elem ) :
+					elem[ name ] != null ?
+						elem[ name ] :
+						elem.getAttribute( name ),
+				value = result + "",
+				type = match[2],
+				check = match[4];
+
+			return result == null ?
+				type === "!=" :
+				type === "=" ?
+				value === check :
+				type === "*=" ?
+				value.indexOf(check) >= 0 :
+				type === "~=" ?
+				(" " + value + " ").indexOf(check) >= 0 :
+				!check ?
+				value && result !== false :
+				type === "!=" ?
+				value != check :
+				type === "^=" ?
+				value.indexOf(check) === 0 :
+				type === "$=" ?
+				value.substr(value.length - check.length) === check :
+				type === "|=" ?
+				value === check || value.substr(0, check.length + 1) === check + "-" :
+				false;
+		},
+		POS: function(elem, match, i, array){
+			var name = match[2], filter = Expr.setFilters[ name ];
+
+			if ( filter ) {
+				return filter( elem, i, match, array );
+			}
+		}
+	}
+};
+
+var origPOS = Expr.match.POS;
+
+for ( var type in Expr.match ) {
+	Expr.match[ type ] = RegExp( Expr.match[ type ].source + /(?![^\[]*\])(?![^\(]*\))/.source );
+}
+
+var makeArray = function(array, results) {
+	array = Array.prototype.slice.call( array );
+
+	if ( results ) {
+		results.push.apply( results, array );
+		return results;
+	}
+	
+	return array;
+};
+
+// Perform a simple check to determine if the browser is capable of
+// converting a NodeList to an array using builtin methods.
+try {
+	Array.prototype.slice.call( document.documentElement.childNodes );
+
+// Provide a fallback method if it does not work
+} catch(e){
+	makeArray = function(array, results) {
+		var ret = results || [];
+
+		if ( toString.call(array) === "[object Array]" ) {
+			Array.prototype.push.apply( ret, array );
+		} else {
+			if ( typeof array.length === "number" ) {
+				for ( var i = 0, l = array.length; i < l; i++ ) {
+					ret.push( array[i] );
+				}
+			} else {
+				for ( var i = 0; array[i]; i++ ) {
+					ret.push( array[i] );
+				}
+			}
+		}
+
+		return ret;
+	};
+}
+
+var sortOrder;
+
+if ( document.documentElement.compareDocumentPosition ) {
+	sortOrder = function( a, b ) {
+		var ret = a.compareDocumentPosition(b) & 4 ? -1 : a === b ? 0 : 1;
+		if ( ret === 0 ) {
+			hasDuplicate = true;
+		}
+		return ret;
+	};
+} else if ( "sourceIndex" in document.documentElement ) {
+	sortOrder = function( a, b ) {
+		var ret = a.sourceIndex - b.sourceIndex;
+		if ( ret === 0 ) {
+			hasDuplicate = true;
+		}
+		return ret;
+	};
+} else if ( document.createRange ) {
+	sortOrder = function( a, b ) {
+		var aRange = a.ownerDocument.createRange(), bRange = b.ownerDocument.createRange();
+		aRange.selectNode(a);
+		aRange.collapse(true);
+		bRange.selectNode(b);
+		bRange.collapse(true);
+		var ret = aRange.compareBoundaryPoints(Range.START_TO_END, bRange);
+		if ( ret === 0 ) {
+			hasDuplicate = true;
+		}
+		return ret;
+	};
+}
+
+// Check to see if the browser returns elements by name when
+// querying by getElementById (and provide a workaround)
+(function(){
+	// We're going to inject a fake input element with a specified name
+	var form = document.createElement("form"),
+		id = "script" + (new Date).getTime();
+	form.innerHTML = "<input name='" + id + "'/>";
+
+	// Inject it into the root element, check its status, and remove it quickly
+	var root = document.documentElement;
+	root.insertBefore( form, root.firstChild );
+
+	// The workaround has to do additional checks after a getElementById
+	// Which slows things down for other browsers (hence the branching)
+	if ( !!document.getElementById( id ) ) {
+		Expr.find.ID = function(match, context, isXML){
+			if ( typeof context.getElementById !== "undefined" && !isXML ) {
+				var m = context.getElementById(match[1]);
+				return m ? m.id === match[1] || typeof m.getAttributeNode !== "undefined" && m.getAttributeNode("id").nodeValue === match[1] ? [m] : undefined : [];
+			}
+		};
+
+		Expr.filter.ID = function(elem, match){
+			var node = typeof elem.getAttributeNode !== "undefined" && elem.getAttributeNode("id");
+			return elem.nodeType === 1 && node && node.nodeValue === match;
+		};
+	}
+
+	root.removeChild( form );
+})();
+
+(function(){
+	// Check to see if the browser returns only elements
+	// when doing getElementsByTagName("*")
+
+	// Create a fake element
+	var div = document.createElement("div");
+	div.appendChild( document.createComment("") );
+
+	// Make sure no comments are found
+	if ( div.getElementsByTagName("*").length > 0 ) {
+		Expr.find.TAG = function(match, context){
+			var results = context.getElementsByTagName(match[1]);
+
+			// Filter out possible comments
+			if ( match[1] === "*" ) {
+				var tmp = [];
+
+				for ( var i = 0; results[i]; i++ ) {
+					if ( results[i].nodeType === 1 ) {
+						tmp.push( results[i] );
+					}
+				}
+
+				results = tmp;
+			}
+
+			return results;
+		};
+	}
+
+	// Check to see if an attribute returns normalized href attributes
+	div.innerHTML = "<a href='#'></a>";
+	if ( div.firstChild && typeof div.firstChild.getAttribute !== "undefined" &&
+			div.firstChild.getAttribute("href") !== "#" ) {
+		Expr.attrHandle.href = function(elem){
+			return elem.getAttribute("href", 2);
+		};
+	}
+})();
+
+if ( document.querySelectorAll ) (function(){
+	var oldSizzle = Sizzle, div = document.createElement("div");
+	div.innerHTML = "<p class='TEST'></p>";
+
+	// Safari can't handle uppercase or unicode characters when
+	// in quirks mode.
+	if ( div.querySelectorAll && div.querySelectorAll(".TEST").length === 0 ) {
+		return;
+	}
+	
+	Sizzle = function(query, context, extra, seed){
+		context = context || document;
+
+		// Only use querySelectorAll on non-XML documents
+		// (ID selectors don't work in non-HTML documents)
+		if ( !seed && context.nodeType === 9 && !isXML(context) ) {
+			try {
+				return makeArray( context.querySelectorAll(query), extra );
+			} catch(e){}
+		}
+		
+		return oldSizzle(query, context, extra, seed);
+	};
+
+	Sizzle.find = oldSizzle.find;
+	Sizzle.filter = oldSizzle.filter;
+	Sizzle.selectors = oldSizzle.selectors;
+	Sizzle.matches = oldSizzle.matches;
+})();
+
+if ( document.getElementsByClassName && document.documentElement.getElementsByClassName ) (function(){
+	var div = document.createElement("div");
+	div.innerHTML = "<div class='test e'></div><div class='test'></div>";
+
+	// Opera can't find a second classname (in 9.6)
+	if ( div.getElementsByClassName("e").length === 0 )
+		return;
+
+	// Safari caches class attributes, doesn't catch changes (in 3.2)
+	div.lastChild.className = "e";
+
+	if ( div.getElementsByClassName("e").length === 1 )
+		return;
+
+	Expr.order.splice(1, 0, "CLASS");
+	Expr.find.CLASS = function(match, context, isXML) {
+		if ( typeof context.getElementsByClassName !== "undefined" && !isXML ) {
+			return context.getElementsByClassName(match[1]);
+		}
+	};
+})();
+
+function dirNodeCheck( dir, cur, doneName, checkSet, nodeCheck, isXML ) {
+	var sibDir = dir == "previousSibling" && !isXML;
+	for ( var i = 0, l = checkSet.length; i < l; i++ ) {
+		var elem = checkSet[i];
+		if ( elem ) {
+			if ( sibDir && elem.nodeType === 1 ){
+				elem.sizcache = doneName;
+				elem.sizset = i;
+			}
+			elem = elem[dir];
+			var match = false;
+
+			while ( elem ) {
+				if ( elem.sizcache === doneName ) {
+					match = checkSet[elem.sizset];
+					break;
+				}
+
+				if ( elem.nodeType === 1 && !isXML ){
+					elem.sizcache = doneName;
+					elem.sizset = i;
+				}
+
+				if ( elem.nodeName === cur ) {
+					match = elem;
+					break;
+				}
+
+				elem = elem[dir];
+			}
+
+			checkSet[i] = match;
+		}
+	}
+}
+
+function dirCheck( dir, cur, doneName, checkSet, nodeCheck, isXML ) {
+	var sibDir = dir == "previousSibling" && !isXML;
+	for ( var i = 0, l = checkSet.length; i < l; i++ ) {
+		var elem = checkSet[i];
+		if ( elem ) {
+			if ( sibDir && elem.nodeType === 1 ) {
+				elem.sizcache = doneName;
+				elem.sizset = i;
+			}
+			elem = elem[dir];
+			var match = false;
+
+			while ( elem ) {
+				if ( elem.sizcache === doneName ) {
+					match = checkSet[elem.sizset];
+					break;
+				}
+
+				if ( elem.nodeType === 1 ) {
+					if ( !isXML ) {
+						elem.sizcache = doneName;
+						elem.sizset = i;
+					}
+					if ( typeof cur !== "string" ) {
+						if ( elem === cur ) {
+							match = true;
+							break;
+						}
+
+					} else if ( Sizzle.filter( cur, [elem] ).length > 0 ) {
+						match = elem;
+						break;
+					}
+				}
+
+				elem = elem[dir];
+			}
+
+			checkSet[i] = match;
+		}
+	}
+}
+
+var contains = document.compareDocumentPosition ?  function(a, b){
+	return a.compareDocumentPosition(b) & 16;
+} : function(a, b){
+	return a !== b && (a.contains ? a.contains(b) : true);
+};
+
+var isXML = function(elem){
+	return elem.nodeType === 9 && elem.documentElement.nodeName !== "HTML" ||
+		!!elem.ownerDocument && isXML( elem.ownerDocument );
+};
+
+var posProcess = function(selector, context){
+	var tmpSet = [], later = "", match,
+		root = context.nodeType ? [context] : context;
+
+	// Position selectors must be done after the filter
+	// And so must :not(positional) so we move all PSEUDOs to the end
+	while ( (match = Expr.match.PSEUDO.exec( selector )) ) {
+		later += match[0];
+		selector = selector.replace( Expr.match.PSEUDO, "" );
+	}
+
+	selector = Expr.relative[selector] ? selector + "*" : selector;
+
+	for ( var i = 0, l = root.length; i < l; i++ ) {
+		Sizzle( selector, root[i], tmpSet );
+	}
+
+	return Sizzle.filter( later, tmpSet );
+};
+
+// EXPOSE
+jQuery.find = Sizzle;
+jQuery.filter = Sizzle.filter;
+jQuery.expr = Sizzle.selectors;
+jQuery.expr[":"] = jQuery.expr.filters;
+
+Sizzle.selectors.filters.hidden = function(elem){
+	return elem.offsetWidth === 0 || elem.offsetHeight === 0;
+};
+
+Sizzle.selectors.filters.visible = function(elem){
+	return elem.offsetWidth > 0 || elem.offsetHeight > 0;
+};
+
+Sizzle.selectors.filters.animated = function(elem){
+	return jQuery.grep(jQuery.timers, function(fn){
+		return elem === fn.elem;
+	}).length;
+};
+
+jQuery.multiFilter = function( expr, elems, not ) {
+	if ( not ) {
+		expr = ":not(" + expr + ")";
+	}
+
+	return Sizzle.matches(expr, elems);
+};
+
+jQuery.dir = function( elem, dir ){
+	var matched = [], cur = elem[dir];
+	while ( cur && cur != document ) {
+		if ( cur.nodeType == 1 )
+			matched.push( cur );
+		cur = cur[dir];
+	}
+	return matched;
+};
+
+jQuery.nth = function(cur, result, dir, elem){
+	result = result || 1;
+	var num = 0;
+
+	for ( ; cur; cur = cur[dir] )
+		if ( cur.nodeType == 1 && ++num == result )
+			break;
+
+	return cur;
+};
+
+jQuery.sibling = function(n, elem){
+	var r = [];
+
+	for ( ; n; n = n.nextSibling ) {
+		if ( n.nodeType == 1 && n != elem )
+			r.push( n );
+	}
+
+	return r;
+};
+
+return;
+
+window.Sizzle = Sizzle;
+
+})();
+/*
+ * A number of helper functions used for managing events.
+ * Many of the ideas behind this code originated from
+ * Dean Edwards' addEvent library.
+ */
+jQuery.event = {
+
+	// Bind an event to an element
+	// Original by Dean Edwards
+	add: function(elem, types, handler, data) {
+		if ( elem.nodeType == 3 || elem.nodeType == 8 )
+			return;
+
+		// For whatever reason, IE has trouble passing the window object
+		// around, causing it to be cloned in the process
+		if ( elem.setInterval && elem != window )
+			elem = window;
+
+		// Make sure that the function being executed has a unique ID
+		if ( !handler.guid )
+			handler.guid = this.guid++;
+
+		// if data is passed, bind to handler
+		if ( data !== undefined ) {
+			// Create temporary function pointer to original handler
+			var fn = handler;
+
+			// Create unique handler function, wrapped around original handler
+			handler = this.proxy( fn );
+
+			// Store data in unique handler
+			handler.data = data;
+		}
+
+		// Init the element's event structure
+		var events = jQuery.data(elem, "events") || jQuery.data(elem, "events", {}),
+			handle = jQuery.data(elem, "handle") || jQuery.data(elem, "handle", function(){
+				// Handle the second event of a trigger and when
+				// an event is called after a page has unloaded
+				return typeof jQuery !== "undefined" && !jQuery.event.triggered ?
+					jQuery.event.handle.apply(arguments.callee.elem, arguments) :
+					undefined;
+			});
+		// Add elem as a property of the handle function
+		// This is to prevent a memory leak with non-native
+		// event in IE.
+		handle.elem = elem;
+
+		// Handle multiple events separated by a space
+		// jQuery(...).bind("mouseover mouseout", fn);
+		jQuery.each(types.split(/\s+/), function(index, type) {
+			// Namespaced event handlers
+			var namespaces = type.split(".");
+			type = namespaces.shift();
+			handler.type = namespaces.slice().sort().join(".");
+
+			// Get the current list of functions bound to this event
+			var handlers = events[type];
+			
+			if ( jQuery.event.specialAll[type] )
+				jQuery.event.specialAll[type].setup.call(elem, data, namespaces);
+
+			// Init the event handler queue
+			if (!handlers) {
+				handlers = events[type] = {};
+
+				// Check for a special event handler
+				// Only use addEventListener/attachEvent if the special
+				// events handler returns false
+				if ( !jQuery.event.special[type] || jQuery.event.special[type].setup.call(elem, data, namespaces) === false ) {
+					// Bind the global event handler to the element
+					if (elem.addEventListener)
+						elem.addEventListener(type, handle, false);
+					else if (elem.attachEvent)
+						elem.attachEvent("on" + type, handle);
+				}
+			}
+
+			// Add the function to the element's handler list
+			handlers[handler.guid] = handler;
+
+			// Keep track of which events have been used, for global triggering
+			jQuery.event.global[type] = true;
+		});
+
+		// Nullify elem to prevent memory leaks in IE
+		elem = null;
+	},
+
+	guid: 1,
+	global: {},
+
+	// Detach an event or set of events from an element
+	remove: function(elem, types, handler) {
+		// don't do events on text and comment nodes
+		if ( elem.nodeType == 3 || elem.nodeType == 8 )
+			return;
+
+		var events = jQuery.data(elem, "events"), ret, index;
+
+		if ( events ) {
+			// Unbind all events for the element
+			if ( types === undefined || (typeof types === "string" && types.charAt(0) == ".") )
+				for ( var type in events )
+					this.remove( elem, type + (types || "") );
+			else {
+				// types is actually an event object here
+				if ( types.type ) {
+					handler = types.handler;
+					types = types.type;
+				}
+
+				// Handle multiple events seperated by a space
+				// jQuery(...).unbind("mouseover mouseout", fn);
+				jQuery.each(types.split(/\s+/), function(index, type){
+					// Namespaced event handlers
+					var namespaces = type.split(".");
+					type = namespaces.shift();
+					var namespace = RegExp("(^|\\.)" + namespaces.slice().sort().join(".*\\.") + "(\\.|$)");
+
+					if ( events[type] ) {
+						// remove the given handler for the given type
+						if ( handler )
+							delete events[type][handler.guid];
+
+						// remove all handlers for the given type
+						else
+							for ( var handle in events[type] )
+								// Handle the removal of namespaced events
+								if ( namespace.test(events[type][handle].type) )
+									delete events[type][handle];
+									
+						if ( jQuery.event.specialAll[type] )
+							jQuery.event.specialAll[type].teardown.call(elem, namespaces);
+
+						// remove generic event handler if no more handlers exist
+						for ( ret in events[type] ) break;
+						if ( !ret ) {
+							if ( !jQuery.event.special[type] || jQuery.event.special[type].teardown.call(elem, namespaces) === false ) {
+								if (elem.removeEventListener)
+									elem.removeEventListener(type, jQuery.data(elem, "handle"), false);
+								else if (elem.detachEvent)
+									elem.detachEvent("on" + type, jQuery.data(elem, "handle"));
+							}
+							ret = null;
+							delete events[type];
+						}
+					}
+				});
+			}
+
+			// Remove the expando if it's no longer used
+			for ( ret in events ) break;
+			if ( !ret ) {
+				var handle = jQuery.data( elem, "handle" );
+				if ( handle ) handle.elem = null;
+				jQuery.removeData( elem, "events" );
+				jQuery.removeData( elem, "handle" );
+			}
+		}
+	},
+
+	// bubbling is internal
+	trigger: function( event, data, elem, bubbling ) {
+		// Event object or event type
+		var type = event.type || event;
+
+		if( !bubbling ){
+			event = typeof event === "object" ?
+				// jQuery.Event object
+				event[expando] ? event :
+				// Object literal
+				jQuery.extend( jQuery.Event(type), event ) :
+				// Just the event type (string)
+				jQuery.Event(type);
+
+			if ( type.indexOf("!") >= 0 ) {
+				event.type = type = type.slice(0, -1);
+				event.exclusive = true;
+			}
+
+			// Handle a global trigger
+			if ( !elem ) {
+				// Don't bubble custom events when global (to avoid too much overhead)
+				event.stopPropagation();
+				// Only trigger if we've ever bound an event for it
+				if ( this.global[type] )
+					jQuery.each( jQuery.cache, function(){
+						if ( this.events && this.events[type] )
+							jQuery.event.trigger( event, data, this.handle.elem );
+					});
+			}
+
+			// Handle triggering a single element
+
+			// don't do events on text and comment nodes
+			if ( !elem || elem.nodeType == 3 || elem.nodeType == 8 )
+				return undefined;
+			
+			// Clean up in case it is reused
+			event.result = undefined;
+			event.target = elem;
+			
+			// Clone the incoming data, if any
+			data = jQuery.makeArray(data);
+			data.unshift( event );
+		}
+
+		event.currentTarget = elem;
+
+		// Trigger the event, it is assumed that "handle" is a function
+		var handle = jQuery.data(elem, "handle");
+		if ( handle )
+			handle.apply( elem, data );
+
+		// Handle triggering native .onfoo handlers (and on links since we don't call .click() for links)
+		if ( (!elem[type] || (jQuery.nodeName(elem, 'a') && type == "click")) && elem["on"+type] && elem["on"+type].apply( elem, data ) === false )
+			event.result = false;
+
+		// Trigger the native events (except for clicks on links)
+		if ( !bubbling && elem[type] && !event.isDefaultPrevented() && !(jQuery.nodeName(elem, 'a') && type == "click") ) {
+			this.triggered = true;
+			try {
+				elem[ type ]();
+			// prevent IE from throwing an error for some hidden elements
+			} catch (e) {}
+		}
+
+		this.triggered = false;
+
+		if ( !event.isPropagationStopped() ) {
+			var parent = elem.parentNode || elem.ownerDocument;
+			if ( parent )
+				jQuery.event.trigger(event, data, parent, true);
+		}
+	},
+
+	handle: function(event) {
+		// returned undefined or false
+		var all, handlers;
+
+		event = arguments[0] = jQuery.event.fix( event || window.event );
+		event.currentTarget = this;
+		
+		// Namespaced event handlers
+		var namespaces = event.type.split(".");
+		event.type = namespaces.shift();
+
+		// Cache this now, all = true means, any handler
+		all = !namespaces.length && !event.exclusive;
+		
+		var namespace = RegExp("(^|\\.)" + namespaces.slice().sort().join(".*\\.") + "(\\.|$)");
+
+		handlers = ( jQuery.data(this, "events") || {} )[event.type];
+
+		for ( var j in handlers ) {
+			var handler = handlers[j];
+
+			// Filter the functions by class
+			if ( all || namespace.test(handler.type) ) {
+				// Pass in a reference to the handler function itself
+				// So that we can later remove it
+				event.handler = handler;
+				event.data = handler.data;
+
+				var ret = handler.apply(this, arguments);
+
+				if( ret !== undefined ){
+					event.result = ret;
+					if ( ret === false ) {
+						event.preventDefault();
+						event.stopPropagation();
+					}
+				}
+
+				if( event.isImmediatePropagationStopped() )
+					break;
+
+			}
+		}
+	},
+
+	props: "altKey attrChange attrName bubbles button cancelable charCode clientX clientY ctrlKey currentTarget data detail eventPhase fromElement handler keyCode metaKey newValue originalTarget pageX pageY prevValue relatedNode relatedTarget screenX screenY shiftKey srcElement target toElement view wheelDelta which".split(" "),
+
+	fix: function(event) {
+		if ( event[expando] )
+			return event;
+
+		// store a copy of the original event object
+		// and "clone" to set read-only properties
+		var originalEvent = event;
+		event = jQuery.Event( originalEvent );
+
+		for ( var i = this.props.length, prop; i; ){
+			prop = this.props[ --i ];
+			event[ prop ] = originalEvent[ prop ];
+		}
+
+		// Fix target property, if necessary
+		if ( !event.target )
+			event.target = event.srcElement || document; // Fixes #1925 where srcElement might not be defined either
+
+		// check if target is a textnode (safari)
+		if ( event.target.nodeType == 3 )
+			event.target = event.target.parentNode;
+
+		// Add relatedTarget, if necessary
+		if ( !event.relatedTarget && event.fromElement )
+			event.relatedTarget = event.fromElement == event.target ? event.toElement : event.fromElement;
+
+		// Calculate pageX/Y if missing and clientX/Y available
+		if ( event.pageX == null && event.clientX != null ) {
+			var doc = document.documentElement, body = document.body;
+			event.pageX = event.clientX + (doc && doc.scrollLeft || body && body.scrollLeft || 0) - (doc.clientLeft || 0);
+			event.pageY = event.clientY + (doc && doc.scrollTop || body && body.scrollTop || 0) - (doc.clientTop || 0);
+		}
+
+		// Add which for key events
+		if ( !event.which && ((event.charCode || event.charCode === 0) ? event.charCode : event.keyCode) )
+			event.which = event.charCode || event.keyCode;
+
+		// Add metaKey to non-Mac browsers (use ctrl for PC's and Meta for Macs)
+		if ( !event.metaKey && event.ctrlKey )
+			event.metaKey = event.ctrlKey;
+
+		// Add which for click: 1 == left; 2 == middle; 3 == right
+		// Note: button is not normalized, so don't use it
+		if ( !event.which && event.button )
+			event.which = (event.button & 1 ? 1 : ( event.button & 2 ? 3 : ( event.button & 4 ? 2 : 0 ) ));
+
+		return event;
+	},
+
+	proxy: function( fn, proxy ){
+		proxy = proxy || function(){ return fn.apply(this, arguments); };
+		// Set the guid of unique handler to the same of original handler, so it can be removed
+		proxy.guid = fn.guid = fn.guid || proxy.guid || this.guid++;
+		// So proxy can be declared as an argument
+		return proxy;
+	},
+
+	special: {
+		ready: {
+			// Make sure the ready event is setup
+			setup: bindReady,
+			teardown: function() {}
+		}
+	},
+	
+	specialAll: {
+		live: {
+			setup: function( selector, namespaces ){
+				jQuery.event.add( this, namespaces[0], liveHandler );
+			},
+			teardown:  function( namespaces ){
+				if ( namespaces.length ) {
+					var remove = 0, name = RegExp("(^|\\.)" + namespaces[0] + "(\\.|$)");
+					
+					jQuery.each( (jQuery.data(this, "events").live || {}), function(){
+						if ( name.test(this.type) )
+							remove++;
+					});
+					
+					if ( remove < 1 )
+						jQuery.event.remove( this, namespaces[0], liveHandler );
+				}
+			}
+		}
+	}
+};
+
+jQuery.Event = function( src ){
+	// Allow instantiation without the 'new' keyword
+	if( !this.preventDefault )
+		return new jQuery.Event(src);
+	
+	// Event object
+	if( src && src.type ){
+		this.originalEvent = src;
+		this.type = src.type;
+	// Event type
+	}else
+		this.type = src;
+
+	// timeStamp is buggy for some events on Firefox(#3843)
+	// So we won't rely on the native value
+	this.timeStamp = now();
+	
+	// Mark it as fixed
+	this[expando] = true;
+};
+
+function returnFalse(){
+	return false;
+}
+function returnTrue(){
+	return true;
+}
+
+// jQuery.Event is based on DOM3 Events as specified by the ECMAScript Language Binding
+// http://www.w3.org/TR/2003/WD-DOM-Level-3-Events-20030331/ecma-script-binding.html
+jQuery.Event.prototype = {
+	preventDefault: function() {
+		this.isDefaultPrevented = returnTrue;
+
+		var e = this.originalEvent;
+		if( !e )
+			return;
+		// if preventDefault exists run it on the original event
+		if (e.preventDefault)
+			e.preventDefault();
+		// otherwise set the returnValue property of the original event to false (IE)
+		e.returnValue = false;
+	},
+	stopPropagation: function() {
+		this.isPropagationStopped = returnTrue;
+
+		var e = this.originalEvent;
+		if( !e )
+			return;
+		// if stopPropagation exists run it on the original event
+		if (e.stopPropagation)
+			e.stopPropagation();
+		// otherwise set the cancelBubble property of the original event to true (IE)
+		e.cancelBubble = true;
+	},
+	stopImmediatePropagation:function(){
+		this.isImmediatePropagationStopped = returnTrue;
+		this.stopPropagation();
+	},
+	isDefaultPrevented: returnFalse,
+	isPropagationStopped: returnFalse,
+	isImmediatePropagationStopped: returnFalse
+};
+// Checks if an event happened on an element within another element
+// Used in jQuery.event.special.mouseenter and mouseleave handlers
+var withinElement = function(event) {
+	// Check if mouse(over|out) are still within the same parent element
+	var parent = event.relatedTarget;
+	// Traverse up the tree
+	while ( parent && parent != this )
+		try { parent = parent.parentNode; }
+		catch(e) { parent = this; }
+	
+	if( parent != this ){
+		// set the correct event type
+		event.type = event.data;
+		// handle event if we actually just moused on to a non sub-element
+		jQuery.event.handle.apply( this, arguments );
+	}
+};
+	
+jQuery.each({ 
+	mouseover: 'mouseenter', 
+	mouseout: 'mouseleave'
+}, function( orig, fix ){
+	jQuery.event.special[ fix ] = {
+		setup: function(){
+			jQuery.event.add( this, orig, withinElement, fix );
+		},
+		teardown: function(){
+			jQuery.event.remove( this, orig, withinElement );
+		}
+	};			   
+});
+
+jQuery.fn.extend({
+	bind: function( type, data, fn ) {
+		return type == "unload" ? this.one(type, data, fn) : this.each(function(){
+			jQuery.event.add( this, type, fn || data, fn && data );
+		});
+	},
+
+	one: function( type, data, fn ) {
+		var one = jQuery.event.proxy( fn || data, function(event) {
+			jQuery(this).unbind(event, one);
+			return (fn || data).apply( this, arguments );
+		});
+		return this.each(function(){
+			jQuery.event.add( this, type, one, fn && data);
+		});
+	},
+
+	unbind: function( type, fn ) {
+		return this.each(function(){
+			jQuery.event.remove( this, type, fn );
+		});
+	},
+
+	trigger: function( type, data ) {
+		return this.each(function(){
+			jQuery.event.trigger( type, data, this );
+		});
+	},
+
+	triggerHandler: function( type, data ) {
+		if( this[0] ){
+			var event = jQuery.Event(type);
+			event.preventDefault();
+			event.stopPropagation();
+			jQuery.event.trigger( event, data, this[0] );
+			return event.result;
+		}		
+	},
+
+	toggle: function( fn ) {
+		// Save reference to arguments for access in closure
+		var args = arguments, i = 1;
+
+		// link all the functions, so any of them can unbind this click handler
+		while( i < args.length )
+			jQuery.event.proxy( fn, args[i++] );
+
+		return this.click( jQuery.event.proxy( fn, function(event) {
+			// Figure out which function to execute
+			this.lastToggle = ( this.lastToggle || 0 ) % i;
+
+			// Make sure that clicks stop
+			event.preventDefault();
+
+			// and execute the function
+			return args[ this.lastToggle++ ].apply( this, arguments ) || false;
+		}));
+	},
+
+	hover: function(fnOver, fnOut) {
+		return this.mouseenter(fnOver).mouseleave(fnOut);
+	},
+
+	ready: function(fn) {
+		// Attach the listeners
+		bindReady();
+
+		// If the DOM is already ready
+		if ( jQuery.isReady )
+			// Execute the function immediately
+			fn.call( document, jQuery );
+
+		// Otherwise, remember the function for later
+		else
+			// Add the function to the wait list
+			jQuery.readyList.push( fn );
+
+		return this;
+	},
+	
+	live: function( type, fn ){
+		var proxy = jQuery.event.proxy( fn );
+		proxy.guid += this.selector + type;
+
+		jQuery(document).bind( liveConvert(type, this.selector), this.selector, proxy );
+
+		return this;
+	},
+	
+	die: function( type, fn ){
+		jQuery(document).unbind( liveConvert(type, this.selector), fn ? { guid: fn.guid + this.selector + type } : null );
+		return this;
+	}
+});
+
+function liveHandler( event ){
+	var check = RegExp("(^|\\.)" + event.type + "(\\.|$)"),
+		stop = true,
+		elems = [];
+
+	jQuery.each(jQuery.data(this, "events").live || [], function(i, fn){
+		if ( check.test(fn.type) ) {
+			var elem = jQuery(event.target).closest(fn.data)[0];
+			if ( elem )
+				elems.push({ elem: elem, fn: fn });
+		}
+	});
+
+	elems.sort(function(a,b) {
+		return jQuery.data(a.elem, "closest") - jQuery.data(b.elem, "closest");
+	});
+	
+	jQuery.each(elems, function(){
+		if ( this.fn.call(this.elem, event, this.fn.data) === false )
+			return (stop = false);
+	});
+
+	return stop;
+}
+
+function liveConvert(type, selector){
+	return ["live", type, selector.replace(/\./g, "`").replace(/ /g, "|")].join(".");
+}
+
+jQuery.extend({
+	isReady: false,
+	readyList: [],
+	// Handle when the DOM is ready
+	ready: function() {
+		// Make sure that the DOM is not already loaded
+		if ( !jQuery.isReady ) {
+			// Remember that the DOM is ready
+			jQuery.isReady = true;
+
+			// If there are functions bound, to execute
+			if ( jQuery.readyList ) {
+				// Execute all of them
+				jQuery.each( jQuery.readyList, function(){
+					this.call( document, jQuery );
+				});
+
+				// Reset the list of functions
+				jQuery.readyList = null;
+			}
+
+			// Trigger any bound ready events
+			jQuery(document).triggerHandler("ready");
+		}
+	}
+});
+
+var readyBound = false;
+
+function bindReady(){
+	if ( readyBound ) return;
+	readyBound = true;
+
+	// Mozilla, Opera and webkit nightlies currently support this event
+	if ( document.addEventListener ) {
+		// Use the handy event callback
+		document.addEventListener( "DOMContentLoaded", function(){
+			document.removeEventListener( "DOMContentLoaded", arguments.callee, false );
+			jQuery.ready();
+		}, false );
+
+	// If IE event model is used
+	} else if ( document.attachEvent ) {
+		// ensure firing before onload,
+		// maybe late but safe also for iframes
+		document.attachEvent("onreadystatechange", function(){
+			if ( document.readyState === "complete" ) {
+				document.detachEvent( "onreadystatechange", arguments.callee );
+				jQuery.ready();
+			}
+		});
+
+		// If IE and not an iframe
+		// continually check to see if the document is ready
+		if ( document.documentElement.doScroll && window == window.top ) (function(){
+			if ( jQuery.isReady ) return;
+
+			try {
+				// If IE is used, use the trick by Diego Perini
+				// http://javascript.nwbox.com/IEContentLoaded/
+				document.documentElement.doScroll("left");
+			} catch( error ) {
+				setTimeout( arguments.callee, 0 );
+				return;
+			}
+
+			// and execute any waiting functions
+			jQuery.ready();
+		})();
+	}
+
+	// A fallback to window.onload, that will always work
+	jQuery.event.add( window, "load", jQuery.ready );
+}
+
+jQuery.each( ("blur,focus,load,resize,scroll,unload,click,dblclick," +
+	"mousedown,mouseup,mousemove,mouseover,mouseout,mouseenter,mouseleave," +
+	"change,select,submit,keydown,keypress,keyup,error").split(","), function(i, name){
+
+	// Handle event binding
+	jQuery.fn[name] = function(fn){
+		return fn ? this.bind(name, fn) : this.trigger(name);
+	};
+});
+
+// Prevent memory leaks in IE
+// And prevent errors on refresh with events like mouseover in other browsers
+// Window isn't included so as not to unbind existing unload events
+jQuery( window ).bind( 'unload', function(){ 
+	for ( var id in jQuery.cache )
+		// Skip the window
+		if ( id != 1 && jQuery.cache[ id ].handle )
+			jQuery.event.remove( jQuery.cache[ id ].handle.elem );
+}); 
+(function(){
+
+	jQuery.support = {};
+
+	var root = document.documentElement,
+		script = document.createElement("script"),
+		div = document.createElement("div"),
+		id = "script" + (new Date).getTime();
+
+	div.style.display = "none";
+	div.innerHTML = '   <link/><table></table><a href="/a" style="color:red;float:left;opacity:.5;">a</a><select><option>text</option></select><object><param/></object>';
+
+	var all = div.getElementsByTagName("*"),
+		a = div.getElementsByTagName("a")[0];
+
+	// Can't get basic test support
+	if ( !all || !all.length || !a ) {
+		return;
+	}
+
+	jQuery.support = {
+		// IE strips leading whitespace when .innerHTML is used
+		leadingWhitespace: div.firstChild.nodeType == 3,
+		
+		// Make sure that tbody elements aren't automatically inserted
+		// IE will insert them into empty tables
+		tbody: !div.getElementsByTagName("tbody").length,
+		
+		// Make sure that you can get all elements in an <object> element
+		// IE 7 always returns no results
+		objectAll: !!div.getElementsByTagName("object")[0]
+			.getElementsByTagName("*").length,
+		
+		// Make sure that link elements get serialized correctly by innerHTML
+		// This requires a wrapper element in IE
+		htmlSerialize: !!div.getElementsByTagName("link").length,
+		
+		// Get the style information from getAttribute
+		// (IE uses .cssText insted)
+		style: /red/.test( a.getAttribute("style") ),
+		
+		// Make sure that URLs aren't manipulated
+		// (IE normalizes it by default)
+		hrefNormalized: a.getAttribute("href") === "/a",
+		
+		// Make sure that element opacity exists
+		// (IE uses filter instead)
+		opacity: a.style.opacity === "0.5",
+		
+		// Verify style float existence
+		// (IE uses styleFloat instead of cssFloat)
+		cssFloat: !!a.style.cssFloat,
+
+		// Will be defined later
+		scriptEval: false,
+		noCloneEvent: true,
+		boxModel: null
+	};
+	
+	script.type = "text/javascript";
+	try {
+		script.appendChild( document.createTextNode( "window." + id + "=1;" ) );
+	} catch(e){}
+
+	root.insertBefore( script, root.firstChild );
+	
+	// Make sure that the execution of code works by injecting a script
+	// tag with appendChild/createTextNode
+	// (IE doesn't support this, fails, and uses .text instead)
+	if ( window[ id ] ) {
+		jQuery.support.scriptEval = true;
+		delete window[ id ];
+	}
+
+	root.removeChild( script );
+
+	if ( div.attachEvent && div.fireEvent ) {
+		div.attachEvent("onclick", function(){
+			// Cloning a node shouldn't copy over any
+			// bound event handlers (IE does this)
+			jQuery.support.noCloneEvent = false;
+			div.detachEvent("onclick", arguments.callee);
+		});
+		div.cloneNode(true).fireEvent("onclick");
+	}
+
+	// Figure out if the W3C box model works as expected
+	// document.body must exist before we can do this
+	jQuery(function(){
+		var div = document.createElement("div");
+		div.style.width = div.style.paddingLeft = "1px";
+
+		document.body.appendChild( div );
+		jQuery.boxModel = jQuery.support.boxModel = div.offsetWidth === 2;
+		document.body.removeChild( div ).style.display = 'none';
+	});
+})();
+
+var styleFloat = jQuery.support.cssFloat ? "cssFloat" : "styleFloat";
+
+jQuery.props = {
+	"for": "htmlFor",
+	"class": "className",
+	"float": styleFloat,
+	cssFloat: styleFloat,
+	styleFloat: styleFloat,
+	readonly: "readOnly",
+	maxlength: "maxLength",
+	cellspacing: "cellSpacing",
+	rowspan: "rowSpan",
+	tabindex: "tabIndex"
+};
+jQuery.fn.extend({
+	// Keep a copy of the old load
+	_load: jQuery.fn.load,
+
+	load: function( url, params, callback ) {
+		if ( typeof url !== "string" )
+			return this._load( url );
+
+		var off = url.indexOf(" ");
+		if ( off >= 0 ) {
+			var selector = url.slice(off, url.length);
+			url = url.slice(0, off);
+		}
+
+		// Default to a GET request
+		var type = "GET";
+
+		// If the second parameter was provided
+		if ( params )
+			// If it's a function
+			if ( jQuery.isFunction( params ) ) {
+				// We assume that it's the callback
+				callback = params;
+				params = null;
+
+			// Otherwise, build a param string
+			} else if( typeof params === "object" ) {
+				params = jQuery.param( params );
+				type = "POST";
+			}
+
+		var self = this;
+
+		// Request the remote document
+		jQuery.ajax({
+			url: url,
+			type: type,
+			dataType: "html",
+			data: params,
+			complete: function(res, status){
+				// If successful, inject the HTML into all the matched elements
+				if ( status == "success" || status == "notmodified" )
+					// See if a selector was specified
+					self.html( selector ?
+						// Create a dummy div to hold the results
+						jQuery("<div/>")
+							// inject the contents of the document in, removing the scripts
+							// to avoid any 'Permission Denied' errors in IE
+							.append(res.responseText.replace(/<script(.|\s)*?\/script>/g, ""))
+
+							// Locate the specified elements
+							.find(selector) :
+
+						// If not, just inject the full result
+						res.responseText );
+
+				if( callback )
+					self.each( callback, [res.responseText, status, res] );
+			}
+		});
+		return this;
+	},
+
+	serialize: function() {
+		return jQuery.param(this.serializeArray());
+	},
+	serializeArray: function() {
+		return this.map(function(){
+			return this.elements ? jQuery.makeArray(this.elements) : this;
+		})
+		.filter(function(){
+			return this.name && !this.disabled &&
+				(this.checked || /select|textarea/i.test(this.nodeName) ||
+					/text|hidden|password|search/i.test(this.type));
+		})
+		.map(function(i, elem){
+			var val = jQuery(this).val();
+			return val == null ? null :
+				jQuery.isArray(val) ?
+					jQuery.map( val, function(val, i){
+						return {name: elem.name, value: val};
+					}) :
+					{name: elem.name, value: val};
+		}).get();
+	}
+});
+
+// Attach a bunch of functions for handling common AJAX events
+jQuery.each( "ajaxStart,ajaxStop,ajaxComplete,ajaxError,ajaxSuccess,ajaxSend".split(","), function(i,o){
+	jQuery.fn[o] = function(f){
+		return this.bind(o, f);
+	};
+});
+
+var jsc = now();
+
+jQuery.extend({
+  
+	get: function( url, data, callback, type ) {
+		// shift arguments if data argument was ommited
+		if ( jQuery.isFunction( data ) ) {
+			callback = data;
+			data = null;
+		}
+
+		return jQuery.ajax({
+			type: "GET",
+			url: url,
+			data: data,
+			success: callback,
+			dataType: type
+		});
+	},
+
+	getScript: function( url, callback ) {
+		return jQuery.get(url, null, callback, "script");
+	},
+
+	getJSON: function( url, data, callback ) {
+		return jQuery.get(url, data, callback, "json");
+	},
+
+	post: function( url, data, callback, type ) {
+		if ( jQuery.isFunction( data ) ) {
+			callback = data;
+			data = {};
+		}
+
+		return jQuery.ajax({
+			type: "POST",
+			url: url,
+			data: data,
+			success: callback,
+			dataType: type
+		});
+	},
+
+	ajaxSetup: function( settings ) {
+		jQuery.extend( jQuery.ajaxSettings, settings );
+	},
+
+	ajaxSettings: {
+		url: location.href,
+		global: true,
+		type: "GET",
+		contentType: "application/x-www-form-urlencoded",
+		processData: true,
+		async: true,
+		/*
+		timeout: 0,
+		data: null,
+		username: null,
+		password: null,
+		*/
+		// Create the request object; Microsoft failed to properly
+		// implement the XMLHttpRequest in IE7, so we use the ActiveXObject when it is available
+		// This function can be overriden by calling jQuery.ajaxSetup
+		xhr:function(){
+			return window.ActiveXObject ? new ActiveXObject("Microsoft.XMLHTTP") : new XMLHttpRequest();
+		},
+		accepts: {
+			xml: "application/xml, text/xml",
+			html: "text/html",
+			script: "text/javascript, application/javascript",
+			json: "application/json, text/javascript",
+			text: "text/plain",
+			_default: "*/*"
+		}
+	},
+
+	// Last-Modified header cache for next request
+	lastModified: {},
+
+	ajax: function( s ) {
+		// Extend the settings, but re-extend 's' so that it can be
+		// checked again later (in the test suite, specifically)
+		s = jQuery.extend(true, s, jQuery.extend(true, {}, jQuery.ajaxSettings, s));
+
+		var jsonp, jsre = /=\?(&|$)/g, status, data,
+			type = s.type.toUpperCase();
+
+		// convert data if not already a string
+		if ( s.data && s.processData && typeof s.data !== "string" )
+			s.data = jQuery.param(s.data);
+
+		// Handle JSONP Parameter Callbacks
+		if ( s.dataType == "jsonp" ) {
+			if ( type == "GET" ) {
+				if ( !s.url.match(jsre) )
+					s.url += (s.url.match(/\?/) ? "&" : "?") + (s.jsonp || "callback") + "=?";
+			} else if ( !s.data || !s.data.match(jsre) )
+				s.data = (s.data ? s.data + "&" : "") + (s.jsonp || "callback") + "=?";
+			s.dataType = "json";
+		}
+
+		// Build temporary JSONP function
+		if ( s.dataType == "json" && (s.data && s.data.match(jsre) || s.url.match(jsre)) ) {
+			jsonp = "jsonp" + jsc++;
+
+			// Replace the =? sequence both in the query string and the data
+			if ( s.data )
+				s.data = (s.data + "").replace(jsre, "=" + jsonp + "$1");
+			s.url = s.url.replace(jsre, "=" + jsonp + "$1");
+
+			// We need to make sure
+			// that a JSONP style response is executed properly
+			s.dataType = "script";
+
+			// Handle JSONP-style loading
+			window[ jsonp ] = function(tmp){
+				data = tmp;
+				success();
+				complete();
+				// Garbage collect
+				window[ jsonp ] = undefined;
+				try{ delete window[ jsonp ]; } catch(e){}
+				if ( head )
+					head.removeChild( script );
+			};
+		}
+
+		if ( s.dataType == "script" && s.cache == null )
+			s.cache = false;
+
+		if ( s.cache === false && type == "GET" ) {
+			var ts = now();
+			// try replacing _= if it is there
+			var ret = s.url.replace(/(\?|&)_=.*?(&|$)/, "$1_=" + ts + "$2");
+			// if nothing was replaced, add timestamp to the end
+			s.url = ret + ((ret == s.url) ? (s.url.match(/\?/) ? "&" : "?") + "_=" + ts : "");
+		}
+
+		// If data is available, append data to url for get requests
+		if ( s.data && type == "GET" ) {
+			s.url += (s.url.match(/\?/) ? "&" : "?") + s.data;
+
+			// IE likes to send both get and post data, prevent this
+			s.data = null;
+		}
+
+		// Watch for a new set of requests
+		if ( s.global && ! jQuery.active++ )
+			jQuery.event.trigger( "ajaxStart" );
+
+		// Matches an absolute URL, and saves the domain
+		var parts = /^(\w+:)?\/\/([^\/?#]+)/.exec( s.url );
+
+		// If we're requesting a remote document
+		// and trying to load JSON or Script with a GET
+		if ( s.dataType == "script" && type == "GET" && parts
+			&& ( parts[1] && parts[1] != location.protocol || parts[2] != location.host )){
+
+			var head = document.getElementsByTagName("head")[0];
+			var script = document.createElement("script");
+			script.src = s.url;
+			if (s.scriptCharset)
+				script.charset = s.scriptCharset;
+
+			// Handle Script loading
+			if ( !jsonp ) {
+				var done = false;
+
+				// Attach handlers for all browsers
+				script.onload = script.onreadystatechange = function(){
+					if ( !done && (!this.readyState ||
+							this.readyState == "loaded" || this.readyState == "complete") ) {
+						done = true;
+						success();
+						complete();
+
+						// Handle memory leak in IE
+						script.onload = script.onreadystatechange = null;
+						head.removeChild( script );
+					}
+				};
+			}
+
+			head.appendChild(script);
+
+			// We handle everything using the script element injection
+			return undefined;
+		}
+
+		var requestDone = false;
+
+		// Create the request object
+		var xhr = s.xhr();
+
+		// Open the socket
+		// Passing null username, generates a login popup on Opera (#2865)
+		if( s.username )
+			xhr.open(type, s.url, s.async, s.username, s.password);
+		else
+			xhr.open(type, s.url, s.async);
+
+		// Need an extra try/catch for cross domain requests in Firefox 3
+		try {
+			// Set the correct header, if data is being sent
+			if ( s.data )
+				xhr.setRequestHeader("Content-Type", s.contentType);
+
+			// Set the If-Modified-Since header, if ifModified mode.
+			if ( s.ifModified )
+				xhr.setRequestHeader("If-Modified-Since",
+					jQuery.lastModified[s.url] || "Thu, 01 Jan 1970 00:00:00 GMT" );
+
+			// Set header so the called script knows that it's an XMLHttpRequest
+			xhr.setRequestHeader("X-Requested-With", "XMLHttpRequest");
+
+			// Set the Accepts header for the server, depending on the dataType
+			xhr.setRequestHeader("Accept", s.dataType && s.accepts[ s.dataType ] ?
+				s.accepts[ s.dataType ] + ", */*" :
+				s.accepts._default );
+		} catch(e){}
+
+		// Allow custom headers/mimetypes and early abort
+		if ( s.beforeSend && s.beforeSend(xhr, s) === false ) {
+			// Handle the global AJAX counter
+			if ( s.global && ! --jQuery.active )
+				jQuery.event.trigger( "ajaxStop" );
+			// close opended socket
+			xhr.abort();
+			return false;
+		}
+
+		if ( s.global )
+			jQuery.event.trigger("ajaxSend", [xhr, s]);
+
+		// Wait for a response to come back
+		var onreadystatechange = function(isTimeout){
+			// The request was aborted, clear the interval and decrement jQuery.active
+			if (xhr.readyState == 0) {
+				if (ival) {
+					// clear poll interval
+					clearInterval(ival);
+					ival = null;
+					// Handle the global AJAX counter
+					if ( s.global && ! --jQuery.active )
+						jQuery.event.trigger( "ajaxStop" );
+				}
+			// The transfer is complete and the data is available, or the request timed out
+			} else if ( !requestDone && xhr && (xhr.readyState == 4 || isTimeout == "timeout") ) {
+				requestDone = true;
+
+				// clear poll interval
+				if (ival) {
+					clearInterval(ival);
+					ival = null;
+				}
+
+				status = isTimeout == "timeout" ? "timeout" :
+					!jQuery.httpSuccess( xhr ) ? "error" :
+					s.ifModified && jQuery.httpNotModified( xhr, s.url ) ? "notmodified" :
+					"success";
+
+				if ( status == "success" ) {
+					// Watch for, and catch, XML document parse errors
+					try {
+						// process the data (runs the xml through httpData regardless of callback)
+						data = jQuery.httpData( xhr, s.dataType, s );
+					} catch(e) {
+						status = "parsererror";
+					}
+				}
+
+				// Make sure that the request was successful or notmodified
+				if ( status == "success" ) {
+					// Cache Last-Modified header, if ifModified mode.
+					var modRes;
+					try {
+						modRes = xhr.getResponseHeader("Last-Modified");
+					} catch(e) {} // swallow exception thrown by FF if header is not available
+
+					if ( s.ifModified && modRes )
+						jQuery.lastModified[s.url] = modRes;
+
+					// JSONP handles its own success callback
+					if ( !jsonp )
+						success();
+				} else
+					jQuery.handleError(s, xhr, status);
+
+				// Fire the complete handlers
+				complete();
+
+				if ( isTimeout )
+					xhr.abort();
+
+				// Stop memory leaks
+				if ( s.async )
+					xhr = null;
+			}
+		};
+
+		if ( s.async ) {
+			// don't attach the handler to the request, just poll it instead
+			var ival = setInterval(onreadystatechange, 13);
+
+			// Timeout checker
+			if ( s.timeout > 0 )
+				setTimeout(function(){
+					// Check to see if the request is still happening
+					if ( xhr && !requestDone )
+						onreadystatechange( "timeout" );
+				}, s.timeout);
+		}
+
+		// Send the data
+		try {
+			xhr.send(s.data);
+		} catch(e) {
+			jQuery.handleError(s, xhr, null, e);
+		}
+
+		// firefox 1.5 doesn't fire statechange for sync requests
+		if ( !s.async )
+			onreadystatechange();
+
+		function success(){
+			// If a local callback was specified, fire it and pass it the data
+			if ( s.success )
+				s.success( data, status );
+
+			// Fire the global callback
+			if ( s.global )
+				jQuery.event.trigger( "ajaxSuccess", [xhr, s] );
+		}
+
+		function complete(){
+			// Process result
+			if ( s.complete )
+				s.complete(xhr, status);
+
+			// The request was completed
+			if ( s.global )
+				jQuery.event.trigger( "ajaxComplete", [xhr, s] );
+
+			// Handle the global AJAX counter
+			if ( s.global && ! --jQuery.active )
+				jQuery.event.trigger( "ajaxStop" );
+		}
+
+		// return XMLHttpRequest to allow aborting the request etc.
+		return xhr;
+	},
+
+	handleError: function( s, xhr, status, e ) {
+		// If a local callback was specified, fire it
+		if ( s.error ) s.error( xhr, status, e );
+
+		// Fire the global callback
+		if ( s.global )
+			jQuery.event.trigger( "ajaxError", [xhr, s, e] );
+	},
+
+	// Counter for holding the number of active queries
+	active: 0,
+
+	// Determines if an XMLHttpRequest was successful or not
+	httpSuccess: function( xhr ) {
+		try {
+			// IE error sometimes returns 1223 when it should be 204 so treat it as success, see #1450
+			return !xhr.status && location.protocol == "file:" ||
+				( xhr.status >= 200 && xhr.status < 300 ) || xhr.status == 304 || xhr.status == 1223;
+		} catch(e){}
+		return false;
+	},
+
+	// Determines if an XMLHttpRequest returns NotModified
+	httpNotModified: function( xhr, url ) {
+		try {
+			var xhrRes = xhr.getResponseHeader("Last-Modified");
+
+			// Firefox always returns 200. check Last-Modified date
+			return xhr.status == 304 || xhrRes == jQuery.lastModified[url];
+		} catch(e){}
+		return false;
+	},
+
+	httpData: function( xhr, type, s ) {
+		var ct = xhr.getResponseHeader("content-type"),
+			xml = type == "xml" || !type && ct && ct.indexOf("xml") >= 0,
+			data = xml ? xhr.responseXML : xhr.responseText;
+
+		if ( xml && data.documentElement.tagName == "parsererror" )
+			throw "parsererror";
+			
+		// Allow a pre-filtering function to sanitize the response
+		// s != null is checked to keep backwards compatibility
+		if( s && s.dataFilter )
+			data = s.dataFilter( data, type );
+
+		// The filter can actually parse the response
+		if( typeof data === "string" ){
+
+			// If the type is "script", eval it in global context
+			if ( type == "script" )
+				jQuery.globalEval( data );
+
+			// Get the JavaScript object, if JSON is used.
+			if ( type == "json" )
+				data = window["eval"]("(" + data + ")");
+		}
+		
+		return data;
+	},
+
+	// Serialize an array of form elements or a set of
+	// key/values into a query string
+	param: function( a ) {
+		var s = [ ];
+
+		function add( key, value ){
+			s[ s.length ] = encodeURIComponent(key) + '=' + encodeURIComponent(value);
+		};
+
+		// If an array was passed in, assume that it is an array
+		// of form elements
+		if ( jQuery.isArray(a) || a.jquery )
+			// Serialize the form elements
+			jQuery.each( a, function(){
+				add( this.name, this.value );
+			});
+
+		// Otherwise, assume that it's an object of key/value pairs
+		else
+			// Serialize the key/values
+			for ( var j in a )
+				// If the value is an array then the key names need to be repeated
+				if ( jQuery.isArray(a[j]) )
+					jQuery.each( a[j], function(){
+						add( j, this );
+					});
+				else
+					add( j, jQuery.isFunction(a[j]) ? a[j]() : a[j] );
+
+		// Return the resulting serialization
+		return s.join("&").replace(/%20/g, "+");
+	}
+
+});
+var elemdisplay = {},
+	timerId,
+	fxAttrs = [
+		// height animations
+		[ "height", "marginTop", "marginBottom", "paddingTop", "paddingBottom" ],
+		// width animations
+		[ "width", "marginLeft", "marginRight", "paddingLeft", "paddingRight" ],
+		// opacity animations
+		[ "opacity" ]
+	];
+
+function genFx( type, num ){
+	var obj = {};
+	jQuery.each( fxAttrs.concat.apply([], fxAttrs.slice(0,num)), function(){
+		obj[ this ] = type;
+	});
+	return obj;
+}
+
+jQuery.fn.extend({
+	show: function(speed,callback){
+		if ( speed ) {
+			return this.animate( genFx("show", 3), speed, callback);
+		} else {
+			for ( var i = 0, l = this.length; i < l; i++ ){
+				var old = jQuery.data(this[i], "olddisplay");
+				
+				this[i].style.display = old || "";
+				
+				if ( jQuery.css(this[i], "display") === "none" ) {
+					var tagName = this[i].tagName, display;
+					
+					if ( elemdisplay[ tagName ] ) {
+						display = elemdisplay[ tagName ];
+					} else {
+						var elem = jQuery("<" + tagName + " />").appendTo("body");
+						
+						display = elem.css("display");
+						if ( display === "none" )
+							display = "block";
+						
+						elem.remove();
+						
+						elemdisplay[ tagName ] = display;
+					}
+					
+					jQuery.data(this[i], "olddisplay", display);
+				}
+			}
+
+			// Set the display of the elements in a second loop
+			// to avoid the constant reflow
+			for ( var i = 0, l = this.length; i < l; i++ ){
+				this[i].style.display = jQuery.data(this[i], "olddisplay") || "";
+			}
+			
+			return this;
+		}
+	},
+
+	hide: function(speed,callback){
+		if ( speed ) {
+			return this.animate( genFx("hide", 3), speed, callback);
+		} else {
+			for ( var i = 0, l = this.length; i < l; i++ ){
+				var old = jQuery.data(this[i], "olddisplay");
+				if ( !old && old !== "none" )
+					jQuery.data(this[i], "olddisplay", jQuery.css(this[i], "display"));
+			}
+
+			// Set the display of the elements in a second loop
+			// to avoid the constant reflow
+			for ( var i = 0, l = this.length; i < l; i++ ){
+				this[i].style.display = "none";
+			}
+
+			return this;
+		}
+	},
+
+	// Save the old toggle function
+	_toggle: jQuery.fn.toggle,
+
+	toggle: function( fn, fn2 ){
+		var bool = typeof fn === "boolean";
+
+		return jQuery.isFunction(fn) && jQuery.isFunction(fn2) ?
+			this._toggle.apply( this, arguments ) :
+			fn == null || bool ?
+				this.each(function(){
+					var state = bool ? fn : jQuery(this).is(":hidden");
+					jQuery(this)[ state ? "show" : "hide" ]();
+				}) :
+				this.animate(genFx("toggle", 3), fn, fn2);
+	},
+
+	fadeTo: function(speed,to,callback){
+		return this.animate({opacity: to}, speed, callback);
+	},
+
+	animate: function( prop, speed, easing, callback ) {
+		var optall = jQuery.speed(speed, easing, callback);
+
+		return this[ optall.queue === false ? "each" : "queue" ](function(){
+		
+			var opt = jQuery.extend({}, optall), p,
+				hidden = this.nodeType == 1 && jQuery(this).is(":hidden"),
+				self = this;
+	
+			for ( p in prop ) {
+				if ( prop[p] == "hide" && hidden || prop[p] == "show" && !hidden )
+					return opt.complete.call(this);
+
+				if ( ( p == "height" || p == "width" ) && this.style ) {
+					// Store display property
+					opt.display = jQuery.css(this, "display");
+
+					// Make sure that nothing sneaks out
+					opt.overflow = this.style.overflow;
+				}
+			}
+
+			if ( opt.overflow != null )
+				this.style.overflow = "hidden";
+
+			opt.curAnim = jQuery.extend({}, prop);
+
+			jQuery.each( prop, function(name, val){
+				var e = new jQuery.fx( self, opt, name );
+
+				if ( /toggle|show|hide/.test(val) )
+					e[ val == "toggle" ? hidden ? "show" : "hide" : val ]( prop );
+				else {
+					var parts = val.toString().match(/^([+-]=)?([\d+-.]+)(.*)$/),
+						start = e.cur(true) || 0;
+
+					if ( parts ) {
+						var end = parseFloat(parts[2]),
+							unit = parts[3] || "px";
+
+						// We need to compute starting value
+						if ( unit != "px" ) {
+							self.style[ name ] = (end || 1) + unit;
+							start = ((end || 1) / e.cur(true)) * start;
+							self.style[ name ] = start + unit;
+						}
+
+						// If a +=/-= token was provided, we're doing a relative animation
+						if ( parts[1] )
+							end = ((parts[1] == "-=" ? -1 : 1) * end) + start;
+
+						e.custom( start, end, unit );
+					} else
+						e.custom( start, val, "" );
+				}
+			});
+
+			// For JS strict compliance
+			return true;
+		});
+	},
+
+	stop: function(clearQueue, gotoEnd){
+		var timers = jQuery.timers;
+
+		if (clearQueue)
+			this.queue([]);
+
+		this.each(function(){
+			// go in reverse order so anything added to the queue during the loop is ignored
+			for ( var i = timers.length - 1; i >= 0; i-- )
+				if ( timers[i].elem == this ) {
+					if (gotoEnd)
+						// force the next step to be the last
+						timers[i](true);
+					timers.splice(i, 1);
+				}
+		});
+
+		// start the next in the queue if the last step wasn't forced
+		if (!gotoEnd)
+			this.dequeue();
+
+		return this;
+	}
+
+});
+
+// Generate shortcuts for custom animations
+jQuery.each({
+	slideDown: genFx("show", 1),
+	slideUp: genFx("hide", 1),
+	slideToggle: genFx("toggle", 1),
+	fadeIn: { opacity: "show" },
+	fadeOut: { opacity: "hide" }
+}, function( name, props ){
+	jQuery.fn[ name ] = function( speed, callback ){
+		return this.animate( props, speed, callback );
+	};
+});
+
+jQuery.extend({
+
+	speed: function(speed, easing, fn) {
+		var opt = typeof speed === "object" ? speed : {
+			complete: fn || !fn && easing ||
+				jQuery.isFunction( speed ) && speed,
+			duration: speed,
+			easing: fn && easing || easing && !jQuery.isFunction(easing) && easing
+		};
+
+		opt.duration = jQuery.fx.off ? 0 : typeof opt.duration === "number" ? opt.duration :
+			jQuery.fx.speeds[opt.duration] || jQuery.fx.speeds._default;
+
+		// Queueing
+		opt.old = opt.complete;
+		opt.complete = function(){
+			if ( opt.queue !== false )
+				jQuery(this).dequeue();
+			if ( jQuery.isFunction( opt.old ) )
+				opt.old.call( this );
+		};
+
+		return opt;
+	},
+
+	easing: {
+		linear: function( p, n, firstNum, diff ) {
+			return firstNum + diff * p;
+		},
+		swing: function( p, n, firstNum, diff ) {
+			return ((-Math.cos(p*Math.PI)/2) + 0.5) * diff + firstNum;
+		}
+	},
+
+	timers: [],
+
+	fx: function( elem, options, prop ){
+		this.options = options;
+		this.elem = elem;
+		this.prop = prop;
+
+		if ( !options.orig )
+			options.orig = {};
+	}
+
+});
+
+jQuery.fx.prototype = {
+
+	// Simple function for setting a style value
+	update: function(){
+		if ( this.options.step )
+			this.options.step.call( this.elem, this.now, this );
+
+		(jQuery.fx.step[this.prop] || jQuery.fx.step._default)( this );
+
+		// Set display property to block for height/width animations
+		if ( ( this.prop == "height" || this.prop == "width" ) && this.elem.style )
+			this.elem.style.display = "block";
+	},
+
+	// Get the current size
+	cur: function(force){
+		if ( this.elem[this.prop] != null && (!this.elem.style || this.elem.style[this.prop] == null) )
+			return this.elem[ this.prop ];
+
+		var r = parseFloat(jQuery.css(this.elem, this.prop, force));
+		return r && r > -10000 ? r : parseFloat(jQuery.curCSS(this.elem, this.prop)) || 0;
+	},
+
+	// Start an animation from one number to another
+	custom: function(from, to, unit){
+		this.startTime = now();
+		this.start = from;
+		this.end = to;
+		this.unit = unit || this.unit || "px";
+		this.now = this.start;
+		this.pos = this.state = 0;
+
+		var self = this;
+		function t(gotoEnd){
+			return self.step(gotoEnd);
+		}
+
+		t.elem = this.elem;
+
+		if ( t() && jQuery.timers.push(t) && !timerId ) {
+			timerId = setInterval(function(){
+				var timers = jQuery.timers;
+
+				for ( var i = 0; i < timers.length; i++ )
+					if ( !timers[i]() )
+						timers.splice(i--, 1);
+
+				if ( !timers.length ) {
+					clearInterval( timerId );
+					timerId = undefined;
+				}
+			}, 13);
+		}
+	},
+
+	// Simple 'show' function
+	show: function(){
+		// Remember where we started, so that we can go back to it later
+		this.options.orig[this.prop] = jQuery.attr( this.elem.style, this.prop );
+		this.options.show = true;
+
+		// Begin the animation
+		// Make sure that we start at a small width/height to avoid any
+		// flash of content
+		this.custom(this.prop == "width" || this.prop == "height" ? 1 : 0, this.cur());
+
+		// Start by showing the element
+		jQuery(this.elem).show();
+	},
+
+	// Simple 'hide' function
+	hide: function(){
+		// Remember where we started, so that we can go back to it later
+		this.options.orig[this.prop] = jQuery.attr( this.elem.style, this.prop );
+		this.options.hide = true;
+
+		// Begin the animation
+		this.custom(this.cur(), 0);
+	},
+
+	// Each step of an animation
+	step: function(gotoEnd){
+		var t = now();
+
+		if ( gotoEnd || t >= this.options.duration + this.startTime ) {
+			this.now = this.end;
+			this.pos = this.state = 1;
+			this.update();
+
+			this.options.curAnim[ this.prop ] = true;
+
+			var done = true;
+			for ( var i in this.options.curAnim )
+				if ( this.options.curAnim[i] !== true )
+					done = false;
+
+			if ( done ) {
+				if ( this.options.display != null ) {
+					// Reset the overflow
+					this.elem.style.overflow = this.options.overflow;
+
+					// Reset the display
+					this.elem.style.display = this.options.display;
+					if ( jQuery.css(this.elem, "display") == "none" )
+						this.elem.style.display = "block";
+				}
+
+				// Hide the element if the "hide" operation was done
+				if ( this.options.hide )
+					jQuery(this.elem).hide();
+
+				// Reset the properties, if the item has been hidden or shown
+				if ( this.options.hide || this.options.show )
+					for ( var p in this.options.curAnim )
+						jQuery.attr(this.elem.style, p, this.options.orig[p]);
+					
+				// Execute the complete function
+				this.options.complete.call( this.elem );
+			}
+
+			return false;
+		} else {
+			var n = t - this.startTime;
+			this.state = n / this.options.duration;
+
+			// Perform the easing function, defaults to swing
+			this.pos = jQuery.easing[this.options.easing || (jQuery.easing.swing ? "swing" : "linear")](this.state, n, 0, 1, this.options.duration);
+			this.now = this.start + ((this.end - this.start) * this.pos);
+
+			// Perform the next step of the animation
+			this.update();
+		}
+
+		return true;
+	}
+
+};
+
+jQuery.extend( jQuery.fx, {
+	speeds:{
+		slow: 600,
+ 		fast: 200,
+ 		// Default speed
+ 		_default: 400
+	},
+	step: {
+
+		opacity: function(fx){
+			jQuery.attr(fx.elem.style, "opacity", fx.now);
+		},
+
+		_default: function(fx){
+			if ( fx.elem.style && fx.elem.style[ fx.prop ] != null )
+				fx.elem.style[ fx.prop ] = fx.now + fx.unit;
+			else
+				fx.elem[ fx.prop ] = fx.now;
+		}
+	}
+});
+if ( document.documentElement["getBoundingClientRect"] )
+	jQuery.fn.offset = function() {
+		if ( !this[0] ) return { top: 0, left: 0 };
+		if ( this[0] === this[0].ownerDocument.body ) return jQuery.offset.bodyOffset( this[0] );
+		var box  = this[0].getBoundingClientRect(), doc = this[0].ownerDocument, body = doc.body, docElem = doc.documentElement,
+			clientTop = docElem.clientTop || body.clientTop || 0, clientLeft = docElem.clientLeft || body.clientLeft || 0,
+			top  = box.top  + (self.pageYOffset || jQuery.boxModel && docElem.scrollTop  || body.scrollTop ) - clientTop,
+			left = box.left + (self.pageXOffset || jQuery.boxModel && docElem.scrollLeft || body.scrollLeft) - clientLeft;
+		return { top: top, left: left };
+	};
+else 
+	jQuery.fn.offset = function() {
+		if ( !this[0] ) return { top: 0, left: 0 };
+		if ( this[0] === this[0].ownerDocument.body ) return jQuery.offset.bodyOffset( this[0] );
+		jQuery.offset.initialized || jQuery.offset.initialize();
+
+		var elem = this[0], offsetParent = elem.offsetParent, prevOffsetParent = elem,
+			doc = elem.ownerDocument, computedStyle, docElem = doc.documentElement,
+			body = doc.body, defaultView = doc.defaultView,
+			prevComputedStyle = defaultView.getComputedStyle(elem, null),
+			top = elem.offsetTop, left = elem.offsetLeft;
+
+		while ( (elem = elem.parentNode) && elem !== body && elem !== docElem ) {
+			computedStyle = defaultView.getComputedStyle(elem, null);
+			top -= elem.scrollTop, left -= elem.scrollLeft;
+			if ( elem === offsetParent ) {
+				top += elem.offsetTop, left += elem.offsetLeft;
+				if ( jQuery.offset.doesNotAddBorder && !(jQuery.offset.doesAddBorderForTableAndCells && /^t(able|d|h)$/i.test(elem.tagName)) )
+					top  += parseInt( computedStyle.borderTopWidth,  10) || 0,
+					left += parseInt( computedStyle.borderLeftWidth, 10) || 0;
+				prevOffsetParent = offsetParent, offsetParent = elem.offsetParent;
+			}
+			if ( jQuery.offset.subtractsBorderForOverflowNotVisible && computedStyle.overflow !== "visible" )
+				top  += parseInt( computedStyle.borderTopWidth,  10) || 0,
+				left += parseInt( computedStyle.borderLeftWidth, 10) || 0;
+			prevComputedStyle = computedStyle;
+		}
+
+		if ( prevComputedStyle.position === "relative" || prevComputedStyle.position === "static" )
+			top  += body.offsetTop,
+			left += body.offsetLeft;
+
+		if ( prevComputedStyle.position === "fixed" )
+			top  += Math.max(docElem.scrollTop, body.scrollTop),
+			left += Math.max(docElem.scrollLeft, body.scrollLeft);
+
+		return { top: top, left: left };
+	};
+
+jQuery.offset = {
+	initialize: function() {
+		if ( this.initialized ) return;
+		var body = document.body, container = document.createElement('div'), innerDiv, checkDiv, table, td, rules, prop, bodyMarginTop = body.style.marginTop,
+			html = '<div style="position:absolute;top:0;left:0;margin:0;border:5px solid #000;padding:0;width:1px;height:1px;"><div></div></div><table style="position:absolute;top:0;left:0;margin:0;border:5px solid #000;padding:0;width:1px;height:1px;" cellpadding="0" cellspacing="0"><tr><td></td></tr></table>';
+
+		rules = { position: 'absolute', top: 0, left: 0, margin: 0, border: 0, width: '1px', height: '1px', visibility: 'hidden' };
+		for ( prop in rules ) container.style[prop] = rules[prop];
+
+		container.innerHTML = html;
+		body.insertBefore(container, body.firstChild);
+		innerDiv = container.firstChild, checkDiv = innerDiv.firstChild, td = innerDiv.nextSibling.firstChild.firstChild;
+
+		this.doesNotAddBorder = (checkDiv.offsetTop !== 5);
+		this.doesAddBorderForTableAndCells = (td.offsetTop === 5);
+
+		innerDiv.style.overflow = 'hidden', innerDiv.style.position = 'relative';
+		this.subtractsBorderForOverflowNotVisible = (checkDiv.offsetTop === -5);
+
+		body.style.marginTop = '1px';
+		this.doesNotIncludeMarginInBodyOffset = (body.offsetTop === 0);
+		body.style.marginTop = bodyMarginTop;
+
+		body.removeChild(container);
+		this.initialized = true;
+	},
+
+	bodyOffset: function(body) {
+		jQuery.offset.initialized || jQuery.offset.initialize();
+		var top = body.offsetTop, left = body.offsetLeft;
+		if ( jQuery.offset.doesNotIncludeMarginInBodyOffset )
+			top  += parseInt( jQuery.curCSS(body, 'marginTop',  true), 10 ) || 0,
+			left += parseInt( jQuery.curCSS(body, 'marginLeft', true), 10 ) || 0;
+		return { top: top, left: left };
+	}
+};
+
+
+jQuery.fn.extend({
+	position: function() {
+		var left = 0, top = 0, results;
+
+		if ( this[0] ) {
+			// Get *real* offsetParent
+			var offsetParent = this.offsetParent(),
+
+			// Get correct offsets
+			offset       = this.offset(),
+			parentOffset = /^body|html$/i.test(offsetParent[0].tagName) ? { top: 0, left: 0 } : offsetParent.offset();
+
+			// Subtract element margins
+			// note: when an element has margin: auto the offsetLeft and marginLeft 
+			// are the same in Safari causing offset.left to incorrectly be 0
+			offset.top  -= num( this, 'marginTop'  );
+			offset.left -= num( this, 'marginLeft' );
+
+			// Add offsetParent borders
+			parentOffset.top  += num( offsetParent, 'borderTopWidth'  );
+			parentOffset.left += num( offsetParent, 'borderLeftWidth' );
+
+			// Subtract the two offsets
+			results = {
+				top:  offset.top  - parentOffset.top,
+				left: offset.left - parentOffset.left
+			};
+		}
+
+		return results;
+	},
+
+	offsetParent: function() {
+		var offsetParent = this[0].offsetParent || document.body;
+		while ( offsetParent && (!/^body|html$/i.test(offsetParent.tagName) && jQuery.css(offsetParent, 'position') == 'static') )
+			offsetParent = offsetParent.offsetParent;
+		return jQuery(offsetParent);
+	}
+});
+
+
+// Create scrollLeft and scrollTop methods
+jQuery.each( ['Left', 'Top'], function(i, name) {
+	var method = 'scroll' + name;
+	
+	jQuery.fn[ method ] = function(val) {
+		if (!this[0]) return null;
+
+		return val !== undefined ?
+
+			// Set the scroll offset
+			this.each(function() {
+				this == window || this == document ?
+					window.scrollTo(
+						!i ? val : jQuery(window).scrollLeft(),
+						 i ? val : jQuery(window).scrollTop()
+					) :
+					this[ method ] = val;
+			}) :
+
+			// Return the scroll offset
+			this[0] == window || this[0] == document ?
+				self[ i ? 'pageYOffset' : 'pageXOffset' ] ||
+					jQuery.boxModel && document.documentElement[ method ] ||
+					document.body[ method ] :
+				this[0][ method ];
+	};
+});
+// Create innerHeight, innerWidth, outerHeight and outerWidth methods
+jQuery.each([ "Height", "Width" ], function(i, name){
+
+	var tl = i ? "Left"  : "Top",  // top or left
+		br = i ? "Right" : "Bottom", // bottom or right
+		lower = name.toLowerCase();
+
+	// innerHeight and innerWidth
+	jQuery.fn["inner" + name] = function(){
+		return this[0] ?
+			jQuery.css( this[0], lower, false, "padding" ) :
+			null;
+	};
+
+	// outerHeight and outerWidth
+	jQuery.fn["outer" + name] = function(margin) {
+		return this[0] ?
+			jQuery.css( this[0], lower, false, margin ? "margin" : "border" ) :
+			null;
+	};
+	
+	var type = name.toLowerCase();
+
+	jQuery.fn[ type ] = function( size ) {
+		// Get window width or height
+		return this[0] == window ?
+			// Everyone else use document.documentElement or document.body depending on Quirks vs Standards mode
+			document.compatMode == "CSS1Compat" && document.documentElement[ "client" + name ] ||
+			document.body[ "client" + name ] :
+
+			// Get document width or height
+			this[0] == document ?
+				// Either scroll[Width/Height] or offset[Width/Height], whichever is greater
+				Math.max(
+					document.documentElement["client" + name],
+					document.body["scroll" + name], document.documentElement["scroll" + name],
+					document.body["offset" + name], document.documentElement["offset" + name]
+				) :
+
+				// Get or set width or height on the element
+				size === undefined ?
+					// Get width or height on the element
+					(this.length ? jQuery.css( this[0], type ) : null) :
+
+					// Set the width or height on the element (default to pixels if value is unitless)
+					this.css( type, typeof size === "string" ? size : size + "px" );
+	};
+
+});
+})();
diff --git a/main.py b/main.py
new file mode 100644
index 00000000..1ca7dcb2
--- /dev/null
+++ b/main.py
@@ -0,0 +1,309 @@
+#!/usr/bin/env python
+#
+# Copyright 2007 Google Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import os
+import sys
+import logging
+import traceback
+import StringIO
+
+from google.appengine.runtime import DeadlineExceededError
+
+from google.appengine.ext.webapp import template
+from google.appengine.api import users
+from google.appengine.ext import webapp
+from google.appengine.ext.webapp import util
+
+from fanficdownloader.downloader import *
+from fanficdownloader.ffnet import *
+from fanficdownloader.output import *
+from fanficdownloader import twilighted
+
+from google.appengine.ext import db
+
+from fanficdownloader.zipdir import *
+
+from ffstorage import *
+
+
+
+class LoginRequired(webapp.RequestHandler):
+	def get(self):
+		user = users.get_current_user()
+		if user:
+			self.redirect('/')
+		else:
+			logging.debug(users.create_login_url('/'))
+			url = users.create_login_url(self.request.uri)
+			template_values = {'login_url' : url}
+			path = os.path.join(os.path.dirname(__file__), 'index-nonlogin.html')
+			self.response.out.write(template.render(path, template_values))
+
+class MainHandler(webapp.RequestHandler):
+	def get(self):
+		user = users.get_current_user()
+		if user:
+			error = self.request.get('error')
+			template_values = {'nickname' : user.nickname(), 'authorized': True}
+			url = self.request.get('url')
+			template_values['url'] = url
+			
+			if error != None and len(error) > 1:
+				if error == 'login_required':
+					template_values['error_message'] = 'This story (or one of the chapters) requires you to be logged in.'
+				elif error == 'bad_url':
+					template_values['error_message'] = 'Unsupported URL: ' + url
+				elif error == 'custom':
+					template_values['error_message'] = 'Error happened: ' + self.request.get('errtext')
+			
+			filename = self.request.get('file')
+			if len(filename) > 1:
+				template_values['yourfile'] = '''<div id='yourfile'><a href='/file?id=%s'>"%s" by %s</a></div>''' % (filename, self.request.get('name'), self.request.get('author'))
+			
+			self.response.headers['Content-Type'] = 'text/html'
+			path = os.path.join(os.path.dirname(__file__), 'index.html')
+
+			self.response.out.write(template.render(path, template_values))
+		else:
+#			self.redirect(users.create_login_url(self.request.uri))
+#			self.redirect('/login')
+			logging.debug(users.create_login_url('/'))
+			url = users.create_login_url(self.request.uri)
+			template_values = {'login_url' : url, 'authorized': False}
+			path = os.path.join(os.path.dirname(__file__), 'index.html')
+			self.response.out.write(template.render(path, template_values))
+
+
+class FileServer(webapp.RequestHandler):
+	def get(self):
+#		user  = users.get_current_user()
+		fileId = self.request.get('id')
+		
+		if fileId == None or len(fileId) < 3:
+			self.redirect('/')
+		
+		key = db.Key(fileId)
+		fanfic = db.get(key)
+		
+		name = fanfic.name.encode('utf-8')
+		
+		name = makeAcceptableFilename(name)
+		
+		logging.info("Serving file: %s" % name)
+
+		if fanfic.format == 'epub':
+			self.response.headers['Content-Type'] = 'application/epub+zip'
+			self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.epub'
+		elif fanfic.format == 'html':
+			self.response.headers['Content-Type'] = 'text/html'
+			self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.html.zip'
+		elif fanfic.format == 'text':
+			self.response.headers['Content-Type'] = 'text/plain'
+			self.response.headers['Content-disposition'] = 'attachment; filename=' +name + '.txt.zip'
+		
+		self.response.out.write(fanfic.blob)
+
+class RecentFilesServer(webapp.RequestHandler):
+	def get(self):
+		user = users.get_current_user()
+		if not user:
+			self.redirect('/login')
+		
+#		fics = db.GqlQuery("Select * From DownloadedFanfic WHERE user = :1 and cleared = :2", user)
+		q = DownloadedFanfic.all()
+		q.filter('user =', user)
+		q.filter('cleared =', False)
+		fics = q.fetch(100)
+		
+		template_values = dict(fics = fics, nickname = user.nickname())
+		path = os.path.join(os.path.dirname(__file__), 'recent.html')
+		self.response.out.write(template.render(path, template_values))
+		
+class RecentAllFilesServer(webapp.RequestHandler):
+	def get(self):
+		user = users.get_current_user()
+		if user.nickname() != 'sigizmund':
+			return
+			
+		fics = db.GqlQuery("Select * From DownloadedFanfic")
+		template_values = dict(fics = fics, nickname = user.nickname())
+		path = os.path.join(os.path.dirname(__file__), 'recent.html')
+		self.response.out.write(template.render(path, template_values))	
+
+class FanfictionDownloader(webapp.RequestHandler):
+	def _printableVersion(self, text):
+		text = removeEntities(text)
+		try:
+			d = text.decode('utf-8')
+		except:
+			d = text
+		return d
+	
+
+	def post(self):
+		logging.getLogger().setLevel(logging.DEBUG)
+		
+		user = users.get_current_user()
+		if not user:
+			self.redirect(users.create_login_url('/'))
+		
+		format = self.request.get('format')
+		url = self.request.get('url')
+		login = self.request.get('login')
+		password = self.request.get('password')
+		
+		logging.info("Downloading: " + url)
+		
+		adapter = None
+		writerClass = None
+
+		download = OneDownload()
+		download.user = user
+		download.url = url
+		download.login = login
+		download.password = password
+		download.format = format
+		logging.info('Creating adapter...')
+		
+		try:
+			if url.find('fictionalley') != -1:
+				adapter = fictionalley.FictionAlley(url)
+			elif url.find('ficwad') != -1:
+				adapter = ficwad.FicWad(url)
+			elif url.find('fanfiction.net') != -1 or url.find('fictionpress.com') != -1:
+				adapter = ffnet.FFNet(url)
+			elif url.find('harrypotterfanfiction.com') != -1:
+				adapter = hpfiction.HPFiction(url)
+			elif url.find('twilighted') != -1 or url.find('potionsandsnitches.net') != -1:
+				adapter = twilighted.Twilighted(url)
+			else:
+				logging.debug("Bad URL detected")
+				self.redirect('/?error=bad_url&url=' + urlEscape(url) )
+				return
+		except Exception, e:
+			logging.exception(e)
+			download.failure = "Adapter was not created: " + str(e)
+			download.put()
+			
+			self.redirect('/?error=custom&url=' + urlEscape(url) + '&errtext=' + urlEscape(str(traceback.format_exc())) )
+			return
+		
+		logging.info('Created an adaper: %s' % adapter)
+		
+		if len(login) > 1:
+			adapter.setLogin(login)
+			adapter.setPassword(password)
+
+		if format == 'epub':
+			writerClass = output.EPubFanficWriter
+		elif format == 'html':
+			writerClass = output.HTMLWriter
+		else:
+			writerClass = output.TextWriter
+		
+		loader = FanficLoader(adapter, writerClass, quiet = True, inmemory=True, compress=False)
+		try:
+			data = loader.download()
+			
+			if format == 'html' or format == 'text':
+				# data is uncompressed hence huge
+				ext = '.html'
+				if format == 'text':
+					ext = '.txt'
+				files = {makeAcceptableFilename(str(adapter.getStoryName())) + ext : StringIO.StringIO(data.decode('utf-8')) }
+				d = inMemoryZip(files)
+				data = d.getvalue()
+			
+		
+		except LoginRequiredException, e:
+			logging.exception(e)
+			download.failure = 'Login problem detected'
+			download.put()
+			
+			self.redirect('/?error=login_required&url=' + urlEscape(url))
+			return
+		except:
+			e = sys.exc_info()[0]
+			
+			logging.exception(e)
+			download.failure = 'Some exception happened in downloader: ' + str(e)
+			download.put()
+			
+			self.redirect('/?error=custom&url=' + urlEscape(url) + '&errtext=' + urlEscape(str(traceback.format_exc())) )
+			return
+			
+		if data == None:
+			if loader.badLogin:
+				logging.debug("Bad login detected")
+				
+				download.failure = 'Login problem detected'
+				download.put()
+				
+				self.redirect('/?error=login_required&url=' + urlEscape(url))
+		else:
+			fic = DownloadedFanfic()
+			fic.user = user
+			fic.url = url
+			fic.format = format
+			fic.name = self._printableVersion(adapter.getStoryName())
+			fic.author = self._printableVersion(adapter.getAuthorName())
+			fic.blob = data
+			
+			try:
+				fic.put()
+				
+				key = fic.key()
+				
+				download.put()
+				self.redirect('/?file='+str(key)+'&name=' + urlEscape(fic.name) + '&author=' + urlEscape(fic.author))
+				
+				logging.info("Download finished OK")
+			except Exception, e:
+				logging.exception(e)
+				# it was too large, won't save it
+				name = str(makeAcceptableFilename(adapter.getStoryName()))
+				if format == 'epub':
+					self.response.headers['Content-Type'] = 'application/epub+zip'
+					self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.epub'
+				elif format == 'html':
+					self.response.headers['Content-Type'] = 'application/zip'
+					self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.html.zip'
+				elif format == 'text':
+					self.response.headers['Content-Type'] = 'application/zip'
+					self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.txt.zip'
+				
+				self.response.out.write(data)
+				
+def toPercentDecimal(match): 
+	"Return the %decimal number for the character for url escaping"
+	s = match.group(1)
+	return "%%%02x" % ord(s)
+
+def urlEscape(data):
+	"Escape text, including unicode, for use in URLs"
+	p = re.compile(r'([^\w])')
+	return p.sub(toPercentDecimal, data.encode("utf-8"))
+
+def main():
+  application = webapp.WSGIApplication([('/', MainHandler), ('/fdown', FanfictionDownloader), ('/file', FileServer), ('/recent', RecentFilesServer), ('/r2d2', RecentAllFilesServer), ('/login', LoginRequired)],
+                                       debug=False)
+  util.run_wsgi_app(application)
+
+
+if __name__ == '__main__':
+	logging.getLogger().setLevel(logging.DEBUG)
+	main()
diff --git a/queue.yaml b/queue.yaml
new file mode 100644
index 00000000..0bfb85d0
--- /dev/null
+++ b/queue.yaml
@@ -0,0 +1,5 @@
+queue:
+- name: default
+  rate: 1/s
+- name: download
+  rate: 10/s
\ No newline at end of file
diff --git a/recent.html b/recent.html
new file mode 100644
index 00000000..1b199e5e
--- /dev/null
+++ b/recent.html
@@ -0,0 +1,69 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01//EN">
+<html>
+	<head>
+		<link href="css/index.css" rel="stylesheet" type="text/css">
+		<title>Fanfiction Downloader (fanfiction.net, fanficauthors, fictionalley, ficwad to epub and HTML)</title>
+		<meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
+	</head>
+	<body>
+		<div id='main'>
+			<h1>
+				<a href="/" style="text-decoration: none; color: black;">FanFiction Downloader</a>
+			</h1>
+			
+			
+			<script type="text/javascript"><!--
+			google_ad_client = "pub-2027714004231956";
+			/* 468x60, created 6/9/10 */
+			google_ad_slot = "8817097473";
+			google_ad_width = 468;
+			google_ad_height = 60;
+			//-->
+			</script>
+			<script type="text/javascript"
+			src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
+			</script>			
+			
+			
+			
+<!--			<div id='yourfile'> -->
+			{{yourfile}}
+<!--			</div> -->
+			
+				<div id='urlbox'>
+					<div id='greeting'>
+						Hi, {{ nickname }}! These fanfics you've downloaded previously.
+					</div>
+				</div>
+				
+				<div id='helpbox'>
+					{% for fic in fics %}
+					<p> <a href="/file?id={{ fic.key }}">{{ fic.name }}</a> by {{ fic.author }} ({{ fic.format }})<br/><small><a href="{{ fic.url }}">{{ fic.url }}</a></small></p>
+					{% endfor %}
+				</div>
+				
+				<script type="text/javascript"><!--
+				google_ad_client = "pub-2027714004231956";
+				/* 468x60, created 6/9/10 */
+				google_ad_slot = "2009456648";
+				google_ad_width = 468;
+				google_ad_height = 60;
+				//-->
+				</script>
+				<script type="text/javascript"
+				src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
+				</script>
+				
+				
+		</div>
+		<script type="text/javascript">
+		var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+		document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+		</script>
+		<script type="text/javascript">
+		try {
+		var pageTracker = _gat._getTracker("UA-12136939-1");
+		pageTracker._trackPageview();
+		} catch(err) {}</script>
+	</body>
+</html>
diff --git a/simplejson/__init__.py b/simplejson/__init__.py
new file mode 100644
index 00000000..d5b4d399
--- /dev/null
+++ b/simplejson/__init__.py
@@ -0,0 +1,318 @@
+r"""JSON (JavaScript Object Notation) <http://json.org> is a subset of
+JavaScript syntax (ECMA-262 3rd edition) used as a lightweight data
+interchange format.
+
+:mod:`simplejson` exposes an API familiar to users of the standard library
+:mod:`marshal` and :mod:`pickle` modules. It is the externally maintained
+version of the :mod:`json` library contained in Python 2.6, but maintains
+compatibility with Python 2.4 and Python 2.5 and (currently) has
+significant performance advantages, even without using the optional C
+extension for speedups.
+
+Encoding basic Python object hierarchies::
+
+    >>> import simplejson as json
+    >>> json.dumps(['foo', {'bar': ('baz', None, 1.0, 2)}])
+    '["foo", {"bar": ["baz", null, 1.0, 2]}]'
+    >>> print json.dumps("\"foo\bar")
+    "\"foo\bar"
+    >>> print json.dumps(u'\u1234')
+    "\u1234"
+    >>> print json.dumps('\\')
+    "\\"
+    >>> print json.dumps({"c": 0, "b": 0, "a": 0}, sort_keys=True)
+    {"a": 0, "b": 0, "c": 0}
+    >>> from StringIO import StringIO
+    >>> io = StringIO()
+    >>> json.dump(['streaming API'], io)
+    >>> io.getvalue()
+    '["streaming API"]'
+
+Compact encoding::
+
+    >>> import simplejson as json
+    >>> json.dumps([1,2,3,{'4': 5, '6': 7}], separators=(',',':'))
+    '[1,2,3,{"4":5,"6":7}]'
+
+Pretty printing::
+
+    >>> import simplejson as json
+    >>> s = json.dumps({'4': 5, '6': 7}, sort_keys=True, indent=4)
+    >>> print '\n'.join([l.rstrip() for l in  s.splitlines()])
+    {
+        "4": 5,
+        "6": 7
+    }
+
+Decoding JSON::
+
+    >>> import simplejson as json
+    >>> obj = [u'foo', {u'bar': [u'baz', None, 1.0, 2]}]
+    >>> json.loads('["foo", {"bar":["baz", null, 1.0, 2]}]') == obj
+    True
+    >>> json.loads('"\\"foo\\bar"') == u'"foo\x08ar'
+    True
+    >>> from StringIO import StringIO
+    >>> io = StringIO('["streaming API"]')
+    >>> json.load(io)[0] == 'streaming API'
+    True
+
+Specializing JSON object decoding::
+
+    >>> import simplejson as json
+    >>> def as_complex(dct):
+    ...     if '__complex__' in dct:
+    ...         return complex(dct['real'], dct['imag'])
+    ...     return dct
+    ...
+    >>> json.loads('{"__complex__": true, "real": 1, "imag": 2}',
+    ...     object_hook=as_complex)
+    (1+2j)
+    >>> import decimal
+    >>> json.loads('1.1', parse_float=decimal.Decimal) == decimal.Decimal('1.1')
+    True
+
+Specializing JSON object encoding::
+
+    >>> import simplejson as json
+    >>> def encode_complex(obj):
+    ...     if isinstance(obj, complex):
+    ...         return [obj.real, obj.imag]
+    ...     raise TypeError(repr(o) + " is not JSON serializable")
+    ...
+    >>> json.dumps(2 + 1j, default=encode_complex)
+    '[2.0, 1.0]'
+    >>> json.JSONEncoder(default=encode_complex).encode(2 + 1j)
+    '[2.0, 1.0]'
+    >>> ''.join(json.JSONEncoder(default=encode_complex).iterencode(2 + 1j))
+    '[2.0, 1.0]'
+
+
+Using simplejson.tool from the shell to validate and pretty-print::
+
+    $ echo '{"json":"obj"}' | python -m simplejson.tool
+    {
+        "json": "obj"
+    }
+    $ echo '{ 1.2:3.4}' | python -m simplejson.tool
+    Expecting property name: line 1 column 2 (char 2)
+"""
+__version__ = '2.0.9'
+__all__ = [
+    'dump', 'dumps', 'load', 'loads',
+    'JSONDecoder', 'JSONEncoder',
+]
+
+__author__ = 'Bob Ippolito <bob@redivi.com>'
+
+from decoder import JSONDecoder
+from encoder import JSONEncoder
+
+_default_encoder = JSONEncoder(
+    skipkeys=False,
+    ensure_ascii=True,
+    check_circular=True,
+    allow_nan=True,
+    indent=None,
+    separators=None,
+    encoding='utf-8',
+    default=None,
+)
+
+def dump(obj, fp, skipkeys=False, ensure_ascii=True, check_circular=True,
+        allow_nan=True, cls=None, indent=None, separators=None,
+        encoding='utf-8', default=None, **kw):
+    """Serialize ``obj`` as a JSON formatted stream to ``fp`` (a
+    ``.write()``-supporting file-like object).
+
+    If ``skipkeys`` is true then ``dict`` keys that are not basic types
+    (``str``, ``unicode``, ``int``, ``long``, ``float``, ``bool``, ``None``)
+    will be skipped instead of raising a ``TypeError``.
+
+    If ``ensure_ascii`` is false, then the some chunks written to ``fp``
+    may be ``unicode`` instances, subject to normal Python ``str`` to
+    ``unicode`` coercion rules. Unless ``fp.write()`` explicitly
+    understands ``unicode`` (as in ``codecs.getwriter()``) this is likely
+    to cause an error.
+
+    If ``check_circular`` is false, then the circular reference check
+    for container types will be skipped and a circular reference will
+    result in an ``OverflowError`` (or worse).
+
+    If ``allow_nan`` is false, then it will be a ``ValueError`` to
+    serialize out of range ``float`` values (``nan``, ``inf``, ``-inf``)
+    in strict compliance of the JSON specification, instead of using the
+    JavaScript equivalents (``NaN``, ``Infinity``, ``-Infinity``).
+
+    If ``indent`` is a non-negative integer, then JSON array elements and object
+    members will be pretty-printed with that indent level. An indent level
+    of 0 will only insert newlines. ``None`` is the most compact representation.
+
+    If ``separators`` is an ``(item_separator, dict_separator)`` tuple
+    then it will be used instead of the default ``(', ', ': ')`` separators.
+    ``(',', ':')`` is the most compact JSON representation.
+
+    ``encoding`` is the character encoding for str instances, default is UTF-8.
+
+    ``default(obj)`` is a function that should return a serializable version
+    of obj or raise TypeError. The default simply raises TypeError.
+
+    To use a custom ``JSONEncoder`` subclass (e.g. one that overrides the
+    ``.default()`` method to serialize additional types), specify it with
+    the ``cls`` kwarg.
+
+    """
+    # cached encoder
+    if (not skipkeys and ensure_ascii and
+        check_circular and allow_nan and
+        cls is None and indent is None and separators is None and
+        encoding == 'utf-8' and default is None and not kw):
+        iterable = _default_encoder.iterencode(obj)
+    else:
+        if cls is None:
+            cls = JSONEncoder
+        iterable = cls(skipkeys=skipkeys, ensure_ascii=ensure_ascii,
+            check_circular=check_circular, allow_nan=allow_nan, indent=indent,
+            separators=separators, encoding=encoding,
+            default=default, **kw).iterencode(obj)
+    # could accelerate with writelines in some versions of Python, at
+    # a debuggability cost
+    for chunk in iterable:
+        fp.write(chunk)
+
+
+def dumps(obj, skipkeys=False, ensure_ascii=True, check_circular=True,
+        allow_nan=True, cls=None, indent=None, separators=None,
+        encoding='utf-8', default=None, **kw):
+    """Serialize ``obj`` to a JSON formatted ``str``.
+
+    If ``skipkeys`` is false then ``dict`` keys that are not basic types
+    (``str``, ``unicode``, ``int``, ``long``, ``float``, ``bool``, ``None``)
+    will be skipped instead of raising a ``TypeError``.
+
+    If ``ensure_ascii`` is false, then the return value will be a
+    ``unicode`` instance subject to normal Python ``str`` to ``unicode``
+    coercion rules instead of being escaped to an ASCII ``str``.
+
+    If ``check_circular`` is false, then the circular reference check
+    for container types will be skipped and a circular reference will
+    result in an ``OverflowError`` (or worse).
+
+    If ``allow_nan`` is false, then it will be a ``ValueError`` to
+    serialize out of range ``float`` values (``nan``, ``inf``, ``-inf``) in
+    strict compliance of the JSON specification, instead of using the
+    JavaScript equivalents (``NaN``, ``Infinity``, ``-Infinity``).
+
+    If ``indent`` is a non-negative integer, then JSON array elements and
+    object members will be pretty-printed with that indent level. An indent
+    level of 0 will only insert newlines. ``None`` is the most compact
+    representation.
+
+    If ``separators`` is an ``(item_separator, dict_separator)`` tuple
+    then it will be used instead of the default ``(', ', ': ')`` separators.
+    ``(',', ':')`` is the most compact JSON representation.
+
+    ``encoding`` is the character encoding for str instances, default is UTF-8.
+
+    ``default(obj)`` is a function that should return a serializable version
+    of obj or raise TypeError. The default simply raises TypeError.
+
+    To use a custom ``JSONEncoder`` subclass (e.g. one that overrides the
+    ``.default()`` method to serialize additional types), specify it with
+    the ``cls`` kwarg.
+
+    """
+    # cached encoder
+    if (not skipkeys and ensure_ascii and
+        check_circular and allow_nan and
+        cls is None and indent is None and separators is None and
+        encoding == 'utf-8' and default is None and not kw):
+        return _default_encoder.encode(obj)
+    if cls is None:
+        cls = JSONEncoder
+    return cls(
+        skipkeys=skipkeys, ensure_ascii=ensure_ascii,
+        check_circular=check_circular, allow_nan=allow_nan, indent=indent,
+        separators=separators, encoding=encoding, default=default,
+        **kw).encode(obj)
+
+
+_default_decoder = JSONDecoder(encoding=None, object_hook=None)
+
+
+def load(fp, encoding=None, cls=None, object_hook=None, parse_float=None,
+        parse_int=None, parse_constant=None, **kw):
+    """Deserialize ``fp`` (a ``.read()``-supporting file-like object containing
+    a JSON document) to a Python object.
+
+    If the contents of ``fp`` is encoded with an ASCII based encoding other
+    than utf-8 (e.g. latin-1), then an appropriate ``encoding`` name must
+    be specified. Encodings that are not ASCII based (such as UCS-2) are
+    not allowed, and should be wrapped with
+    ``codecs.getreader(fp)(encoding)``, or simply decoded to a ``unicode``
+    object and passed to ``loads()``
+
+    ``object_hook`` is an optional function that will be called with the
+    result of any object literal decode (a ``dict``). The return value of
+    ``object_hook`` will be used instead of the ``dict``. This feature
+    can be used to implement custom decoders (e.g. JSON-RPC class hinting).
+
+    To use a custom ``JSONDecoder`` subclass, specify it with the ``cls``
+    kwarg.
+
+    """
+    return loads(fp.read(),
+        encoding=encoding, cls=cls, object_hook=object_hook,
+        parse_float=parse_float, parse_int=parse_int,
+        parse_constant=parse_constant, **kw)
+
+
+def loads(s, encoding=None, cls=None, object_hook=None, parse_float=None,
+        parse_int=None, parse_constant=None, **kw):
+    """Deserialize ``s`` (a ``str`` or ``unicode`` instance containing a JSON
+    document) to a Python object.
+
+    If ``s`` is a ``str`` instance and is encoded with an ASCII based encoding
+    other than utf-8 (e.g. latin-1) then an appropriate ``encoding`` name
+    must be specified. Encodings that are not ASCII based (such as UCS-2)
+    are not allowed and should be decoded to ``unicode`` first.
+
+    ``object_hook`` is an optional function that will be called with the
+    result of any object literal decode (a ``dict``). The return value of
+    ``object_hook`` will be used instead of the ``dict``. This feature
+    can be used to implement custom decoders (e.g. JSON-RPC class hinting).
+
+    ``parse_float``, if specified, will be called with the string
+    of every JSON float to be decoded. By default this is equivalent to
+    float(num_str). This can be used to use another datatype or parser
+    for JSON floats (e.g. decimal.Decimal).
+
+    ``parse_int``, if specified, will be called with the string
+    of every JSON int to be decoded. By default this is equivalent to
+    int(num_str). This can be used to use another datatype or parser
+    for JSON integers (e.g. float).
+
+    ``parse_constant``, if specified, will be called with one of the
+    following strings: -Infinity, Infinity, NaN, null, true, false.
+    This can be used to raise an exception if invalid JSON numbers
+    are encountered.
+
+    To use a custom ``JSONDecoder`` subclass, specify it with the ``cls``
+    kwarg.
+
+    """
+    if (cls is None and encoding is None and object_hook is None and
+            parse_int is None and parse_float is None and
+            parse_constant is None and not kw):
+        return _default_decoder.decode(s)
+    if cls is None:
+        cls = JSONDecoder
+    if object_hook is not None:
+        kw['object_hook'] = object_hook
+    if parse_float is not None:
+        kw['parse_float'] = parse_float
+    if parse_int is not None:
+        kw['parse_int'] = parse_int
+    if parse_constant is not None:
+        kw['parse_constant'] = parse_constant
+    return cls(encoding=encoding, **kw).decode(s)
diff --git a/simplejson/__init__.pyc b/simplejson/__init__.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..f01003d4f81d37513d0f8a2a5fb857b8448ae2bd
GIT binary patch
literal 12071
zcmeHNL37+jc5aXoC5<V`wpPhnPEuV{TLC6J1Wiho9hRuFEorN`sg+zqX}5}`Y6b)J
za3Ep;7!8P|C7!%jANIcgVlVj{xu+`sAvx?Z`QGaWW`?31S@tGXTb4L8Xmt1M?$@v1
z`@RSK=|3;Ge(}dYZiT}ByN2J-@X<FMAtE7m@a>2lM??!ES`^Va5uF#&l87#d{Ux!3
zn-|3n?q3p7OB|dN$$7DJUN}^KM;t7P<bv3_ARKi;M9V^56wzg&P<MsDuk!c1BDx`>
z_xSsL5nU6}&*=IaadGDz>Vo#>kD8f3w86!7@%u|+hsD0O&EIev42oGpIC}l95x%f<
zrIyx+#l_FX@3E|_XH|W`RXp2m??ckj2g^eIdi&8s>HRu*9&Cq2oR{*^@R<rr`7kSk
zGS1SDyfZG#d}DR>na)x_EB5coSj#}_YN%Byvr%iNvp!DC;7EE8?)~QTmG#@}@@5f9
z6~#tUrBx&Y>YT*;<ML3^w~T@^XvJx%if|mH`$~?oViJ^otF<x7qK$!$CwZc1^np}I
zd8QR4r1JAGx8x|8#7P_!vdkoe7aG%%<yc8w25A&v>?9r*L2+zFO@cy?gJgjIku=it
zI6O$yKw_vWQQDVVC9RKys3XiN4U*(oP6A929~HHpV;JbA9?3{Cv$KQAFtd$ioXRhc
z%Q2d-`?tGtSe1<^-3qfw4jm7%gz{J(#^re0_!dvG>H9Gky|5|@m6pkIM~(yC((!&8
zkK!;$OPQ;J^_GT82GMie3ig%mO7&c&EIY&4m5$SWUR##amIR5s*P>;nyd(&aI#(*H
zat-xANW(0m4#PmlVLi9Z*vB|lP;7`Fy|K}1N&LHe7p5`Ev!ayKJ)`|5?KCaejG}6i
zYj4*bWtrQRFWg~JxEs>L@7E|l%u>~rYyL-Fx!yT>+Tp(LZX2!JXx&EZ_J-WW@7E}&
zRg%=LpPoE*o00MYo5q9tX1w+uiP)p=M&`_o*Y~R2y=ra!<}J7G!=?7?JGgs$P20Wi
zX!oKWVi{OuduV?H`aS7N4ITCm)Un=tTvW=8`=ZUYGp)JzNi&a8kxk@wiAC>kJ*qdN
zE;p^>Ol~%<JR_PmuGtpsiY^O<lZBnfA#<O0Wt>eL#+kpb%I85+Dcc=8GuNYyJ!st{
z<Axtm)`;HTNY=XR-J9JP?k!lz$6e{(#_uO5n3Yy}Py}UG=uOY<;{S%*G4phHZKw9F
z_QuEE_U-ltdSF&x7OKQqW6Qw$zTc!YG}ov}d#7h~dfTA3G{R}!yfsyxF-dnXb^T{q
zoO-*7UqE+p?sdrR$%H(H)V|K)6B76v?RBjEzu+yTb4H7TCZ=U9PkzG1lUD1#vZt0j
z`}bQQjy9IKTh+(1vgZ<aUOkvNYK>8`R+21;w0HWLzV4KE<mRTtfGmTo{7hl(J#%FF
z%(~pCa`_M+ee@}O#;d*G<`kS^z|$>j*5=_9?0)o==6&jfOlQ&B&Q%x(N&GdP9*(Wn
zUq*IYzTb{SY6J(`r$~{gBQFZe&IXU>`#zb1j7QS#*Y*9rOZJ0S^Npw>48JN;gr-K)
zu8UKi(D6oxT{oTt`>wUMTDt9o`g&0QZTyAZ@)zxyDZmy>Y$yB_iAQM-mn0mQ>nE-;
z+j;<_oc=h=4mPLjG|KnZe!2c^x(_z8K#vfXoH>s*e+|(CPC={w2y-hpZEGKgf_kw5
zox10_)Xj{;cKG@|d^=x8d&oUiy-yyN{pvo(2+o9CLPho6daF(~oY~7=H1kQxT{=iU
z>DU~}TDwIMYb75a=juUGWQA9#yzsJ){H1IY#!0i%m?)4F+iWmQl#PrKF|T41LD$iD
z4Rgbqf+{ID=htPF=<cpl<VN_OiN$=1=sY~2c%TaJH4=Oy(K7>mhd|eQ&^Hzw1I*0}
zKSO$}^@JhP6u<aomL-zC3IofrN)m#b2!Jt=E5H_@WX@q_g}r-yz<(iCIL@T|qD@n5
zZ?v&T?GsnNl(|8KE0Y<R#KW-0XZ*bBD7h!snPA^YhK|=aZu+<0K<a}dIHr=EQeI@h
ziU@*fFi{%-$f=TRFt((c0HsO~AiMzVYU%T!2-r#gpUZQ&qWv%F78?TJqSMc}*bS8L
zppteNXN`8aDcc>_e~<bvvZ36{^9<1~lXr&M@UsH!;CbxBFWrs*8~;4;HqoOI%@qw<
zUc{F^h;xEOB}j_^V66((4|EvE<rUlr$0|JNhj9^BNl=uRa0|daJM5=G!b>QbSX{Pn
zImHbun2iFO;RRRaXyw!L0$N!E4QW|4!u$CA3qJbK_<Fe@mb0&f^KwyS&+v0jWFdae
zi);@+pqDN2?4rmXp#bJ+3SXcA0%-~#qW~W1h-V8T^H6BjH6Nnz4y0cbPU(nvLA(^=
z8%LZhi}Wd~8rdz>FN%{Tkvir!S~ADQoIrCiB`{sg2xOP$a6!=E7X^)aNnkh(@~yZy
zEC1+2@p4(*e|k-vTox}eHl$ppv7N8}UHlFc-}Xou`VUagwsjdw4hAsn0VoymI*xdT
zzm?#61{TtB84N}_8hHWR@nGN|7C4YzXE0dN6%3+a+Z@G-T1nyqMGg)2+5rn8hqpC?
zfZ6~ch6oyB3^AD$HBlUvxJ%Z7TR|y<La}!<#HEA-)GWt?l(HBMy69A;G1;jpfGC)Y
zBun?r6$cP=IfM%^SHw&P1LHUjV|aogxF!rU$70EQs~{p`NRF4zT7YpH_lrf(tY+4N
z&5A}rq7gQEP3&s2iIU;CN)NOoZGojtHOb4F1jjUinYHjFD1?CdfuJ*!hxSuq)Je_Y
ztP&v1ZbqXDxB;+mVz-4M!%tFhVvP|-`E<vKg(q<cfO^aVD!^QzSU5szIThx?BmhSS
z1JZM-i8k=A7qsmiEEL;_KiY3A2~!ON5P3LNsVHR4YHa?9pRKdn0RZld*xi!`;Td?I
z1h8vrj+6me1(@;tCXzP~<QZb9AxkNgM&zS~VUmNvBjf{MDu*0lF)0s&9D<UlIooY~
z(W}#r%VrW}F25yWRSUB_RL5r=3y^rWFUpf(R|w=lB(pIsVcu|e#!};SWG+_t%9t!B
zO>6_SjB#L0mQp7&_~?TDhn!KM>;Ms%#-y9n0V`o9<)gl;VvG->!xMNIJT&8OrK31S
zV#Cg2TAWjiamz+40qitgN!31*BF_~DFV(&(?1|v%1w{dqSBaYNaI{&*QShWDYBHo8
zP`#(KQ5olx6D;f=%%CzsZY1&L=P8CFqGoQeDCqbjBPUCd{(&A4&}6C(nUncYz3~Kf
zs%VmFqf?^11hbTeKu(~|n(#F8*cFond2oc2ep3Z-g$<gPaaLqm0siyE*gMRa45!p)
zwuu~vja(!eaG3r!q)TF&F_7IMx5^E;o~y~LqWj!hSnX#nXfUV)r&$YiCF}qVsG_0$
z%xYnCY)aNK)$_x6Pagkj<x{I6_;G_O86H~&$x)R8x4<Lu&gpShB~eXg0<36?T&2y-
z)f))QkT{H|K(H?#&!~uT-mz(;r%2h(=rLy%$sbg@L~>;?Aaz(gL;9?SVG_VUddlDT
zC1Qh_Wrmp)aRm1QrC3e-_2OtFCJH&hh`f2d0Jyx!q)FkY*)?_G!TB`8{K!R=<Jtf)
zk1){?b8r|G`*yBV^wJ}^(<2DeBiz&@EYu_1)1&C!Bly(2jIW0tV=IDMWX$Eexaiwi
z_IYn%^VDyOoO|4ZzD)QgTm%pz1aw_4;CGatH99xJl+T(4cRM&_Bt`=f2Vqdjk<Wun
z!C(3_T&+HVzVzxrT)-P=&sXmQ%MP=n)%$dkvwU?F!0CjCYPdQD@T>hk`JsN_&yRZ~
z?rVJX-_cd~s&mD0owjpr;j+_m-pBuC=lbFWvE+obaMD);`~D3DfTHCr1Ka{=8{-G)
zFTfAb-wu9&wG6oX4GIlT`wWE!1KvadFwDTde?$Rj%=GyHg%+g0HxK)^8QnFKE$BOM
zKp$=c^x@gYB11pGH9$XrK0rT!K7PnSLj&|-On^SdeY2p?0=hrLVzyrabg<4>0G)*n
zb3V=Da&urA#E{vOXZ!2KWi~0oF}H~|HLjhaA9BhZU*7<SL03&jKIQW`jGd>2mP19r
zQt2=t%t?EMM<LtywzeRHvF+^M`~;bP2xNlVc{BdXAQP|2z$OHu9|oCN7UL*_k#7x|
zSj?Fy!!W-l(Qlj#1Mi<;lVOuT!6tsX{C^0W2r=~t`t+{ii?d4xE-^gf97&I0!&y+M
z_cN+E1C8~rqvFSgJCsZNSA6u(@g@GLhCA;$1b3DIcHVccI-IC8{(uwlAwfq%j<h<?
zczuG466gm|&=KG88x@2)z9ZqpIj3)(rEQOd=^PmGJ}8j^>&#qDHV8qBGT71omI$hO
zJ7ORE3JXl4EUbtMBAGy7#Xc@KYnjGDW+r$f&zuo%%I2a#Kg_mSYS;u)WQ`D7xsGCO
zhW-VQ3JQ`+&JbF}pMc?|D{Fx2jCfER<dk2<I*}QkV@Q;3l@ss?mPBbIL$y`p%Ln!u
z>8b3M3F~Gyp02_%<=CFw+g@4kP=<>IQ4XJz3o7aY3LxcX7!n3JEHD|%d%5jwB8HTX
zEc__%c=bX-Oz<E9ZvfEy7RO+bl(sPt15265CpLW0fH??|X*L*eBAE8Fc1<&8)wu5F
z)q{CzSF`pI%dxX==#$O4VDEzT*iwGvjfgHJcA`ivVwMJRb_~gz18R6r#Zcb)Db=H%
z#iMI+Bn`$gQUM;J8MWh;3(CB4FPI*`p+bgOGex63<RT0+B-*&r`|_SNba9N-1}v*i
zggiczX4*75)K=5XR|p~L2a9Gh$g7(rgofy`yZM05FOiv<M`N5KH)YI*bLggo3>g8}
z(jz|C!@(7t?B`QTUZF>?Se+8yyFvHpouVEQtG|dZqv`w?KAI*Wu3u%c*7z#&$?U5Z
z;qxdDzQhT5qGj+@ra-i8u`UoT<K#Hy>4}yxX`%wrGH@r;hiKV_*U_?O7)#3*3@tNb
zToTz8bOtp81#`q5CURyFTLr#`ss&qRCS$8W;!w3{tITX{l}YEHvsIV^+B($yTj4a>
zeCv1r15|z9?^4=;PYQDdI_@(^yGhc_xLdeYvR*c?H*>e(A@;08wi%}3LgX;s(C_ky
z?0aG6ukpKY=5|>Uxn9oJ{}8v!lIn*G*6p71x-)KbR<olR8FCwv_=yRgZg8}<s>1tZ
z^&43~xy3qq%(yFxO?cO#37Xx8d7p|GoZz-70r3Kfq2ky+mZD@i0R=d2yGy?Of&v{s
z%Z4q%GRZibgf<%Uj&qvbODkk)%YuUonw<&(2nDbNW3Ti^Bjxbuc<~wxe4ytKoKIzW
zb!@;?=+y)t{+?e^XpE$B&OgH1;o{$F<>>b#t{c)QqhGI_)ldh)!C*f8yxF2D<%(TK
z95fr1(KBBHZN%B}NOwc7)DIrIa(ab_6!m+9=3Ny|TbZOd$NE#7YjVhNLh2|~d``(2
z;}kidI5K+*>!61ZjfWsqRnbeW0C>ip|3YD&g8S+COF7<$Uc*!7Q@h6Y3+656+B|Nj
zxQZvvh_L?;(VcL{6%4Nb0T-g}Iyao_j^Qbnk))mdJoMf}6MjbD?;|Aj`;2Y+eVhMB
znMg;!4+o8F;##<_kZ~_;mDK<*o7*x3R>d^E{VRGF%eaSL37V2UP9XP4Nj;iqufa$j
zN<TJzW2AG(yqJ79gnWGqUrWx?!m_ixxU}%D^X>vlbN??bUIMMVdWXMnUth%ajb-P5
E0OpUxq5uE@

literal 0
HcmV?d00001

diff --git a/simplejson/_speedups.c b/simplejson/_speedups.c
new file mode 100644
index 00000000..23b5f4a6
--- /dev/null
+++ b/simplejson/_speedups.c
@@ -0,0 +1,2329 @@
+#include "Python.h"
+#include "structmember.h"
+#if PY_VERSION_HEX < 0x02060000 && !defined(Py_TYPE)
+#define Py_TYPE(ob)     (((PyObject*)(ob))->ob_type)
+#endif
+#if PY_VERSION_HEX < 0x02050000 && !defined(PY_SSIZE_T_MIN)
+typedef int Py_ssize_t;
+#define PY_SSIZE_T_MAX INT_MAX
+#define PY_SSIZE_T_MIN INT_MIN
+#define PyInt_FromSsize_t PyInt_FromLong
+#define PyInt_AsSsize_t PyInt_AsLong
+#endif
+#ifndef Py_IS_FINITE
+#define Py_IS_FINITE(X) (!Py_IS_INFINITY(X) && !Py_IS_NAN(X))
+#endif
+
+#ifdef __GNUC__
+#define UNUSED __attribute__((__unused__))
+#else
+#define UNUSED
+#endif
+
+#define DEFAULT_ENCODING "utf-8"
+
+#define PyScanner_Check(op) PyObject_TypeCheck(op, &PyScannerType)
+#define PyScanner_CheckExact(op) (Py_TYPE(op) == &PyScannerType)
+#define PyEncoder_Check(op) PyObject_TypeCheck(op, &PyEncoderType)
+#define PyEncoder_CheckExact(op) (Py_TYPE(op) == &PyEncoderType)
+
+static PyTypeObject PyScannerType;
+static PyTypeObject PyEncoderType;
+
+typedef struct _PyScannerObject {
+    PyObject_HEAD
+    PyObject *encoding;
+    PyObject *strict;
+    PyObject *object_hook;
+    PyObject *parse_float;
+    PyObject *parse_int;
+    PyObject *parse_constant;
+} PyScannerObject;
+
+static PyMemberDef scanner_members[] = {
+    {"encoding", T_OBJECT, offsetof(PyScannerObject, encoding), READONLY, "encoding"},
+    {"strict", T_OBJECT, offsetof(PyScannerObject, strict), READONLY, "strict"},
+    {"object_hook", T_OBJECT, offsetof(PyScannerObject, object_hook), READONLY, "object_hook"},
+    {"parse_float", T_OBJECT, offsetof(PyScannerObject, parse_float), READONLY, "parse_float"},
+    {"parse_int", T_OBJECT, offsetof(PyScannerObject, parse_int), READONLY, "parse_int"},
+    {"parse_constant", T_OBJECT, offsetof(PyScannerObject, parse_constant), READONLY, "parse_constant"},
+    {NULL}
+};
+
+typedef struct _PyEncoderObject {
+    PyObject_HEAD
+    PyObject *markers;
+    PyObject *defaultfn;
+    PyObject *encoder;
+    PyObject *indent;
+    PyObject *key_separator;
+    PyObject *item_separator;
+    PyObject *sort_keys;
+    PyObject *skipkeys;
+    int fast_encode;
+    int allow_nan;
+} PyEncoderObject;
+
+static PyMemberDef encoder_members[] = {
+    {"markers", T_OBJECT, offsetof(PyEncoderObject, markers), READONLY, "markers"},
+    {"default", T_OBJECT, offsetof(PyEncoderObject, defaultfn), READONLY, "default"},
+    {"encoder", T_OBJECT, offsetof(PyEncoderObject, encoder), READONLY, "encoder"},
+    {"indent", T_OBJECT, offsetof(PyEncoderObject, indent), READONLY, "indent"},
+    {"key_separator", T_OBJECT, offsetof(PyEncoderObject, key_separator), READONLY, "key_separator"},
+    {"item_separator", T_OBJECT, offsetof(PyEncoderObject, item_separator), READONLY, "item_separator"},
+    {"sort_keys", T_OBJECT, offsetof(PyEncoderObject, sort_keys), READONLY, "sort_keys"},
+    {"skipkeys", T_OBJECT, offsetof(PyEncoderObject, skipkeys), READONLY, "skipkeys"},
+    {NULL}
+};
+
+static Py_ssize_t
+ascii_escape_char(Py_UNICODE c, char *output, Py_ssize_t chars);
+static PyObject *
+ascii_escape_unicode(PyObject *pystr);
+static PyObject *
+ascii_escape_str(PyObject *pystr);
+static PyObject *
+py_encode_basestring_ascii(PyObject* self UNUSED, PyObject *pystr);
+void init_speedups(void);
+static PyObject *
+scan_once_str(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr);
+static PyObject *
+scan_once_unicode(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr);
+static PyObject *
+_build_rval_index_tuple(PyObject *rval, Py_ssize_t idx);
+static PyObject *
+scanner_new(PyTypeObject *type, PyObject *args, PyObject *kwds);
+static int
+scanner_init(PyObject *self, PyObject *args, PyObject *kwds);
+static void
+scanner_dealloc(PyObject *self);
+static int
+scanner_clear(PyObject *self);
+static PyObject *
+encoder_new(PyTypeObject *type, PyObject *args, PyObject *kwds);
+static int
+encoder_init(PyObject *self, PyObject *args, PyObject *kwds);
+static void
+encoder_dealloc(PyObject *self);
+static int
+encoder_clear(PyObject *self);
+static int
+encoder_listencode_list(PyEncoderObject *s, PyObject *rval, PyObject *seq, Py_ssize_t indent_level);
+static int
+encoder_listencode_obj(PyEncoderObject *s, PyObject *rval, PyObject *obj, Py_ssize_t indent_level);
+static int
+encoder_listencode_dict(PyEncoderObject *s, PyObject *rval, PyObject *dct, Py_ssize_t indent_level);
+static PyObject *
+_encoded_const(PyObject *const);
+static void
+raise_errmsg(char *msg, PyObject *s, Py_ssize_t end);
+static PyObject *
+encoder_encode_string(PyEncoderObject *s, PyObject *obj);
+static int
+_convertPyInt_AsSsize_t(PyObject *o, Py_ssize_t *size_ptr);
+static PyObject *
+_convertPyInt_FromSsize_t(Py_ssize_t *size_ptr);
+static PyObject *
+encoder_encode_float(PyEncoderObject *s, PyObject *obj);
+
+#define S_CHAR(c) (c >= ' ' && c <= '~' && c != '\\' && c != '"')
+#define IS_WHITESPACE(c) (((c) == ' ') || ((c) == '\t') || ((c) == '\n') || ((c) == '\r'))
+
+#define MIN_EXPANSION 6
+#ifdef Py_UNICODE_WIDE
+#define MAX_EXPANSION (2 * MIN_EXPANSION)
+#else
+#define MAX_EXPANSION MIN_EXPANSION
+#endif
+
+static int
+_convertPyInt_AsSsize_t(PyObject *o, Py_ssize_t *size_ptr)
+{
+    /* PyObject to Py_ssize_t converter */
+    *size_ptr = PyInt_AsSsize_t(o);
+    if (*size_ptr == -1 && PyErr_Occurred());
+        return 1;
+    return 0;
+}
+
+static PyObject *
+_convertPyInt_FromSsize_t(Py_ssize_t *size_ptr)
+{
+    /* Py_ssize_t to PyObject converter */
+    return PyInt_FromSsize_t(*size_ptr);
+}
+
+static Py_ssize_t
+ascii_escape_char(Py_UNICODE c, char *output, Py_ssize_t chars)
+{
+    /* Escape unicode code point c to ASCII escape sequences
+    in char *output. output must have at least 12 bytes unused to
+    accommodate an escaped surrogate pair "\uXXXX\uXXXX" */
+    output[chars++] = '\\';
+    switch (c) {
+        case '\\': output[chars++] = (char)c; break;
+        case '"': output[chars++] = (char)c; break;
+        case '\b': output[chars++] = 'b'; break;
+        case '\f': output[chars++] = 'f'; break;
+        case '\n': output[chars++] = 'n'; break;
+        case '\r': output[chars++] = 'r'; break;
+        case '\t': output[chars++] = 't'; break;
+        default:
+#ifdef Py_UNICODE_WIDE
+            if (c >= 0x10000) {
+                /* UTF-16 surrogate pair */
+                Py_UNICODE v = c - 0x10000;
+                c = 0xd800 | ((v >> 10) & 0x3ff);
+                output[chars++] = 'u';
+                output[chars++] = "0123456789abcdef"[(c >> 12) & 0xf];
+                output[chars++] = "0123456789abcdef"[(c >>  8) & 0xf];
+                output[chars++] = "0123456789abcdef"[(c >>  4) & 0xf];
+                output[chars++] = "0123456789abcdef"[(c      ) & 0xf];
+                c = 0xdc00 | (v & 0x3ff);
+                output[chars++] = '\\';
+            }
+#endif
+            output[chars++] = 'u';
+            output[chars++] = "0123456789abcdef"[(c >> 12) & 0xf];
+            output[chars++] = "0123456789abcdef"[(c >>  8) & 0xf];
+            output[chars++] = "0123456789abcdef"[(c >>  4) & 0xf];
+            output[chars++] = "0123456789abcdef"[(c      ) & 0xf];
+    }
+    return chars;
+}
+
+static PyObject *
+ascii_escape_unicode(PyObject *pystr)
+{
+    /* Take a PyUnicode pystr and return a new ASCII-only escaped PyString */
+    Py_ssize_t i;
+    Py_ssize_t input_chars;
+    Py_ssize_t output_size;
+    Py_ssize_t max_output_size;
+    Py_ssize_t chars;
+    PyObject *rval;
+    char *output;
+    Py_UNICODE *input_unicode;
+
+    input_chars = PyUnicode_GET_SIZE(pystr);
+    input_unicode = PyUnicode_AS_UNICODE(pystr);
+
+    /* One char input can be up to 6 chars output, estimate 4 of these */
+    output_size = 2 + (MIN_EXPANSION * 4) + input_chars;
+    max_output_size = 2 + (input_chars * MAX_EXPANSION);
+    rval = PyString_FromStringAndSize(NULL, output_size);
+    if (rval == NULL) {
+        return NULL;
+    }
+    output = PyString_AS_STRING(rval);
+    chars = 0;
+    output[chars++] = '"';
+    for (i = 0; i < input_chars; i++) {
+        Py_UNICODE c = input_unicode[i];
+        if (S_CHAR(c)) {
+            output[chars++] = (char)c;
+        }
+        else {
+            chars = ascii_escape_char(c, output, chars);
+        }
+        if (output_size - chars < (1 + MAX_EXPANSION)) {
+            /* There's more than four, so let's resize by a lot */
+            Py_ssize_t new_output_size = output_size * 2;
+            /* This is an upper bound */
+            if (new_output_size > max_output_size) {
+                new_output_size = max_output_size;
+            }
+            /* Make sure that the output size changed before resizing */
+            if (new_output_size != output_size) {
+                output_size = new_output_size;
+                if (_PyString_Resize(&rval, output_size) == -1) {
+                    return NULL;
+                }
+                output = PyString_AS_STRING(rval);
+            }
+        }
+    }
+    output[chars++] = '"';
+    if (_PyString_Resize(&rval, chars) == -1) {
+        return NULL;
+    }
+    return rval;
+}
+
+static PyObject *
+ascii_escape_str(PyObject *pystr)
+{
+    /* Take a PyString pystr and return a new ASCII-only escaped PyString */
+    Py_ssize_t i;
+    Py_ssize_t input_chars;
+    Py_ssize_t output_size;
+    Py_ssize_t chars;
+    PyObject *rval;
+    char *output;
+    char *input_str;
+
+    input_chars = PyString_GET_SIZE(pystr);
+    input_str = PyString_AS_STRING(pystr);
+
+    /* Fast path for a string that's already ASCII */
+    for (i = 0; i < input_chars; i++) {
+        Py_UNICODE c = (Py_UNICODE)(unsigned char)input_str[i];
+        if (!S_CHAR(c)) {
+            /* If we have to escape something, scan the string for unicode */
+            Py_ssize_t j;
+            for (j = i; j < input_chars; j++) {
+                c = (Py_UNICODE)(unsigned char)input_str[j];
+                if (c > 0x7f) {
+                    /* We hit a non-ASCII character, bail to unicode mode */
+                    PyObject *uni;
+                    uni = PyUnicode_DecodeUTF8(input_str, input_chars, "strict");
+                    if (uni == NULL) {
+                        return NULL;
+                    }
+                    rval = ascii_escape_unicode(uni);
+                    Py_DECREF(uni);
+                    return rval;
+                }
+            }
+            break;
+        }
+    }
+
+    if (i == input_chars) {
+        /* Input is already ASCII */
+        output_size = 2 + input_chars;
+    }
+    else {
+        /* One char input can be up to 6 chars output, estimate 4 of these */
+        output_size = 2 + (MIN_EXPANSION * 4) + input_chars;
+    }
+    rval = PyString_FromStringAndSize(NULL, output_size);
+    if (rval == NULL) {
+        return NULL;
+    }
+    output = PyString_AS_STRING(rval);
+    output[0] = '"';
+
+    /* We know that everything up to i is ASCII already */
+    chars = i + 1;
+    memcpy(&output[1], input_str, i);
+
+    for (; i < input_chars; i++) {
+        Py_UNICODE c = (Py_UNICODE)(unsigned char)input_str[i];
+        if (S_CHAR(c)) {
+            output[chars++] = (char)c;
+        }
+        else {
+            chars = ascii_escape_char(c, output, chars);
+        }
+        /* An ASCII char can't possibly expand to a surrogate! */
+        if (output_size - chars < (1 + MIN_EXPANSION)) {
+            /* There's more than four, so let's resize by a lot */
+            output_size *= 2;
+            if (output_size > 2 + (input_chars * MIN_EXPANSION)) {
+                output_size = 2 + (input_chars * MIN_EXPANSION);
+            }
+            if (_PyString_Resize(&rval, output_size) == -1) {
+                return NULL;
+            }
+            output = PyString_AS_STRING(rval);
+        }
+    }
+    output[chars++] = '"';
+    if (_PyString_Resize(&rval, chars) == -1) {
+        return NULL;
+    }
+    return rval;
+}
+
+static void
+raise_errmsg(char *msg, PyObject *s, Py_ssize_t end)
+{
+    /* Use the Python function simplejson.decoder.errmsg to raise a nice
+    looking ValueError exception */
+    static PyObject *errmsg_fn = NULL;
+    PyObject *pymsg;
+    if (errmsg_fn == NULL) {
+        PyObject *decoder = PyImport_ImportModule("simplejson.decoder");
+        if (decoder == NULL)
+            return;
+        errmsg_fn = PyObject_GetAttrString(decoder, "errmsg");
+        Py_DECREF(decoder);
+        if (errmsg_fn == NULL)
+            return;
+    }
+    pymsg = PyObject_CallFunction(errmsg_fn, "(zOO&)", msg, s, _convertPyInt_FromSsize_t, &end);
+    if (pymsg) {
+        PyErr_SetObject(PyExc_ValueError, pymsg);
+        Py_DECREF(pymsg);
+    }
+}
+
+static PyObject *
+join_list_unicode(PyObject *lst)
+{
+    /* return u''.join(lst) */
+    static PyObject *joinfn = NULL;
+    if (joinfn == NULL) {
+        PyObject *ustr = PyUnicode_FromUnicode(NULL, 0);
+        if (ustr == NULL)
+            return NULL;
+
+        joinfn = PyObject_GetAttrString(ustr, "join");
+        Py_DECREF(ustr);
+        if (joinfn == NULL)
+            return NULL;
+    }
+    return PyObject_CallFunctionObjArgs(joinfn, lst, NULL);
+}
+
+static PyObject *
+join_list_string(PyObject *lst)
+{
+    /* return ''.join(lst) */
+    static PyObject *joinfn = NULL;
+    if (joinfn == NULL) {
+        PyObject *ustr = PyString_FromStringAndSize(NULL, 0);
+        if (ustr == NULL)
+            return NULL;
+
+        joinfn = PyObject_GetAttrString(ustr, "join");
+        Py_DECREF(ustr);
+        if (joinfn == NULL)
+            return NULL;
+    }
+    return PyObject_CallFunctionObjArgs(joinfn, lst, NULL);
+}
+
+static PyObject *
+_build_rval_index_tuple(PyObject *rval, Py_ssize_t idx) {
+    /* return (rval, idx) tuple, stealing reference to rval */
+    PyObject *tpl;
+    PyObject *pyidx;
+    /*
+    steal a reference to rval, returns (rval, idx)
+    */
+    if (rval == NULL) {
+        return NULL;
+    }
+    pyidx = PyInt_FromSsize_t(idx);
+    if (pyidx == NULL) {
+        Py_DECREF(rval);
+        return NULL;
+    }
+    tpl = PyTuple_New(2);
+    if (tpl == NULL) {
+        Py_DECREF(pyidx);
+        Py_DECREF(rval);
+        return NULL;
+    }
+    PyTuple_SET_ITEM(tpl, 0, rval);
+    PyTuple_SET_ITEM(tpl, 1, pyidx);
+    return tpl;
+}
+
+static PyObject *
+scanstring_str(PyObject *pystr, Py_ssize_t end, char *encoding, int strict, Py_ssize_t *next_end_ptr)
+{
+    /* Read the JSON string from PyString pystr.
+    end is the index of the first character after the quote.
+    encoding is the encoding of pystr (must be an ASCII superset)
+    if strict is zero then literal control characters are allowed
+    *next_end_ptr is a return-by-reference index of the character
+        after the end quote
+
+    Return value is a new PyString (if ASCII-only) or PyUnicode
+    */
+    PyObject *rval;
+    Py_ssize_t len = PyString_GET_SIZE(pystr);
+    Py_ssize_t begin = end - 1;
+    Py_ssize_t next = begin;
+    int has_unicode = 0;
+    char *buf = PyString_AS_STRING(pystr);
+    PyObject *chunks = PyList_New(0);
+    if (chunks == NULL) {
+        goto bail;
+    }
+    if (end < 0 || len <= end) {
+        PyErr_SetString(PyExc_ValueError, "end is out of bounds");
+        goto bail;
+    }
+    while (1) {
+        /* Find the end of the string or the next escape */
+        Py_UNICODE c = 0;
+        PyObject *chunk = NULL;
+        for (next = end; next < len; next++) {
+            c = (unsigned char)buf[next];
+            if (c == '"' || c == '\\') {
+                break;
+            }
+            else if (strict && c <= 0x1f) {
+                raise_errmsg("Invalid control character at", pystr, next);
+                goto bail;
+            }
+            else if (c > 0x7f) {
+                has_unicode = 1;
+            }
+        }
+        if (!(c == '"' || c == '\\')) {
+            raise_errmsg("Unterminated string starting at", pystr, begin);
+            goto bail;
+        }
+        /* Pick up this chunk if it's not zero length */
+        if (next != end) {
+            PyObject *strchunk = PyString_FromStringAndSize(&buf[end], next - end);
+            if (strchunk == NULL) {
+                goto bail;
+            }
+            if (has_unicode) {
+                chunk = PyUnicode_FromEncodedObject(strchunk, encoding, NULL);
+                Py_DECREF(strchunk);
+                if (chunk == NULL) {
+                    goto bail;
+                }
+            }
+            else {
+                chunk = strchunk;
+            }
+            if (PyList_Append(chunks, chunk)) {
+                Py_DECREF(chunk);
+                goto bail;
+            }
+            Py_DECREF(chunk);
+        }
+        next++;
+        if (c == '"') {
+            end = next;
+            break;
+        }
+        if (next == len) {
+            raise_errmsg("Unterminated string starting at", pystr, begin);
+            goto bail;
+        }
+        c = buf[next];
+        if (c != 'u') {
+            /* Non-unicode backslash escapes */
+            end = next + 1;
+            switch (c) {
+                case '"': break;
+                case '\\': break;
+                case '/': break;
+                case 'b': c = '\b'; break;
+                case 'f': c = '\f'; break;
+                case 'n': c = '\n'; break;
+                case 'r': c = '\r'; break;
+                case 't': c = '\t'; break;
+                default: c = 0;
+            }
+            if (c == 0) {
+                raise_errmsg("Invalid \\escape", pystr, end - 2);
+                goto bail;
+            }
+        }
+        else {
+            c = 0;
+            next++;
+            end = next + 4;
+            if (end >= len) {
+                raise_errmsg("Invalid \\uXXXX escape", pystr, next - 1);
+                goto bail;
+            }
+            /* Decode 4 hex digits */
+            for (; next < end; next++) {
+                Py_UNICODE digit = buf[next];
+                c <<= 4;
+                switch (digit) {
+                    case '0': case '1': case '2': case '3': case '4':
+                    case '5': case '6': case '7': case '8': case '9':
+                        c |= (digit - '0'); break;
+                    case 'a': case 'b': case 'c': case 'd': case 'e':
+                    case 'f':
+                        c |= (digit - 'a' + 10); break;
+                    case 'A': case 'B': case 'C': case 'D': case 'E':
+                    case 'F':
+                        c |= (digit - 'A' + 10); break;
+                    default:
+                        raise_errmsg("Invalid \\uXXXX escape", pystr, end - 5);
+                        goto bail;
+                }
+            }
+#ifdef Py_UNICODE_WIDE
+            /* Surrogate pair */
+            if ((c & 0xfc00) == 0xd800) {
+                Py_UNICODE c2 = 0;
+                if (end + 6 >= len) {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                if (buf[next++] != '\\' || buf[next++] != 'u') {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                end += 6;
+                /* Decode 4 hex digits */
+                for (; next < end; next++) {
+                    c2 <<= 4;
+                    Py_UNICODE digit = buf[next];
+                    switch (digit) {
+                        case '0': case '1': case '2': case '3': case '4':
+                        case '5': case '6': case '7': case '8': case '9':
+                            c2 |= (digit - '0'); break;
+                        case 'a': case 'b': case 'c': case 'd': case 'e':
+                        case 'f':
+                            c2 |= (digit - 'a' + 10); break;
+                        case 'A': case 'B': case 'C': case 'D': case 'E':
+                        case 'F':
+                            c2 |= (digit - 'A' + 10); break;
+                        default:
+                            raise_errmsg("Invalid \\uXXXX escape", pystr, end - 5);
+                            goto bail;
+                    }
+                }
+                if ((c2 & 0xfc00) != 0xdc00) {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                c = 0x10000 + (((c - 0xd800) << 10) | (c2 - 0xdc00));
+            }
+            else if ((c & 0xfc00) == 0xdc00) {
+                raise_errmsg("Unpaired low surrogate", pystr, end - 5);
+                goto bail;
+            }
+#endif
+        }
+        if (c > 0x7f) {
+            has_unicode = 1;
+        }
+        if (has_unicode) {
+            chunk = PyUnicode_FromUnicode(&c, 1);
+            if (chunk == NULL) {
+                goto bail;
+            }
+        }
+        else {
+            char c_char = Py_CHARMASK(c);
+            chunk = PyString_FromStringAndSize(&c_char, 1);
+            if (chunk == NULL) {
+                goto bail;
+            }
+        }
+        if (PyList_Append(chunks, chunk)) {
+            Py_DECREF(chunk);
+            goto bail;
+        }
+        Py_DECREF(chunk);
+    }
+
+    rval = join_list_string(chunks);
+    if (rval == NULL) {
+        goto bail;
+    }
+    Py_CLEAR(chunks);
+    *next_end_ptr = end;
+    return rval;
+bail:
+    *next_end_ptr = -1;
+    Py_XDECREF(chunks);
+    return NULL;
+}
+
+
+static PyObject *
+scanstring_unicode(PyObject *pystr, Py_ssize_t end, int strict, Py_ssize_t *next_end_ptr)
+{
+    /* Read the JSON string from PyUnicode pystr.
+    end is the index of the first character after the quote.
+    if strict is zero then literal control characters are allowed
+    *next_end_ptr is a return-by-reference index of the character
+        after the end quote
+
+    Return value is a new PyUnicode
+    */
+    PyObject *rval;
+    Py_ssize_t len = PyUnicode_GET_SIZE(pystr);
+    Py_ssize_t begin = end - 1;
+    Py_ssize_t next = begin;
+    const Py_UNICODE *buf = PyUnicode_AS_UNICODE(pystr);
+    PyObject *chunks = PyList_New(0);
+    if (chunks == NULL) {
+        goto bail;
+    }
+    if (end < 0 || len <= end) {
+        PyErr_SetString(PyExc_ValueError, "end is out of bounds");
+        goto bail;
+    }
+    while (1) {
+        /* Find the end of the string or the next escape */
+        Py_UNICODE c = 0;
+        PyObject *chunk = NULL;
+        for (next = end; next < len; next++) {
+            c = buf[next];
+            if (c == '"' || c == '\\') {
+                break;
+            }
+            else if (strict && c <= 0x1f) {
+                raise_errmsg("Invalid control character at", pystr, next);
+                goto bail;
+            }
+        }
+        if (!(c == '"' || c == '\\')) {
+            raise_errmsg("Unterminated string starting at", pystr, begin);
+            goto bail;
+        }
+        /* Pick up this chunk if it's not zero length */
+        if (next != end) {
+            chunk = PyUnicode_FromUnicode(&buf[end], next - end);
+            if (chunk == NULL) {
+                goto bail;
+            }
+            if (PyList_Append(chunks, chunk)) {
+                Py_DECREF(chunk);
+                goto bail;
+            }
+            Py_DECREF(chunk);
+        }
+        next++;
+        if (c == '"') {
+            end = next;
+            break;
+        }
+        if (next == len) {
+            raise_errmsg("Unterminated string starting at", pystr, begin);
+            goto bail;
+        }
+        c = buf[next];
+        if (c != 'u') {
+            /* Non-unicode backslash escapes */
+            end = next + 1;
+            switch (c) {
+                case '"': break;
+                case '\\': break;
+                case '/': break;
+                case 'b': c = '\b'; break;
+                case 'f': c = '\f'; break;
+                case 'n': c = '\n'; break;
+                case 'r': c = '\r'; break;
+                case 't': c = '\t'; break;
+                default: c = 0;
+            }
+            if (c == 0) {
+                raise_errmsg("Invalid \\escape", pystr, end - 2);
+                goto bail;
+            }
+        }
+        else {
+            c = 0;
+            next++;
+            end = next + 4;
+            if (end >= len) {
+                raise_errmsg("Invalid \\uXXXX escape", pystr, next - 1);
+                goto bail;
+            }
+            /* Decode 4 hex digits */
+            for (; next < end; next++) {
+                Py_UNICODE digit = buf[next];
+                c <<= 4;
+                switch (digit) {
+                    case '0': case '1': case '2': case '3': case '4':
+                    case '5': case '6': case '7': case '8': case '9':
+                        c |= (digit - '0'); break;
+                    case 'a': case 'b': case 'c': case 'd': case 'e':
+                    case 'f':
+                        c |= (digit - 'a' + 10); break;
+                    case 'A': case 'B': case 'C': case 'D': case 'E':
+                    case 'F':
+                        c |= (digit - 'A' + 10); break;
+                    default:
+                        raise_errmsg("Invalid \\uXXXX escape", pystr, end - 5);
+                        goto bail;
+                }
+            }
+#ifdef Py_UNICODE_WIDE
+            /* Surrogate pair */
+            if ((c & 0xfc00) == 0xd800) {
+                Py_UNICODE c2 = 0;
+                if (end + 6 >= len) {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                if (buf[next++] != '\\' || buf[next++] != 'u') {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                end += 6;
+                /* Decode 4 hex digits */
+                for (; next < end; next++) {
+                    c2 <<= 4;
+                    Py_UNICODE digit = buf[next];
+                    switch (digit) {
+                        case '0': case '1': case '2': case '3': case '4':
+                        case '5': case '6': case '7': case '8': case '9':
+                            c2 |= (digit - '0'); break;
+                        case 'a': case 'b': case 'c': case 'd': case 'e':
+                        case 'f':
+                            c2 |= (digit - 'a' + 10); break;
+                        case 'A': case 'B': case 'C': case 'D': case 'E':
+                        case 'F':
+                            c2 |= (digit - 'A' + 10); break;
+                        default:
+                            raise_errmsg("Invalid \\uXXXX escape", pystr, end - 5);
+                            goto bail;
+                    }
+                }
+                if ((c2 & 0xfc00) != 0xdc00) {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                c = 0x10000 + (((c - 0xd800) << 10) | (c2 - 0xdc00));
+            }
+            else if ((c & 0xfc00) == 0xdc00) {
+                raise_errmsg("Unpaired low surrogate", pystr, end - 5);
+                goto bail;
+            }
+#endif
+        }
+        chunk = PyUnicode_FromUnicode(&c, 1);
+        if (chunk == NULL) {
+            goto bail;
+        }
+        if (PyList_Append(chunks, chunk)) {
+            Py_DECREF(chunk);
+            goto bail;
+        }
+        Py_DECREF(chunk);
+    }
+
+    rval = join_list_unicode(chunks);
+    if (rval == NULL) {
+        goto bail;
+    }
+    Py_DECREF(chunks);
+    *next_end_ptr = end;
+    return rval;
+bail:
+    *next_end_ptr = -1;
+    Py_XDECREF(chunks);
+    return NULL;
+}
+
+PyDoc_STRVAR(pydoc_scanstring,
+    "scanstring(basestring, end, encoding, strict=True) -> (str, end)\n"
+    "\n"
+    "Scan the string s for a JSON string. End is the index of the\n"
+    "character in s after the quote that started the JSON string.\n"
+    "Unescapes all valid JSON string escape sequences and raises ValueError\n"
+    "on attempt to decode an invalid string. If strict is False then literal\n"
+    "control characters are allowed in the string.\n"
+    "\n"
+    "Returns a tuple of the decoded string and the index of the character in s\n"
+    "after the end quote."
+);
+
+static PyObject *
+py_scanstring(PyObject* self UNUSED, PyObject *args)
+{
+    PyObject *pystr;
+    PyObject *rval;
+    Py_ssize_t end;
+    Py_ssize_t next_end = -1;
+    char *encoding = NULL;
+    int strict = 1;
+    if (!PyArg_ParseTuple(args, "OO&|zi:scanstring", &pystr, _convertPyInt_AsSsize_t, &end, &encoding, &strict)) {
+        return NULL;
+    }
+    if (encoding == NULL) {
+        encoding = DEFAULT_ENCODING;
+    }
+    if (PyString_Check(pystr)) {
+        rval = scanstring_str(pystr, end, encoding, strict, &next_end);
+    }
+    else if (PyUnicode_Check(pystr)) {
+        rval = scanstring_unicode(pystr, end, strict, &next_end);
+    }
+    else {
+        PyErr_Format(PyExc_TypeError,
+                     "first argument must be a string, not %.80s",
+                     Py_TYPE(pystr)->tp_name);
+        return NULL;
+    }
+    return _build_rval_index_tuple(rval, next_end);
+}
+
+PyDoc_STRVAR(pydoc_encode_basestring_ascii,
+    "encode_basestring_ascii(basestring) -> str\n"
+    "\n"
+    "Return an ASCII-only JSON representation of a Python string"
+);
+
+static PyObject *
+py_encode_basestring_ascii(PyObject* self UNUSED, PyObject *pystr)
+{
+    /* Return an ASCII-only JSON representation of a Python string */
+    /* METH_O */
+    if (PyString_Check(pystr)) {
+        return ascii_escape_str(pystr);
+    }
+    else if (PyUnicode_Check(pystr)) {
+        return ascii_escape_unicode(pystr);
+    }
+    else {
+        PyErr_Format(PyExc_TypeError,
+                     "first argument must be a string, not %.80s",
+                     Py_TYPE(pystr)->tp_name);
+        return NULL;
+    }
+}
+
+static void
+scanner_dealloc(PyObject *self)
+{
+    /* Deallocate scanner object */
+    scanner_clear(self);
+    Py_TYPE(self)->tp_free(self);
+}
+
+static int
+scanner_traverse(PyObject *self, visitproc visit, void *arg)
+{
+    PyScannerObject *s;
+    assert(PyScanner_Check(self));
+    s = (PyScannerObject *)self;
+    Py_VISIT(s->encoding);
+    Py_VISIT(s->strict);
+    Py_VISIT(s->object_hook);
+    Py_VISIT(s->parse_float);
+    Py_VISIT(s->parse_int);
+    Py_VISIT(s->parse_constant);
+    return 0;
+}
+
+static int
+scanner_clear(PyObject *self)
+{
+    PyScannerObject *s;
+    assert(PyScanner_Check(self));
+    s = (PyScannerObject *)self;
+    Py_CLEAR(s->encoding);
+    Py_CLEAR(s->strict);
+    Py_CLEAR(s->object_hook);
+    Py_CLEAR(s->parse_float);
+    Py_CLEAR(s->parse_int);
+    Py_CLEAR(s->parse_constant);
+    return 0;
+}
+
+static PyObject *
+_parse_object_str(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON object from PyString pystr.
+    idx is the index of the first character after the opening curly brace.
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the closing curly brace.
+
+    Returns a new PyObject (usually a dict, but object_hook can change that)
+    */
+    char *str = PyString_AS_STRING(pystr);
+    Py_ssize_t end_idx = PyString_GET_SIZE(pystr) - 1;
+    PyObject *rval = PyDict_New();
+    PyObject *key = NULL;
+    PyObject *val = NULL;
+    char *encoding = PyString_AS_STRING(s->encoding);
+    int strict = PyObject_IsTrue(s->strict);
+    Py_ssize_t next_idx;
+    if (rval == NULL)
+        return NULL;
+
+    /* skip whitespace after { */
+    while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+    /* only loop if the object is non-empty */
+    if (idx <= end_idx && str[idx] != '}') {
+        while (idx <= end_idx) {
+            /* read key */
+            if (str[idx] != '"') {
+                raise_errmsg("Expecting property name", pystr, idx);
+                goto bail;
+            }
+            key = scanstring_str(pystr, idx + 1, encoding, strict, &next_idx);
+            if (key == NULL)
+                goto bail;
+            idx = next_idx;
+
+            /* skip whitespace between key and : delimiter, read :, skip whitespace */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+            if (idx > end_idx || str[idx] != ':') {
+                raise_errmsg("Expecting : delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* read any JSON data type */
+            val = scan_once_str(s, pystr, idx, &next_idx);
+            if (val == NULL)
+                goto bail;
+
+            if (PyDict_SetItem(rval, key, val) == -1)
+                goto bail;
+
+            Py_CLEAR(key);
+            Py_CLEAR(val);
+            idx = next_idx;
+
+            /* skip whitespace before } or , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* bail if the object is closed or we didn't get the , delimiter */
+            if (idx > end_idx) break;
+            if (str[idx] == '}') {
+                break;
+            }
+            else if (str[idx] != ',') {
+                raise_errmsg("Expecting , delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+
+            /* skip whitespace after , delimiter */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+        }
+    }
+    /* verify that idx < end_idx, str[idx] should be '}' */
+    if (idx > end_idx || str[idx] != '}') {
+        raise_errmsg("Expecting object", pystr, end_idx);
+        goto bail;
+    }
+    /* if object_hook is not None: rval = object_hook(rval) */
+    if (s->object_hook != Py_None) {
+        val = PyObject_CallFunctionObjArgs(s->object_hook, rval, NULL);
+        if (val == NULL)
+            goto bail;
+        Py_DECREF(rval);
+        rval = val;
+        val = NULL;
+    }
+    *next_idx_ptr = idx + 1;
+    return rval;
+bail:
+    Py_XDECREF(key);
+    Py_XDECREF(val);
+    Py_DECREF(rval);
+    return NULL;
+}
+
+static PyObject *
+_parse_object_unicode(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON object from PyUnicode pystr.
+    idx is the index of the first character after the opening curly brace.
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the closing curly brace.
+
+    Returns a new PyObject (usually a dict, but object_hook can change that)
+    */
+    Py_UNICODE *str = PyUnicode_AS_UNICODE(pystr);
+    Py_ssize_t end_idx = PyUnicode_GET_SIZE(pystr) - 1;
+    PyObject *val = NULL;
+    PyObject *rval = PyDict_New();
+    PyObject *key = NULL;
+    int strict = PyObject_IsTrue(s->strict);
+    Py_ssize_t next_idx;
+    if (rval == NULL)
+        return NULL;
+
+    /* skip whitespace after { */
+    while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+    /* only loop if the object is non-empty */
+    if (idx <= end_idx && str[idx] != '}') {
+        while (idx <= end_idx) {
+            /* read key */
+            if (str[idx] != '"') {
+                raise_errmsg("Expecting property name", pystr, idx);
+                goto bail;
+            }
+            key = scanstring_unicode(pystr, idx + 1, strict, &next_idx);
+            if (key == NULL)
+                goto bail;
+            idx = next_idx;
+
+            /* skip whitespace between key and : delimiter, read :, skip whitespace */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+            if (idx > end_idx || str[idx] != ':') {
+                raise_errmsg("Expecting : delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* read any JSON term */
+            val = scan_once_unicode(s, pystr, idx, &next_idx);
+            if (val == NULL)
+                goto bail;
+
+            if (PyDict_SetItem(rval, key, val) == -1)
+                goto bail;
+
+            Py_CLEAR(key);
+            Py_CLEAR(val);
+            idx = next_idx;
+
+            /* skip whitespace before } or , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* bail if the object is closed or we didn't get the , delimiter */
+            if (idx > end_idx) break;
+            if (str[idx] == '}') {
+                break;
+            }
+            else if (str[idx] != ',') {
+                raise_errmsg("Expecting , delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+
+            /* skip whitespace after , delimiter */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+        }
+    }
+
+    /* verify that idx < end_idx, str[idx] should be '}' */
+    if (idx > end_idx || str[idx] != '}') {
+        raise_errmsg("Expecting object", pystr, end_idx);
+        goto bail;
+    }
+
+    /* if object_hook is not None: rval = object_hook(rval) */
+    if (s->object_hook != Py_None) {
+        val = PyObject_CallFunctionObjArgs(s->object_hook, rval, NULL);
+        if (val == NULL)
+            goto bail;
+        Py_DECREF(rval);
+        rval = val;
+        val = NULL;
+    }
+    *next_idx_ptr = idx + 1;
+    return rval;
+bail:
+    Py_XDECREF(key);
+    Py_XDECREF(val);
+    Py_DECREF(rval);
+    return NULL;
+}
+
+static PyObject *
+_parse_array_str(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON array from PyString pystr.
+    idx is the index of the first character after the opening brace.
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the closing brace.
+
+    Returns a new PyList
+    */
+    char *str = PyString_AS_STRING(pystr);
+    Py_ssize_t end_idx = PyString_GET_SIZE(pystr) - 1;
+    PyObject *val = NULL;
+    PyObject *rval = PyList_New(0);
+    Py_ssize_t next_idx;
+    if (rval == NULL)
+        return NULL;
+
+    /* skip whitespace after [ */
+    while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+    /* only loop if the array is non-empty */
+    if (idx <= end_idx && str[idx] != ']') {
+        while (idx <= end_idx) {
+
+            /* read any JSON term and de-tuplefy the (rval, idx) */
+            val = scan_once_str(s, pystr, idx, &next_idx);
+            if (val == NULL)
+                goto bail;
+
+            if (PyList_Append(rval, val) == -1)
+                goto bail;
+
+            Py_CLEAR(val);
+            idx = next_idx;
+
+            /* skip whitespace between term and , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* bail if the array is closed or we didn't get the , delimiter */
+            if (idx > end_idx) break;
+            if (str[idx] == ']') {
+                break;
+            }
+            else if (str[idx] != ',') {
+                raise_errmsg("Expecting , delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+
+            /* skip whitespace after , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+        }
+    }
+
+    /* verify that idx < end_idx, str[idx] should be ']' */
+    if (idx > end_idx || str[idx] != ']') {
+        raise_errmsg("Expecting object", pystr, end_idx);
+        goto bail;
+    }
+    *next_idx_ptr = idx + 1;
+    return rval;
+bail:
+    Py_XDECREF(val);
+    Py_DECREF(rval);
+    return NULL;
+}
+
+static PyObject *
+_parse_array_unicode(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON array from PyString pystr.
+    idx is the index of the first character after the opening brace.
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the closing brace.
+
+    Returns a new PyList
+    */
+    Py_UNICODE *str = PyUnicode_AS_UNICODE(pystr);
+    Py_ssize_t end_idx = PyUnicode_GET_SIZE(pystr) - 1;
+    PyObject *val = NULL;
+    PyObject *rval = PyList_New(0);
+    Py_ssize_t next_idx;
+    if (rval == NULL)
+        return NULL;
+
+    /* skip whitespace after [ */
+    while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+    /* only loop if the array is non-empty */
+    if (idx <= end_idx && str[idx] != ']') {
+        while (idx <= end_idx) {
+
+            /* read any JSON term  */
+            val = scan_once_unicode(s, pystr, idx, &next_idx);
+            if (val == NULL)
+                goto bail;
+
+            if (PyList_Append(rval, val) == -1)
+                goto bail;
+
+            Py_CLEAR(val);
+            idx = next_idx;
+
+            /* skip whitespace between term and , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* bail if the array is closed or we didn't get the , delimiter */
+            if (idx > end_idx) break;
+            if (str[idx] == ']') {
+                break;
+            }
+            else if (str[idx] != ',') {
+                raise_errmsg("Expecting , delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+
+            /* skip whitespace after , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+        }
+    }
+
+    /* verify that idx < end_idx, str[idx] should be ']' */
+    if (idx > end_idx || str[idx] != ']') {
+        raise_errmsg("Expecting object", pystr, end_idx);
+        goto bail;
+    }
+    *next_idx_ptr = idx + 1;
+    return rval;
+bail:
+    Py_XDECREF(val);
+    Py_DECREF(rval);
+    return NULL;
+}
+
+static PyObject *
+_parse_constant(PyScannerObject *s, char *constant, Py_ssize_t idx, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON constant from PyString pystr.
+    constant is the constant string that was found
+        ("NaN", "Infinity", "-Infinity").
+    idx is the index of the first character of the constant
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the constant.
+
+    Returns the result of parse_constant
+    */
+    PyObject *cstr;
+    PyObject *rval;
+    /* constant is "NaN", "Infinity", or "-Infinity" */
+    cstr = PyString_InternFromString(constant);
+    if (cstr == NULL)
+        return NULL;
+
+    /* rval = parse_constant(constant) */
+    rval = PyObject_CallFunctionObjArgs(s->parse_constant, cstr, NULL);
+    idx += PyString_GET_SIZE(cstr);
+    Py_DECREF(cstr);
+    *next_idx_ptr = idx;
+    return rval;
+}
+
+static PyObject *
+_match_number_str(PyScannerObject *s, PyObject *pystr, Py_ssize_t start, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON number from PyString pystr.
+    idx is the index of the first character of the number
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the number.
+
+    Returns a new PyObject representation of that number:
+        PyInt, PyLong, or PyFloat.
+        May return other types if parse_int or parse_float are set
+    */
+    char *str = PyString_AS_STRING(pystr);
+    Py_ssize_t end_idx = PyString_GET_SIZE(pystr) - 1;
+    Py_ssize_t idx = start;
+    int is_float = 0;
+    PyObject *rval;
+    PyObject *numstr;
+
+    /* read a sign if it's there, make sure it's not the end of the string */
+    if (str[idx] == '-') {
+        idx++;
+        if (idx > end_idx) {
+            PyErr_SetNone(PyExc_StopIteration);
+            return NULL;
+        }
+    }
+
+    /* read as many integer digits as we find as long as it doesn't start with 0 */
+    if (str[idx] >= '1' && str[idx] <= '9') {
+        idx++;
+        while (idx <= end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+    }
+    /* if it starts with 0 we only expect one integer digit */
+    else if (str[idx] == '0') {
+        idx++;
+    }
+    /* no integer digits, error */
+    else {
+        PyErr_SetNone(PyExc_StopIteration);
+        return NULL;
+    }
+
+    /* if the next char is '.' followed by a digit then read all float digits */
+    if (idx < end_idx && str[idx] == '.' && str[idx + 1] >= '0' && str[idx + 1] <= '9') {
+        is_float = 1;
+        idx += 2;
+        while (idx <= end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+    }
+
+    /* if the next char is 'e' or 'E' then maybe read the exponent (or backtrack) */
+    if (idx < end_idx && (str[idx] == 'e' || str[idx] == 'E')) {
+
+        /* save the index of the 'e' or 'E' just in case we need to backtrack */
+        Py_ssize_t e_start = idx;
+        idx++;
+
+        /* read an exponent sign if present */
+        if (idx < end_idx && (str[idx] == '-' || str[idx] == '+')) idx++;
+
+        /* read all digits */
+        while (idx <= end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+
+        /* if we got a digit, then parse as float. if not, backtrack */
+        if (str[idx - 1] >= '0' && str[idx - 1] <= '9') {
+            is_float = 1;
+        }
+        else {
+            idx = e_start;
+        }
+    }
+
+    /* copy the section we determined to be a number */
+    numstr = PyString_FromStringAndSize(&str[start], idx - start);
+    if (numstr == NULL)
+        return NULL;
+    if (is_float) {
+        /* parse as a float using a fast path if available, otherwise call user defined method */
+        if (s->parse_float != (PyObject *)&PyFloat_Type) {
+            rval = PyObject_CallFunctionObjArgs(s->parse_float, numstr, NULL);
+        }
+        else {
+            rval = PyFloat_FromDouble(PyOS_ascii_atof(PyString_AS_STRING(numstr)));
+        }
+    }
+    else {
+        /* parse as an int using a fast path if available, otherwise call user defined method */
+        if (s->parse_int != (PyObject *)&PyInt_Type) {
+            rval = PyObject_CallFunctionObjArgs(s->parse_int, numstr, NULL);
+        }
+        else {
+            rval = PyInt_FromString(PyString_AS_STRING(numstr), NULL, 10);
+        }
+    }
+    Py_DECREF(numstr);
+    *next_idx_ptr = idx;
+    return rval;
+}
+
+static PyObject *
+_match_number_unicode(PyScannerObject *s, PyObject *pystr, Py_ssize_t start, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON number from PyUnicode pystr.
+    idx is the index of the first character of the number
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the number.
+
+    Returns a new PyObject representation of that number:
+        PyInt, PyLong, or PyFloat.
+        May return other types if parse_int or parse_float are set
+    */
+    Py_UNICODE *str = PyUnicode_AS_UNICODE(pystr);
+    Py_ssize_t end_idx = PyUnicode_GET_SIZE(pystr) - 1;
+    Py_ssize_t idx = start;
+    int is_float = 0;
+    PyObject *rval;
+    PyObject *numstr;
+
+    /* read a sign if it's there, make sure it's not the end of the string */
+    if (str[idx] == '-') {
+        idx++;
+        if (idx > end_idx) {
+            PyErr_SetNone(PyExc_StopIteration);
+            return NULL;
+        }
+    }
+
+    /* read as many integer digits as we find as long as it doesn't start with 0 */
+    if (str[idx] >= '1' && str[idx] <= '9') {
+        idx++;
+        while (idx <= end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+    }
+    /* if it starts with 0 we only expect one integer digit */
+    else if (str[idx] == '0') {
+        idx++;
+    }
+    /* no integer digits, error */
+    else {
+        PyErr_SetNone(PyExc_StopIteration);
+        return NULL;
+    }
+
+    /* if the next char is '.' followed by a digit then read all float digits */
+    if (idx < end_idx && str[idx] == '.' && str[idx + 1] >= '0' && str[idx + 1] <= '9') {
+        is_float = 1;
+        idx += 2;
+        while (idx < end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+    }
+
+    /* if the next char is 'e' or 'E' then maybe read the exponent (or backtrack) */
+    if (idx < end_idx && (str[idx] == 'e' || str[idx] == 'E')) {
+        Py_ssize_t e_start = idx;
+        idx++;
+
+        /* read an exponent sign if present */
+        if (idx < end_idx && (str[idx] == '-' || str[idx] == '+')) idx++;
+
+        /* read all digits */
+        while (idx <= end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+
+        /* if we got a digit, then parse as float. if not, backtrack */
+        if (str[idx - 1] >= '0' && str[idx - 1] <= '9') {
+            is_float = 1;
+        }
+        else {
+            idx = e_start;
+        }
+    }
+
+    /* copy the section we determined to be a number */
+    numstr = PyUnicode_FromUnicode(&str[start], idx - start);
+    if (numstr == NULL)
+        return NULL;
+    if (is_float) {
+        /* parse as a float using a fast path if available, otherwise call user defined method */
+        if (s->parse_float != (PyObject *)&PyFloat_Type) {
+            rval = PyObject_CallFunctionObjArgs(s->parse_float, numstr, NULL);
+        }
+        else {
+            rval = PyFloat_FromString(numstr, NULL);
+        }
+    }
+    else {
+        /* no fast path for unicode -> int, just call */
+        rval = PyObject_CallFunctionObjArgs(s->parse_int, numstr, NULL);
+    }
+    Py_DECREF(numstr);
+    *next_idx_ptr = idx;
+    return rval;
+}
+
+static PyObject *
+scan_once_str(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr)
+{
+    /* Read one JSON term (of any kind) from PyString pystr.
+    idx is the index of the first character of the term
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the number.
+
+    Returns a new PyObject representation of the term.
+    */
+    char *str = PyString_AS_STRING(pystr);
+    Py_ssize_t length = PyString_GET_SIZE(pystr);
+    if (idx >= length) {
+        PyErr_SetNone(PyExc_StopIteration);
+        return NULL;
+    }
+    switch (str[idx]) {
+        case '"':
+            /* string */
+            return scanstring_str(pystr, idx + 1,
+                PyString_AS_STRING(s->encoding),
+                PyObject_IsTrue(s->strict),
+                next_idx_ptr);
+        case '{':
+            /* object */
+            return _parse_object_str(s, pystr, idx + 1, next_idx_ptr);
+        case '[':
+            /* array */
+            return _parse_array_str(s, pystr, idx + 1, next_idx_ptr);
+        case 'n':
+            /* null */
+            if ((idx + 3 < length) && str[idx + 1] == 'u' && str[idx + 2] == 'l' && str[idx + 3] == 'l') {
+                Py_INCREF(Py_None);
+                *next_idx_ptr = idx + 4;
+                return Py_None;
+            }
+            break;
+        case 't':
+            /* true */
+            if ((idx + 3 < length) && str[idx + 1] == 'r' && str[idx + 2] == 'u' && str[idx + 3] == 'e') {
+                Py_INCREF(Py_True);
+                *next_idx_ptr = idx + 4;
+                return Py_True;
+            }
+            break;
+        case 'f':
+            /* false */
+            if ((idx + 4 < length) && str[idx + 1] == 'a' && str[idx + 2] == 'l' && str[idx + 3] == 's' && str[idx + 4] == 'e') {
+                Py_INCREF(Py_False);
+                *next_idx_ptr = idx + 5;
+                return Py_False;
+            }
+            break;
+        case 'N':
+            /* NaN */
+            if ((idx + 2 < length) && str[idx + 1] == 'a' && str[idx + 2] == 'N') {
+                return _parse_constant(s, "NaN", idx, next_idx_ptr);
+            }
+            break;
+        case 'I':
+            /* Infinity */
+            if ((idx + 7 < length) && str[idx + 1] == 'n' && str[idx + 2] == 'f' && str[idx + 3] == 'i' && str[idx + 4] == 'n' && str[idx + 5] == 'i' && str[idx + 6] == 't' && str[idx + 7] == 'y') {
+                return _parse_constant(s, "Infinity", idx, next_idx_ptr);
+            }
+            break;
+        case '-':
+            /* -Infinity */
+            if ((idx + 8 < length) && str[idx + 1] == 'I' && str[idx + 2] == 'n' && str[idx + 3] == 'f' && str[idx + 4] == 'i' && str[idx + 5] == 'n' && str[idx + 6] == 'i' && str[idx + 7] == 't' && str[idx + 8] == 'y') {
+                return _parse_constant(s, "-Infinity", idx, next_idx_ptr);
+            }
+            break;
+    }
+    /* Didn't find a string, object, array, or named constant. Look for a number. */
+    return _match_number_str(s, pystr, idx, next_idx_ptr);
+}
+
+static PyObject *
+scan_once_unicode(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr)
+{
+    /* Read one JSON term (of any kind) from PyUnicode pystr.
+    idx is the index of the first character of the term
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the number.
+
+    Returns a new PyObject representation of the term.
+    */
+    Py_UNICODE *str = PyUnicode_AS_UNICODE(pystr);
+    Py_ssize_t length = PyUnicode_GET_SIZE(pystr);
+    if (idx >= length) {
+        PyErr_SetNone(PyExc_StopIteration);
+        return NULL;
+    }
+    switch (str[idx]) {
+        case '"':
+            /* string */
+            return scanstring_unicode(pystr, idx + 1,
+                PyObject_IsTrue(s->strict),
+                next_idx_ptr);
+        case '{':
+            /* object */
+            return _parse_object_unicode(s, pystr, idx + 1, next_idx_ptr);
+        case '[':
+            /* array */
+            return _parse_array_unicode(s, pystr, idx + 1, next_idx_ptr);
+        case 'n':
+            /* null */
+            if ((idx + 3 < length) && str[idx + 1] == 'u' && str[idx + 2] == 'l' && str[idx + 3] == 'l') {
+                Py_INCREF(Py_None);
+                *next_idx_ptr = idx + 4;
+                return Py_None;
+            }
+            break;
+        case 't':
+            /* true */
+            if ((idx + 3 < length) && str[idx + 1] == 'r' && str[idx + 2] == 'u' && str[idx + 3] == 'e') {
+                Py_INCREF(Py_True);
+                *next_idx_ptr = idx + 4;
+                return Py_True;
+            }
+            break;
+        case 'f':
+            /* false */
+            if ((idx + 4 < length) && str[idx + 1] == 'a' && str[idx + 2] == 'l' && str[idx + 3] == 's' && str[idx + 4] == 'e') {
+                Py_INCREF(Py_False);
+                *next_idx_ptr = idx + 5;
+                return Py_False;
+            }
+            break;
+        case 'N':
+            /* NaN */
+            if ((idx + 2 < length) && str[idx + 1] == 'a' && str[idx + 2] == 'N') {
+                return _parse_constant(s, "NaN", idx, next_idx_ptr);
+            }
+            break;
+        case 'I':
+            /* Infinity */
+            if ((idx + 7 < length) && str[idx + 1] == 'n' && str[idx + 2] == 'f' && str[idx + 3] == 'i' && str[idx + 4] == 'n' && str[idx + 5] == 'i' && str[idx + 6] == 't' && str[idx + 7] == 'y') {
+                return _parse_constant(s, "Infinity", idx, next_idx_ptr);
+            }
+            break;
+        case '-':
+            /* -Infinity */
+            if ((idx + 8 < length) && str[idx + 1] == 'I' && str[idx + 2] == 'n' && str[idx + 3] == 'f' && str[idx + 4] == 'i' && str[idx + 5] == 'n' && str[idx + 6] == 'i' && str[idx + 7] == 't' && str[idx + 8] == 'y') {
+                return _parse_constant(s, "-Infinity", idx, next_idx_ptr);
+            }
+            break;
+    }
+    /* Didn't find a string, object, array, or named constant. Look for a number. */
+    return _match_number_unicode(s, pystr, idx, next_idx_ptr);
+}
+
+static PyObject *
+scanner_call(PyObject *self, PyObject *args, PyObject *kwds)
+{
+    /* Python callable interface to scan_once_{str,unicode} */
+    PyObject *pystr;
+    PyObject *rval;
+    Py_ssize_t idx;
+    Py_ssize_t next_idx = -1;
+    static char *kwlist[] = {"string", "idx", NULL};
+    PyScannerObject *s;
+    assert(PyScanner_Check(self));
+    s = (PyScannerObject *)self;
+    if (!PyArg_ParseTupleAndKeywords(args, kwds, "OO&:scan_once", kwlist, &pystr, _convertPyInt_AsSsize_t, &idx))
+        return NULL;
+
+    if (PyString_Check(pystr)) {
+        rval = scan_once_str(s, pystr, idx, &next_idx);
+    }
+    else if (PyUnicode_Check(pystr)) {
+        rval = scan_once_unicode(s, pystr, idx, &next_idx);
+    }
+    else {
+        PyErr_Format(PyExc_TypeError,
+                 "first argument must be a string, not %.80s",
+                 Py_TYPE(pystr)->tp_name);
+        return NULL;
+    }
+    return _build_rval_index_tuple(rval, next_idx);
+}
+
+static PyObject *
+scanner_new(PyTypeObject *type, PyObject *args, PyObject *kwds)
+{
+    PyScannerObject *s;
+    s = (PyScannerObject *)type->tp_alloc(type, 0);
+    if (s != NULL) {
+        s->encoding = NULL;
+        s->strict = NULL;
+        s->object_hook = NULL;
+        s->parse_float = NULL;
+        s->parse_int = NULL;
+        s->parse_constant = NULL;
+    }
+    return (PyObject *)s;
+}
+
+static int
+scanner_init(PyObject *self, PyObject *args, PyObject *kwds)
+{
+    /* Initialize Scanner object */
+    PyObject *ctx;
+    static char *kwlist[] = {"context", NULL};
+    PyScannerObject *s;
+
+    assert(PyScanner_Check(self));
+    s = (PyScannerObject *)self;
+
+    if (!PyArg_ParseTupleAndKeywords(args, kwds, "O:make_scanner", kwlist, &ctx))
+        return -1;
+
+    /* PyString_AS_STRING is used on encoding */
+    s->encoding = PyObject_GetAttrString(ctx, "encoding");
+    if (s->encoding == Py_None) {
+        Py_DECREF(Py_None);
+        s->encoding = PyString_InternFromString(DEFAULT_ENCODING);
+    }
+    else if (PyUnicode_Check(s->encoding)) {
+        PyObject *tmp = PyUnicode_AsEncodedString(s->encoding, NULL, NULL);
+        Py_DECREF(s->encoding);
+        s->encoding = tmp;
+    }
+    if (s->encoding == NULL || !PyString_Check(s->encoding))
+        goto bail;
+
+    /* All of these will fail "gracefully" so we don't need to verify them */
+    s->strict = PyObject_GetAttrString(ctx, "strict");
+    if (s->strict == NULL)
+        goto bail;
+    s->object_hook = PyObject_GetAttrString(ctx, "object_hook");
+    if (s->object_hook == NULL)
+        goto bail;
+    s->parse_float = PyObject_GetAttrString(ctx, "parse_float");
+    if (s->parse_float == NULL)
+        goto bail;
+    s->parse_int = PyObject_GetAttrString(ctx, "parse_int");
+    if (s->parse_int == NULL)
+        goto bail;
+    s->parse_constant = PyObject_GetAttrString(ctx, "parse_constant");
+    if (s->parse_constant == NULL)
+        goto bail;
+
+    return 0;
+
+bail:
+    Py_CLEAR(s->encoding);
+    Py_CLEAR(s->strict);
+    Py_CLEAR(s->object_hook);
+    Py_CLEAR(s->parse_float);
+    Py_CLEAR(s->parse_int);
+    Py_CLEAR(s->parse_constant);
+    return -1;
+}
+
+PyDoc_STRVAR(scanner_doc, "JSON scanner object");
+
+static
+PyTypeObject PyScannerType = {
+    PyObject_HEAD_INIT(NULL)
+    0,                    /* tp_internal */
+    "simplejson._speedups.Scanner",       /* tp_name */
+    sizeof(PyScannerObject), /* tp_basicsize */
+    0,                    /* tp_itemsize */
+    scanner_dealloc, /* tp_dealloc */
+    0,                    /* tp_print */
+    0,                    /* tp_getattr */
+    0,                    /* tp_setattr */
+    0,                    /* tp_compare */
+    0,                    /* tp_repr */
+    0,                    /* tp_as_number */
+    0,                    /* tp_as_sequence */
+    0,                    /* tp_as_mapping */
+    0,                    /* tp_hash */
+    scanner_call,         /* tp_call */
+    0,                    /* tp_str */
+    0,/* PyObject_GenericGetAttr, */                    /* tp_getattro */
+    0,/* PyObject_GenericSetAttr, */                    /* tp_setattro */
+    0,                    /* tp_as_buffer */
+    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,   /* tp_flags */
+    scanner_doc,          /* tp_doc */
+    scanner_traverse,                    /* tp_traverse */
+    scanner_clear,                    /* tp_clear */
+    0,                    /* tp_richcompare */
+    0,                    /* tp_weaklistoffset */
+    0,                    /* tp_iter */
+    0,                    /* tp_iternext */
+    0,                    /* tp_methods */
+    scanner_members,                    /* tp_members */
+    0,                    /* tp_getset */
+    0,                    /* tp_base */
+    0,                    /* tp_dict */
+    0,                    /* tp_descr_get */
+    0,                    /* tp_descr_set */
+    0,                    /* tp_dictoffset */
+    scanner_init,                    /* tp_init */
+    0,/* PyType_GenericAlloc, */        /* tp_alloc */
+    scanner_new,          /* tp_new */
+    0,/* PyObject_GC_Del, */              /* tp_free */
+};
+
+static PyObject *
+encoder_new(PyTypeObject *type, PyObject *args, PyObject *kwds)
+{
+    PyEncoderObject *s;
+    s = (PyEncoderObject *)type->tp_alloc(type, 0);
+    if (s != NULL) {
+        s->markers = NULL;
+        s->defaultfn = NULL;
+        s->encoder = NULL;
+        s->indent = NULL;
+        s->key_separator = NULL;
+        s->item_separator = NULL;
+        s->sort_keys = NULL;
+        s->skipkeys = NULL;
+    }
+    return (PyObject *)s;
+}
+
+static int
+encoder_init(PyObject *self, PyObject *args, PyObject *kwds)
+{
+    /* initialize Encoder object */
+    static char *kwlist[] = {"markers", "default", "encoder", "indent", "key_separator", "item_separator", "sort_keys", "skipkeys", "allow_nan", NULL};
+
+    PyEncoderObject *s;
+    PyObject *allow_nan;
+
+    assert(PyEncoder_Check(self));
+    s = (PyEncoderObject *)self;
+
+    if (!PyArg_ParseTupleAndKeywords(args, kwds, "OOOOOOOOO:make_encoder", kwlist,
+        &s->markers, &s->defaultfn, &s->encoder, &s->indent, &s->key_separator, &s->item_separator, &s->sort_keys, &s->skipkeys, &allow_nan))
+        return -1;
+
+    Py_INCREF(s->markers);
+    Py_INCREF(s->defaultfn);
+    Py_INCREF(s->encoder);
+    Py_INCREF(s->indent);
+    Py_INCREF(s->key_separator);
+    Py_INCREF(s->item_separator);
+    Py_INCREF(s->sort_keys);
+    Py_INCREF(s->skipkeys);
+    s->fast_encode = (PyCFunction_Check(s->encoder) && PyCFunction_GetFunction(s->encoder) == (PyCFunction)py_encode_basestring_ascii);
+    s->allow_nan = PyObject_IsTrue(allow_nan);
+    return 0;
+}
+
+static PyObject *
+encoder_call(PyObject *self, PyObject *args, PyObject *kwds)
+{
+    /* Python callable interface to encode_listencode_obj */
+    static char *kwlist[] = {"obj", "_current_indent_level", NULL};
+    PyObject *obj;
+    PyObject *rval;
+    Py_ssize_t indent_level;
+    PyEncoderObject *s;
+    assert(PyEncoder_Check(self));
+    s = (PyEncoderObject *)self;
+    if (!PyArg_ParseTupleAndKeywords(args, kwds, "OO&:_iterencode", kwlist,
+        &obj, _convertPyInt_AsSsize_t, &indent_level))
+        return NULL;
+    rval = PyList_New(0);
+    if (rval == NULL)
+        return NULL;
+    if (encoder_listencode_obj(s, rval, obj, indent_level)) {
+        Py_DECREF(rval);
+        return NULL;
+    }
+    return rval;
+}
+
+static PyObject *
+_encoded_const(PyObject *obj)
+{
+    /* Return the JSON string representation of None, True, False */
+    if (obj == Py_None) {
+        static PyObject *s_null = NULL;
+        if (s_null == NULL) {
+            s_null = PyString_InternFromString("null");
+        }
+        Py_INCREF(s_null);
+        return s_null;
+    }
+    else if (obj == Py_True) {
+        static PyObject *s_true = NULL;
+        if (s_true == NULL) {
+            s_true = PyString_InternFromString("true");
+        }
+        Py_INCREF(s_true);
+        return s_true;
+    }
+    else if (obj == Py_False) {
+        static PyObject *s_false = NULL;
+        if (s_false == NULL) {
+            s_false = PyString_InternFromString("false");
+        }
+        Py_INCREF(s_false);
+        return s_false;
+    }
+    else {
+        PyErr_SetString(PyExc_ValueError, "not a const");
+        return NULL;
+    }
+}
+
+static PyObject *
+encoder_encode_float(PyEncoderObject *s, PyObject *obj)
+{
+    /* Return the JSON representation of a PyFloat */
+    double i = PyFloat_AS_DOUBLE(obj);
+    if (!Py_IS_FINITE(i)) {
+        if (!s->allow_nan) {
+            PyErr_SetString(PyExc_ValueError, "Out of range float values are not JSON compliant");
+            return NULL;
+        }
+        if (i > 0) {
+            return PyString_FromString("Infinity");
+        }
+        else if (i < 0) {
+            return PyString_FromString("-Infinity");
+        }
+        else {
+            return PyString_FromString("NaN");
+        }
+    }
+    /* Use a better float format here? */
+    return PyObject_Repr(obj);
+}
+
+static PyObject *
+encoder_encode_string(PyEncoderObject *s, PyObject *obj)
+{
+    /* Return the JSON representation of a string */
+    if (s->fast_encode)
+        return py_encode_basestring_ascii(NULL, obj);
+    else
+        return PyObject_CallFunctionObjArgs(s->encoder, obj, NULL);
+}
+
+static int
+_steal_list_append(PyObject *lst, PyObject *stolen)
+{
+    /* Append stolen and then decrement its reference count */
+    int rval = PyList_Append(lst, stolen);
+    Py_DECREF(stolen);
+    return rval;
+}
+
+static int
+encoder_listencode_obj(PyEncoderObject *s, PyObject *rval, PyObject *obj, Py_ssize_t indent_level)
+{
+    /* Encode Python object obj to a JSON term, rval is a PyList */
+    PyObject *newobj;
+    int rv;
+
+    if (obj == Py_None || obj == Py_True || obj == Py_False) {
+        PyObject *cstr = _encoded_const(obj);
+        if (cstr == NULL)
+            return -1;
+        return _steal_list_append(rval, cstr);
+    }
+    else if (PyString_Check(obj) || PyUnicode_Check(obj))
+    {
+        PyObject *encoded = encoder_encode_string(s, obj);
+        if (encoded == NULL)
+            return -1;
+        return _steal_list_append(rval, encoded);
+    }
+    else if (PyInt_Check(obj) || PyLong_Check(obj)) {
+        PyObject *encoded = PyObject_Str(obj);
+        if (encoded == NULL)
+            return -1;
+        return _steal_list_append(rval, encoded);
+    }
+    else if (PyFloat_Check(obj)) {
+        PyObject *encoded = encoder_encode_float(s, obj);
+        if (encoded == NULL)
+            return -1;
+        return _steal_list_append(rval, encoded);
+    }
+    else if (PyList_Check(obj) || PyTuple_Check(obj)) {
+        return encoder_listencode_list(s, rval, obj, indent_level);
+    }
+    else if (PyDict_Check(obj)) {
+        return encoder_listencode_dict(s, rval, obj, indent_level);
+    }
+    else {
+        PyObject *ident = NULL;
+        if (s->markers != Py_None) {
+            int has_key;
+            ident = PyLong_FromVoidPtr(obj);
+            if (ident == NULL)
+                return -1;
+            has_key = PyDict_Contains(s->markers, ident);
+            if (has_key) {
+                if (has_key != -1)
+                    PyErr_SetString(PyExc_ValueError, "Circular reference detected");
+                Py_DECREF(ident);
+                return -1;
+            }
+            if (PyDict_SetItem(s->markers, ident, obj)) {
+                Py_DECREF(ident);
+                return -1;
+            }
+        }
+        newobj = PyObject_CallFunctionObjArgs(s->defaultfn, obj, NULL);
+        if (newobj == NULL) {
+            Py_XDECREF(ident);
+            return -1;
+        }
+        rv = encoder_listencode_obj(s, rval, newobj, indent_level);
+        Py_DECREF(newobj);
+        if (rv) {
+            Py_XDECREF(ident);
+            return -1;
+        }
+        if (ident != NULL) {
+            if (PyDict_DelItem(s->markers, ident)) {
+                Py_XDECREF(ident);
+                return -1;
+            }
+            Py_XDECREF(ident);
+        }
+        return rv;
+    }
+}
+
+static int
+encoder_listencode_dict(PyEncoderObject *s, PyObject *rval, PyObject *dct, Py_ssize_t indent_level)
+{
+    /* Encode Python dict dct a JSON term, rval is a PyList */
+    static PyObject *open_dict = NULL;
+    static PyObject *close_dict = NULL;
+    static PyObject *empty_dict = NULL;
+    PyObject *kstr = NULL;
+    PyObject *ident = NULL;
+    PyObject *key, *value;
+    Py_ssize_t pos;
+    int skipkeys;
+    Py_ssize_t idx;
+
+    if (open_dict == NULL || close_dict == NULL || empty_dict == NULL) {
+        open_dict = PyString_InternFromString("{");
+        close_dict = PyString_InternFromString("}");
+        empty_dict = PyString_InternFromString("{}");
+        if (open_dict == NULL || close_dict == NULL || empty_dict == NULL)
+            return -1;
+    }
+    if (PyDict_Size(dct) == 0)
+        return PyList_Append(rval, empty_dict);
+
+    if (s->markers != Py_None) {
+        int has_key;
+        ident = PyLong_FromVoidPtr(dct);
+        if (ident == NULL)
+            goto bail;
+        has_key = PyDict_Contains(s->markers, ident);
+        if (has_key) {
+            if (has_key != -1)
+                PyErr_SetString(PyExc_ValueError, "Circular reference detected");
+            goto bail;
+        }
+        if (PyDict_SetItem(s->markers, ident, dct)) {
+            goto bail;
+        }
+    }
+
+    if (PyList_Append(rval, open_dict))
+        goto bail;
+
+    if (s->indent != Py_None) {
+        /* TODO: DOES NOT RUN */
+        indent_level += 1;
+        /*
+            newline_indent = '\n' + (' ' * (_indent * _current_indent_level))
+            separator = _item_separator + newline_indent
+            buf += newline_indent
+        */
+    }
+
+    /* TODO: C speedup not implemented for sort_keys */
+
+    pos = 0;
+    skipkeys = PyObject_IsTrue(s->skipkeys);
+    idx = 0;
+    while (PyDict_Next(dct, &pos, &key, &value)) {
+        PyObject *encoded;
+
+        if (PyString_Check(key) || PyUnicode_Check(key)) {
+            Py_INCREF(key);
+            kstr = key;
+        }
+        else if (PyFloat_Check(key)) {
+            kstr = encoder_encode_float(s, key);
+            if (kstr == NULL)
+                goto bail;
+        }
+        else if (PyInt_Check(key) || PyLong_Check(key)) {
+            kstr = PyObject_Str(key);
+            if (kstr == NULL)
+                goto bail;
+        }
+        else if (key == Py_True || key == Py_False || key == Py_None) {
+            kstr = _encoded_const(key);
+            if (kstr == NULL)
+                goto bail;
+        }
+        else if (skipkeys) {
+            continue;
+        }
+        else {
+            /* TODO: include repr of key */
+            PyErr_SetString(PyExc_ValueError, "keys must be a string");
+            goto bail;
+        }
+
+        if (idx) {
+            if (PyList_Append(rval, s->item_separator))
+                goto bail;
+        }
+
+        encoded = encoder_encode_string(s, kstr);
+        Py_CLEAR(kstr);
+        if (encoded == NULL)
+            goto bail;
+        if (PyList_Append(rval, encoded)) {
+            Py_DECREF(encoded);
+            goto bail;
+        }
+        Py_DECREF(encoded);
+        if (PyList_Append(rval, s->key_separator))
+            goto bail;
+        if (encoder_listencode_obj(s, rval, value, indent_level))
+            goto bail;
+        idx += 1;
+    }
+    if (ident != NULL) {
+        if (PyDict_DelItem(s->markers, ident))
+            goto bail;
+        Py_CLEAR(ident);
+    }
+    if (s->indent != Py_None) {
+        /* TODO: DOES NOT RUN */
+        indent_level -= 1;
+        /*
+            yield '\n' + (' ' * (_indent * _current_indent_level))
+        */
+    }
+    if (PyList_Append(rval, close_dict))
+        goto bail;
+    return 0;
+
+bail:
+    Py_XDECREF(kstr);
+    Py_XDECREF(ident);
+    return -1;
+}
+
+
+static int
+encoder_listencode_list(PyEncoderObject *s, PyObject *rval, PyObject *seq, Py_ssize_t indent_level)
+{
+    /* Encode Python list seq to a JSON term, rval is a PyList */
+    static PyObject *open_array = NULL;
+    static PyObject *close_array = NULL;
+    static PyObject *empty_array = NULL;
+    PyObject *ident = NULL;
+    PyObject *s_fast = NULL;
+    Py_ssize_t num_items;
+    PyObject **seq_items;
+    Py_ssize_t i;
+
+    if (open_array == NULL || close_array == NULL || empty_array == NULL) {
+        open_array = PyString_InternFromString("[");
+        close_array = PyString_InternFromString("]");
+        empty_array = PyString_InternFromString("[]");
+        if (open_array == NULL || close_array == NULL || empty_array == NULL)
+            return -1;
+    }
+    ident = NULL;
+    s_fast = PySequence_Fast(seq, "_iterencode_list needs a sequence");
+    if (s_fast == NULL)
+        return -1;
+    num_items = PySequence_Fast_GET_SIZE(s_fast);
+    if (num_items == 0) {
+        Py_DECREF(s_fast);
+        return PyList_Append(rval, empty_array);
+    }
+
+    if (s->markers != Py_None) {
+        int has_key;
+        ident = PyLong_FromVoidPtr(seq);
+        if (ident == NULL)
+            goto bail;
+        has_key = PyDict_Contains(s->markers, ident);
+        if (has_key) {
+            if (has_key != -1)
+                PyErr_SetString(PyExc_ValueError, "Circular reference detected");
+            goto bail;
+        }
+        if (PyDict_SetItem(s->markers, ident, seq)) {
+            goto bail;
+        }
+    }
+
+    seq_items = PySequence_Fast_ITEMS(s_fast);
+    if (PyList_Append(rval, open_array))
+        goto bail;
+    if (s->indent != Py_None) {
+        /* TODO: DOES NOT RUN */
+        indent_level += 1;
+        /*
+            newline_indent = '\n' + (' ' * (_indent * _current_indent_level))
+            separator = _item_separator + newline_indent
+            buf += newline_indent
+        */
+    }
+    for (i = 0; i < num_items; i++) {
+        PyObject *obj = seq_items[i];
+        if (i) {
+            if (PyList_Append(rval, s->item_separator))
+                goto bail;
+        }
+        if (encoder_listencode_obj(s, rval, obj, indent_level))
+            goto bail;
+    }
+    if (ident != NULL) {
+        if (PyDict_DelItem(s->markers, ident))
+            goto bail;
+        Py_CLEAR(ident);
+    }
+    if (s->indent != Py_None) {
+        /* TODO: DOES NOT RUN */
+        indent_level -= 1;
+        /*
+            yield '\n' + (' ' * (_indent * _current_indent_level))
+        */
+    }
+    if (PyList_Append(rval, close_array))
+        goto bail;
+    Py_DECREF(s_fast);
+    return 0;
+
+bail:
+    Py_XDECREF(ident);
+    Py_DECREF(s_fast);
+    return -1;
+}
+
+static void
+encoder_dealloc(PyObject *self)
+{
+    /* Deallocate Encoder */
+    encoder_clear(self);
+    Py_TYPE(self)->tp_free(self);
+}
+
+static int
+encoder_traverse(PyObject *self, visitproc visit, void *arg)
+{
+    PyEncoderObject *s;
+    assert(PyEncoder_Check(self));
+    s = (PyEncoderObject *)self;
+    Py_VISIT(s->markers);
+    Py_VISIT(s->defaultfn);
+    Py_VISIT(s->encoder);
+    Py_VISIT(s->indent);
+    Py_VISIT(s->key_separator);
+    Py_VISIT(s->item_separator);
+    Py_VISIT(s->sort_keys);
+    Py_VISIT(s->skipkeys);
+    return 0;
+}
+
+static int
+encoder_clear(PyObject *self)
+{
+    /* Deallocate Encoder */
+    PyEncoderObject *s;
+    assert(PyEncoder_Check(self));
+    s = (PyEncoderObject *)self;
+    Py_CLEAR(s->markers);
+    Py_CLEAR(s->defaultfn);
+    Py_CLEAR(s->encoder);
+    Py_CLEAR(s->indent);
+    Py_CLEAR(s->key_separator);
+    Py_CLEAR(s->item_separator);
+    Py_CLEAR(s->sort_keys);
+    Py_CLEAR(s->skipkeys);
+    return 0;
+}
+
+PyDoc_STRVAR(encoder_doc, "_iterencode(obj, _current_indent_level) -> iterable");
+
+static
+PyTypeObject PyEncoderType = {
+    PyObject_HEAD_INIT(NULL)
+    0,                    /* tp_internal */
+    "simplejson._speedups.Encoder",       /* tp_name */
+    sizeof(PyEncoderObject), /* tp_basicsize */
+    0,                    /* tp_itemsize */
+    encoder_dealloc, /* tp_dealloc */
+    0,                    /* tp_print */
+    0,                    /* tp_getattr */
+    0,                    /* tp_setattr */
+    0,                    /* tp_compare */
+    0,                    /* tp_repr */
+    0,                    /* tp_as_number */
+    0,                    /* tp_as_sequence */
+    0,                    /* tp_as_mapping */
+    0,                    /* tp_hash */
+    encoder_call,         /* tp_call */
+    0,                    /* tp_str */
+    0,                    /* tp_getattro */
+    0,                    /* tp_setattro */
+    0,                    /* tp_as_buffer */
+    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,   /* tp_flags */
+    encoder_doc,          /* tp_doc */
+    encoder_traverse,     /* tp_traverse */
+    encoder_clear,        /* tp_clear */
+    0,                    /* tp_richcompare */
+    0,                    /* tp_weaklistoffset */
+    0,                    /* tp_iter */
+    0,                    /* tp_iternext */
+    0,                    /* tp_methods */
+    encoder_members,      /* tp_members */
+    0,                    /* tp_getset */
+    0,                    /* tp_base */
+    0,                    /* tp_dict */
+    0,                    /* tp_descr_get */
+    0,                    /* tp_descr_set */
+    0,                    /* tp_dictoffset */
+    encoder_init,         /* tp_init */
+    0,                    /* tp_alloc */
+    encoder_new,          /* tp_new */
+    0,                    /* tp_free */
+};
+
+static PyMethodDef speedups_methods[] = {
+    {"encode_basestring_ascii",
+        (PyCFunction)py_encode_basestring_ascii,
+        METH_O,
+        pydoc_encode_basestring_ascii},
+    {"scanstring",
+        (PyCFunction)py_scanstring,
+        METH_VARARGS,
+        pydoc_scanstring},
+    {NULL, NULL, 0, NULL}
+};
+
+PyDoc_STRVAR(module_doc,
+"simplejson speedups\n");
+
+void
+init_speedups(void)
+{
+    PyObject *m;
+    PyScannerType.tp_new = PyType_GenericNew;
+    if (PyType_Ready(&PyScannerType) < 0)
+        return;
+    PyEncoderType.tp_new = PyType_GenericNew;
+    if (PyType_Ready(&PyEncoderType) < 0)
+        return;
+    m = Py_InitModule3("_speedups", speedups_methods, module_doc);
+    Py_INCREF((PyObject*)&PyScannerType);
+    PyModule_AddObject(m, "make_scanner", (PyObject*)&PyScannerType);
+    Py_INCREF((PyObject*)&PyEncoderType);
+    PyModule_AddObject(m, "make_encoder", (PyObject*)&PyEncoderType);
+}
diff --git a/simplejson/decoder.py b/simplejson/decoder.py
new file mode 100644
index 00000000..b769ea48
--- /dev/null
+++ b/simplejson/decoder.py
@@ -0,0 +1,354 @@
+"""Implementation of JSONDecoder
+"""
+import re
+import sys
+import struct
+
+from simplejson.scanner import make_scanner
+try:
+    from simplejson._speedups import scanstring as c_scanstring
+except ImportError:
+    c_scanstring = None
+
+__all__ = ['JSONDecoder']
+
+FLAGS = re.VERBOSE | re.MULTILINE | re.DOTALL
+
+def _floatconstants():
+    _BYTES = '7FF80000000000007FF0000000000000'.decode('hex')
+    if sys.byteorder != 'big':
+        _BYTES = _BYTES[:8][::-1] + _BYTES[8:][::-1]
+    nan, inf = struct.unpack('dd', _BYTES)
+    return nan, inf, -inf
+
+NaN, PosInf, NegInf = _floatconstants()
+
+
+def linecol(doc, pos):
+    lineno = doc.count('\n', 0, pos) + 1
+    if lineno == 1:
+        colno = pos
+    else:
+        colno = pos - doc.rindex('\n', 0, pos)
+    return lineno, colno
+
+
+def errmsg(msg, doc, pos, end=None):
+    # Note that this function is called from _speedups
+    lineno, colno = linecol(doc, pos)
+    if end is None:
+        #fmt = '{0}: line {1} column {2} (char {3})'
+        #return fmt.format(msg, lineno, colno, pos)
+        fmt = '%s: line %d column %d (char %d)'
+        return fmt % (msg, lineno, colno, pos)
+    endlineno, endcolno = linecol(doc, end)
+    #fmt = '{0}: line {1} column {2} - line {3} column {4} (char {5} - {6})'
+    #return fmt.format(msg, lineno, colno, endlineno, endcolno, pos, end)
+    fmt = '%s: line %d column %d - line %d column %d (char %d - %d)'
+    return fmt % (msg, lineno, colno, endlineno, endcolno, pos, end)
+
+
+_CONSTANTS = {
+    '-Infinity': NegInf,
+    'Infinity': PosInf,
+    'NaN': NaN,
+}
+
+STRINGCHUNK = re.compile(r'(.*?)(["\\\x00-\x1f])', FLAGS)
+BACKSLASH = {
+    '"': u'"', '\\': u'\\', '/': u'/',
+    'b': u'\b', 'f': u'\f', 'n': u'\n', 'r': u'\r', 't': u'\t',
+}
+
+DEFAULT_ENCODING = "utf-8"
+
+def py_scanstring(s, end, encoding=None, strict=True, _b=BACKSLASH, _m=STRINGCHUNK.match):
+    """Scan the string s for a JSON string. End is the index of the
+    character in s after the quote that started the JSON string.
+    Unescapes all valid JSON string escape sequences and raises ValueError
+    on attempt to decode an invalid string. If strict is False then literal
+    control characters are allowed in the string.
+    
+    Returns a tuple of the decoded string and the index of the character in s
+    after the end quote."""
+    if encoding is None:
+        encoding = DEFAULT_ENCODING
+    chunks = []
+    _append = chunks.append
+    begin = end - 1
+    while 1:
+        chunk = _m(s, end)
+        if chunk is None:
+            raise ValueError(
+                errmsg("Unterminated string starting at", s, begin))
+        end = chunk.end()
+        content, terminator = chunk.groups()
+        # Content is contains zero or more unescaped string characters
+        if content:
+            if not isinstance(content, unicode):
+                content = unicode(content, encoding)
+            _append(content)
+        # Terminator is the end of string, a literal control character,
+        # or a backslash denoting that an escape sequence follows
+        if terminator == '"':
+            break
+        elif terminator != '\\':
+            if strict:
+                msg = "Invalid control character %r at" % (terminator,)
+                #msg = "Invalid control character {0!r} at".format(terminator)
+                raise ValueError(errmsg(msg, s, end))
+            else:
+                _append(terminator)
+                continue
+        try:
+            esc = s[end]
+        except IndexError:
+            raise ValueError(
+                errmsg("Unterminated string starting at", s, begin))
+        # If not a unicode escape sequence, must be in the lookup table
+        if esc != 'u':
+            try:
+                char = _b[esc]
+            except KeyError:
+                msg = "Invalid \\escape: " + repr(esc)
+                raise ValueError(errmsg(msg, s, end))
+            end += 1
+        else:
+            # Unicode escape sequence
+            esc = s[end + 1:end + 5]
+            next_end = end + 5
+            if len(esc) != 4:
+                msg = "Invalid \\uXXXX escape"
+                raise ValueError(errmsg(msg, s, end))
+            uni = int(esc, 16)
+            # Check for surrogate pair on UCS-4 systems
+            if 0xd800 <= uni <= 0xdbff and sys.maxunicode > 65535:
+                msg = "Invalid \\uXXXX\\uXXXX surrogate pair"
+                if not s[end + 5:end + 7] == '\\u':
+                    raise ValueError(errmsg(msg, s, end))
+                esc2 = s[end + 7:end + 11]
+                if len(esc2) != 4:
+                    raise ValueError(errmsg(msg, s, end))
+                uni2 = int(esc2, 16)
+                uni = 0x10000 + (((uni - 0xd800) << 10) | (uni2 - 0xdc00))
+                next_end += 6
+            char = unichr(uni)
+            end = next_end
+        # Append the unescaped character
+        _append(char)
+    return u''.join(chunks), end
+
+
+# Use speedup if available
+scanstring = c_scanstring or py_scanstring
+
+WHITESPACE = re.compile(r'[ \t\n\r]*', FLAGS)
+WHITESPACE_STR = ' \t\n\r'
+
+def JSONObject((s, end), encoding, strict, scan_once, object_hook, _w=WHITESPACE.match, _ws=WHITESPACE_STR):
+    pairs = {}
+    # Use a slice to prevent IndexError from being raised, the following
+    # check will raise a more specific ValueError if the string is empty
+    nextchar = s[end:end + 1]
+    # Normally we expect nextchar == '"'
+    if nextchar != '"':
+        if nextchar in _ws:
+            end = _w(s, end).end()
+            nextchar = s[end:end + 1]
+        # Trivial empty object
+        if nextchar == '}':
+            return pairs, end + 1
+        elif nextchar != '"':
+            raise ValueError(errmsg("Expecting property name", s, end))
+    end += 1
+    while True:
+        key, end = scanstring(s, end, encoding, strict)
+
+        # To skip some function call overhead we optimize the fast paths where
+        # the JSON key separator is ": " or just ":".
+        if s[end:end + 1] != ':':
+            end = _w(s, end).end()
+            if s[end:end + 1] != ':':
+                raise ValueError(errmsg("Expecting : delimiter", s, end))
+
+        end += 1
+
+        try:
+            if s[end] in _ws:
+                end += 1
+                if s[end] in _ws:
+                    end = _w(s, end + 1).end()
+        except IndexError:
+            pass
+
+        try:
+            value, end = scan_once(s, end)
+        except StopIteration:
+            raise ValueError(errmsg("Expecting object", s, end))
+        pairs[key] = value
+
+        try:
+            nextchar = s[end]
+            if nextchar in _ws:
+                end = _w(s, end + 1).end()
+                nextchar = s[end]
+        except IndexError:
+            nextchar = ''
+        end += 1
+
+        if nextchar == '}':
+            break
+        elif nextchar != ',':
+            raise ValueError(errmsg("Expecting , delimiter", s, end - 1))
+
+        try:
+            nextchar = s[end]
+            if nextchar in _ws:
+                end += 1
+                nextchar = s[end]
+                if nextchar in _ws:
+                    end = _w(s, end + 1).end()
+                    nextchar = s[end]
+        except IndexError:
+            nextchar = ''
+
+        end += 1
+        if nextchar != '"':
+            raise ValueError(errmsg("Expecting property name", s, end - 1))
+
+    if object_hook is not None:
+        pairs = object_hook(pairs)
+    return pairs, end
+
+def JSONArray((s, end), scan_once, _w=WHITESPACE.match, _ws=WHITESPACE_STR):
+    values = []
+    nextchar = s[end:end + 1]
+    if nextchar in _ws:
+        end = _w(s, end + 1).end()
+        nextchar = s[end:end + 1]
+    # Look-ahead for trivial empty array
+    if nextchar == ']':
+        return values, end + 1
+    _append = values.append
+    while True:
+        try:
+            value, end = scan_once(s, end)
+        except StopIteration:
+            raise ValueError(errmsg("Expecting object", s, end))
+        _append(value)
+        nextchar = s[end:end + 1]
+        if nextchar in _ws:
+            end = _w(s, end + 1).end()
+            nextchar = s[end:end + 1]
+        end += 1
+        if nextchar == ']':
+            break
+        elif nextchar != ',':
+            raise ValueError(errmsg("Expecting , delimiter", s, end))
+
+        try:
+            if s[end] in _ws:
+                end += 1
+                if s[end] in _ws:
+                    end = _w(s, end + 1).end()
+        except IndexError:
+            pass
+
+    return values, end
+
+class JSONDecoder(object):
+    """Simple JSON <http://json.org> decoder
+
+    Performs the following translations in decoding by default:
+
+    +---------------+-------------------+
+    | JSON          | Python            |
+    +===============+===================+
+    | object        | dict              |
+    +---------------+-------------------+
+    | array         | list              |
+    +---------------+-------------------+
+    | string        | unicode           |
+    +---------------+-------------------+
+    | number (int)  | int, long         |
+    +---------------+-------------------+
+    | number (real) | float             |
+    +---------------+-------------------+
+    | true          | True              |
+    +---------------+-------------------+
+    | false         | False             |
+    +---------------+-------------------+
+    | null          | None              |
+    +---------------+-------------------+
+
+    It also understands ``NaN``, ``Infinity``, and ``-Infinity`` as
+    their corresponding ``float`` values, which is outside the JSON spec.
+
+    """
+
+    def __init__(self, encoding=None, object_hook=None, parse_float=None,
+            parse_int=None, parse_constant=None, strict=True):
+        """``encoding`` determines the encoding used to interpret any ``str``
+        objects decoded by this instance (utf-8 by default).  It has no
+        effect when decoding ``unicode`` objects.
+
+        Note that currently only encodings that are a superset of ASCII work,
+        strings of other encodings should be passed in as ``unicode``.
+
+        ``object_hook``, if specified, will be called with the result
+        of every JSON object decoded and its return value will be used in
+        place of the given ``dict``.  This can be used to provide custom
+        deserializations (e.g. to support JSON-RPC class hinting).
+
+        ``parse_float``, if specified, will be called with the string
+        of every JSON float to be decoded. By default this is equivalent to
+        float(num_str). This can be used to use another datatype or parser
+        for JSON floats (e.g. decimal.Decimal).
+
+        ``parse_int``, if specified, will be called with the string
+        of every JSON int to be decoded. By default this is equivalent to
+        int(num_str). This can be used to use another datatype or parser
+        for JSON integers (e.g. float).
+
+        ``parse_constant``, if specified, will be called with one of the
+        following strings: -Infinity, Infinity, NaN.
+        This can be used to raise an exception if invalid JSON numbers
+        are encountered.
+
+        """
+        self.encoding = encoding
+        self.object_hook = object_hook
+        self.parse_float = parse_float or float
+        self.parse_int = parse_int or int
+        self.parse_constant = parse_constant or _CONSTANTS.__getitem__
+        self.strict = strict
+        self.parse_object = JSONObject
+        self.parse_array = JSONArray
+        self.parse_string = scanstring
+        self.scan_once = make_scanner(self)
+
+    def decode(self, s, _w=WHITESPACE.match):
+        """Return the Python representation of ``s`` (a ``str`` or ``unicode``
+        instance containing a JSON document)
+
+        """
+        obj, end = self.raw_decode(s, idx=_w(s, 0).end())
+        end = _w(s, end).end()
+        if end != len(s):
+            raise ValueError(errmsg("Extra data", s, end, len(s)))
+        return obj
+
+    def raw_decode(self, s, idx=0):
+        """Decode a JSON document from ``s`` (a ``str`` or ``unicode`` beginning
+        with a JSON document) and return a 2-tuple of the Python
+        representation and the index in ``s`` where the document ended.
+
+        This can be used to decode a JSON document from a string that may
+        have extraneous data at the end.
+
+        """
+        try:
+            obj, end = self.scan_once(s, idx)
+        except StopIteration:
+            raise ValueError("No JSON object could be decoded")
+        return obj, end
diff --git a/simplejson/decoder.pyc b/simplejson/decoder.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..2ae9b3591ee9c6400d5cd09eb0a05999ef680bdc
GIT binary patch
literal 11292
zcmcIq&2tmkcE2sjACi&37_iM}!weOf0h^grg(*VjJp*RO4@U6XFwFBak=p8(-B{|D
zyIWwr$eTbG*{8C4o2;@-Ro*I9S){Vde~_xAD%-5H%x3cYo!i}#{XArtI09eY&vVZ`
z=iKvk^}GKnmp=LJZ`T?s`IPbfbNogBXei|<wSm%5PEPF_Y6BHr&#8@ETF<MEywvk*
zx1d@hYGXthy^o};pms-9YfNp7E8~T~pbBnLy(+1otPFer6$5@w8Q(c0Y8x9&DA!Ql
zDJje99vhSD-o})2M%6nYGp*cd^;W4(Y&xShX4S@N<&4P?HUvuJ>K(wGQ9BBIomM%g
zsO}crSyW1_%%C!%?rxlw9p;pSt)|pl;4v>toH8a%Vx}{N$}}rnGRq2~eZ<NcRL-(8
zhsr!F3#go9<vc1E0DnO_7uCi&qU4@e?t*gXm3Kiom(;t0+PJ9Pan&g(!^Nbr6qU;<
zDwmXFstq(RagBRfIaky>plA;DT$P?H3UqU?swTMdF{uF3{A%N4Zo6Ljgj~FYVy)e2
zxoy{v?br)^GiaK>SbtJ|;5Gus4NKnl_*5(4wu(=oXxqDPEo#`l?}oa!L_p|>;?VQA
z;|Vl}0Epz|(Km*_`<&WE0Xgwd=G0q59RM<#;7(q>%B$d(GWr-RC=>F<|0C)z@@hf%
zT|U$|hqb<;j5x2n0)+sRz^%=kIsn|9>Km$$GN&e*c^sK2RAUq6?S~J)xHa@ad#H8m
z762-><L=A%mbdMVqb;O}bEr8^WdvXGDC<HfnHcq=xQMQ;UhD=Ts3#LZmu@4LYS-`B
zjok`?OS^XOSI<`0Wvy@f^6mM}3Wk*w(a%s@ejd4Dw7lzuUaJ+nUVab;ovmPh`GNb|
zZ3Ug>rtLSq#v6BQIr7NLS5e?EYplYhPA{GUj9Rl5*l{BOldw-TgRY2tQ^u4rZQL^E
zjRwzEz#k7Ld|F2Z^dz6;R)d&tag+0Ej+E8x%Bi3Pc7fP=<)4!pmtg+Tl6ef04SCh1
z;Bk{`M1d*+w#>$HxqZyN8$s9C)PguU?!L?y(l|jwzB@rA)N6UZ>j%lAmLHrj-6$>G
zq7k&tqnglb!6+N0+=9{IG01F6hR|ytl^7%wnM<UwpbkcOa7gW|aTQ!r1_*NiITcau
z7gQg^In^wvv+E+rdVM~X;xTnF&TDdX$(ZVor!*bIS`n#gbQvgIi|&|2+q~wOK)u`c
zS*tX5>=2d3=!+kmbMrmx%$r;+T(Zvcpu)w#cPpfUu%#VsTeE0br_&zScdU=tb0+O+
zwqv;=7)iKC@}UJxPn?0goo*NcuTM~mCQ+!|8KayZg}k3Z84>rJYq&nX7x!YKk~Mfo
zt9CUa>XoJIKU=K)`s(K9=Kif)H#he`Yrb6UQi88SbD@;_rpWZB)R(1yS?c3b-;(+%
zsW+uwlDaSTveZMV7o{FYybRsAdGm_~4??0+wTh_y9N6&&&Wlvx24V>=B_(KECBg!Q
zdH^wzt2hrS+W+qyg-rwu(s@u+{bCB?f~ZjN6r#o%<Gkrm&3|qPOic7fXgr`*Ss!J6
z6EI5ZU_$j_us;I;Y*tbrB7k>JqYVKq5le1X(r{!7;2OlVKOq_)Dg+L}Q~!zXDTobN
zK?9~>5%&c+Ptby$Jvc=<1Csqy=`m6y_pTU5AHXMww6XVxvRiL5nYM6HRxkWdRRN+$
z@8Ys}7aG<v2d2N#FVmXP8g0N?0U+#JRtpD{0QAQIR1!eT+D#c#FnSoq-gECkQXCo0
zkJ})m{}MP0H=q*c*gvl3t^n1fdN4(UtHHueAud-z4v_qZ=^!cu5P&^M0lH7qh3QYL
zLjIK@su~^)YCt7t1pfjiO)3xG)1-P;P{BU{{1m|_XaOJMG7Yrg=DY%1GdcNv76?c6
zaj<~vW_g?$Im8TUlN{oIfe{1!nH2q51-A<5;}G+3uD<M}<BXcWH;04uf%jQ;8)TAG
zqXVuVt^t^ZLqJd=50j}pz!&posC6*|xQQKFz-@~D9`|>>Vf$vh<C@xoF(b1Xgr+TS
zP|~+#uKJGYMKVpy68$8sDVg|Cx7v-^4NcF-YP-oQ0q%8!*hS5b0mlww*O6|zM=4+d
z@Z5LdL3LcLZMDqTcFS{ycQ^H@8M%91*KcqdunBE1LiJm_)pb|HFbD+{JUBa!-F7E7
z<G|Ez0Hy;o4OX9V$y{p+2921fdT6&I;_3P@0YKhv>2n2s90sky`LJ>5635^Tj)KDu
zsJ0|4q_Et$8~T`Q#$EU$38fNToaEqg1TG(@=3pnGq(B=`6J|nFbO{ayct>mZ+y}aC
z&$mh2lz${OTu~6hGC7g6H)Z--LIrq2hfii+1IJ_0yj^jR(wUo@_IFHZK=>*&dtwu^
z@$Pr{BpmXlIY<2~itqo8#rK%~G5QYA-qdTNF1WT0%*~Ds=Z^kHL^o)&>rvCgIf7eE
zFU?c`j)GQzzO$-U#LUj28gs)3s}EP6KYmtQt=@m~V6FO<I7fD;1A0MGDK(G~>mr&K
z1z+ZDhe5X!$s8~8#5ZiX(Bs(0_vrr1&>Fok5iqfkkKCSakQAZY3B~xg5I^M6;rX#e
zJ1Q&N_I?UTkO$D6P&|iMf#+AmPY_OOl(Z{=eHlh@0r?5fnKY?w>94j7G<LfFZX}r2
zl7o^vTkbaY7blVvWSpD^Zh}uLDnV$?6GtKp_6kP4!*V_!UVn|G<0#OVQOx>WD(LvU
zf`JqC&lys8dJ<D<0bW5z)Zr#Y_?pJ3QAC-Cr(Q<6V4N~$b7Sz@PaBi@vN3|*F{7Nj
zkSpOkZ%pD}-Z+=zT-K+Ji<ox?5KaTq1!F3=B;OZ|Gw4CvIEPuMj8Uu*7x&lZX1wWd
zhA*#2<gi&Rl^YZZqDjy1KK`P=2612|=mUt0x&z+;4h2*$tUf$eShOoJ`fvbXU}?JE
z!l0uKn>wn3>uA8N%WPOF2>M&B$I7GY#i#%V0z<e7vsi{rG<d4;z26DcWD6P=LqSXs
zIwr6){{RyOmaM%^Z|LuGU~uraIRk7>_SKGiK~6RC`}n{U;Yq&vQOGBg2ROmu*XPY}
z`pP(hQ}36_oP~r=cd=E5v0k1IT^z!K)E*||-rs1*FZ|PRRe&{oo-uJ%#0BXsFd|8?
z(ZTX5o>sd^;LyND(&Pl*hf&v_4EzLe1L>09y%cZF@&x-ocn^xnVG_SkQa=fzN$O`@
zd`5A_1{BC7K^(><z(<dEjm(VskTSs*RGB~I#rC$3Mf347ME(iq*gKmSc7DKF^vxJx
zo(ke2%=i8Y4lVv(zy);>MHW>s4U93jDDF;Cd)9I<#I2#}sEUCU<0mHVAfmBY-S4;!
zF^nCg5RjednZDh2WyT#bYJ(YfV6IzUo6bN)8#5RQwq5}W0$nIjD(@RdR^Aw_tWcwi
zZnv(pM(ZP5^jX+-EiSf}*hST{9tWK@x*kkISwy$OZqfQnx2)T!TMS(#e1x;)*8+G#
zl5Nr$)pmklR~v~pqPuHvBI}R1Oza)40?llcDS6TORPwuSPmBf}q^^6y%ANL??%orj
z+Fzj+?W4%6qA{AEfzB;M51+yJENUk8yc#pk7Z9H!Mm2M#T;7;L?~HK`T6zSn1$<vb
z1|pB%GFr1}PoS+WftmD|lF_pqg=Huk*DzyRXDx^mgJIF+{|PoEnp~0<N&E=;f`%SR
zG`ZFQ(85sOymp8ZWx`?2g9S&IiP9YtBakR?=s^vY!Yad~%okB5KR3X>;2XoBhJrE{
zU{GwdGDRj*w1xs20}WMR(g^k;nVc$Dt)XC1<dVpBIkDpi`nQ?a$qpv^h*k|fI)J6(
z*SMurIjoDI>g9L~P{pJwRs8_)p&_dJA0qhPKPRew?=PY1weHrc9v#MaEM7nz1GMM{
zI#pUX$kly$?A5j&Vb*&tHJt%{sTWy$%;Fms*&UZ#U7?s+RTfWJ{E~&mVsI&mkKDS*
zdd88vEWSl?!ncrl9^S&0FtmIBfkt!>g<L{hEnXvi1&eb1vP+hZ$z`IWb>Yx;Eae)2
zA|KL(AfpE;T)ade+(ijr1WX<J??Q<i>fI<GL0kyFNYFbxNx;Y<OIVQSiK4RBE8_p2
zg9o-QNnITd-rb4g&Yk6Drg)cvaQn+7s0vFGDm`^WM6PWer8WbGX$*tn5Xt$LDAtH^
zl>~(x*y^F)w7aeNjt21Q&BLFgZH|5_TlF<UjDF?QH=p+69R#04pT5le^iK|dj<z|P
z!ql2P1<^Mhxc_NOe<v^xqj~dvc-rK72BePwH~K%rOajdWYTrzvoNO1<{BS(|ZhH%9
zg9;*;MXU#-;u~fw0Gra!Plp-0c54wZ<rN?WC*L0q6R#QW07T!UEg!U5`*4^|$v>n}
z`bj<_ZT~cweix~f?9(@^NLFV}seA~YBFbwqavxCucH?b_FDXuB*6YX;*XuV>Npr_+
zF+o$WXSwBi-LxZtfs}_AA~7F^Zqx~U#=4j&jKL(W3~!ikb`UBvGZS><$a5q&qi<XU
zA8twCRtd|fc^DvzF^3@+%ZYdy70Kn+U`X@wnh4{H@tW95zAiHGL0jx%2Sx+t1Nw+v
zu$%HeQ7bZzXU~MB@lYu%qzu`E>?Bfdh}-}lO{DA$yzLN^s0m-IUPq!zB6*w&i3CZ~
zAX~+ZPdZ|DBPPTGin<$iLKo!qd!PocSG_LOBA>KUh!R!jP;13IAWfREFe{QJAJS%v
zOQs24?bwm&2N@i<*@WW?(jv>1sla+Yxw}9!*(jkdx2|UCy9RPKNF%g*X5gbpkH7;V
zxhGjMGwQ;rj&KU323OYaudSJHf^hdnhJe-@;AztgK!<P$O0*MnTR0k1K@q6}H4W^C
zup7dvUe}n4$4g=JkjsNucumiBAUk*_B%}uNbb$26i+6<V5IAW13>#p92gI<a#VXOf
zI$!9B_<C_<f+tAjX|c=z3)?(DgVbr+jV#Nz?Y#zl>vgK`dL4{-Mqa^RCrT;95r4d<
zR5!X&9JDh)j*FL0582P(B*v=ZE^RMSLO|M15XOS*P3!4>v(W;b%pFJ$F3{p3;&f~<
zK|gr@c;aZ@WSAT#j#isM14l?Gv}E4PjAtT_k%{!IhZ_tz0nQmLSzUp8uVE92=5Yi8
zVL)>&6^@OU_+AGT4IvFUi%#rP9+{Vx<gvhvOidr4<hAYA(gXc{95q0v6QTtmks&{c
z5?Fh}bO1zm8<#GjgplR9^QSN0KaL2r6p#Si(E$@PZz{RPcg#$=-!N0nf5U_^(3x<u
z>o`tJ)*iez-Tj8!kzZWk`g%!TT9~Un0c|b_hT4S+2k+u;=sH8fo@9b0IDQJ%D`Bh<
zK?38Un_zv;Vfw+k6NHnLXzl)!>iV;l>a%rOQLAmcF@pYftp+`xPEM&O0l4*okoZ#&
z4M}Sb3qJ(nGg#UyUYCUULsK>B7z5~-Kz@)R34zFMHFb>7V_2IkUb3jOVBCMg5dkw3
zwHn`jYqcu~fg`?Ct4l@XTBjwq${PPQm?2>DfQD9#?4O|mlZUJ&U%6oZU{_I*hfYMY
zZ)p<^#;kdD023>t2=<tvlTmgeG?ac=Pv#V_!TQS6CL>uu92$O$m4k;^{)z=Lfr@^E
zLcg<!Zcm(VrsJVQhknWfV+zYwu~Vx`r7~nyGWpJoDf8tv=mNJSc>%-EF1q}A(4zJ_
zD3Ow1@tl3o0Jt#FTir*LVN!MJU&gR6wBOXUy42y~XXqOQi89YZl#~R7j1L7a1WM+g
zEXOVK?-%4WQBxz=CI5ZRkRxPFX4EB2{u-6ug#n+z#v~IVTz%nRM!XH?ArpbOZhXK`
z$U?#@$y<t}C1JOCMUSyJG&EjSjuO^vhC!PQdLO5taq+l8zGOTT%YKweV!9KvZJVFp
zJoE&o#Uul8L|o{z(m&HLa_~SjN^qE<fH;s!0<@8HNDm#S=rre#KdYTS)rt4iwtE>$
zJN9cRI|`HU23<IPkSILN$@bWFNcYKmUNt!6zCcH6FG_Fj$j@SQ`XS3u9F@B!IBo5)
zV4m=Vg>D-lpJzf>%;Ujj5?O_+Bu69@S*tMz3w2Aetkv3q(`~Uyajn%r@mfu?p*qik
z)PjCmd-3%eemVAZ<^HPZ{5F2vwId>Kam&Feq;?WNBeN*P`Sd8G7e;eMW41CiA-^NE
zc8M2fgswdQSv*b5XUf5E(w3OD#jgfM|Hss~Lt`~Ku&#sG$brph3_Xd7Wx)>>;RDL!
zqmU$_5!~E_Uf-@-_nxe;ikbTcFQRLY*Q%@XVEEw4vz5n>g;Wn8uY9#`@kenMACP7E
zX%NALOSS55qbk2~(yyg|%1Pu#BWQQLmQFdZKeO=AdjIR^)km`1y_Nfq)*r8|e{GTA
znpbVszGBfrA?9?zwHhFZCDn$LdM7cYq~iYr|Dtigy{pCROHoL7(J_jbKm5y0<F)W3
s$rTrKbGhQ!Y`$1LHB}G`IFX+<3dVV3IX{}4ua<MOcq^QJH2cZ_08a|RG5`Po

literal 0
HcmV?d00001

diff --git a/simplejson/encoder.py b/simplejson/encoder.py
new file mode 100644
index 00000000..cf582903
--- /dev/null
+++ b/simplejson/encoder.py
@@ -0,0 +1,440 @@
+"""Implementation of JSONEncoder
+"""
+import re
+
+try:
+    from simplejson._speedups import encode_basestring_ascii as c_encode_basestring_ascii
+except ImportError:
+    c_encode_basestring_ascii = None
+try:
+    from simplejson._speedups import make_encoder as c_make_encoder
+except ImportError:
+    c_make_encoder = None
+
+ESCAPE = re.compile(r'[\x00-\x1f\\"\b\f\n\r\t]')
+ESCAPE_ASCII = re.compile(r'([\\"]|[^\ -~])')
+HAS_UTF8 = re.compile(r'[\x80-\xff]')
+ESCAPE_DCT = {
+    '\\': '\\\\',
+    '"': '\\"',
+    '\b': '\\b',
+    '\f': '\\f',
+    '\n': '\\n',
+    '\r': '\\r',
+    '\t': '\\t',
+}
+for i in range(0x20):
+    #ESCAPE_DCT.setdefault(chr(i), '\\u{0:04x}'.format(i))
+    ESCAPE_DCT.setdefault(chr(i), '\\u%04x' % (i,))
+
+# Assume this produces an infinity on all machines (probably not guaranteed)
+INFINITY = float('1e66666')
+FLOAT_REPR = repr
+
+def encode_basestring(s):
+    """Return a JSON representation of a Python string
+
+    """
+    def replace(match):
+        return ESCAPE_DCT[match.group(0)]
+    return '"' + ESCAPE.sub(replace, s) + '"'
+
+
+def py_encode_basestring_ascii(s):
+    """Return an ASCII-only JSON representation of a Python string
+
+    """
+    if isinstance(s, str) and HAS_UTF8.search(s) is not None:
+        s = s.decode('utf-8')
+    def replace(match):
+        s = match.group(0)
+        try:
+            return ESCAPE_DCT[s]
+        except KeyError:
+            n = ord(s)
+            if n < 0x10000:
+                #return '\\u{0:04x}'.format(n)
+                return '\\u%04x' % (n,)
+            else:
+                # surrogate pair
+                n -= 0x10000
+                s1 = 0xd800 | ((n >> 10) & 0x3ff)
+                s2 = 0xdc00 | (n & 0x3ff)
+                #return '\\u{0:04x}\\u{1:04x}'.format(s1, s2)
+                return '\\u%04x\\u%04x' % (s1, s2)
+    return '"' + str(ESCAPE_ASCII.sub(replace, s)) + '"'
+
+
+encode_basestring_ascii = c_encode_basestring_ascii or py_encode_basestring_ascii
+
+class JSONEncoder(object):
+    """Extensible JSON <http://json.org> encoder for Python data structures.
+
+    Supports the following objects and types by default:
+
+    +-------------------+---------------+
+    | Python            | JSON          |
+    +===================+===============+
+    | dict              | object        |
+    +-------------------+---------------+
+    | list, tuple       | array         |
+    +-------------------+---------------+
+    | str, unicode      | string        |
+    +-------------------+---------------+
+    | int, long, float  | number        |
+    +-------------------+---------------+
+    | True              | true          |
+    +-------------------+---------------+
+    | False             | false         |
+    +-------------------+---------------+
+    | None              | null          |
+    +-------------------+---------------+
+
+    To extend this to recognize other objects, subclass and implement a
+    ``.default()`` method with another method that returns a serializable
+    object for ``o`` if possible, otherwise it should call the superclass
+    implementation (to raise ``TypeError``).
+
+    """
+    item_separator = ', '
+    key_separator = ': '
+    def __init__(self, skipkeys=False, ensure_ascii=True,
+            check_circular=True, allow_nan=True, sort_keys=False,
+            indent=None, separators=None, encoding='utf-8', default=None):
+        """Constructor for JSONEncoder, with sensible defaults.
+
+        If skipkeys is false, then it is a TypeError to attempt
+        encoding of keys that are not str, int, long, float or None.  If
+        skipkeys is True, such items are simply skipped.
+
+        If ensure_ascii is true, the output is guaranteed to be str
+        objects with all incoming unicode characters escaped.  If
+        ensure_ascii is false, the output will be unicode object.
+
+        If check_circular is true, then lists, dicts, and custom encoded
+        objects will be checked for circular references during encoding to
+        prevent an infinite recursion (which would cause an OverflowError).
+        Otherwise, no such check takes place.
+
+        If allow_nan is true, then NaN, Infinity, and -Infinity will be
+        encoded as such.  This behavior is not JSON specification compliant,
+        but is consistent with most JavaScript based encoders and decoders.
+        Otherwise, it will be a ValueError to encode such floats.
+
+        If sort_keys is true, then the output of dictionaries will be
+        sorted by key; this is useful for regression tests to ensure
+        that JSON serializations can be compared on a day-to-day basis.
+
+        If indent is a non-negative integer, then JSON array
+        elements and object members will be pretty-printed with that
+        indent level.  An indent level of 0 will only insert newlines.
+        None is the most compact representation.
+
+        If specified, separators should be a (item_separator, key_separator)
+        tuple.  The default is (', ', ': ').  To get the most compact JSON
+        representation you should specify (',', ':') to eliminate whitespace.
+
+        If specified, default is a function that gets called for objects
+        that can't otherwise be serialized.  It should return a JSON encodable
+        version of the object or raise a ``TypeError``.
+
+        If encoding is not None, then all input strings will be
+        transformed into unicode using that encoding prior to JSON-encoding.
+        The default is UTF-8.
+
+        """
+
+        self.skipkeys = skipkeys
+        self.ensure_ascii = ensure_ascii
+        self.check_circular = check_circular
+        self.allow_nan = allow_nan
+        self.sort_keys = sort_keys
+        self.indent = indent
+        if separators is not None:
+            self.item_separator, self.key_separator = separators
+        if default is not None:
+            self.default = default
+        self.encoding = encoding
+
+    def default(self, o):
+        """Implement this method in a subclass such that it returns
+        a serializable object for ``o``, or calls the base implementation
+        (to raise a ``TypeError``).
+
+        For example, to support arbitrary iterators, you could
+        implement default like this::
+
+            def default(self, o):
+                try:
+                    iterable = iter(o)
+                except TypeError:
+                    pass
+                else:
+                    return list(iterable)
+                return JSONEncoder.default(self, o)
+
+        """
+        raise TypeError(repr(o) + " is not JSON serializable")
+
+    def encode(self, o):
+        """Return a JSON string representation of a Python data structure.
+
+        >>> JSONEncoder().encode({"foo": ["bar", "baz"]})
+        '{"foo": ["bar", "baz"]}'
+
+        """
+        # This is for extremely simple cases and benchmarks.
+        if isinstance(o, basestring):
+            if isinstance(o, str):
+                _encoding = self.encoding
+                if (_encoding is not None
+                        and not (_encoding == 'utf-8')):
+                    o = o.decode(_encoding)
+            if self.ensure_ascii:
+                return encode_basestring_ascii(o)
+            else:
+                return encode_basestring(o)
+        # This doesn't pass the iterator directly to ''.join() because the
+        # exceptions aren't as detailed.  The list call should be roughly
+        # equivalent to the PySequence_Fast that ''.join() would do.
+        chunks = self.iterencode(o, _one_shot=True)
+        if not isinstance(chunks, (list, tuple)):
+            chunks = list(chunks)
+        return ''.join(chunks)
+
+    def iterencode(self, o, _one_shot=False):
+        """Encode the given object and yield each string
+        representation as available.
+
+        For example::
+
+            for chunk in JSONEncoder().iterencode(bigobject):
+                mysocket.write(chunk)
+
+        """
+        if self.check_circular:
+            markers = {}
+        else:
+            markers = None
+        if self.ensure_ascii:
+            _encoder = encode_basestring_ascii
+        else:
+            _encoder = encode_basestring
+        if self.encoding != 'utf-8':
+            def _encoder(o, _orig_encoder=_encoder, _encoding=self.encoding):
+                if isinstance(o, str):
+                    o = o.decode(_encoding)
+                return _orig_encoder(o)
+
+        def floatstr(o, allow_nan=self.allow_nan, _repr=FLOAT_REPR, _inf=INFINITY, _neginf=-INFINITY):
+            # Check for specials.  Note that this type of test is processor- and/or
+            # platform-specific, so do tests which don't depend on the internals.
+
+            if o != o:
+                text = 'NaN'
+            elif o == _inf:
+                text = 'Infinity'
+            elif o == _neginf:
+                text = '-Infinity'
+            else:
+                return _repr(o)
+
+            if not allow_nan:
+                raise ValueError(
+                    "Out of range float values are not JSON compliant: " +
+                    repr(o))
+
+            return text
+
+
+        if _one_shot and c_make_encoder is not None and not self.indent and not self.sort_keys:
+            _iterencode = c_make_encoder(
+                markers, self.default, _encoder, self.indent,
+                self.key_separator, self.item_separator, self.sort_keys,
+                self.skipkeys, self.allow_nan)
+        else:
+            _iterencode = _make_iterencode(
+                markers, self.default, _encoder, self.indent, floatstr,
+                self.key_separator, self.item_separator, self.sort_keys,
+                self.skipkeys, _one_shot)
+        return _iterencode(o, 0)
+
+def _make_iterencode(markers, _default, _encoder, _indent, _floatstr, _key_separator, _item_separator, _sort_keys, _skipkeys, _one_shot,
+        ## HACK: hand-optimized bytecode; turn globals into locals
+        False=False,
+        True=True,
+        ValueError=ValueError,
+        basestring=basestring,
+        dict=dict,
+        float=float,
+        id=id,
+        int=int,
+        isinstance=isinstance,
+        list=list,
+        long=long,
+        str=str,
+        tuple=tuple,
+    ):
+
+    def _iterencode_list(lst, _current_indent_level):
+        if not lst:
+            yield '[]'
+            return
+        if markers is not None:
+            markerid = id(lst)
+            if markerid in markers:
+                raise ValueError("Circular reference detected")
+            markers[markerid] = lst
+        buf = '['
+        if _indent is not None:
+            _current_indent_level += 1
+            newline_indent = '\n' + (' ' * (_indent * _current_indent_level))
+            separator = _item_separator + newline_indent
+            buf += newline_indent
+        else:
+            newline_indent = None
+            separator = _item_separator
+        first = True
+        for value in lst:
+            if first:
+                first = False
+            else:
+                buf = separator
+            if isinstance(value, basestring):
+                yield buf + _encoder(value)
+            elif value is None:
+                yield buf + 'null'
+            elif value is True:
+                yield buf + 'true'
+            elif value is False:
+                yield buf + 'false'
+            elif isinstance(value, (int, long)):
+                yield buf + str(value)
+            elif isinstance(value, float):
+                yield buf + _floatstr(value)
+            else:
+                yield buf
+                if isinstance(value, (list, tuple)):
+                    chunks = _iterencode_list(value, _current_indent_level)
+                elif isinstance(value, dict):
+                    chunks = _iterencode_dict(value, _current_indent_level)
+                else:
+                    chunks = _iterencode(value, _current_indent_level)
+                for chunk in chunks:
+                    yield chunk
+        if newline_indent is not None:
+            _current_indent_level -= 1
+            yield '\n' + (' ' * (_indent * _current_indent_level))
+        yield ']'
+        if markers is not None:
+            del markers[markerid]
+
+    def _iterencode_dict(dct, _current_indent_level):
+        if not dct:
+            yield '{}'
+            return
+        if markers is not None:
+            markerid = id(dct)
+            if markerid in markers:
+                raise ValueError("Circular reference detected")
+            markers[markerid] = dct
+        yield '{'
+        if _indent is not None:
+            _current_indent_level += 1
+            newline_indent = '\n' + (' ' * (_indent * _current_indent_level))
+            item_separator = _item_separator + newline_indent
+            yield newline_indent
+        else:
+            newline_indent = None
+            item_separator = _item_separator
+        first = True
+        if _sort_keys:
+            items = dct.items()
+            items.sort(key=lambda kv: kv[0])
+        else:
+            items = dct.iteritems()
+        for key, value in items:
+            if isinstance(key, basestring):
+                pass
+            # JavaScript is weakly typed for these, so it makes sense to
+            # also allow them.  Many encoders seem to do something like this.
+            elif isinstance(key, float):
+                key = _floatstr(key)
+            elif key is True:
+                key = 'true'
+            elif key is False:
+                key = 'false'
+            elif key is None:
+                key = 'null'
+            elif isinstance(key, (int, long)):
+                key = str(key)
+            elif _skipkeys:
+                continue
+            else:
+                raise TypeError("key " + repr(key) + " is not a string")
+            if first:
+                first = False
+            else:
+                yield item_separator
+            yield _encoder(key)
+            yield _key_separator
+            if isinstance(value, basestring):
+                yield _encoder(value)
+            elif value is None:
+                yield 'null'
+            elif value is True:
+                yield 'true'
+            elif value is False:
+                yield 'false'
+            elif isinstance(value, (int, long)):
+                yield str(value)
+            elif isinstance(value, float):
+                yield _floatstr(value)
+            else:
+                if isinstance(value, (list, tuple)):
+                    chunks = _iterencode_list(value, _current_indent_level)
+                elif isinstance(value, dict):
+                    chunks = _iterencode_dict(value, _current_indent_level)
+                else:
+                    chunks = _iterencode(value, _current_indent_level)
+                for chunk in chunks:
+                    yield chunk
+        if newline_indent is not None:
+            _current_indent_level -= 1
+            yield '\n' + (' ' * (_indent * _current_indent_level))
+        yield '}'
+        if markers is not None:
+            del markers[markerid]
+
+    def _iterencode(o, _current_indent_level):
+        if isinstance(o, basestring):
+            yield _encoder(o)
+        elif o is None:
+            yield 'null'
+        elif o is True:
+            yield 'true'
+        elif o is False:
+            yield 'false'
+        elif isinstance(o, (int, long)):
+            yield str(o)
+        elif isinstance(o, float):
+            yield _floatstr(o)
+        elif isinstance(o, (list, tuple)):
+            for chunk in _iterencode_list(o, _current_indent_level):
+                yield chunk
+        elif isinstance(o, dict):
+            for chunk in _iterencode_dict(o, _current_indent_level):
+                yield chunk
+        else:
+            if markers is not None:
+                markerid = id(o)
+                if markerid in markers:
+                    raise ValueError("Circular reference detected")
+                markers[markerid] = o
+            o = _default(o)
+            for chunk in _iterencode(o, _current_indent_level):
+                yield chunk
+            if markers is not None:
+                del markers[markerid]
+
+    return _iterencode
diff --git a/simplejson/encoder.pyc b/simplejson/encoder.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..e59d372a7ab88749c287a7a2a77dfad41ebd616b
GIT binary patch
literal 13938
zcmcgz%WoV<das@tK4$ooM3ItguUoX&8m>u6UVGPCtt?yCBhuPSIZfHJC2EJw=^C=d
zVfU!JM<i`B*u+A}<Q6131Tc_W@&{}V0dmVN2yzdC9C8T|Ag2Vm<dV(r_f>b#3`xaN
zKxe3_sjlZ&Rp0mf9@YBQzmHU2|K^)Jb(MZj<M#u6<3F^N@|1dj)KXqSty$`UrM4#I
zv8dJxs##PIO3Jz)oK_{>ryf^SIHD|k&>9s%L0O-t?Mu>rKs^|IUi(4QUR%m9E3Z#|
zjp-^Xee9RVq3m%$9*5PcQYCLt6}+;#Qt~Ru3^6l|%m_21$c!;Fj?6J;jw5q|nF(Z0
zsw)ph)aF}Ck1B7HW8Qf5ntCv%^oa7ul|H8Q7)!k=W*U~7{2EJo@^9+CKCZk|Lc|HB
zC)9(J$~&!|VY4QccSbVkQc^AKj-FBvipqOQ=~EoSdzsZ=EA_>L(@LLF8Wk@q{fg4x
zQy5jhs<f^2S*53yeog7umHxi+UQy3R)Ppy83JcZm@o<>jS#LG<x(*UI@x#Cl8}`o@
z?#|x~>Y=BjivMeT=BqeFl}sVgQeInjV;v`vAFR~exbFL=!7v)EyKA~;T1D|G6g*tq
zym)bLar3Rl;^Oq;@?v8#Sd12vNAVacs}E85X#3$W7VWv;dNdOcnGToOq0x907x28e
z7<2kX^Dv$8VcI+_OU<BpXvo8`c?jg8Vjd!S7%>ltJd}MK!^Hg@xc&W$?`$Rm$iAh2
z%uk(DaOx7i*YS<dA_4zm&v%526Qz7hZQ~zKp`fO)rBe&lBAfmQiKCNt6xgn8r5)*3
zq~q=#cI{8Ll2z=s*~3c3#z$u5%p7KcLmfkcnJ@<?!}MUH(+gD+Ht!=*l1(be-CVeS
z?US3e8`tk8eRy1n!gkA?2_M(pq`q23MoALCkKBb%V;#j8*8IqCHp8bEZbV^gIo!N(
zLqFBcuyvu~1`WTyp_ebjJ~`xZ90nKCb3NbMlI_C6nr>acf#GCtmF18)Ll(Ezkd?^3
zw3kgeR~S3o?IWg$yLEs)r#TysQI*Pt{9L&y*IBcK#OyHG3I`d^C@U!_zbFTbO)sg(
zWfh)K77w8>J%k;l0!tB}QidohbWi$~KhWU`9M+UqBwKK{_!^RoEdu-6!u30M=E9)4
z^+GHXbEtOGn7brP;S;~YEPsp)i4;b~<Y3gTVbTRIJ-u*0h*b$IBf72#y5dw&!-fU5
zT_7ktRw^9BvQSYFoLYGD2Uxh&T|z5t1|Ry=`(D5L;KLo@5!Q<mc`7Mj=r;P6RHL9K
z7X-IG5LYdOGQ+SS&gvFAU;RBOCIkDw29x;eAF)$J5hIf(t@8LBuG3*I8AS4t-ntn@
zVI-^-MxN}kLzZ(mnqWkL<zl$E%+C*xmfM7Z-{Sa_NR%~Z6|G@w6yK4;Sg~Rqw?+#h
z4D(geD?;kWeh?>aP}fExl1SEa``SY7(|flrfqyWZcBA@g!iCO<ftE5)6N?k>ODgBW
zJ`VR)WJ=cjU5L~f%+T6O;rsyTzlqwIt5c;ntP@swJRy8{X^%SV_~Ds+h;O`zL_@(r
zvXFvxpq{}-qUfRfb$|8`qBbc1P>W1SJu6e|gZZAJBUF38WT4v7azH)9I77-YycWZ1
zP&YRd9mM`}QyU4pvYI5V%NH&X$Ige*%2hiBGrJK+8610V;u4eFb>O#-&l_M~Xt!Em
zwb)KpHCh8MH=y|JaQU&Wqtp#NJK1XK*k0bUJ>78I&E&G_`R3fg&;GJE1^l-&5~vB%
z&$gjFd$hNu<(uyv{Om8w#`OGpl6RNPc1m_unvQvp%(>^$+4SRN)=t{c3F#o)wi`w6
zRyJft=L?L9EuXd9flod+!)&LjF&p&7>GT7T*$jh~S-a5;UF^fQ9kkb%b@YE9^Ip`>
z7M%{VZG&67%3hq#TW&M%8UW*N+l`*G7ax<*k*(7Fa_!A#r|d<>6t=q;+L|H-USIVg
z3L(szdbkq!UurvqU__Zb%-V5#x!!bRBN<{m(7d!=8E0wfd@3W=nWZIrUBeFY><vFz
zg&>)M(z0X~hZcz?g`sSiE56(GzjPteGLn%$5#Oby5M%ibyA{SF^RtGg4If+UCw9CV
zwws<^cd-Q&;<(+?k<ch3<un=-xXQ)3?7Fmc4}vY4W@%|Ag#$5luu5u|%XXJaCd%;(
zO=hf%Um{~{#2PYCvr5&VkHxsC;Su^2C3x(U3?BO>gU10vBTbJ<Xy5_0XgWjPq62&!
zSRdN}LDK}@5*}DnHZ{=0c&M=6n2Yg6!1VPH+K12vyd&my0rjjo0NAJoG1C*u0FZ2R
zr(wryerru{#Wv1gI216jssnB?N?beND{_aMBznD-$o{gwpsm1W!<Iqhc-=_bICTp9
ztbIUYK_of(JZH}b>ZXG7NPerYf(X41A~2rVt6M^COMB^|rAxp90qn+SA<-0GS%n?8
zlU7?6veI@VH%PPwtB3Y7227%S_6+n5!-AcBI7I7QR|a48RdlZ>Fs^MK*Ikm(L;rpf
zIy;%sumOvl^JXKOIeQmUU)A-sTHTN8?WP;`EG4iB(ebQJ^v4hNQ@tH0;d-j_yhB!F
zW|UE}Zn8%{cBC6R!tp`Dd2PCUowH2Bd?>g$PesbX5AYlUoCgu29mVu2s~f964rwD5
z!!~5g4eYy5bp&kQ5CMaD@sRkrOFW_M&Vo72@d{;j0_QTe#p&qX4hVL*Q426;_n`*%
zygNT@-!b%TnXQ=19>Mdn>U>&b5O}s5%bYm2dxW}Wz3M*ou_MTnS1C7k+|qR)4w69(
zut2NngK1{-!Ilj()gg2^4epGv%z7AO1ox@CP>=jpV$+fKGE>ALrZM*-2%p)Fp8bHV
zW$fYFpSjJpK__ymA>VA5XuSR63mc}E$#2g1fdFF4{c!%tG&nIg^0CwVcPPdXAQyHH
z#`&qy1lScEXQSN|u8H&t3@17B1Q7yJ6o%vT)rjDmP0S#jGsb}DfNamrgdBS|_{Oz8
zcWW*Q=kUY5^7pOD4?J!yXmD{h!CatMa3W6u`Vin14Nwt;lG(&a$*IsL=wY@zRVC}1
z=0Uz}8$6vPTXQWiJ(n#9Nb2)J(&?M@nZYjC$ooQ&lrWZZ(d?mkda(X=l-PmZX!-%I
z%j|qbU1JSYO~N3u1u)%uBL}@KpK_q~0Du}B<^tEjxJJ`q8(q6fOswUVvplrU<4iui
z*mA<{I<sH7qt$b>Hve6=&&{wlv{!U;kVfupK2$Hk_Ey-=C^F=3aa0-f+>G#S(+7CE
zzzP5a7^a1A!gH6IY9({pjdmc63W8uJfHLw=vx#FOc%?9%(<P0-U+0o8!+_A9a-ad}
z+)yx92ewccM+7T3J9ucoEn#sSFwZPyAIxja2DjI6=v|PEMij*s6Ha*eDVx$f@dK(M
zs2nuOIkB@2Xr>qoT*o@WlwqzT+VCw`%wFUZfNwz(8gUhKS#gK$?t%2KJ%tZCcd3ik
z`6}HxaZxj!D?Vtq0!v2Gq*oUubW3wQmM6l7Adk4SMns&G9Gu;IxilF;Q4ga^s41mW
zsL57R6<43Ga;%#Tht8_=5|fviyuyS5PUlr5;(+I(5Ie82g2ADq4GRc;wHno5tp-Oo
z4G)|zTb;iVYtkCQU!4XdzeRknvn^MEXq1WBATk5{Z3;iXgB(M)Y!|<d9(l+X2M#Vu
z?PZ^EncLoC6baiyWu#Vg&PHgLK`$NTlz%BWVoAe#hW^JH8c3p!vU_dhe58)8ypQQK
zYnkG53&ZJ6mtjP3IyJgD)Uei;{UmauEn05|z-9$A>a-K`Ir6D<Zf*K&TGoC!b+kDP
zKVXxrQI$-AmCRhu2QqDJSbbXu3t1^-a7W&gY&GnFWY$-2);08YZtEUCPz&zQfoU}y
zy~CTQctg95pdArx4o;o6qBP$$;rZN^%GPSa4x}~a4NQhH0%P4rK5t^N6xDns5_BSf
zo0!t;WJU&S!=n`uk-9&{xZ*&m<01wWVtz#o{stKaWf4*}LD?q=%9`hb1ZjT?hX=S(
z%tDtYNP8Bg5>a|wP{R_k#U&72DfE$O=#z)a62}Q$`&BrKK_y&^+Jz^-jVHKG5)fU;
zTEVFj(F1sVZCQwSk_x0l3P6Y;Cj!Q;adaGFDJLnKxNuSVBWY0@{rxj6$?3TiFbKa-
z!_#8O?*@8<QC+}%_3G7b=dC((UJy}NznX4@;q+zu;q<Z_P0!l+`EvTvPKT4uJ*UOF
zF1}%)RYJ@H-8E>Z8jOkrOGikuO2BsHUV`9DWH1YHj<e!5CIoheQBecN$S6lN344&c
z4Yk5<bl@aI)|aabF-D~5ap(so_DfcDW{?<?GW-{9QeSNcYw^*ts0?hV{1s*uTvmhQ
z);Lgn1VP>@tAg<EXz3)7eB7!R(T4XKT%<6t4Y47ELUt<3TE(Ri7-ImD^*-iUgPR7_
zAPl^N3r^Hv!N{>j?id~yjpLse;ijP=ZRz-<Rlfr7f?@G*2=V%7=q{WdE@3RW_+;#0
z!8EQw9B!NJ5VG${6BC8-htntog76#{Y>RYMQgAi$W0K<Lw5)deRd5-d$I}o-PiF~X
z9Nr&-QekICHy}?X%FRMmqTLAptDAylVo0sPbjKB>1Xjgw-SRc!Hrj>nX!tA#)qR#G
zd^R{$ev`=AB`RH-XTPeTwiD)oA+=AOI!sz!_E!u!hp3VDtvIZ&>E!%IgdSBHZ00aY
z5)L7k@GF-!bI1@(1Y)rr*$tCi#Slr%4HLEtO$bnOnKv&cfQX-wH%gf)6X~GoR0|`2
zCA)xie#i#+9^u8`ASW@x5&aYLa)+uQ2PdpLv4iJID3^5-HLwEwBTIwjVbXw8gP#aH
zf(L=sQVi}!@w6!ho~OkS5EKugSOQ?&3G7Mh47d>YTqQA;WP?&WNszk_+eJ#|<(dT{
z0I|w4w?8hUDh~q0+@ZU$xPiQ|tyd7>mtgTzy4K*SG(IH?H23l^+eUp7&^kW2!;KcU
z7OWBjR3NQJUKL1#Vb~CJwgyL)d2UpKxaxOsMkWN1ME{H_<RV^`Mu1!Cw@@hz;L56K
zO%woAM0SF@v780K#gJx=V7Ebbn$%)Q-}?COwR<(^<|mHX+WA{|=I`A5!gvF<?pFZB
z_%>!Zt!?Kl6Pt+`yW_~2_FXbZEOm0scYc6J*|c>xT7%=|{FwDuSxUsMb@jyK(Q&#%
zA^kgi<2N{NrD9bI{n$aK<JM%~>61Ue{vF5PWT9xC#P66jU*#>GY)TE`sC8Yd$%fTx
z>!H_f@{y~n)x5A?tC@}9mI$B7O@MPAk4A@bTCtX#cbFqN9X^rVQQYJ^G!$>)8&ie%
zzua$`zp{1mQhB0$rq0(s_+>i+Sp2U@cJZ&Ec8hAaq;`kYZok?cP`iU_x2$$6YPV1A
zj;P&HwR=qM9#^|3)b51ZJ*jpl)$Wwq#Vag$)x}c3tJLqI3#zQH(a<*^4YQa5F~x8;
z=6Khz-D94jo5V3O@BctvPTSaX#=*NuMH%Om+B*d-p^(mtnM#50$M<b~<1gTe0oYmy
zzhf<*SspNt__K$baNr&E@4I-Ah&~ZrpdEFOVSB=8+{4R4Vwu9bOYKcm0_Lvp2?W4W
z*c;DAdItz7s`FjGe*zn!pOq+@n3#g$um?-Eq^4*C$OZhnG&o2XOb@9=&E5!g@aE^V
zA8tJQ#M*)J3sQi|d&fkz!wkVi1gFI?18Q$jY;C^!fFdkaUYDBs%zE;dD8l^&);K7y
zYM~xiu$>yr)KxRsU309vrkvHJ6IyDolA6_`4>9eD-f7c@VtHpxu;3obia3h2-Ep;t
z7q0Twdswlt_@QlZiSjm<Zk9TfEp-p}P<Im^)I?9wCP*5@1`eqmY<d}!J^4@TKKA53
zP9Qz^SF_W)bnvu36CVU`nSsi@0~DM&{P*PW`O*ZTZC+fYhmT@{@%1d$pU30j=_a^=
z)}FX&5Alu=xROal3T)9Xy!JC{hNd>vqFgvgi$`Kr2-uid3dOq#L!26*hS)t!^#nSL
zA<deEGzHlV4*Q;{*X4FYU_Xs&rmaobCksoOY5gcQ@kO^flp(1QyQwNlhsZ9YBDQ5Z
zQ5hSnKhtN<bu=<A2!kgeLzGBI3)JXKII|pzub5FkbVWgBFL*618AiJg^k<=g;h%7-
ziyTQ%JB?i3X6Xec;`H1=?X5u;7v5aVTJlr>=WS%Xm8c&`LXXB5~>1%6x{5QEbL
zsvoV4QaXX!&fg?VGMHtBKDa3+H)gRlTU4O1`tU2TMqbNd?KYU;P*@wz*qg8hArZSP
zg|*=v*6>Q>eprJ{bzlu_56jKq<AqF4x=;<18&rezi(gHA1HwRVQb3am!Wv*pU@d$N
z<A4+3yaVsV&wzskNWz;V&p;(!cVb^QftxN(Hm3>zzZ;Ln3X8yk0m1>18mI?XAGRmn
zxD5UR%QR)^g)(9RND;6>m*9^uBsv&KqiG8d3B^06ctVhl#qfPl+>l}}9H7Z!00@fj
z=93hNyD3<4s>!aY@Kze&J_JHP`4<(u1nU>jftR}ky`WsCypb$Y2nZKUpAgHrAG4MS
zHNYw%99ilrE(}XHi^V%%tOwq+3Nu*9r<9h3(!4ZXElUOZOj|%CSH)7|8b?Sc=w1}3
z!J@jRNgJ8%Wi__<VD(9=fi4tBn8rkEaB{ftCW@QYjOHi~r?tBYw{xneh$vn*C=SQh
z5M8(r!tYa=8SXp`#WU_qQGAqJnac%HTzI{M;shXr;$Q9juTcD}E);iuhTZ~)h=<n+
z?EDh+7VwofufWrw7B7XeMhtmDB6*be-qxO)0#vJ`uoguDTxq)N%bt7HB~Ec<=VK;6
zXYvsedEpW?+cBXz3qrc73ooi?r%J#vmjF~s1nF2HnU@8E_(XImcFwUW*I{lX08q*U
zM1R8K-(<r5aBL=@GFf3#XYv`7x0&2WQsw)|j*CQ87Ox~a_hHWGto(w>117&<B2Ljm
z<`$WV=RwWlJYsSki81f<8x99=dMIa!74$P}+0Ds5ed63^v+qiWaQcsVHouR|K^;Qe
zH#(#YSB8HB&@WSkVQ7b8XpB;kp{~?XlwXFq2CRX?8PPO-)(~{ZINY5P35YQ$R)&rl
zV_D%_bWI5q@ykPrzX6dn!H^njlOQ1KN1!P9(jsb89#eQBKn0$ZrdB3Fr@+#AQ#ziv
z6`gU(5*rT_z`87FFv4k$ry2}hPvnh^t;lML(-|uM1CNHtV_gO%l+NZqD5D6WvY;Wv
zC=@dv82Gp9e(+a$M+3C%^5>$~1V{FF`7d<YLzmnv?C~E!5Hw$p|A0uE+zxg54@KiY
z5QmI@R%-KQv7-;2@`-i7GhJ$h7F7qoB#a_5-4XF`!!ZFLV^s2>O)x}cl`<#-Tb*D|
zq-mejQKa@uod}$WV@J3K(XN(W3jV*!)(uSjCzLG)AQ<*KR0<dv7E23~#NR^4f`f#i
zgfc@!Q&qaw#-<IJlT9H+85CM$PQa$g+&U8mL=1pPtU!!Z*(2E=K`?<V*;+v`0UFss
zu~=!*n#oUdD49|w+IJX-L0~WXIYL!_ERHNei0qKY*#vYC1HGfrNzR9up`T|$u29E5
z`q90g-+r|!TH`lRAc_!|XJoq0e`Yve!z&5eYqw&Dy%KIk{duoCOQZ?cuFy^LvXTkV
zU`pj&W9I>O#(OJ%Q#&NWkyAav9A!X!83`|n^7BP$#5&1twW-nStC7(@AFvmX$9bO#
zjdSM|61kNy!DxxuJf8)={q$wa3=3f7qjO*61g@A^*Hv07@jWE{)-WPu6L4RK7;)rp
mVGM#ZW|bfaoxh>Ni0Ut#Ee>1#g>t!kdZaM<*Njmf_V?dj3=-%7

literal 0
HcmV?d00001

diff --git a/simplejson/scanner.py b/simplejson/scanner.py
new file mode 100644
index 00000000..adbc6ec9
--- /dev/null
+++ b/simplejson/scanner.py
@@ -0,0 +1,65 @@
+"""JSON token scanner
+"""
+import re
+try:
+    from simplejson._speedups import make_scanner as c_make_scanner
+except ImportError:
+    c_make_scanner = None
+
+__all__ = ['make_scanner']
+
+NUMBER_RE = re.compile(
+    r'(-?(?:0|[1-9]\d*))(\.\d+)?([eE][-+]?\d+)?',
+    (re.VERBOSE | re.MULTILINE | re.DOTALL))
+
+def py_make_scanner(context):
+    parse_object = context.parse_object
+    parse_array = context.parse_array
+    parse_string = context.parse_string
+    match_number = NUMBER_RE.match
+    encoding = context.encoding
+    strict = context.strict
+    parse_float = context.parse_float
+    parse_int = context.parse_int
+    parse_constant = context.parse_constant
+    object_hook = context.object_hook
+
+    def _scan_once(string, idx):
+        try:
+            nextchar = string[idx]
+        except IndexError:
+            raise StopIteration
+
+        if nextchar == '"':
+            return parse_string(string, idx + 1, encoding, strict)
+        elif nextchar == '{':
+            return parse_object((string, idx + 1), encoding, strict, _scan_once, object_hook)
+        elif nextchar == '[':
+            return parse_array((string, idx + 1), _scan_once)
+        elif nextchar == 'n' and string[idx:idx + 4] == 'null':
+            return None, idx + 4
+        elif nextchar == 't' and string[idx:idx + 4] == 'true':
+            return True, idx + 4
+        elif nextchar == 'f' and string[idx:idx + 5] == 'false':
+            return False, idx + 5
+
+        m = match_number(string, idx)
+        if m is not None:
+            integer, frac, exp = m.groups()
+            if frac or exp:
+                res = parse_float(integer + (frac or '') + (exp or ''))
+            else:
+                res = parse_int(integer)
+            return res, m.end()
+        elif nextchar == 'N' and string[idx:idx + 3] == 'NaN':
+            return parse_constant('NaN'), idx + 3
+        elif nextchar == 'I' and string[idx:idx + 8] == 'Infinity':
+            return parse_constant('Infinity'), idx + 8
+        elif nextchar == '-' and string[idx:idx + 9] == '-Infinity':
+            return parse_constant('-Infinity'), idx + 9
+        else:
+            raise StopIteration
+
+    return _scan_once
+
+make_scanner = c_make_scanner or py_make_scanner
diff --git a/simplejson/scanner.pyc b/simplejson/scanner.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..30d94445f0a0c941ee46b6c4fa3bd255e662f6ef
GIT binary patch
literal 2340
zcmb_dUvC>l5T8B&cj6S1v}wr$X-SKd%5~uhP(>h$k&IGTvRgn&D(iB$PA@s%o$fXz
z5y=AtVOzZO)Mvf`?|cM43}2x9X3kDsMZDG4&dtuw@3*rvb9;aNTPd%;dewAj{43%4
z6-F|IaEW#x6}c82DcVtVx+v2O9a-dOXeUeR``{L3b&d|p6jnX8C{7O5ZHEFAz?
zAg#zNlA9ByB(hAKY@MOa3jk)x&C{>gutGXZ5r}n#b~3zmr&{2M79hUuJZY_%@JI(M
ziDL(Wj?3O_{909oRWl3Gw~uspyx7K^k~N5GZKJyJ#ly4RPimh(-*ea3)~b6C_T2kx
z8`WLic)nY^|9nHH4ioX1!N_1FzeAi6c|@aBQ8X%x#iCJ>OoqHHjk03N(I_WMo<=26
z3N*4rDbh%ZQle2_lroJnG|16F(ZHfXi3VjFWN83no(4pN0u74Po8grIhTRJ^EFc*c
z;%PZ7ix_-l&P?(LET?l!e5UBuxkXYKLsNw@ihfaPVa_aOJ+vrXCN-4f0ET2Qq42{D
zU1X^fye7qd8Sz_%UvW&&em#p)*I|i<dAi5}@J|ZJUJ^@I#>5OL5o+BD{!IPQGzefF
z6A7CA^0ai@Er@-d6dG`B1h^A~DXjQEu+jvEl1#%sOJU`!uo>QM_7a9@5dw^|o5F#m
zm@p#hbC9APk<Su^9w<@w99<CYW#~Lh=Q%n@S#uN>u$HIr9^j}vIAKFOyA@i3eWG3{
zIxkRwH)e>o$Wl5#EAS>B(n%yi{GG-=Cow+6<T6v&IQI9%eiI}G!UQCI0xSvm=M?<@
zRq#B67pB1r6EKzpyp@6%uY#{L_{KE&#srKd0V4-#vmsxd>Js|1g*nk3Pu^1&KZ#*i
zWPmpauP=+>*!RU|WNPALEz=&74Hp(Y+fOta8&f7~dHkB9=1}c)n<nlWm{>G}o)>uL
zR9tHw-){+v+GIg47gH8jSD!TEIE+mN(~b$FrqQu&yfBbpT4A6?dCF07DBnmZd1wc5
zcpN1Xg$~@R?9cYZ#9nY9cF#SLkOF;ToELU1A@vPkZeC#YfsTc|7u!zCa}voj)=8Cb
zBLVBc30-F7Lqv9*=q|v9*V9?g4{c*6TRYQBb{yNM<4Y0|bc5smJ~m}+xPPb}(|r+!
zM`rGl%L#+T*r4ZICZ$guC0}yOcEiBYQ|sw@tMI2}1ET&c(Q#5g@?y{T!<Y4~IE?ng
zllqo^sr@jj_iPl%`BCrJ6R#in`Y;KD`uO^O5S_M}X_?6$L6FL*Is9j=idt3`wTiK<
z?yC98u&%*!9Uk|rS+xl3&B?GNh3$_)(*B6W8iXXV_3ZIxqup&cq@sNrnQ4E>9(P#W
zX0gKJ9*esW>9>Z<hWr>5Q%*a@zrvmZWcT(e3t<!r_Lkk#4LF#0ktuTxMA2z?`uoSG
z<R%2E($&9JTdi`fr31TNH*~sP!{3!yn?*d{6y!lSiL`dn;POS44sqVvNt&qHkMQou
z8`PeELu~s#h|_%aBhS~Of7fVlKIt^11dpF>KW%O|TMg;kttU^v-rjDngP~o6NYe`?
n)!s$2k|Nk1^+WgA*I)9HlN%6uHH!vYlm;tVdFUTlrBD9@kb}!4

literal 0
HcmV?d00001

diff --git a/simplejson/tests/__init__.py b/simplejson/tests/__init__.py
new file mode 100644
index 00000000..17c97963
--- /dev/null
+++ b/simplejson/tests/__init__.py
@@ -0,0 +1,23 @@
+import unittest
+import doctest
+
+def additional_tests():
+    import simplejson
+    import simplejson.encoder
+    import simplejson.decoder
+    suite = unittest.TestSuite()
+    for mod in (simplejson, simplejson.encoder, simplejson.decoder):
+        suite.addTest(doctest.DocTestSuite(mod))
+    suite.addTest(doctest.DocFileSuite('../../index.rst'))
+    return suite
+
+def main():
+    suite = additional_tests()
+    runner = unittest.TextTestRunner()
+    runner.run(suite)
+
+if __name__ == '__main__':
+    import os
+    import sys
+    sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))
+    main()
diff --git a/simplejson/tests/test_check_circular.py b/simplejson/tests/test_check_circular.py
new file mode 100644
index 00000000..af6463d6
--- /dev/null
+++ b/simplejson/tests/test_check_circular.py
@@ -0,0 +1,30 @@
+from unittest import TestCase
+import simplejson as json
+
+def default_iterable(obj):
+    return list(obj)
+
+class TestCheckCircular(TestCase):
+    def test_circular_dict(self):
+        dct = {}
+        dct['a'] = dct
+        self.assertRaises(ValueError, json.dumps, dct)
+
+    def test_circular_list(self):
+        lst = []
+        lst.append(lst)
+        self.assertRaises(ValueError, json.dumps, lst)
+
+    def test_circular_composite(self):
+        dct2 = {}
+        dct2['a'] = []
+        dct2['a'].append(dct2)
+        self.assertRaises(ValueError, json.dumps, dct2)
+
+    def test_circular_default(self):
+        json.dumps([set()], default=default_iterable)
+        self.assertRaises(TypeError, json.dumps, [set()])
+
+    def test_circular_off_default(self):
+        json.dumps([set()], default=default_iterable, check_circular=False)
+        self.assertRaises(TypeError, json.dumps, [set()], check_circular=False)
diff --git a/simplejson/tests/test_decode.py b/simplejson/tests/test_decode.py
new file mode 100644
index 00000000..1cd701d4
--- /dev/null
+++ b/simplejson/tests/test_decode.py
@@ -0,0 +1,22 @@
+import decimal
+from unittest import TestCase
+
+import simplejson as json
+
+class TestDecode(TestCase):
+    def test_decimal(self):
+        rval = json.loads('1.1', parse_float=decimal.Decimal)
+        self.assert_(isinstance(rval, decimal.Decimal))
+        self.assertEquals(rval, decimal.Decimal('1.1'))
+
+    def test_float(self):
+        rval = json.loads('1', parse_int=float)
+        self.assert_(isinstance(rval, float))
+        self.assertEquals(rval, 1.0)
+
+    def test_decoder_optimizations(self):
+        # Several optimizations were made that skip over calls to
+        # the whitespace regex, so this test is designed to try and
+        # exercise the uncommon cases. The array cases are already covered.
+        rval = json.loads('{   "key"    :    "value"    ,  "k":"v"    }')
+        self.assertEquals(rval, {"key":"value", "k":"v"})
diff --git a/simplejson/tests/test_default.py b/simplejson/tests/test_default.py
new file mode 100644
index 00000000..139e42bf
--- /dev/null
+++ b/simplejson/tests/test_default.py
@@ -0,0 +1,9 @@
+from unittest import TestCase
+
+import simplejson as json
+
+class TestDefault(TestCase):
+    def test_default(self):
+        self.assertEquals(
+            json.dumps(type, default=repr),
+            json.dumps(repr(type)))
diff --git a/simplejson/tests/test_dump.py b/simplejson/tests/test_dump.py
new file mode 100644
index 00000000..4de37cf4
--- /dev/null
+++ b/simplejson/tests/test_dump.py
@@ -0,0 +1,21 @@
+from unittest import TestCase
+from cStringIO import StringIO
+
+import simplejson as json
+
+class TestDump(TestCase):
+    def test_dump(self):
+        sio = StringIO()
+        json.dump({}, sio)
+        self.assertEquals(sio.getvalue(), '{}')
+
+    def test_dumps(self):
+        self.assertEquals(json.dumps({}), '{}')
+
+    def test_encode_truefalse(self):
+        self.assertEquals(json.dumps(
+                 {True: False, False: True}, sort_keys=True),
+                 '{"false": true, "true": false}')
+        self.assertEquals(json.dumps(
+                {2: 3.0, 4.0: 5L, False: 1, 6L: True, "7": 0}, sort_keys=True),
+                '{"false": 1, "2": 3.0, "4.0": 5, "6": true, "7": 0}')
diff --git a/simplejson/tests/test_encode_basestring_ascii.py b/simplejson/tests/test_encode_basestring_ascii.py
new file mode 100644
index 00000000..7128495f
--- /dev/null
+++ b/simplejson/tests/test_encode_basestring_ascii.py
@@ -0,0 +1,38 @@
+from unittest import TestCase
+
+import simplejson.encoder
+
+CASES = [
+    (u'/\\"\ucafe\ubabe\uab98\ufcde\ubcda\uef4a\x08\x0c\n\r\t`1~!@#$%^&*()_+-=[]{}|;:\',./<>?', '"/\\\\\\"\\ucafe\\ubabe\\uab98\\ufcde\\ubcda\\uef4a\\b\\f\\n\\r\\t`1~!@#$%^&*()_+-=[]{}|;:\',./<>?"'),
+    (u'\u0123\u4567\u89ab\ucdef\uabcd\uef4a', '"\\u0123\\u4567\\u89ab\\ucdef\\uabcd\\uef4a"'),
+    (u'controls', '"controls"'),
+    (u'\x08\x0c\n\r\t', '"\\b\\f\\n\\r\\t"'),
+    (u'{"object with 1 member":["array with 1 element"]}', '"{\\"object with 1 member\\":[\\"array with 1 element\\"]}"'),
+    (u' s p a c e d ', '" s p a c e d "'),
+    (u'\U0001d120', '"\\ud834\\udd20"'),
+    (u'\u03b1\u03a9', '"\\u03b1\\u03a9"'),
+    ('\xce\xb1\xce\xa9', '"\\u03b1\\u03a9"'),
+    (u'\u03b1\u03a9', '"\\u03b1\\u03a9"'),
+    ('\xce\xb1\xce\xa9', '"\\u03b1\\u03a9"'),
+    (u'\u03b1\u03a9', '"\\u03b1\\u03a9"'),
+    (u'\u03b1\u03a9', '"\\u03b1\\u03a9"'),
+    (u"`1~!@#$%^&*()_+-={':[,]}|;.</>?", '"`1~!@#$%^&*()_+-={\':[,]}|;.</>?"'),
+    (u'\x08\x0c\n\r\t', '"\\b\\f\\n\\r\\t"'),
+    (u'\u0123\u4567\u89ab\ucdef\uabcd\uef4a', '"\\u0123\\u4567\\u89ab\\ucdef\\uabcd\\uef4a"'),
+]
+
+class TestEncodeBaseStringAscii(TestCase):
+    def test_py_encode_basestring_ascii(self):
+        self._test_encode_basestring_ascii(simplejson.encoder.py_encode_basestring_ascii)
+
+    def test_c_encode_basestring_ascii(self):
+        if not simplejson.encoder.c_encode_basestring_ascii:
+            return
+        self._test_encode_basestring_ascii(simplejson.encoder.c_encode_basestring_ascii)
+
+    def _test_encode_basestring_ascii(self, encode_basestring_ascii):
+        fname = encode_basestring_ascii.__name__
+        for input_string, expect in CASES:
+            result = encode_basestring_ascii(input_string)
+            self.assertEquals(result, expect,
+                '%r != %r for %s(%r)' % (result, expect, fname, input_string))
diff --git a/simplejson/tests/test_fail.py b/simplejson/tests/test_fail.py
new file mode 100644
index 00000000..002eea08
--- /dev/null
+++ b/simplejson/tests/test_fail.py
@@ -0,0 +1,76 @@
+from unittest import TestCase
+
+import simplejson as json
+
+# Fri Dec 30 18:57:26 2005
+JSONDOCS = [
+    # http://json.org/JSON_checker/test/fail1.json
+    '"A JSON payload should be an object or array, not a string."',
+    # http://json.org/JSON_checker/test/fail2.json
+    '["Unclosed array"',
+    # http://json.org/JSON_checker/test/fail3.json
+    '{unquoted_key: "keys must be quoted}',
+    # http://json.org/JSON_checker/test/fail4.json
+    '["extra comma",]',
+    # http://json.org/JSON_checker/test/fail5.json
+    '["double extra comma",,]',
+    # http://json.org/JSON_checker/test/fail6.json
+    '[   , "<-- missing value"]',
+    # http://json.org/JSON_checker/test/fail7.json
+    '["Comma after the close"],',
+    # http://json.org/JSON_checker/test/fail8.json
+    '["Extra close"]]',
+    # http://json.org/JSON_checker/test/fail9.json
+    '{"Extra comma": true,}',
+    # http://json.org/JSON_checker/test/fail10.json
+    '{"Extra value after close": true} "misplaced quoted value"',
+    # http://json.org/JSON_checker/test/fail11.json
+    '{"Illegal expression": 1 + 2}',
+    # http://json.org/JSON_checker/test/fail12.json
+    '{"Illegal invocation": alert()}',
+    # http://json.org/JSON_checker/test/fail13.json
+    '{"Numbers cannot have leading zeroes": 013}',
+    # http://json.org/JSON_checker/test/fail14.json
+    '{"Numbers cannot be hex": 0x14}',
+    # http://json.org/JSON_checker/test/fail15.json
+    '["Illegal backslash escape: \\x15"]',
+    # http://json.org/JSON_checker/test/fail16.json
+    '["Illegal backslash escape: \\\'"]',
+    # http://json.org/JSON_checker/test/fail17.json
+    '["Illegal backslash escape: \\017"]',
+    # http://json.org/JSON_checker/test/fail18.json
+    '[[[[[[[[[[[[[[[[[[[["Too deep"]]]]]]]]]]]]]]]]]]]]',
+    # http://json.org/JSON_checker/test/fail19.json
+    '{"Missing colon" null}',
+    # http://json.org/JSON_checker/test/fail20.json
+    '{"Double colon":: null}',
+    # http://json.org/JSON_checker/test/fail21.json
+    '{"Comma instead of colon", null}',
+    # http://json.org/JSON_checker/test/fail22.json
+    '["Colon instead of comma": false]',
+    # http://json.org/JSON_checker/test/fail23.json
+    '["Bad value", truth]',
+    # http://json.org/JSON_checker/test/fail24.json
+    "['single quote']",
+    # http://code.google.com/p/simplejson/issues/detail?id=3
+    u'["A\u001FZ control characters in string"]',
+]
+
+SKIPS = {
+    1: "why not have a string payload?",
+    18: "spec doesn't specify any nesting limitations",
+}
+
+class TestFail(TestCase):
+    def test_failures(self):
+        for idx, doc in enumerate(JSONDOCS):
+            idx = idx + 1
+            if idx in SKIPS:
+                json.loads(doc)
+                continue
+            try:
+                json.loads(doc)
+            except ValueError:
+                pass
+            else:
+                self.fail("Expected failure for fail%d.json: %r" % (idx, doc))
diff --git a/simplejson/tests/test_float.py b/simplejson/tests/test_float.py
new file mode 100644
index 00000000..1a2b98a2
--- /dev/null
+++ b/simplejson/tests/test_float.py
@@ -0,0 +1,15 @@
+import math
+from unittest import TestCase
+
+import simplejson as json
+
+class TestFloat(TestCase):
+    def test_floats(self):
+        for num in [1617161771.7650001, math.pi, math.pi**100, math.pi**-100, 3.1]:
+            self.assertEquals(float(json.dumps(num)), num)
+            self.assertEquals(json.loads(json.dumps(num)), num)
+
+    def test_ints(self):
+        for num in [1, 1L, 1<<32, 1<<64]:
+            self.assertEquals(json.dumps(num), str(num))
+            self.assertEquals(int(json.dumps(num)), num)
diff --git a/simplejson/tests/test_indent.py b/simplejson/tests/test_indent.py
new file mode 100644
index 00000000..66e19b9e
--- /dev/null
+++ b/simplejson/tests/test_indent.py
@@ -0,0 +1,41 @@
+from unittest import TestCase
+
+import simplejson as json
+import textwrap
+
+class TestIndent(TestCase):
+    def test_indent(self):
+        h = [['blorpie'], ['whoops'], [], 'd-shtaeou', 'd-nthiouh', 'i-vhbjkhnth',
+             {'nifty': 87}, {'field': 'yes', 'morefield': False} ]
+
+        expect = textwrap.dedent("""\
+        [
+          [
+            "blorpie"
+          ],
+          [
+            "whoops"
+          ],
+          [],
+          "d-shtaeou",
+          "d-nthiouh",
+          "i-vhbjkhnth",
+          {
+            "nifty": 87
+          },
+          {
+            "field": "yes",
+            "morefield": false
+          }
+        ]""")
+
+
+        d1 = json.dumps(h)
+        d2 = json.dumps(h, indent=2, sort_keys=True, separators=(',', ': '))
+
+        h1 = json.loads(d1)
+        h2 = json.loads(d2)
+
+        self.assertEquals(h1, h)
+        self.assertEquals(h2, h)
+        self.assertEquals(d2, expect)
diff --git a/simplejson/tests/test_pass1.py b/simplejson/tests/test_pass1.py
new file mode 100644
index 00000000..c3d6302d
--- /dev/null
+++ b/simplejson/tests/test_pass1.py
@@ -0,0 +1,76 @@
+from unittest import TestCase
+
+import simplejson as json
+
+# from http://json.org/JSON_checker/test/pass1.json
+JSON = r'''
+[
+    "JSON Test Pattern pass1",
+    {"object with 1 member":["array with 1 element"]},
+    {},
+    [],
+    -42,
+    true,
+    false,
+    null,
+    {
+        "integer": 1234567890,
+        "real": -9876.543210,
+        "e": 0.123456789e-12,
+        "E": 1.234567890E+34,
+        "":  23456789012E666,
+        "zero": 0,
+        "one": 1,
+        "space": " ",
+        "quote": "\"",
+        "backslash": "\\",
+        "controls": "\b\f\n\r\t",
+        "slash": "/ & \/",
+        "alpha": "abcdefghijklmnopqrstuvwyz",
+        "ALPHA": "ABCDEFGHIJKLMNOPQRSTUVWYZ",
+        "digit": "0123456789",
+        "special": "`1~!@#$%^&*()_+-={':[,]}|;.</>?",
+        "hex": "\u0123\u4567\u89AB\uCDEF\uabcd\uef4A",
+        "true": true,
+        "false": false,
+        "null": null,
+        "array":[  ],
+        "object":{  },
+        "address": "50 St. James Street",
+        "url": "http://www.JSON.org/",
+        "comment": "// /* <!-- --",
+        "# -- --> */": " ",
+        " s p a c e d " :[1,2 , 3
+
+,
+
+4 , 5        ,          6           ,7        ],
+        "compact": [1,2,3,4,5,6,7],
+        "jsontext": "{\"object with 1 member\":[\"array with 1 element\"]}",
+        "quotes": "&#34; \u0022 %22 0x22 034 &#x22;",
+        "\/\\\"\uCAFE\uBABE\uAB98\uFCDE\ubcda\uef4A\b\f\n\r\t`1~!@#$%^&*()_+-=[]{}|;:',./<>?"
+: "A key can be any string"
+    },
+    0.5 ,98.6
+,
+99.44
+,
+
+1066
+
+
+,"rosebud"]
+'''
+
+class TestPass1(TestCase):
+    def test_parse(self):
+        # test in/out equivalence and parsing
+        res = json.loads(JSON)
+        out = json.dumps(res)
+        self.assertEquals(res, json.loads(out))
+        try:
+            json.dumps(res, allow_nan=False)
+        except ValueError:
+            pass
+        else:
+            self.fail("23456789012E666 should be out of range")
diff --git a/simplejson/tests/test_pass2.py b/simplejson/tests/test_pass2.py
new file mode 100644
index 00000000..de4ee00b
--- /dev/null
+++ b/simplejson/tests/test_pass2.py
@@ -0,0 +1,14 @@
+from unittest import TestCase
+import simplejson as json
+
+# from http://json.org/JSON_checker/test/pass2.json
+JSON = r'''
+[[[[[[[[[[[[[[[[[[["Not too deep"]]]]]]]]]]]]]]]]]]]
+'''
+
+class TestPass2(TestCase):
+    def test_parse(self):
+        # test in/out equivalence and parsing
+        res = json.loads(JSON)
+        out = json.dumps(res)
+        self.assertEquals(res, json.loads(out))
diff --git a/simplejson/tests/test_pass3.py b/simplejson/tests/test_pass3.py
new file mode 100644
index 00000000..f591aba9
--- /dev/null
+++ b/simplejson/tests/test_pass3.py
@@ -0,0 +1,20 @@
+from unittest import TestCase
+
+import simplejson as json
+
+# from http://json.org/JSON_checker/test/pass3.json
+JSON = r'''
+{
+    "JSON Test Pattern pass3": {
+        "The outermost value": "must be an object or array.",
+        "In this test": "It is an object."
+    }
+}
+'''
+
+class TestPass3(TestCase):
+    def test_parse(self):
+        # test in/out equivalence and parsing
+        res = json.loads(JSON)
+        out = json.dumps(res)
+        self.assertEquals(res, json.loads(out))
diff --git a/simplejson/tests/test_recursion.py b/simplejson/tests/test_recursion.py
new file mode 100644
index 00000000..97422a66
--- /dev/null
+++ b/simplejson/tests/test_recursion.py
@@ -0,0 +1,67 @@
+from unittest import TestCase
+
+import simplejson as json
+
+class JSONTestObject:
+    pass
+
+
+class RecursiveJSONEncoder(json.JSONEncoder):
+    recurse = False
+    def default(self, o):
+        if o is JSONTestObject:
+            if self.recurse:
+                return [JSONTestObject]
+            else:
+                return 'JSONTestObject'
+        return json.JSONEncoder.default(o)
+
+
+class TestRecursion(TestCase):
+    def test_listrecursion(self):
+        x = []
+        x.append(x)
+        try:
+            json.dumps(x)
+        except ValueError:
+            pass
+        else:
+            self.fail("didn't raise ValueError on list recursion")
+        x = []
+        y = [x]
+        x.append(y)
+        try:
+            json.dumps(x)
+        except ValueError:
+            pass
+        else:
+            self.fail("didn't raise ValueError on alternating list recursion")
+        y = []
+        x = [y, y]
+        # ensure that the marker is cleared
+        json.dumps(x)
+
+    def test_dictrecursion(self):
+        x = {}
+        x["test"] = x
+        try:
+            json.dumps(x)
+        except ValueError:
+            pass
+        else:
+            self.fail("didn't raise ValueError on dict recursion")
+        x = {}
+        y = {"a": x, "b": x}
+        # ensure that the marker is cleared
+        json.dumps(x)
+
+    def test_defaultrecursion(self):
+        enc = RecursiveJSONEncoder()
+        self.assertEquals(enc.encode(JSONTestObject), '"JSONTestObject"')
+        enc.recurse = True
+        try:
+            enc.encode(JSONTestObject)
+        except ValueError:
+            pass
+        else:
+            self.fail("didn't raise ValueError on default recursion")
diff --git a/simplejson/tests/test_scanstring.py b/simplejson/tests/test_scanstring.py
new file mode 100644
index 00000000..b08dec71
--- /dev/null
+++ b/simplejson/tests/test_scanstring.py
@@ -0,0 +1,111 @@
+import sys
+import decimal
+from unittest import TestCase
+
+import simplejson as json
+import simplejson.decoder
+
+class TestScanString(TestCase):
+    def test_py_scanstring(self):
+        self._test_scanstring(simplejson.decoder.py_scanstring)
+
+    def test_c_scanstring(self):
+        if not simplejson.decoder.c_scanstring:
+            return
+        self._test_scanstring(simplejson.decoder.c_scanstring)
+
+    def _test_scanstring(self, scanstring):
+        self.assertEquals(
+            scanstring('"z\\ud834\\udd20x"', 1, None, True),
+            (u'z\U0001d120x', 16))
+
+        if sys.maxunicode == 65535:
+            self.assertEquals(
+                scanstring(u'"z\U0001d120x"', 1, None, True),
+                (u'z\U0001d120x', 6))
+        else:
+            self.assertEquals(
+                scanstring(u'"z\U0001d120x"', 1, None, True),
+                (u'z\U0001d120x', 5))
+
+        self.assertEquals(
+            scanstring('"\\u007b"', 1, None, True),
+            (u'{', 8))
+
+        self.assertEquals(
+            scanstring('"A JSON payload should be an object or array, not a string."', 1, None, True),
+            (u'A JSON payload should be an object or array, not a string.', 60))
+
+        self.assertEquals(
+            scanstring('["Unclosed array"', 2, None, True),
+            (u'Unclosed array', 17))
+
+        self.assertEquals(
+            scanstring('["extra comma",]', 2, None, True),
+            (u'extra comma', 14))
+
+        self.assertEquals(
+            scanstring('["double extra comma",,]', 2, None, True),
+            (u'double extra comma', 21))
+
+        self.assertEquals(
+            scanstring('["Comma after the close"],', 2, None, True),
+            (u'Comma after the close', 24))
+
+        self.assertEquals(
+            scanstring('["Extra close"]]', 2, None, True),
+            (u'Extra close', 14))
+
+        self.assertEquals(
+            scanstring('{"Extra comma": true,}', 2, None, True),
+            (u'Extra comma', 14))
+
+        self.assertEquals(
+            scanstring('{"Extra value after close": true} "misplaced quoted value"', 2, None, True),
+            (u'Extra value after close', 26))
+
+        self.assertEquals(
+            scanstring('{"Illegal expression": 1 + 2}', 2, None, True),
+            (u'Illegal expression', 21))
+
+        self.assertEquals(
+            scanstring('{"Illegal invocation": alert()}', 2, None, True),
+            (u'Illegal invocation', 21))
+
+        self.assertEquals(
+            scanstring('{"Numbers cannot have leading zeroes": 013}', 2, None, True),
+            (u'Numbers cannot have leading zeroes', 37))
+
+        self.assertEquals(
+            scanstring('{"Numbers cannot be hex": 0x14}', 2, None, True),
+            (u'Numbers cannot be hex', 24))
+
+        self.assertEquals(
+            scanstring('[[[[[[[[[[[[[[[[[[[["Too deep"]]]]]]]]]]]]]]]]]]]]', 21, None, True),
+            (u'Too deep', 30))
+
+        self.assertEquals(
+            scanstring('{"Missing colon" null}', 2, None, True),
+            (u'Missing colon', 16))
+
+        self.assertEquals(
+            scanstring('{"Double colon":: null}', 2, None, True),
+            (u'Double colon', 15))
+
+        self.assertEquals(
+            scanstring('{"Comma instead of colon", null}', 2, None, True),
+            (u'Comma instead of colon', 25))
+
+        self.assertEquals(
+            scanstring('["Colon instead of comma": false]', 2, None, True),
+            (u'Colon instead of comma', 25))
+
+        self.assertEquals(
+            scanstring('["Bad value", truth]', 2, None, True),
+            (u'Bad value', 12))
+
+    def test_issue3623(self):
+        self.assertRaises(ValueError, json.decoder.scanstring, "xxx", 1,
+                          "xxx")
+        self.assertRaises(UnicodeDecodeError,
+                          json.encoder.encode_basestring_ascii, "xx\xff")
diff --git a/simplejson/tests/test_separators.py b/simplejson/tests/test_separators.py
new file mode 100644
index 00000000..8fa0dac6
--- /dev/null
+++ b/simplejson/tests/test_separators.py
@@ -0,0 +1,42 @@
+import textwrap
+from unittest import TestCase
+
+import simplejson as json
+
+
+class TestSeparators(TestCase):
+    def test_separators(self):
+        h = [['blorpie'], ['whoops'], [], 'd-shtaeou', 'd-nthiouh', 'i-vhbjkhnth',
+             {'nifty': 87}, {'field': 'yes', 'morefield': False} ]
+
+        expect = textwrap.dedent("""\
+        [
+          [
+            "blorpie"
+          ] ,
+          [
+            "whoops"
+          ] ,
+          [] ,
+          "d-shtaeou" ,
+          "d-nthiouh" ,
+          "i-vhbjkhnth" ,
+          {
+            "nifty" : 87
+          } ,
+          {
+            "field" : "yes" ,
+            "morefield" : false
+          }
+        ]""")
+
+
+        d1 = json.dumps(h)
+        d2 = json.dumps(h, indent=2, sort_keys=True, separators=(' ,', ' : '))
+
+        h1 = json.loads(d1)
+        h2 = json.loads(d2)
+
+        self.assertEquals(h1, h)
+        self.assertEquals(h2, h)
+        self.assertEquals(d2, expect)
diff --git a/simplejson/tests/test_unicode.py b/simplejson/tests/test_unicode.py
new file mode 100644
index 00000000..6f4384a5
--- /dev/null
+++ b/simplejson/tests/test_unicode.py
@@ -0,0 +1,64 @@
+from unittest import TestCase
+
+import simplejson as json
+
+class TestUnicode(TestCase):
+    def test_encoding1(self):
+        encoder = json.JSONEncoder(encoding='utf-8')
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        s = u.encode('utf-8')
+        ju = encoder.encode(u)
+        js = encoder.encode(s)
+        self.assertEquals(ju, js)
+
+    def test_encoding2(self):
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        s = u.encode('utf-8')
+        ju = json.dumps(u, encoding='utf-8')
+        js = json.dumps(s, encoding='utf-8')
+        self.assertEquals(ju, js)
+
+    def test_encoding3(self):
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        j = json.dumps(u)
+        self.assertEquals(j, '"\\u03b1\\u03a9"')
+
+    def test_encoding4(self):
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        j = json.dumps([u])
+        self.assertEquals(j, '["\\u03b1\\u03a9"]')
+
+    def test_encoding5(self):
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        j = json.dumps(u, ensure_ascii=False)
+        self.assertEquals(j, u'"%s"' % (u,))
+
+    def test_encoding6(self):
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        j = json.dumps([u], ensure_ascii=False)
+        self.assertEquals(j, u'["%s"]' % (u,))
+
+    def test_big_unicode_encode(self):
+        u = u'\U0001d120'
+        self.assertEquals(json.dumps(u), '"\\ud834\\udd20"')
+        self.assertEquals(json.dumps(u, ensure_ascii=False), u'"\U0001d120"')
+
+    def test_big_unicode_decode(self):
+        u = u'z\U0001d120x'
+        self.assertEquals(json.loads('"' + u + '"'), u)
+        self.assertEquals(json.loads('"z\\ud834\\udd20x"'), u)
+
+    def test_unicode_decode(self):
+        for i in range(0, 0xd7ff):
+            u = unichr(i)
+            s = '"\\u%04x"' % (i,)
+            self.assertEquals(json.loads(s), u)
+
+    def test_default_encoding(self):
+        self.assertEquals(json.loads(u'{"a": "\xe9"}'.encode('utf-8')),
+            {'a': u'\xe9'})
+
+    def test_unicode_preservation(self):
+        self.assertEquals(type(json.loads(u'""')), unicode)
+        self.assertEquals(type(json.loads(u'"a"')), unicode)
+        self.assertEquals(type(json.loads(u'["a"]')[0]), unicode)
\ No newline at end of file
diff --git a/simplejson/tool.py b/simplejson/tool.py
new file mode 100644
index 00000000..90443317
--- /dev/null
+++ b/simplejson/tool.py
@@ -0,0 +1,37 @@
+r"""Command-line tool to validate and pretty-print JSON
+
+Usage::
+
+    $ echo '{"json":"obj"}' | python -m simplejson.tool
+    {
+        "json": "obj"
+    }
+    $ echo '{ 1.2:3.4}' | python -m simplejson.tool
+    Expecting property name: line 1 column 2 (char 2)
+
+"""
+import sys
+import simplejson
+
+def main():
+    if len(sys.argv) == 1:
+        infile = sys.stdin
+        outfile = sys.stdout
+    elif len(sys.argv) == 2:
+        infile = open(sys.argv[1], 'rb')
+        outfile = sys.stdout
+    elif len(sys.argv) == 3:
+        infile = open(sys.argv[1], 'rb')
+        outfile = open(sys.argv[2], 'wb')
+    else:
+        raise SystemExit(sys.argv[0] + " [infile [outfile]]")
+    try:
+        obj = simplejson.load(infile)
+    except ValueError, e:
+        raise SystemExit(e)
+    simplejson.dump(obj, outfile, sort_keys=True, indent=4)
+    outfile.write('\n')
+
+
+if __name__ == '__main__':
+    main()
diff --git a/static/ajax-loader.gif b/static/ajax-loader.gif
new file mode 100644
index 0000000000000000000000000000000000000000..f16ebf7cbd4f28620c0daba2f4a36ae0196b3d4c
GIT binary patch
literal 10819
zcmb`NXHZjX->;L91QJksO9Fy4X^NnNiVC_BuprxlbVKhX^w84?z4u<FS4FB|0BI2r
z>7CGf5evn_!Tr3?d(NECJ2Pu0AJ)uTvu54bx_-a^t*&`j>8i;TfD`Z)060EAmb_Eg
z)wf#RL@#+W)ka%x?pW*}*_fIC+&j2FF}pLjxVO0SWp(}A+xH6{y(=4A-?w-72Szu)
zd^`O1{b+b%YyaTK$DxhUsqNjpgDLv%hfiy@)VYJh9~E^o`Bf9b$IM!4PoLaT)mD=~
zFUJ4`006?j5qF#|Ok6F@g*<Frt%Xc%O>p)Y6Z7*nj+PjJ@F5rmKRHY0<N*A+NdV+n
zNGQVGCd0b8+<v1OEA!FSVHQ`u<Fj*2&BAJcnV{r6=WhFJnf-;X_saAu#!B6<u~ma1
zq_*92B*wHVuc_&}+0L&izcj{nkoCA7>xC_AA8$W@FCrO7u?zADA-VZ`x<p1J2}EcZ
zJ|a0PAl4Oa2{D#7GUwptgTr&mLC8GBYo<3$NOP>?tC|{EeZ$+PS}L}+>0Lu3YulS{
zT4!^6L+^W9RZs87mhra9j_Iz!%2vK2CI%TW6b5HzImN~dVJ!O2!OQxY?dQ)g-}ZOc
zHbx@}1$YJ+?K<v)uqp|_zU|%BpV3C-hG@O#>z}{t&;P~OkgsY^BS?Vr*pM7Zz+VGy
zGfn8J#m3_yoX+b#a<TCrb(B1oHxD@r`?FU<W|XfHRzJQ}Pd_3{JuU9ddKP=Ly<xEU
zQ=xu=^YB`{?ej!wCX_BfbwySm`$RA4{%9-F9c$HHc75N`xQYAVdwZ(Kg%|JqPmQV>
zDpjI8oCMB@qx33`Xw_VU0cm=BragGsS+$bevLq%hnO&KCcBH=3mDfvuPp-Rdj{6&R
zHa8Kz$xJs|?B}2IQQUsp?)jr!!0=#iu`;qPU^}gDYqibg#q;S@SNLF|EZL!#x_2<U
z1j!tYLT^re+v?4Xtnl;mYTlg=t-X+0_xtCsCHEIbE4V-qjtkonGHF?P5s(66ai?ct
z*tNR!16WNpvcbKYNy34>db)8GULs#w(5+~toZv=1YdVas3W&uFU4AzBgx@vEBz#;l
z-pu9tZ)?LyrFGoG)7w(&W-(&|Hk`4;RUNspd=I*5q2ess%;1CmgIS<4v~VcVWaPQH
zANrnVeu}B%aK0|an0w{9^-)|O9DS)D9?uwbcai9O^ScC@pw(ezOGyY?wF-n!Sm#Ke
zZy3)y(6~018z!}0`0yn?_&rY+<>YT(f~^#{5m)wlacRx^dP!x6)JAFbi0ww11o>n&
z{9EsPXXod0%vV-{ohI1IX%fgQW4U^o;-lR1D2o$i=iuqZ>VxzPB9Jhr87P6lwqYLL
zzAmxh0lsOW7;-|8F98?s9psNE+IvPo(qi06Ws!-wc9~e{KMO$+^=Bn?AdpZ9E6B?F
z1A=K_u-m%NuW@h!26eF-W1SeBa_##tKQP?qva-5}9POT49d`BGnqS=b_~meVq;S`!
zgb_=kIvvv?GI&6n9GF3ujY-D@NP@D-pFf91Cy^u1oI&?!IJb}(xK)nDnXbl&f}s>;
z;#;8si@QnEH<n9nIF~!)gv54TZC)*WOqbQ1XE}<td>k&J3gSNcYVjbRBW<Eu>RIc(
zvKzVb5N~!MFj(-4jL_9=*-X>+JQKFctTLloj<B`(gsg2ci^t*WW%2Os*+zaa>)kA>
z9G&XPD<bDp=P=*pjr>ujY_f!g_$c1eN~62X^~Q5s<^MdWux&z|6ZtNq_x%Nv)pIs%
z<@aqc7|CWG#B)lO2<M5Bz}Tf7V4J(*rC&s;9PG~X<w$3u2}fU6;5YAOW>7spFDxV{
zdYr!DyZ`O|<bBM>uSUbIfsI>M$}+#ezuJX`W_;eY)V^^4y_63+2J*_W0U<oPIw?>%
zepJ^$z`V=Il-pRMH-O)ERX<>)`;978*j-52{u7^zX^6D`^EA)}O5Ge(0N%+LbVWZ3
z7{O(%Xc&Ih8OP#|MC*!1{kR+_8YV)k6N#2`rwV(Ym*O{JWIvY#0x~KwnK+*jILrpH
zgsEGa3u@KiQ+VRWO+tOg#nRJmpN$nKR4-XirTUoGoH4@A*S|=2kmW7Na^0?<&XIR7
zOh~8kdrd<lW+Vxo1&4|F#B+E_OJ^3UdJ;%lGSRf?HqkQ89pSDm6}n$kJnv0{T+M=%
zAei)VmF`g}HyOm2ze9vyd8He7o|U$<iP@U4EAPMhWAoUm;~v_M^7=fb7~FOGN6}v<
zH&;cfJAE{k!t<|Q1%};}*PM&nnNXUyLTISGq`=UXrNQ6M>pif%1ohd7+!_eVX}T-u
z5(Z#qmf?p!n&=XXnBierie$(vu4-qu#{&x`ScFc29Zax*vO;;4wG^3Ly>pi2dQBUe
zbn0P&ztrG*zPEG!kCk45uPjJ2c}{EBa&mFKYwyEbh)Y9wN5z&wFSW8F5PKN_dY3b9
z;`7C$R?X?Lu(C_}IaUiLI}_}`M=#WHpaA=gENGdp>e$%g{UTdV>#4Ev@4p1+=Eh|Y
zro1mdCCr%)mL1?cSM=v5Lq9Hsj%wJ?9j;^ro<BmY<~{kO#$H%Zezaa%yM44#*?IoQ
zX7#AwZKi(@7lDj6IHoJsU-1iAzKJbW;fF73PvL5nqgB3eqU>=bC<80f*9MQpkSM;v
zL4@!y?`T^T#xa7`-zO=YObN=sCp&rsK!P*uQ*+WYZ3q>q-g%jJaSkZK)98~=ryUBy
z2k%0_Pmlq!a)q!m4GqDWdi$e#2Zx7ykyeufGs7^bb-%U6(h%L%cXMWRWg-Z<_=RaD
z#O82mXO+I86OmbWX%C*m%p0DiNZOz0kJ1LV0C>PqrE_SsDg%>{>IpYgh~2Rqg2z5A
zl6$I}Fc>=JX*Y)`iIH17<*mx=<%c2iX8DHQdzM=1%E1)FU8;FN(#6;jGWN^Mz6`Zg
z&<)Aqf{`qahF9kBr`Ecq!X-Ie#WAW3V6YsIbQW-t+~{$LdQAb4@DSW*OFC&20rFy&
z2lu6B?cSk=GAiD6KiHjZ_Y_mQlBneTpfipWpo2P4u;}B|Sh(zvl(O1bEWwtawu#vs
zDoxa*pm3GTgXO|jcs36RP#Groh?);nb#dXA(O`Z1h~(A`%ekL<(?k`t@zKbxR*vAa
ze{vyYUvs+mw~hW<#_t);DWKTB-sc_>zRKTrezuR!80~y^%k=lqqYE7S#8-7r8!^k*
zu@c*hu!cZ3ZM2|$xRF&72sAaU>RIVf`2g2N9%~6ACNs@m=ChA#32CY?oRJsOQZWma
zc%1tn;!=!N3wm^FY!rGnMkz1+0<F$0_=XNoZiLKj{*237I>{;Ffh|Fz;WC!gr9iD1
zMbiLDHYx$kZmpCK5pN38^<Hk5%(ix&u_*AOy-hfi#(|eug|c+jrdaOk1+I`@341N&
zP_}JmEv7WB9!GA-M!oQK&!`K_jD|{CV?9Cej7Yes_A1FbM+MKoQr$gGtp3C~9diBd
zK{oWF9$-0y#r0rH{s02oG^Z(d3YLrLvz5AylHKhXG0+X0V-xX<p&PGnnMxCCIvvF`
zD(Y?rZQkLwwsSNokTocO9joTer&i}Yx()-gNlC{w=;f*;h&oE1mj^IQibH9xo}%$M
zS<eUZ#*g{Ub7A)n#X>Ko=!}~{zBHD+P|(rL2v)lL1JiZcvF1V8IYn<d2i=@B`iDJ^
zDS7+-6gj|UHc@LJlo8!v;7I|=e!ZD8aOl!s;0xD%d0+jiL@o#TR}R#lUn>36ul$2*
zPXmQA!6NM!`ns)A&3bQWMdGq~84qeH)gynuzVDvLTL$P*=d`W^bhACum14kqbeDh~
zp_|ifzbq4R#1?r$S+!ur`v(`>1h<z<VaoQn;mG^ESJfK3@Hgq6F_VY}A`&<AQZp5!
z*f1TD*{l>n)7e!bfAk@|=b<uQ___O@7o+?~M1Jn|DDM3H(yxBu*Vm!vm|x%iRS^la
zlH271r@9_>Iq{*e2U%I=tP_;ClNTT5apGYplxKjaubZEPcYqHo($AKNbHXsNM!Sbn
zpuPlK5683&f*%7Glan49m06IMkdz#S^YTh8!&k>)Q5LLLGDaR42)y$IEGJ~K4n6_P
zAQODB*FVbU)6jIUwO{nq^e7bh(SKoaEM{_GXoP8VZhQJOY<a>Ky0duT_T$K{jZrJ6
zfw0{Fa!$S6Q1uq;)Ke8XJcRIsl`4m)RxJ=gjG{p(&pB06gdp>A&;ucY1u;hA@7ub&
z=)8wX@>Vws`(G7+)8uU?3}IYiq!ez$5SjI=<^Du*7r}U{i|A0&xq$EHhYH0#xytqD
zzomRr?TY89xoC~Y<JC?>I5bFd*^bjJG7If(LTG|fBTfvJ%7Y=zzH|H1k()r@ou!h>
z^c2FBs_5;*M>-Ul@f1okzm#+hBjTc!zu%o>fp8Xr<zPtsvmcv$yVjT@;W{H#p=>gZ
zb5XdTUO|K~2l0yP-o+uH3!TxU&-#3XzQP71v?a<DZC%%RYGS?pln<TfdpQk1miypb
zPR+c2^oZV!JY01zQmoBy_L*Kd+TzXh9Dc|!>&Cg6fBP7-@|Vyo7}s6H2Sq;U2fEjE
zkDvm0ep{%LSKY)_pu9H|@MIe5iAgYjPT~W35#u0~vye{i^DsWa#1<&+X<|=^;C5lQ
zvC7R3vpc9)xY6LLX${jrkI!8K%G_r?vWb#kb?{IwdLZh)@Jt)k!<`T;XvQ36!|x(V
zi?#Ip6kOet_Q75*--oAbZC)NW6`Yh@Sd?4<hV1Px`**GBol3!)p0kR4#h<?n_BtAq
zNDk&$&&mERb}+)g?kZ`-$dWcTeo5Ia%QkpUwt&}3rpR`#_@z!_j>ao}73o;S*{qpj
zdE1rZ@Zr1()!az|g|P~%@v5CXO^{^wIxodG^0?|%->BW?r@++ABGReRtzteY-tnA{
zqd+k@7@MV1m^)G@97TuKCtcQDW)hApI2*O&|3fM@EF2k?v=R7oyFjHyjE2ZICx8BC
z?*5$vD%<A1cFw~5)=e8xXvGn8UYNjB)T2(B0c!^<ju&0?4H7JJ>_%g2AuT}riLuc<
z#TDg;X0vJ@E_Km@`d`2|0+puvSj8QxKo3Mhz5?&)bGr2ku-sVsc$fL%W%-zkrwSl<
zHeNm$8jpY2H@p-tP+oyKvQkx(#ybswbIwySsZ2k~MU_I6Ni5HdOqI@bAp~`ma%jS*
ztH6w0g7yo-tx|--@k4~tnBoOv<AqOJJXh8I#t7w`mvcq*9q3o2b~%?nt!>qrN16SW
zg<g34T6NtYMu#w~+YA3gmY<)yo}XCD|3{WFEB}AhTCAv&-tg3FuRF_1GrK^qba5oh
zX=T6NG11?6cMlIwXIq#bi~&OmqXhbeV!fa~uKpGzay+ZQT?i_L?2HeJj!p4-8JryM
z5ov>W4D&i&oMCH@wLn4s<b8KmRwyeR(S`Vc?1+M$u;m0TgT21_exF9BVSV{Q9n&LY
zQDcjv(5kBbfuR|?-PG>L>_qU_#o5H|HKzTHwb0SPzB<=lHsSRr_%;GihDqkEyKoD`
zNyxD^)TZOfkwRjILv>ZLWU$1oV|{xSc@Yvw_(_QQ_@3CkI0;TezVVX)6oq#;Ew$m0
z=wiI2DSrUtSfM4bC4hdtR<P+#Rq>R%JpNSTapC<NIbTJxlc6AX?`Ne#=oWG<R^n%o
z;;B26b=bePN-RIh8rQ>qPq(L<I9_gsLl@HR9umyjvCNF_VQ4+mccEgg3#kAX^QJYS
zmEld@Hsep6@cSxvWyhD^6%UT90f1X@(8g1p13O>~#UJK=Y{Zsyo(kuYdH+TQb>O(<
zlqymlin{i7`BlJ$PUA-{ov{8{`3uIqUq8R&tlRl^Uihl<nk%WzEi*$|d1oS*H`DU)
z2Y6D7&XZ=eYEcQa2p7{qAA{lqzK=O$_*chF%3<1c!b{0qA$vxh4g~1LPzcU*nn84V
zM3BZ=SB?}b;~@SXUXwtdVX?D;m&-jwO!!7t$Dsah+I++j>R5|EJ3kg^z+A^@#CYa!
zQj!Ntzarvlw}!R_4x<+Q!1HOj#=QEugnA$Yn--geg{2oX17fHD`T@uwL=hO5vemwv
zJg>L%GEK5UEeB^VZYHSm&{;AO{9#w|p_Nwa8%ufn0T?e{l0KsD{m8u^$PoMRFuGvg
z6TWU7NL!IC%8XH$4Ek7h#N%{^M-Nyur|B`4J52DfD&f4QR9u=b&sS>JR<6HkIi!Kz
zi2hR4$qW71Y*l)k+c|f%QPjA1?@azVYkdItQJ>N@S!yDA0?M~)vk=tW7X*wJ+SWaP
zFHTE(KDs-)c(nXhvs!U|P<_IALv`qAO7q3$wW8oMO_*o|du}T5T|YvpA{SWFxZTmY
z?Jdd7pn=ANeD{7x5FPYjGnwIU(x!T_g81S%{qLIA8R*Bsg3v1$(!^3Qt&p!?N<W4%
z&gv^cgqN7xj9(LXmD8<<cu=wy0mON3tLXH#pL@2KPe06ru$2KQV73P;gxKol3HyqA
zak&e_2TcyL(DRSg31jaGVPAk;yUfq&>{gm}IRq=E{aKwWGg%&?lZQ5u8=5M0ZLcR}
zml9LnJ$$VI$(s4)xf(X<TR7_k1B6Xz*bDy&IgUTJ>i(pkxBJ^acK&NECv1`US2+@K
z!jbFm1H!$Ugs;zF`-Gab#;#&WcaE2pH}SUSP_j411qlldfsuT?ph3a0;kYPrG^<-!
zLVyoLN@{$P&*?08+pvf{EB~-!R7O$^-aUfi?Gj?Ij{6TvTu7|te^AoX!-VXP3x?2`
zMn?OyLt)*cGvh_E(=#Leb45doOP@k*yW#8ojc!A`i&NQ!$hFVV)IruEVXA~|s)~#K
zW|#=0))OED2eeX%PM9Du;|2fYD2#s`MN-vFJ<?zFSX9WfWl@ufMKH|p>YgeoQSM1`
z-njF^horN>V0+ImOX?}2_jzu>o{HU1d|<JimrND!%hgoV|0U_R(qH!X9r1}nJoPU$
z-^D`iN;Gk@mUFYPjmon<8UOw5@EfEef!c&s=z3F-C5NtaX6G`_r&k)Zz~~oAqjj>g
z@gsXTU!(Y5E4HPv-`7phyJOMpBzEqK!^h9ymf{MNLhbC$zx>ZKhm!3~hyhk0k1s}S
zdg)~NTVGDrh^g{`rI4mx_sJi!U+o&iL^CVXD&MSOyl-77Z<%x&8f7-PerpP2JlH7v
zbpJ+_vn!-^>vm?^^d=kx71ajXz_P@Xyh3Ef0mm<RP#VcM`0Q1Ttm3M4lE^+5l`W>d
ze3o=dp2bKK#@)s`Qi16&r8%&GD^>`!)PkD}i6r12dWu}LI_n<l5T!~%n(hlw9Nn~Y
zEpJ%TGvNSZIUzrmsID9XT(GW|^-!>@2;uKNu^1b9`B*AwFL-4nvG<aKcsNg1^0JE2
zk$6VJNLC%eqKQ9Q-}T%pvDuJ}maY`=-#Usb))(Oo;uwbxp4=pd-j&J3n0DRK7)ijn
zVaP<)m}w{rS0dVd$ag}uP}taIs^Ez}UMlI;GitG$UvEHK-V}GixToj3W|~*%oP=s<
z1`(lGIi7rEQ<xl{l8NcKl1hI)v?VcpT$XXvVQ-wLg_nc_c(R5gy#x>GQJ0!6bA#Xq
zK^qYUHL0p@cdyhD^vOm_6_EE6p)J0v2^*=DWBG(d11~rQlYT@~FKq~z>q?1KiGkWT
z_EXg5!b&dpAX{3*HL7Z5ScC`w#)IyPI1W@)RuEZybk(ZiqV{qoCmM@y4=Z|*?jw6&
zXAEEdkgeK=ha<!#A@_!L3QgeWRhLqDn4Y-dwaGxBwevlJ>Xram+vgt!jDlU<%oXf=
zjd?VxL3|vAs)Qk0@Or6x9Y<{?h(R0+fNcFrwGQF#ku92mTo50adK*xj5Z3TZKq)EY
zK2^yuC{jv>?nzt0%}0NftyG?2zoUE5>$rA9$|puKgZgf<2YLVov3$A0VX#>KWBVVD
zJazs1{h##nha(mLO+T4zpnt7S2>`XUNnY<e{m7)v5d%e4i)8p!a^jSyg%nu?J&~Rk
zK0a1{?l>Y0<9(Xq9~MKjgeF7<$9SOvtb;r}VNMCor~N%bb0QN13qnG$C3!*FF;$er
z0!O5}1<J%&njt5R74HdUMVvIRACTR|fj@FGI>rS1^rm}!Y!W|U4;q<e>UYmtTUqT6
zaah`#bPO5(0u3$PU+F*kzTB*uDjGgpi`^Le=7KK317RoatDME=Z9y39{{aeDGM(5F
zAqYGU7qxK~xpx8-v|;e)#Sck*oTWWubg>?@YgQ?nhkGIq(`9`-SnfS;)y_O~Az~5s
zY*|a0H7LhiTWEz=pva8sPY%St2SQ~`bwmG@C!F)Nbo@#xs201T)ulbUZP4W8meIzX
zR8F>obJYG~=6hrcL2z)6d{AtWhcJmMjBF?wEcQAd3f>LV16tP;71XtSyej&J$4(Mf
zc=l}w%<?%KU!`iEsVn!qev;f2vBsT)$Y2}=sNb7+O1_?Hkal(19v;J5a6a92d9iiH
z{aps1^5-v{Ns4Vc#`VT)?}StRXMaxEo|;&4tj*AKbKjrWt4T4hFH$*qGEV{H#}**2
zj!~mXRZE1M(~ScIOHNQi3zSW~MxTTbucYJoAB&&$=5UN6P*CSdIU!DN{i*>dQ+f{(
zPSwy0?^F8H6Ee5eE=*xxR~n_f6y_O+UKH%k4Md=|(QroNEIJV>*PmzDZDO4X)q89`
z7T()cAci)&+rg5=q9S4FY$qS9l6uq*kx;lP4oHNwe@<TZ`mlO+DhwmIJRi=n_$ED*
zGSg{^YY!&(W+NBXP?<c`LyN409Er8;j}L-d2|Cm9X<>!5E)^H{d*TF05y$AXVu6<2
zf}g~IJ}?`oRcly2j+Zd2U^f=AFBT}BD6VQeo4OfXmcl4qO!Eq)9{ap6vQ0MX%&=-H
z4f!Rp4r6o=XfXl-))vh!6eB01jKwV%8%NbB!eO-o8phH5EREBYE8D5L4aYTO>(rWZ
zyUf6=6SR`3m(!zip_})DDzR;F@wq1O26Ed>D#ET6z`=x7f#8-5R-2PALXGls)fxf$
ztrlJY3WK=5OCCq5yO^KV<CRH#^qQeWkCI)D3Zsvgw2i^@lq;`|<;>i-&0Ge06oP}-
zG~e`&j`7ueaPjq;HdRnRVF}+eEERY`{rQXbF<QGJ_166pmb?pTs+{o|^l+=|hD6Lv
zGx$9x%(+XjVaWme(^63U<b<nN#2HjQ{d+O=V9EK#4WWxm6tjlnSw7Rh2!NK-@b^6b
z)4n=h|5Kg(4^aNEnEad7NdU2p&W}Y|U#hRPX;ifQdi4fQbo=1_c+{1H8}3LP5ry)x
z^(S}`y(nfjr`=%0Ff7F{DkcnP8EEDg<4KN64k395`ax4X!;3RZ+(SdXE3;TJAQ-E~
zABMo7=+m!A5LN_&iAF=V#l^z9n1)A~S{poBhen56;~Y-BWIWzsakMqoae;Maw*U3V
zo!yQ3xV4e}P~y?&P0;T<yALK)30`o%s6UN~2?u2^TIKK7KQkO#!(F;cJDBUjNxb>2
zss<AhI}UoU!2x23m5`3G@4hJ39;cw$`~ddKN-LZN?xTFDu<#*UIP`WQ|C5&kS!Z^#
zeDtZ7?eVgSi2EwklUano#UM3&_5=mOIZ&LA?MxxsqCb_VM`f2y+JYAQ-Z1kLh;Lm6
ziBDCMO7)uT80~}%6NKig-NfEngzZ<MVIw@xPou_n7TXBp;@Xu-awb%ljffhG$;I_I
z#TTCz3T1D=L5%L2es&IbAk3V2=1wRpu${`oBYN)qoX74PTJm!ZX=U8kM)QIa$W37{
zlbKibnCE?sl};=3jTb7u|H7g7HWSlX1)9E^p4uL4ljv={>TI7ci6=Nnu?bOc=Sj9@
z9s{y1Dpm0x((Ve_=f-!=Lc4}7CVV-ZzYCGeEe?cDdad!oRwY%8yc7Xfz$9tEJFo@H
zpQV9NV3)$?;CPhy&_w^<;T+26GF>xUZjdG#4(56S4Biu?;zRB9RM;_aTcIVgtr34V
z(V)-brMXy40u{8TCubSlYfl9vCQ6bPOs(Kn5^8(#tK#t=%k;u6Bb*8>vAEl7EDXai
zb@mAVl!N>fQpD8)pTd`cR=Eh7U=YyFa6HLgmXgBb32c2vD4a4{IaT=a?@p?hqa-~;
zU$$8)JxX8<&RSBvoRVk26(F@)l3yiJ0&b<;+l=hgk1DOmXlLYbYinJ9etfyN{+wai
z2jA!6`4X2TxuEn<tHPL34ogQ{5wDuDhRMT1z52_0t7b*(BloidUT!7ngxW_N$ms2A
z0kEL5=vBRzs1_!RW;+2x9)I2uW;vtW-up@5--yk#tr-Nyau|b#5EaPHBm+!&rjKs{
ze%ecTo@3MWbHRjoZIaOYvOCN&k9_a@VtB-x%{?Get42Q2cJD!Qsf@(EX#4itMi%-{
z5)sy!w#G%@^d?o0oXyOWyPe~ozp}KvBaJ6Kro9r>PA}Oa78s3HJU(R(V$|Lh?CMGC
zsG4<=l)!dze4Vz%ve;wm=p1anG36pPyq+Jz88yliqFE7XkTE6{`ucoKi3KitJigp=
z=0@teVqPw2CIj%U`h+KSEC11wKRo&0>g0d5<X`5A_AU#`y1Hdf(tc)Fr1RpV>(EHD
zUnYI16H34#y~)1*1R^UX%+Ji-BNRr7^&>=`Bp!yKM4S&984(3d4uDzN;qCH$66}Is
zdd3DsRE0QsK^V;c!3l_i^>hm61Sm|1-d-d$yBgVj5_6bZQap#pMkcV;(=#n$7}&zt
z(p=XGPCj`Jtc`9Au5Rxv?PY@w7eCz&$YG3}y-H*X;s3)Epb4CduP#fSs0NEgsEl<v
zsS+4?I1S(Ks)%%kGYcN$-}5=&>5fJ6E7xf#wA@dUw=)&B*)yj_$#CwHVJ#y4QFl!8
z!IB(ny|Gtq^dG?8#5+Pb3Z28Go=Ma6U`$F}St`pA7CyGT@N@svB?=E-<<k+A8tg*I
zTb=#X$+wsleS_3pjB!2kZ1Kxb-d%7s;%xq#@6^hfQ%s@;gZ+G!^sdos8}V6n6`)U8
z3AKnqzHi`qj!mK#`mk(@nOjPOt&vD2Ks>lhO5|E@f1c-g)%4-6as`B$nM3B0$`o#9
zb+F`&Vnn)Q({ktR-3z}2cE4=5a%=Sa8F?)?z%P}0uuS{@+>6Mqh(LKZyVZ@gkMe@P
zTvcqr#eDuV6Xvk41Va0!0#!i~O$h+I50y2lIInn~7v@OBx#xfV9KLJ<jR+5#la~m=
z2?zK7#dQ`f;?)@jLb|J%nV#9ZykNpBA8TTX{B30jRc<ZR0iA0eCPZkMu9^k>?N^8=
zO3Eb##*8pg@t!>BYJUImx^FMgr!0BQl9wOiqZP~tmeZUtt^EAPR+MB*a$2&@l#647
zm6etMdi^-w`K(8phTIhrK5<fZf-ZkM;SiPeQ4ef&!_tc<H41?~AxpPz9@TvP+3sR2
zX1EiPQ@nog!eg=0168(jF_E`~r7kcW#I4Q5ThYA7y;*+kyOg12Pg%n{n3lp5t=7l!
zqxjf#=-ChRYFF7iMoxW#tJ0;DWi*EuIT<PdK@N03Z_q=*gd`6{2Xd6O3k%9^Qg7~(
zF;Z)_Fam8SKzEXPmK!H*_;owi!J79PRo|BCcxK``3z8O7ew;2@Fx%d)HE&~mN7?Zf
zmtWiMJUE|P4x|2&6o_<`b;-w*Ik9ICy*s<F!Z}2t<l2QE$^6bWLtt<izxx_kg}F;6
zZ^THy+Vb<^Pl+Lg*H^wJmenBKypXP5MG!MqCP`=fy8WoHV&K+y^#0{PlJZGeHsEdp
z{EQJ~UdFM-&h#%;Kk#gj10;}vC%y4pi3b33_jJb2O!y<}`hxMJ4|UXzZ~EBVT`^D2
zE3H(}6tB+P{Y^7m#^>D30>|ExHJ)F*LH{s)GCcloUGk?r`F~>0e}+8&W_xm?DZA%b
zl_IKzw|2R%>>e!llzR&Xzx9i_a&XLmgCRZ1C|`d+0x5tL=w?qKhr=T6@x-`De=}%k
z7#8N57?K<tA7p2f=@n6wRNxgDjK_dHEs!S-?1`g*PIj8S^CqJ~2pWxv2?-^CA~*I9
z_kQ$B9vbO=mmS*xnwo}^X6F`|W(HtgYwe%HAgpU+pSQm3EX{fzE_~no>14nQKXb#5
zPjnMOB?9Ci%zQ$BCdKWc9D<krneZ?&av1j1REcy(a{P6iUyW1E)r??KF@3wbCq|2h
zaahXO$me%u!VLB{S6xJVvn4)<vFHyjc81*bXeQGYSnp;(G3%>VvbH8c5qNg%b1FcF
z2of7wB}+xM|DUiU^q6qD7DVq$k5Uz#wB_SkoJNlB=r`Ika$cG0DML4TZ<LpPPr|-{
zIi}iZuy~ehoC-opN65_W%+f+H)~bbhZCkv_QuB!L)@vQ(2A`I}%e9O*!Z~HYyffZy
zN)VnUeWCJg#km<+8neX7$oOl&eE?+EZrXKW(J8U>%}kAxBAwhl`K(e;;AnS&v+`X@
zdgZn62e02{+TFOabTrw%GV(`LfDG&^m4suntv6y+7hemV3=$h{lt+Q9Reh3pSoM+$
z<=5>HRuCi>3cp}B&0?`*)wj&H6uVuA_73;un>XgqI~bK0hX&;s^z8DPG75CXFZjgy
zYUnbu6Yrwo(6iR;!8sSRP)<*XBUu0)4oi0L-$jEjBQtIE9)i4r6;&Da$_sm-X3#P5
zB!noH>N@nMJ`9R=ELe^kD|(H`;nsuk^6p2HiE1ehl+`TU`9zD$K^>CMlM%|nL;^EY
zLb46)sfwtNfZT4*<+Fzxc}0EE`nIluet|QEpQo32aJl7hyYSi$HEGv4UkPAzeKXC@
zfQQ{6ue>CHr})+TS2P_`>$wf-<C1J)X;o~$>10^G#G<$^B*<YzC$ij$Z=+tmoCnz`
zAs8(1_9pGRL)ckkrR;D!o_Z6{g3muTqL;4(l~=fGR+@$*57u`gdF9`VN1#AH+fl41
zg%&fz`>#~F5=j1-v#5l53iNE7nvvm)zSL3YcQq`!7K5@OdZe^d>PEMBXgo8Sj2hPG
z6GL8=rq~emG*JoanRhRBKVUEv8@f^wU_L<W4rl@DU^@EYXfpVf8U0j&^uV~ob;EZo
zJ$(5ZTzQFuwyhn#(^IY@9{A}YJzl=)bq%)t3crfl3^}KgLn$bM;Jz_q*SWv%(*-+U
z8}e0Es}Pb8O)$UBrCn<%y|N*^3%Gz5scQf4Rue5XUbUe=E$shj%73r|69xdT|JjoH
H&+q>L_7_0j

literal 0
HcmV?d00001

diff --git a/static/favicon.ico b/static/favicon.ico
new file mode 100644
index 0000000000000000000000000000000000000000..ad4ca66a17637746a5c33e5a1cfc46e35754fac8
GIT binary patch
literal 21792
zcmeHv2UwKH^Z&l}`q2ag8^(eim7pLN>;*+)iBgRs8VhO=>2e36#%@FrrA3LTNz^C?
zMVis5!2-qxh=LspNE9QSl>5!zduQcPN%`ja|Jlb6yKmXq*?DJoXJ_X`h(HX&i9lw^
zR0pBYq1?SYcl~91gciU(Gc)eGgC0V8RtPn1%3U88z{|rC($!VJPa|~L5up{14#Oov
zQz1N+j2tm!9Da(yXCZU--ZcXu>CKTt22SuNN@KlNyG}GYm1E;K!?)^yTPKTIXI70F
z^-UgWI-;%qFFH>@xo^Dm*I#wEMnyGESP^15Y<JO$GTk*H-FpyALRz;S_H_sTH2<Ww
z;l1~-39}RJDLqo^>*rhCJl^uU$&5n}va?G{O1zYr(Iwf}wglz$%P9+ZT$XV*-Ln6V
zJ59|HF@_vyId}UqME4|UyB2nKQHa!a=)Y|+A{;4Q-S%=69x?X5t{u9B=x~7<x_QT-
z53P%=5HXeH+gU5ZrBF@MSglbc|6MKlmJEBUw=4Hi%J>k&z{q>evb`!UXIQN-_%iw8
z9Odkvo%bbmujyp)N5?-motgMJGPpe8uIrlgq?i(GbmX$4m$%Cr;^1(DIYSWfqh93>
zqtux>eqIK)hc2~UoL(I5u>0_$!gZ52Jesv|?!6IL61Et08`Cmr$4uM1?6CAhi7{To
z$0ZabPS1(!*NZoJ3*SuM)6*lvqOj_Rn1UxufAK3lYMI?4bN-=)MFE)$bDv!ZanBkn
zJUXU2Cxt4ru6S6G-EXE>TF)Yf{xPl>oJ+i(4+^%v=q>%iIwr{ZbfToyk=emDEsE~X
zO7tAv*G*O%y23!`n%|s7cMK*iz4ap7>4;Z)`N4o6;+1J*g7Z#1$n^+(eEE|9ow6Q<
z%CaU?nlIY>lLsjk^!(9sx*cja`qJ66`?CyczbL%up8rK^aiQXQO8A5P6@wM@?IAt}
z%Lo5n=v+W=vrd^8?;GHxo9ulm&3JtUJGVks<50Y>N^YN9`t^gv;U2fmb55R2PubJ=
z`mAQR){N7$Lpw&D%F6bi)U5Nds$P2!&dJKx3o86-zRtES^Ib-YTy7Sm>`VQ0k#!1H
zn&q(gme;MTeTuX5OKO(gNRK`caVnzQm}1{<IybL+WdxpJi?bJ>9kRY)=GYq(zV-~>
z;YNFw#LSMLar>8<<~v(mO}bDyywm3EpLNVGxV$I!(6r#2p(n2$ij2xGSn2LkR$~(#
zn|Wuu?%uR(%bOhvU+~L!vDLOyPu2QP`|5b<&{CecYt8+O`=2~&clFjDePFxYs9`^J
zUgKZ6WA}@qj9k;QiXN3uO3&yW4PVGpese26wVQb>UY_HcdC#6YUi0_rlu`MOWAKct
zzKYVL1K6^awksd5D+xYo$r~SdxqWPWf=x5!s1b<R*uA6g)^k^OM5I3I{2;F4vS*87
zll3Ne9ZH|mHSdH#@q!-k=-M;U{wFsw^8BZLzpG_R#;)Kj>8DQ(+s#U-h@Nlp{eZNf
zy&-2ty~s{G-uk@NgX0fad#4d*C+?V@J3|;}6h4~ld?o8}+O4bMvF4&kS4X4J8pH9~
zEfiiJ&mS4*pNiZZerxO8<!R<W**57t<>7Hj)wpW=c|lnx{TGfAL{*xYoo^Nz*?sO(
zof*4#7g^oQn6=N!Gh&LR;5(O<rw=(Pf^Hu%8sA3#^S2?9T`c!KOFkA<aA82L^W45O
zrsmt9yG_fSI`r@VxcW*`+e=Bk#PotIiN4mMclQKG9yR#tv9V(R&l9RHeLK6APT?if
z;{7qSuANP}_pm=Z+26R^wAF!#C6+B(jI|wnc$-Je&US5&jy$U0en*0R@=&*|okW=%
zllS|*@B9925T;z*`{ZJm!Id|v$?6mRgZ(EO4NIWf$Pv5Dd!p%qHFFM1=Ew$nCndW}
zXa1I|RDShDv1e~r<QI4S_fKPXBy9{4n8`!3BvbpB<;KpRRDQj%Y<s7heN&&zw;tSI
zY~B2N?Y--R%2zdCH1%wT^%t=wXS*3q@6d*z9Z&vvwqo}m(cMg%r9X(PP5ttRySf9G
z#d|-wAC_@-Ug-7K)@zZGW5>&UvctqaMt<$D&U};<YktLO?0L_=d91&GF;TMNM%IZI
z2a?V{4@HBWfQth&67%<MH>%DXk?A%%>v6eDEfZ4HEwNv`8}d1=5T>S`Pdn=PIm!R_
z$1VFqPWY7Uxos({nU(4G<HY15*YI<;Rk4}5iV|D0WbKW$zpS;JTRKHiVe0c~*2Q1+
z?a-3DHs`O5M)R9TD=y}~@bWoZ6j;`s`6+8@*Vx7VZr%znHT?00Zeo&E+&-3|e=?oG
zyLxZb+MAQSB?IRVyt9t5;6J{Qol+7+Df4Zz%b&t<xO*mRd&@odg9^$|p}{6kPsxo_
z7c441CjG8*T(Nb|nc<+@7UrvhK0Ua}|4CSoNzwG)wK1&*6)znyOSXFK^9$@nX*{YR
z#qkQKL%*g~$vpY-+3WV)cv?PbTJT}3Y!4g3Pdvx$w3r_02Mqh=bsJUv<*wkA%Mbe2
z&RA{H(tDQdkyXnxBjx?%-uLdVzCUr!-J;UtJCm1JtW}ntj{n0yrYhe=FWlcepVGCE
zhaAgEt$4mU^F`3ShzghfF1r^Gh^G%Gr=?%9j=S)C`g4!gH3!f2J>E`^mYqr6Xn&^j
z!BU~`9wxe*j-qqs!{p?gH9?uB3y1z0CrU5cVnLiut@X{H_T&qX=X*W6wV3U2E_0m0
z{jJZ&Rm5dW!tFA`d(S@?G;8i=okQ0hCu9UJ>d=2yMf2VVhWr?HtTr!i&H$;mU(5KS
z&i8jXCAI(?tNZjDo~|*A{VEyT;L5xQFCr(+Nd4hUpI@uiD3%XQW-@~|Tg)qXc-*Mq
zLhln(%Z!JQ3oOn!d2Le3h0O8ugnir!(lU~1-J@5ZTAa9GA-=gXr|PQ3*xW72D5l`c
z0g~jD88cCdb<voZ>RCTMWQ$iF8XsI9QnhkH)o1H>=DmntJ6+*E9Dhj^v~g}(e`Vav
zIltY0zOwW{LB#V%R>iqq<&O_snXsx=d49SgbGqO2(FHld!&9Hktcfa5$STZlR@^e+
zyB>bI_8n_m7u7}=Ou5G1zS~xgMn!FQKKJ=PLfoc}$L)m63$NNZOue0G;<D(}4{dH2
zFWX)d=sv;ymsClzcX7nhgn(&P0e|eCG%fJq-An$JPGz!%W)o^p<Sg-PGdZKexXD1p
zk)8Po)dq!2no2LXT6`%b_o_=^vAgV;!;RFU+()wD-&2+r6<+iVP0lX1Fpo(t2r^%1
zU2!tiHz8+Waa?l#^K&`Q`z!iHUfwaVup0vdcjc#DN`8&?D@^%gY5!Ac`)aPGp5Eu2
zRIqtT-s7O_`4)=W!y8=3rkW(X6g4@z+Wu6zNk+BR07dkul3%~Ix;xFa()P}tp-(4!
zlZ9)GM->h|GHDR$dm+;%%GkOve&$!h`kTr16TKXlBO~Yjt>?@3Y@1be&q5IsyzkE!
zPg{8{{N_;8#a>qIqIn*QbkEcCV9M(~C`~6cDM}uD$y1K#31CxSK5NjMUX93a#b#!s
z5y3Z)Ki^u8b`gBOfgL)QW$wc_L$eWijMkMecq(W?^5v#-d3S;~iwPdI9ICO6)fz?e
zAJmc?%J9^Atxc-V1jC*ejU4JQWbdFa!a6`1HrMD20N!zHOG>2@HKI`ljXKb%1OE#h
zP$(4Wui%A3K>{cZfEK~w1*K4Y6i9d<psN4DJpC_Z_MSFLcuoOu{@%G=CX=DRf|c@6
z<Mp9o=79F=Lc`jI%Vj*7>}zqTe3Q9czOlVrmE&@Kh-fR9uWK%oFA>UQfxr(&Fp|qd
zNx3|X=J=Bnb@8cfUHgFhBz~tQLZJf@Iz9lQj6Mkc0=GILq(2NHm*WUIWpKGOlqVn4
zj!8!mnwWx+!)}CZ*MZ;K73i1(a3TPl>sxjC<{y@2QA5CESrXTqpwnbexM53Wm|-(z
zph0V;xq!7{`9s|GB|DTllJAuIlATIjNg@E}^<jrnSNxr-j*fU!nMCM+SitW$m1Tu|
zjz2zC7oTtT=EJW*C@T36=S$+eB}P^AB?ixCi;bVQq|m2`w3#Sk*H`h`b>%{K!wUiX
zO_hM%P^}#sl>#<ODd5Edwp0t*$Z8?)Tcv>6@RX(|Za{>{062pt3H&YomZaf-6kn3y
zD=|_olo-62CvK`RqrhuV+B%8ZNF|@$SSbX)SSBEcriKO3)aWHNHA+TP_MrgzD>$xX
zDAzb1voM*@tiC5;p&#t}XHd5mml@hA8dQi6B7<{}zb9$<AIX<&TcqaSOWd@gl}i47
zCX3mP!2dTDLUyx~p`5mGt!itZfNx3h2qZEhiOvozJ$o<Lhlol6i?LNnk%Jd<G$=~l
zgTM4GUgLken*S=`zY_Qd`D6Y!0sk9-|0v+!8RUn*J<Wq0cqKrN1n{8&31ti}5roJH
z`Wz)-W8gb%Pzcy9H9TfTDM6TY<=#`t0q8YcpFWO%mssEosxWH)ar+vcRXJSKaOQ>k
zhjaWgU&^Ds(gkcZ^kE&y0rZG+*~;~hd*|QdAIl#nN~6Efm->>r4}@tq;QdblyRk~h
zZmr=nVRs1Bv?Is2HeIZb?yF}XCx7P{t|q0K$MM{S`=AEa0}WL7;1SnXmiG7o>p#q8
z&+#{)i6M(PS}Z=bY;gLE{A0egCG|7aIH5?Q<8U?qFc&A(GSswPoSwb>mfGmld;cHg
zU)?U|A18q>pIP?|<{?-=wkUZ_@MVMy+i}lc8}l%rpaKJ+KLjvYu=ssE|9`;z^S1uf
zCx4E$mw!o`r52u2t#7J6tg9f%_Jg^{G^`1KEe++1qyItvp`QfFQcls_T)Gx?C?3{=
zo|8DPS)oP`j7ZwDFDqQpn-v7wutK>tD_jf+(SpVBj;uE;40IFep7-I_ud2D+`c>Eb
z-%$Chz7wp|VFES|#_;MgA-l7dBKyu%^Dn|WfXm%k!Q3z%W91^Lp)yEnr1S&$zXt*E
ze38TuYzLM7Q1kcm&y4|^8tN<L`2R!5O9c53TEOwo2ww8f@Mnign<{-IhSh<<j~~GQ
z0|4*;3;d4=!gD9cU(NqeUp4=HJXUeJ1I<pJBQ_}dLZo-zQ>2&gA=0}tU8I+*4e&e<
zaCx4%$<u#M{@hwXQ)5@W;(sT$g}gQLhg_v&LV`4IPB8;bDB9YTqHO_v-h;mI+{RI$
zlcX8Hpg-E|pTD60B#d8|SUi5Q`~_@cElJvXa{RL*E^qkXVgKy>1B_7&OZ)tW=YFsy
zo@2X|B)d;g^Z#-U#(G2(gb*NjA1HW-0V9zl2-co2Nz}-{9{aNa@_)I0>G9dMU;}M}
zy}+g#0lVr6Nw(?7@vpJtK3@Ksd3VGs`@cT>`6Kw(*u*OPfh5U}BRJWE9nFiag+0y*
z2-Y&@I9Bx$S0L4(Ab&5Qu4=8uG+_Vo-G|GcR?XFTO?qXoY3#Pwb4;1D^%#1(%6=2D
zYs!VZ1hAneZNg7MUH;PA3;l$D2z{XZKgNCrx_F;}h1$Xr@1X^-9|jv5_F)^IkVH2J
z{7l0?2!g`8{4v1ege3?Gi~}C%|IYWz-!+btH;ebMU^-#hV*61ATn6C%Er!O%=IgNZ
z{7h_na^p5m$<lL=AjFfvJE}bnN0aMKL;nuriDTZ+zq5MZ^wQ>4eLHoV>hh~w1fl;4
z-fQtyd#?zEkllo3|0hXw8o||h#XrbVSD&Q18hjkOG$E;OP_MHCU%E%bzxMeb%OCFz
z1rTG2=WHxPo>&dI7U&R!PBW4)?M{=nU-D?5OqDN%-3WW%h)N+ZPDxV^Uvs>_w3$^M
zZb!4@W{3^Wd43$u;yTmC2B#N@o0Q@8*GFPd{VxAlcALR}5|YPI6C?0Go}ng3!QOl;
z_DQG#W%unY?Ue%i!yMpOHOC8h>tW6WpAg>n(r()k;zQpx`*zjXQ}N%G5qJbijcWp=
z##I2ESAQr1;awl8;fwhaqZbP#1{Jf!O`m}O!4mvelf>Y&;<M}j6tWTEyV?kIH|AwC
zK$GLL2KZjIQpm<s3wWDhuNzq-WVeC;YHcY^ja!5FFr4hMze1H>DqByXj)&Z!g;Lf)
zENRk0xwJ`3Wq6Zj%Ebm|%8o*|5B47#sQiZsN<EeD5PXAhtsURNvjhO-qU}nlc>P_8
zaNdtXzV&35<*EFXEGwX){En{^dSe3)*T{wfoB@#?5ZVNYXp7JWpw|L|eg`5n_7LD8
zLXMDQsIIl-4#^1F??q@JjPovwVSTa(I-oDAgk`Q?H@G=leP5M@fd4#57Sdn@L)}-9
zAxuvuUnY{v)-`(z&EZ-L)|$#?EA+6>Tqg4Y_yIz&|C|E<IaQzk9L@*`^;rQvFK7sG
z{kQSna|ftX*E^UFt;PqPU#QQH)Mq}Lv!B0|<Fg;2htGmO79V$Zgn8E@hsOJL>qnzp
z8s*Zc1An6qyuOw-mK!DTu@V5g3z-4z0EDUpg*sB>I#;K?^RLfkYJ2H@@hzH|8XOM;
z@2cz|ZSgeq#?1Un-yPeE*lv8UJnM=fdHdd~&`{IJuq8cLhlV!C&qC!J+lI=wb`6zp
z>GCF`I?3hh;hg}mxBbE1*4Wx$!>i+J-sY)}q4CZw2v(S5hfuaLLTW#;T|C61WC4DI
z7?jsA=>$TflMu364SRXDPmqhN&=7sQ{kmc}-o7_PthXwpNps~$ss2X%Oeze!q$}C3
z+TY=rl2_OT_YMH|Dy5<&xdOiBSO`mbV~_WC`x?IL%lojxCEjojF@Pt6enHP@A2|Pt
zsAj0oH&SGu>95dl7ERiR@tD91LSDR*&nzz{2!qzI`-K|PzAY<Ux)9Da?0BNJT>HMK
z!S|{pi1x6rd^eHAC$>EBQQ*Bj_!_=_{f)n~eUj)gk@JtK{AX&v8Fvm&5?viIkKl8t
zB#_uh!^7X(zQt!6x^L#3Pl(4X&IMm1oNx4=qIs^ZeF8e74R8*)tS<SJgtqo^YXkwl
zl2zE(!qD#9-q*h7d0n{;E0BMD``F)VIT?Qg9^;>_p<7q~q2DB&clOi<@JYrtq<w-g
zv*y}gSz2HF;LzZ^3H7qI;Y*Q0af8}NMi73s34B=_Ycyl9uKt7KiUQ&6QyYBY47FkH
z8@A=z-&9*)`{47YyE1%FZTL(eO>R*8M9WWc`+R17WqtD3Jkyr<Vg!K=Y5(OMz=Yk<
z(5_4V_!-Cm$2!yr7=K@XeES4RlOscL|5<7-#6ogOOZzYcUix6)DQla5wU2-G{6qVl
zgZ677#!jwo{vCS&--iZYKkRv@4DD-~f9jlnRX$mQXlIA@9`_&O#5&j4zUG;>9M-?E
zy5tY*&!D>M5JYPmSOd>ve=_*N(_Vk)ZTZ8Yi*O)MyrDig3w3|{N@Dl|*56f_7LQ&8
z=cf_X5K9?Bk=9dR0k6MfmhzZ@^W6Ho`VW$5hJSW~zo{y{-M%i%Gg@ubN?9M4<9Jr^
zOWRBJw{Z4H=tW)ecBRhSP{p(ESKA-UuM7CLE-XvD&;Ag1LnyI6SRk~k2SPtc5mK*X
zgA*VQIQv~-n`{jDj(e?zDQ$?l%PM_Pm*3GpxlBeZlgo8J1WROcK4*VMnumtQ^aS(>
z4UK*U`Bn?L{F_!>ytJRn-z$^JU)r9y?%VSJhps=^{>J+Wb<95AW7G?H7yEV9`;RKv
zf7FHgWA^`{{{CBX{ePw%&3O3#HOGDu_|I%qzsYO#le~YQu5H}br#}=Tc$N%*K|fZq
znol4hN%V4p*uyO}^%=z1k6+7B<5n}&XR9C<-=BcERzh_ijwxzlZM0HXt!E4(bex2e
z%sJwwB{~Gsr>JS$MEIPRje|4t1f`I-9f0%i;k<VT*g+n92qZPpO7+zP4Sn$hfh5IK
zY<yQrARUTwje^(#ID5C3QDiT7ysv__cM44o_2)4@Cxy5Tdg@M&j3#d4B~eUMvkrr)
zhYv9c>E{AT+Dx(WL*QSRqNc>bS+f!m&0slvGhrKsM`N2}6T~}Wy9Xy6L!dnYeepzr
zBz1<^_yO<_^xdN|eXxz-=QR}6#jyuCW{D5+2YA0^K2*ql4}EZo;;6pt1GdRD`$HTX
zgv%rg^2huG{fC@<++#TUX1%!jn(xTjg9MToK}^669P<k?8LhZ?wEtD}f8<^IZTfJv
zxV<)KKH@tx5AXN!zMmw_dTS_yjm6U?$hJBJX$EMmhM56Db#W3(PXPV<YWb-7|HOu?
ztKlDCac$Am@IcTfpx<%0hCal8boCJFUvm=bo`gMIj*C$5w5w3>oU2ejd%jrznTN>e
zmM-Wg3Gx@I<X;zkPSz01Izz-uf<3#1qlUf-Nm~a?jg|8yO)7AFD)?e*aGWRPwZ4)j
z%4s5_8$cgIR@}F~k3LP=dJ2I)#2vk)Ps6Y8bxEq74oS5Je4<8c1Cs9g;qu{Paqw6c
z^7a7zF8It|lQep-xmM-St_Y7Wtp9K7Po3WvXwZCyc81txh#4f>^nHUEH?}nGyc}Pk
z{~G<o`u`sNl$!AAup-dWB7!i+O9W0h$OFfgYvRx;br}W_p$qz-{@VBg`kS#|>aFpG
zV|(!U>M~l$?uPN@7LTtrI>nXW{rj5!KjP$r=Lfu>G41m9+XT_3ACHk2aQ+@kC+<1T
z7ZIe%1c6TKIDt;`c!5p|;IJAg69l?P=8E-8K|gPD`subs1pL#KTO3U~EK`AUTmio^
z_@2)!DT3b{z#QtL=ADam)FY_&GSE%X&zi-Mt5F*QWr*Xc4UjfbdWZ}$eHbQKKcm4X
z76oxk_%~Jf_dIbBXS1zVz-)n7zR8<4bCIThcz@J}V#a(zG4_DbZ-O1&o@U0GQG9#w
zVUPsbb3CjmYjJ!yO^pdx{l1H|52eU{vk8RfRMi*;9l_HXm$a>GjrTd5KqIIBN{$C5
z4!$x2{Fm)EU=Jsio`D_2#~0?b(9J=>+fERztOQKRRhVb4@tLK!0JkBQGKC<F+T-`2
znri;S1$+hbq$)1D2P5&BCgS}Haf>5`Ok_0$YZ0DrX=;c+p9#$sFkcrzY#RP;r6y_W
z3-ApKMzX+F$fiR5;R0sKEugH9+f=R31fTi(HbaeFs;P|UIVj_GUW)JaWF)>*gzQlq
zHz{DSPgBPfOaY)Fg`*L$XQ<KG_kSLj)#;t~-Gyu>*Z%T{FxFLcIU0BXcNm6a+BNZY
z{aMkf86y2Vu%`a*Ce%3xcHW=PLiP|%cD4szp}r8S0wk^<U?X+m{5?7<8?PI~pJ6YM
zBo5<Cq6hH>>s^F~7hHtw5sK_I3S<TKar`At+}cYJ&AVg!3hWeBf8fCz{C8o*bKHb%
z2G{@B>vMJ(*k$AS%&NzlenDI=4?{qZs&8V+N&-0fbq4vZC;=aZ>OTH$Am)Oh++xAE
za{`y4VF->UBqSmrNSADa?}7aNUVXo1_ra_I`;F5TEIWu-1iPV^3x2mH#SHcZpRSk0
zupEBR3%S7`{!&w=yO5Vk6CFn3I9?tde2GVg<nox%>v$f97};1{7vw=p2(ndgMi5}h
z2o_i|LSL}s=UXwNfc6yp-<j~6KWt}#Uw=D8Pfdj1%EnVf*D)L~96$f-`IGBM!~gyt
D$c9dJ

literal 0
HcmV?d00001

diff --git a/utils/remover.py b/utils/remover.py
new file mode 100644
index 00000000..327db984
--- /dev/null
+++ b/utils/remover.py
@@ -0,0 +1,53 @@
+#!/usr/bin/env python
+# encoding: utf-8
+"""
+remover.py
+
+Created by Roman on 2010-06-20.
+Copyright (c) 2010 __MyCompanyName__. All rights reserved.
+"""
+
+import datetime
+import logging
+
+from google.appengine.ext.webapp import util
+from google.appengine.ext import webapp
+from google.appengine.api import users
+
+from ffstorage import *
+
+class Remover(webapp.RequestHandler):
+	def get(self):
+		logging.debug("Starting r3m0v3r")
+		user = users.get_current_user()
+		logging.debug("Working as user %s" % user)
+		theDate = datetime.date.today() - datetime.timedelta(days=2)
+		logging.debug("Will delete stuff older than %s" % theDate)
+
+		fics = DownloadedFanfic.all()
+		fics.order("date")
+		
+		results = fics.fetch(50)
+		
+		
+		logging.debug([x.name for x in results])
+		                        
+		num = 0
+		for d in results:
+#			d.blob = None
+#			d.cleared = True
+			d.delete()
+			num = num + 1
+		logging.info('Deleted instances: %d' % num)
+		self.response.out.write('Deleted instances: %d' % num)
+		
+
+def main():
+	application = webapp.WSGIApplication([('/r3m0v3r', Remover)],
+                                               debug=False)
+	util.run_wsgi_app(application)
+
+
+if __name__ == '__main__':
+	logging.getLogger().setLevel(logging.DEBUG)
+	main()
\ No newline at end of file

From 348786f0734272bb94533440d0d0e61d49b02a11 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Mon, 22 Nov 2010 07:06:29 +0000
Subject: [PATCH 77/94] cvreating a special tag so we can quickly restore to
 previous version


From dd483db783e30574dde166c88cf21d7705b6c65b Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Mon, 22 Nov 2010 13:24:50 -0600
Subject: [PATCH 78/94] Move books directory down into sub dir next to CLI.

---
 {books => fanficdownloader/books}/place holder.txt | 0
 1 file changed, 0 insertions(+), 0 deletions(-)
 rename {books => fanficdownloader/books}/place holder.txt (100%)

diff --git a/books/place holder.txt b/fanficdownloader/books/place holder.txt
similarity index 100%
rename from books/place holder.txt
rename to fanficdownloader/books/place holder.txt

From ecdeef4b3b81a2965ef5032191321120a8c641a0 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Mon, 22 Nov 2010 15:00:00 -0600
Subject: [PATCH 79/94] Add new adapters to main.py, update verbiage on index,
 replace a couple prints with logging.debug.

---
 fanficdownloader/fictionalley.py |   2 +-
 fanficdownloader/ficwad.py       |   2 +-
 index.html                       | 103 ++++++++++++++++++-------------
 main.py                          |  10 ++-
 4 files changed, 69 insertions(+), 48 deletions(-)

diff --git a/fanficdownloader/fictionalley.py b/fanficdownloader/fictionalley.py
index 332a08af..68cd36e4 100644
--- a/fanficdownloader/fictionalley.py
+++ b/fanficdownloader/fictionalley.py
@@ -249,7 +249,7 @@ class FictionAlley(FanfictionSiteAdapter):
 					logging.debug('li chapterlink not found!  li=%s' % li)
 					
 
-		print('Story "%s" by %s' % (self.storyName, self.authorName))
+		logging.debug('Story "%s" by %s' % (self.storyName, self.authorName))
 		
 		return result
 	
diff --git a/fanficdownloader/ficwad.py b/fanficdownloader/ficwad.py
index 13e7a45d..058528bc 100644
--- a/fanficdownloader/ficwad.py
+++ b/fanficdownloader/ficwad.py
@@ -170,7 +170,7 @@ class FicWad(FanfictionSiteAdapter):
 						logging.debug('self.numWords=%s' % self.numWords)
 					
 		
-		print('Story "%s" by %s' % (self.storyName, self.authorName))
+		logging.debug('Story "%s" by %s' % (self.storyName, self.authorName))
 		
 		result = []
 		ii = 1
diff --git a/index.html b/index.html
index 4987804d..f5736129 100644
--- a/index.html
+++ b/index.html
@@ -2,7 +2,7 @@
 <html>
 	<head>
 		<link href="css/index.css" rel="stylesheet" type="text/css">
-		<title>Fanfiction Downloader &mdash; twilighted.net, fanfiction.net, fictionpress.com, fictionalley.org, ficwad.com, potionsandsnitches.net, harrypotterfanfiction.com to epub and HTML to Stanza, Kindle, Nook, Sony Reader</title>
+		<title>Fanfiction Downloader &mdash; twilighted.net, fanfiction.net, fictionpress.com, fictionalley.org, ficwad.com, potionsandsnitches.net, harrypotterfanfiction.com, mediaminer.org to epub and HTML to Stanza, Kindle, Nook, Sony Reader</title>
 		<meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
 		<meta name="google-site-verification" content="kCFc-G4bka_pJN6Rv8CapPBcwmq0hbAUZPkKWqRsAYU" />
 	</head>
@@ -33,23 +33,11 @@
 			<form action="/fdown" method="post">
 				<div id='urlbox'>
 					<div id='greeting'>
-					  Hi, {{ nickname }}! This is a fan fiction downloader, which makes reading stories from various websites
-					  much easier. 
-					  <ul>
-					    <li>
-					      For fictionalley.org, please paste the URL of the story's chapter list in the box, such as
-					      <a href="http://www.fictionalley.org/authors/drt/DA.html">this</a>.  Or the story text URL for
-					      fictionalley.org one-shots, such
-					      as <a href="http://www.fictionalley.org/authors/drt/JOTP01a.html">this</a>.
-					    </li>
-					    <li>
-					      For all other supported sites, please paste the URL of the <em>first chapter</em> in the box.  For
-					      one-shots, the first chapter is the whole story.
-					    </li>
-					    <li>
-					      Alternatively, see your personal list of <a href="/recent">previously downloaded fanfics</a>.
-					    </li>
-					  </ul>	
+					  <p>Hi, {{ nickname }}! This is a fan fiction downloader, which makes reading stories from various websites
+					  much easier. </p>
+					  <p>To support new features, such as including story summaries,
+					    the URL you need to use for some sites has changed.  See below for example URLs for each site.  </p>
+					  <p>Or see your personal list of <a href="/recent">previously downloaded fanfics</a>.</p>
 					</div>
 					<div id='error'>
 					{{ error_message }}
@@ -66,23 +54,24 @@
 					</div>
 				</div>
 				
-				<h3>Login and Password</h3>
-				<div id='logpassword'>
-				  
-					If the story requires a login and password to download (e.g. marked as Mature on FFA), you may need to provide
-					your credentials to download it, otherwise just leave it empty
-				</div>
 				<div id='logpasswordtable'>
-					<div class='fieldandlabel'>
-						<div class='label'>Login</div>
-						<div class='field'><input type='text' name='login' size='50'></div>
-					</div>
-					
-					<div class='fieldandlabel'>
-						<div class='label'>Password</div>
-						<div class='field'><input type='password' name='password' size='50'></div>
-					</div>
+				  <h3>Login and Password</h3>
+				  <div id='logpassword'>
+				    
+				    If the story requires a login and password to download (e.g. marked as Mature on FFA), you may need to provide
+				    your credentials to download it, otherwise just leave it empty
+				  </div>
+				  <div class='fieldandlabel'>
+				    <div class='label'>Login</div>
+				    <div class='field'><input type='text' name='login' size='50'></div>
+				  </div>
+				  
+				  <div class='fieldandlabel'>
+				    <div class='label'>Password</div>
+				    <div class='field'><input type='password' name='password' size='50'></div>
+				  </div>
 				</div>
+				
 				<div id='submitbtn'>
 					<input type="submit" value="Download">
 				</div>
@@ -100,7 +89,41 @@
 			{% endif %}
 			
 				<div id='helpbox'>
-				Few things to know, which will make your life substantially easier:
+				  <dl>
+				    <dt>fictionalley.org
+				    <dd>Use the URL of the story's chapter list, such as
+				      <br /><a href="http://www.fictionalley.org/authors/drt/DA.html">http://www.fictionalley.org/authors/drt/DA.html</a>.  Or the story text URL for
+				      fictionalley.org one-shots, such as
+				      <br /><a href="http://www.fictionalley.org/authors/drt/JOTP01a.html">http://www.fictionalley.org/authors/drt/JOTP01a.html</a>.
+				    <dt>fanfiction.net
+				    <dd>Use the URL of any story chapter, with or without story title such as
+				      <br /><a href="http://www.fanfiction.net/s/5192986/1/A_Fox_in_Tokyo">http://www.fanfiction.net/s/5192986/1/A_Fox_in_Tokyo</a> or 
+				      <br /><a href="http://www.fanfiction.net/s/5192986/5/">http://www.fanfiction.net/s/5192986/5/</a>.
+				    <dt>fictionpress.com
+				    <dd>Use the URL of any story chapter, such as
+				      <br /><a href="http://www.fictionpress.com/s/2851771/1/Untouchable_Love">http://www.fictionpress.com/s/2851771/1/Untouchable_Love</a> or 
+				      <br /><a href="http://www.fictionpress.com/s/2847338/6/">http://www.fictionpress.com/s/2847338/6/</a>.
+				    <dt>twilighted.net
+				    <dd>Use the URL of the start of the story, such as
+				      <br /><a href="http://twilighted.net/viewstory.php?sid=8422">http://twilighted.net/viewstory.php?sid=8422</a>.
+				    <dt>ficwad.com
+				    <dd>Use the URL of any story chapter, such as
+				      <br /><a href="http://www.ficwad.com/story/75246">http://www.ficwad.com/story/75246</a>.
+				    <dt>harrypotterfanfiction.com
+				    <dd>Use the URL of the story's chapter list, such as
+				      <br /><a href="http://www.harrypotterfanfiction.com/viewstory.php?psid=289208">http://www.harrypotterfanfiction.com/viewstory.php?psid=289208</a>.
+				    <dt>potionsandsnitches.net
+				    <dd>Use the URL of the story's chapter list, such as
+				      <br /><a href="http://potionsandsnitches.net/fanfiction/viewstory.php?sid=2332">http://potionsandsnitches.net/fanfiction/viewstory.php?sid=2332</a>.
+				    <dt>mediaminer.org
+				    <dd>Use the URL of the story's chapter list, such as
+				      <br /><a href="http://www.mediaminer.org/fanfic/view_st.php/166653">http://www.mediaminer.org/fanfic/view_st.php/166653</a>.
+				      Or the story URL for one-shots, such as
+				      <br /><a href="http://www.mediaminer.org/fanfic/view_st.php/167618">http://www.mediaminer.org/fanfic/view_st.php/167618</a>.
+				  </dl>	
+
+				  
+				A few additional things to know, which will make your life substantially easier:
 				<ol>
 				  <li>
 				    First thing to know: I do not use your login and password. In fact, all I know about it is your ID &ndash; password
@@ -111,20 +134,12 @@
 				    &mdash; how to read fiction in Stanza or any other ebook reader.
 				  </li>
 				  <li>
-				    Currently we support fanfiction.net, fictionpress.com, ficwad.com, fictionalley.org, harrypotterfanfiction.com, potionsandsnitches.net, and twilighted.net.
-				    (fanficauthors.net withdrawn as they offer native ePub functionality now.)
+				    Currently we support fanfiction.net, fictionpress.com, ficwad.com, fictionalley.org, harrypotterfanfiction.com, potionsandsnitches.net, mediaminer.org and twilighted.net.
+				    fanficauthors.net and tthfanfic.org offer native ePub functionality.
 				  </li>
 				  <li>
 				    You can download fanfiction directly from your iPhone, Kindle or (possibly) other ebook reader.
 				  </li>
-				  <li>
-				    Paste a URL of the first chapter of the fanfic, not the index page, except for fictionalley.org.
-				  </li>
-				  <li>
-				    For fictionalley.org, you need to use the URL of the story's chapter list, such as
-				    <a href="http://www.fictionalley.org/authors/drt/DA.html">this</a>.  Or the story text URL for fictionalley.org
-				    one-shots, such as <a href="http://www.fictionalley.org/authors/drt/JOTP01a.html">this</a>.
-				  </li>
 				  <li>
 				    One-shots, fics with a single chapter, <em>are</em> now supported.
 				  </li>
diff --git a/main.py b/main.py
index 1ca7dcb2..1ae0ac99 100644
--- a/main.py
+++ b/main.py
@@ -184,12 +184,18 @@ class FanfictionDownloader(webapp.RequestHandler):
 				adapter = fictionalley.FictionAlley(url)
 			elif url.find('ficwad') != -1:
 				adapter = ficwad.FicWad(url)
-			elif url.find('fanfiction.net') != -1 or url.find('fictionpress.com') != -1:
+			elif url.find('fanfiction.net') != -1:
 				adapter = ffnet.FFNet(url)
+			elif url.find('fictionpress.com') != -1:
+				adapter = fpcom.FPCom(url)
 			elif url.find('harrypotterfanfiction.com') != -1:
 				adapter = hpfiction.HPFiction(url)
-			elif url.find('twilighted') != -1 or url.find('potionsandsnitches.net') != -1:
+			elif url.find('twilighted.net') != -1:
 				adapter = twilighted.Twilighted(url)
+			elif url.find('potionsandsnitches.net') != -1:
+				adapter = potionsNsnitches.PotionsNSnitches(url)
+			elif url.find('mediaminer.org') != -1:
+				adapter = mediaminer.MediaMiner(url)
 			else:
 				logging.debug("Bad URL detected")
 				self.redirect('/?error=bad_url&url=' + urlEscape(url) )

From cf0d1bf09be23668c6495c9e74c321d1a07177cb Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Mon, 22 Nov 2010 20:05:58 -0600
Subject: [PATCH 80/94] Change output names for web version, make html & text
 output work for CLI version.

---
 fanficdownloader/downloader.py | 12 ++++++++++++
 fanficdownloader/output.py     | 13 +++++++++++--
 main.py                        |  5 +++--
 3 files changed, 26 insertions(+), 4 deletions(-)

diff --git a/fanficdownloader/downloader.py b/fanficdownloader/downloader.py
index cb4ca7d4..17078430 100644
--- a/fanficdownloader/downloader.py
+++ b/fanficdownloader/downloader.py
@@ -62,6 +62,13 @@ class FanficLoader:
 		self.standAlone = sa
 		return self.standAlone
 	
+	def getOverWrite(self):
+		return self.overWrite
+
+	def setOverWrite(self, sa):
+		self.overWrite = sa
+		return self.overWrite
+	
 	def getAdapter():
 		return self.adapter
 	
@@ -153,6 +160,8 @@ if __name__ == '__main__':
 		writerClass = output.EPubFanficWriter
 	elif bookFormat == 'html':
 		writerClass = output.HTMLWriter
+	elif bookFormat == 'text':
+		writerClass = output.TextWriter
 	
 	if adapter.requiresLogin(url):
 		print("Meow, URL %s requires you to haz been logged in! Please can I haz this datas?" % url)
@@ -167,6 +176,9 @@ if __name__ == '__main__':
 	
 	loader = FanficLoader(adapter, writerClass)
 	loader.setStandAlone(True)
+	if bookFormat != 'epub':
+		loader.setOverWrite(True)
+	
 
 	try:
 		loader.download()
diff --git a/fanficdownloader/output.py b/fanficdownloader/output.py
index af6788ce..ff5daa51 100644
--- a/fanficdownloader/output.py
+++ b/fanficdownloader/output.py
@@ -60,6 +60,7 @@ class TextWriter(FanficWriter):
 		return '.txt'
 	
 	def __init__(self, base, adapter, inmemory=False, compress=False):
+		self.inmemory = inmemory
 		self.htmlWriter = HTMLWriter(base, adapter, True, False)
 	
 	def writeChapter(self, index, title, text):
@@ -67,9 +68,17 @@ class TextWriter(FanficWriter):
 	
 	def finalise(self):
 		self.htmlWriter.finalise()
-		self.output = StringIO.StringIO()
+		self.name=self.htmlWriter.name
+		self.fileName = self.htmlWriter.fileName.replace(".html",".txt")
+		if self.inmemory:
+			self.output = StringIO.StringIO()
+		else:
+			self.output = open(self.fileName, 'w')
+		
 		self.output.write(html2text.html2text(self.htmlWriter.output.getvalue().decode('utf-8')).encode('utf-8'))
-		self.name = self.htmlWriter.name
+		
+		if not self.inmemory:
+			self.output.close()
 		
 
 class HTMLWriter(FanficWriter):
diff --git a/main.py b/main.py
index 1ae0ac99..9a9cbf31 100644
--- a/main.py
+++ b/main.py
@@ -230,7 +230,8 @@ class FanfictionDownloader(webapp.RequestHandler):
 				ext = '.html'
 				if format == 'text':
 					ext = '.txt'
-				files = {makeAcceptableFilename(str(adapter.getStoryName())) + ext : StringIO.StringIO(data.decode('utf-8')) }
+				logging.debug(data)
+				files = {makeAcceptableFilename(str(adapter.getOutputName())) + ext : StringIO.StringIO(data.decode('utf-8')) }
 				d = inMemoryZip(files)
 				data = d.getvalue()
 			
@@ -265,7 +266,7 @@ class FanfictionDownloader(webapp.RequestHandler):
 			fic.user = user
 			fic.url = url
 			fic.format = format
-			fic.name = self._printableVersion(adapter.getStoryName())
+			fic.name = self._printableVersion(adapter.getOutputName())
 			fic.author = self._printableVersion(adapter.getAuthorName())
 			fic.blob = data
 			

From ebcce7e42d6b98581f69152caebfdcb176af2743 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Tue, 23 Nov 2010 07:15:18 +0000
Subject: [PATCH 81/94] Adding Mobi format and making final configuration
 changes before uploading a beta version.

---
 app.yaml                       |   8 +-
 fanficdownloader/downloader.py |   2 +
 fanficdownloader/html.py       | 121 ++++++++++++
 fanficdownloader/mobi.py       | 344 +++++++++++++++++++++++++++++++++
 fanficdownloader/output.py     |  67 ++++++-
 5 files changed, 533 insertions(+), 9 deletions(-)
 create mode 100644 fanficdownloader/html.py
 create mode 100644 fanficdownloader/mobi.py

diff --git a/app.yaml b/app.yaml
index 6f1ccdc8..8709ef3a 100644
--- a/app.yaml
+++ b/app.yaml
@@ -1,13 +1,9 @@
 application: fanfictionloader
-version: 2-5-5
+version: 2-6-beta
 runtime: python
 api_version: 1
 
 handlers:
-- url: /generate_mock_data
-  script: mocks/generate_mock_data.py
-  login: admin
-
 - url: /r3m0v3r
   script: utils/remover.py
   login: admin
@@ -25,7 +21,5 @@ handlers:
 - url: /static
   static_dir: static
 
-
 - url: /.*
   script: main.py
- 
diff --git a/fanficdownloader/downloader.py b/fanficdownloader/downloader.py
index 17078430..c31f1a4b 100644
--- a/fanficdownloader/downloader.py
+++ b/fanficdownloader/downloader.py
@@ -160,6 +160,8 @@ if __name__ == '__main__':
 		writerClass = output.EPubFanficWriter
 	elif bookFormat == 'html':
 		writerClass = output.HTMLWriter
+	elif bookFormat == 'mobi':
+		writerClass = output.MobiWriter
 	elif bookFormat == 'text':
 		writerClass = output.TextWriter
 	
diff --git a/fanficdownloader/html.py b/fanficdownloader/html.py
new file mode 100644
index 00000000..2c14a58d
--- /dev/null
+++ b/fanficdownloader/html.py
@@ -0,0 +1,121 @@
+#!/usr/bin/python
+# Copyright(c) 2009 Andrew Chatham and Vijay Pandurangan
+
+import re
+import sys
+import StringIO
+import urllib
+
+from BeautifulSoup import BeautifulSoup
+
+class HtmlProcessor:
+  WHITESPACE_RE = re.compile(r'\s')
+  # Look for </blockquote  <p>
+  BAD_TAG_RE = re.compile(r'<[^>]+<', re.MULTILINE)
+
+  def __init__(self, html, unfill=0):
+    self.unfill = unfill
+    html = self._ProcessRawHtml(html)
+    self._soup = BeautifulSoup(html)
+    if self._soup.title:
+      self.title = self._soup.title.contents[0]
+    else:
+      self.title = None
+
+  def _ProcessRawHtml(self, html):
+    new_html, count = HtmlProcessor.BAD_TAG_RE.subn('<', html)
+    if count:
+      print >>sys.stderr, 'Replaced %d bad tags' % count
+    return new_html
+
+  def _StubInternalAnchors(self):
+    '''Replace each internal anchor with a fixed-size filepos anchor.
+
+    Looks for every anchor with <a href="#myanchor"> and replaces that
+    with <a filepos="00000000050">. Stores anchors in self._anchor_references'''
+    self._anchor_references = []
+    anchor_num = 0
+    for anchor in self._soup.findAll('a', href=re.compile('^#')):
+      self._anchor_references.append((anchor_num, anchor['href']))
+      del anchor['href']
+      anchor['filepos'] = '%.10d' % anchor_num
+      anchor_num += 1
+
+  def _ReplaceAnchorStubs(self):
+    # TODO: Browsers allow extra whitespace in the href names.
+    assembled_text = self._soup.prettify()
+    del self._soup # shouldn't touch this anymore
+    for anchor_num, original_ref in self._anchor_references:
+      ref = urllib.unquote(original_ref[1:]) # remove leading '#'
+      # Find the position of ref in the utf-8 document.
+      # TODO(chatham): Using regexes and looking for name= would be better.
+      newpos = assembled_text.rfind(ref.encode('utf-8'))
+      if newpos == -1:
+        print >>sys.stderr, 'Could not find anchor "%s"' % original_ref
+        continue
+      newpos += len(ref) + 2  # don't point into the middle of the <a name> tag
+      old_filepos = 'filepos="%.10d"' % anchor_num
+      new_filepos = 'filepos="%.10d"' % newpos
+      assert assembled_text.find(old_filepos) != -1
+      assembled_text = assembled_text.replace(old_filepos, new_filepos, 1)
+    return assembled_text
+
+  def _FixPreTags(self):
+    '''Replace <pre> tags with HTML-ified text.'''
+    pres = self._soup.findAll('pre')
+    for pre in pres:
+      pre.replaceWith(self._FixPreContents(str(pre.contents[0])))
+
+  def _FixPreContents(self, text):
+    if self.unfill:
+      line_splitter = '\n\n'
+      line_joiner = '<p>'
+    else:
+      line_splitter = '\n'
+      line_joiner = '<br>'
+    lines = []
+    for line in text.split(line_splitter):
+      lines.append(self.WHITESPACE_RE.subn('&nbsp;', line)[0])
+    return line_joiner.join(lines)
+
+  def _RemoveUnsupported(self):
+    '''Remove any tags which the kindle cannot handle.'''
+    # TODO(chatham): <link> tags to script?
+    unsupported_tags = ('script', 'style')
+    for tag_type in unsupported_tags:
+      for element in self._soup.findAll(tag_type):
+        element.extract()
+
+  def RenameAnchors(self, prefix):
+    '''Rename every internal anchor to have the given prefix, then
+    return the contents of the body tag.'''
+    for anchor in self._soup.findAll('a', href=re.compile('^#')):
+      anchor['href'] = '#' + prefix + anchor['href'][1:]
+    for a in self._soup.findAll('a'):
+      if a.get('name'):
+        a['name'] = prefix + a['name']
+
+    # TODO(chatham): figure out how to fix this. sometimes body comes out
+    # as NoneType.
+    content = []
+    if self._soup.body is not None:
+      content = [unicode(c) for c in self._soup.body.contents]
+    return '\n'.join(content)
+
+  def CleanHtml(self):
+    # TODO(chatham): fix_html_br, fix_html
+    self._RemoveUnsupported()
+    self._StubInternalAnchors()
+    self._FixPreTags()
+    return self._ReplaceAnchorStubs()
+
+
+if __name__ == '__main__':
+  FILE ='/tmp/documentation.html'
+  #FILE = '/tmp/multipre.html'
+  FILE = '/tmp/view.html'
+  import codecs
+  d = open(FILE).read()
+  h = HtmlProcessor(d)
+  s = h.CleanHtml()
+  #print s
diff --git a/fanficdownloader/mobi.py b/fanficdownloader/mobi.py
new file mode 100644
index 00000000..4facb556
--- /dev/null
+++ b/fanficdownloader/mobi.py
@@ -0,0 +1,344 @@
+#!/usr/bin/python
+# Copyright(c) 2009 Andrew Chatham and Vijay Pandurangan
+
+    
+import StringIO
+import struct
+import time
+import random
+import logging
+
+from html import HtmlProcessor
+
+# http://wiki.mobileread.com/wiki/MOBI
+# http://membres.lycos.fr/microfirst/palm/pdb.html
+
+encoding = {
+  'UTF-8' : 65001,
+  'latin-1' : 1252,
+}
+
+languages = {"en-us" : 0x0409,
+             "sv"    : 0x041d,
+             "fi"    : 0x000b,
+             "en"    : 0x0009,
+             "en-gb" : 0x0809}
+
+def ToHex(s):
+  v = ['%.2x' % ord(c) for c in s]
+  return ' '.join(v)
+
+class _SubEntry:
+  def __init__(self, pos, html_data):
+    self.pos = pos
+    self.html = HtmlProcessor(html_data)
+    self.title = self.html.title
+    self._name = 'mobi_article_%d' % pos
+    if not self.title:
+      self.title = 'Article %d' % self.pos
+
+  def TocLink(self):
+    return '<a href="#%s_MOBI_START">%.80s</a>' % (self._name, self.title)
+  
+  def Anchor(self):
+    return '<a name="%s_MOBI_START">' % self._name
+
+  def Body(self):
+    return self.html.RenameAnchors(self._name + '_')
+
+class Converter:
+  def __init__(self, refresh_url=''):
+    self._header = Header()
+    self._refresh_url = refresh_url
+
+  def ConvertString(self, s):
+    out = StringIO.StringIO()
+    self._ConvertStringToFile(s, out)
+    return out.getvalue()
+
+  def ConvertStrings(self, html_strs):
+    out = StringIO.StringIO()
+    self._ConvertStringsToFile(html_strs, out)
+    return out.getvalue()
+
+  def ConvertFile(self, html_file, out_file):
+    self._ConvertStringToFile(open(html_file).read(),
+                              open(out_file, 'w'))
+
+  def ConvertFiles(self, html_files, out_file):
+    html_strs = [open(f).read() for f in html_files]
+    self._ConvertStringsToFile(html_strs, open(out_file, 'w'))
+
+  def MakeOneHTML(self, html_strs):
+    """This takes a list of HTML strings and returns a big HTML file with
+    all contents consolidated.  It constructs a table of contents and adds
+    anchors within the text
+    """
+    toc_html = []
+    if self._refresh_url:
+      toc_html.append('<a href="%s">Update Reading List</a><br>' %
+                      self._refresh_url)
+    body_html = []
+    titles = []
+
+    PAGE_BREAK = '<mdb;pagebreak>'
+    for pos, html in enumerate(html_strs):
+      entry = _SubEntry(pos+1, html)
+      titles.append(entry.title[:10])
+      toc_html.append('%s<br>' % entry.TocLink())
+
+      # give some space between bodies of work.
+      body_html.append(PAGE_BREAK)
+      body_html.append(entry.Anchor())
+      
+      body_html.append('<h1>%s</h1>' % entry.title)
+      body_html.append(entry.Body())
+      
+    # TODO: this title can get way too long with RSS feeds. Not sure how to fix
+    header = '<html><title>Bibliorize %s GMT</title><body>' % time.ctime(
+      time.time())
+
+    footer = '</body></html>'
+    all_html = header + '\n'.join(toc_html + body_html) + footer
+    return all_html
+
+  def _ConvertStringsToFile(self, html_strs, out_file):
+    try:
+      tmp = self.MakeOneHTML(html_strs)
+      self._ConvertStringToFile(tmp, out_file)
+    except Exception, e:
+      logging.error('Error %s', e)
+      logging.debug('Details: %s' % html_strs)
+
+  def _ConvertStringToFile(self, html_data, out):
+    html = HtmlProcessor(html_data)
+    data = html.CleanHtml()
+    records = []
+    title = html.title
+    if title:
+      self._header.SetTitle(title)
+    record_id = 1
+    for start_pos in range(0, len(data), Record.MAX_SIZE):
+      end = min(len(data), start_pos + Record.MAX_SIZE)
+      record_data = data[start_pos:end]
+      records.append(self._header.AddRecord(record_data, record_id))
+      record_id += 1
+    self._header.SetImageRecordIndex(record_id)
+    records[0:0] = [self._header.MobiHeader()]
+
+    header, rec_offset = self._header.PDBHeader(len(records))
+    out.write(header)
+    for record in records:
+      record.WriteHeader(out, rec_offset)
+      rec_offset += len(record.data)
+
+    # Write to nuls for some reason
+    out.write('\0\0')
+    for record in records:
+      record.WriteData(out)
+
+class Record:
+  MAX_SIZE = 4096
+  INDEX_LEN = 8
+  _unique_id_seed = 28  # should be arbitrary, but taken from MobiHeader
+
+  # TODO(chatham): Record compression doesn't look that hard.
+
+  def __init__(self, data, record_id):
+    assert len(data) <= self.MAX_SIZE
+    self.data = data
+    if record_id != 0:
+      self._id = record_id
+    else:
+      Record._unique_id_seed += 1
+      self._id = 0
+
+  def __repr__(self):
+    return 'Record: id=%d len=%d' % (self._id, len(self.data))
+
+  def _SetUniqueId(self):
+    Record._unique_id_seed += 1
+    # TODO(chatham): Wraparound crap
+    self._id = Record._unique_id_seed
+
+  def WriteData(self, out):
+    out.write(self.data)
+
+  def WriteHeader(self, out, rec_offset):
+    attributes =  64 # dirty?
+    header = struct.pack('>IbbH',
+                         rec_offset,
+                         attributes,
+                         0, self._id)
+    assert len(header) == Record.INDEX_LEN
+    out.write(header)
+
+EXTH_HEADER_FIELDS = {
+  'author' : 100,
+  'publisher' : 101,
+}
+
+class Header:
+  EPOCH_1904 = 2082844800
+
+  def __init__(self):
+    self._length = 0
+    self._record_count = 0
+    self._title = '2008_2_34'
+    self._author = 'Unknown author'
+    self._publisher = 'Unknown publisher'
+    self._first_image_index = 0
+
+  def SetAuthor(self, author):
+    self._author = author
+
+  def SetTitle(self, title):
+    # TODO(chatham): Reevaluate whether this needs to be ASCII.
+    # maybe just do sys.setdefaultencoding('utf-8')? Problems
+    # appending self._title with other things.
+    self._title = title.encode('ascii')
+
+  def SetPublisher(self, publisher):
+    self._publisher = publisher
+
+  def AddRecord(self, data, record_id):
+    self.max_record_size = max(Record.MAX_SIZE, len(data))
+    self._record_count += 1
+    self._length += len(data)
+    return Record(data, record_id)
+
+  def _ReplaceWord(self, data, pos, word):
+    return data[:pos] + struct.pack('>I', word) + data[pos+4:]
+
+  def PalmDocHeader(self):
+    compression = 1  # no compression
+    unused = 0
+    encryption_type = 0  # no ecryption
+    records = self._record_count + 1  # the header record itself
+    palmdoc_header = struct.pack('>HHIHHHH',
+                                 compression,
+                                 unused,
+                                 self._length,
+                                 records,
+                                 Record.MAX_SIZE,
+                                 encryption_type,
+                                 unused)
+    assert len(palmdoc_header) == 16
+    return palmdoc_header
+
+  def PDBHeader(self, num_records):
+    HEADER_LEN = 32+2+2+9*4
+    RECORD_INDEX_HEADER_LEN = 6
+    RESOURCE_INDEX_LEN = 10
+
+    index_len = RECORD_INDEX_HEADER_LEN + num_records * Record.INDEX_LEN
+    rec_offset = HEADER_LEN + index_len + 2
+
+    short_title = self._title[0:31]
+    attributes = 0
+    version = 0
+    ctime = self.EPOCH_1904 + int(time.time())
+    mtime = self.EPOCH_1904 + int(time.time())
+    backup_time = self.EPOCH_1904 + int(time.time())
+    modnum = 0
+    appinfo_offset = 0
+    sort_offset = 0
+    type = 'BOOK'
+    creator = 'MOBI'
+    id_seed = 36
+    header = struct.pack('>32sHHII',
+                         short_title, attributes, version,
+                         ctime, mtime)
+    header += struct.pack('>IIII', backup_time, modnum,
+                         appinfo_offset, sort_offset)
+    header += struct.pack('>4s4sI',
+                         type, creator, id_seed)
+    next_record = 0  # not used?
+    header += struct.pack('>IH', next_record, num_records)
+    return header, rec_offset
+
+  def _GetExthHeader(self):
+    # They set author, publisher, coveroffset, thumboffset
+    data = {'author' : self._author,
+            'publisher' : self._publisher,
+            }
+    # Turn string type names into EXTH typeids.
+    r = []
+    for key, value in data.items():
+      typeid = EXTH_HEADER_FIELDS[key]
+      length_encoding_len = 8
+      r.append(struct.pack('>LL', typeid, len(value) + length_encoding_len,) + value)
+    content = ''.join(r)
+
+    # Pad to word boundary
+    while len(content) % 4:
+      content += '\0'
+    TODO_mysterious = 12
+    exth = 'EXTH' + struct.pack('>LL', len(content) + TODO_mysterious, len(data)) + content
+    return exth
+
+  def SetImageRecordIndex(self, idx):
+    self._first_image_index = idx
+
+  def MobiHeader(self):
+    exth_header = self._GetExthHeader();
+    palmdoc_header = self.PalmDocHeader()
+
+    fs = 0xffffffff
+
+    # Record 0
+    header_len = 0xE4 # TODO
+    mobi_type = 2 # BOOK
+    text_encoding = encoding['UTF-8']
+    unique_id = random.randint(1, 1<<32)
+    creator_version = 4
+    reserved = '%c' % 0xff * 40
+    nonbook_index = fs
+    full_name_offset = header_len + len(palmdoc_header) + len(exth_header) # put full name after header
+    language = languages['en-us']
+    unused = 0
+    mobi_header = struct.pack('>4sIIIII40sIIIIII',
+                              'MOBI',
+                              header_len,
+                              mobi_type,
+                              text_encoding,
+                              unique_id,
+                              creator_version,
+                              reserved,
+                              nonbook_index,
+                              full_name_offset,
+                              len(self._title),
+                              language,
+                              fs, fs)
+    assert len(mobi_header) == 104 - 16
+
+    unknown_fields = chr(0) * 32
+    drm_offset = 0
+    drm_count = 0
+    drm_size = 0
+    drm_flags = 0
+    exth_flags = 0x50
+    header_end = chr(0) * 64
+    mobi_header += struct.pack('>IIIIIII',
+                               creator_version,
+                               self._first_image_index,
+                               fs,
+                               unused,
+                               fs,
+                               unused,
+                               exth_flags)
+    mobi_header += '\0' * 112 # TODO: Why this much padding?
+    # Set some magic offsets to be 0xFFFFFFF.
+    for pos in (0x94, 0x98, 0xb0, 0xb8, 0xc0, 0xc8, 0xd0, 0xd8, 0xdc):
+      mobi_header = self._ReplaceWord(mobi_header, pos, fs)
+
+    # 16 bytes?
+    padding = '\0' * 48 * 4 # why?
+    total_header = palmdoc_header + mobi_header + exth_header + self._title + padding
+
+    return self.AddRecord(total_header, 0)
+
+if __name__ == '__main__':
+  import sys
+  m = Converter()
+  m.ConvertFiles(sys.argv[1:], '/tmp/test.mobi')
\ No newline at end of file
diff --git a/fanficdownloader/output.py b/fanficdownloader/output.py
index ff5daa51..10fb6198 100644
--- a/fanficdownloader/output.py
+++ b/fanficdownloader/output.py
@@ -21,6 +21,7 @@ import urlparse as up
 import BeautifulSoup as bs
 import htmlentitydefs as hdefs
 
+import mobi
 import zipdir
 import html_constants
 from constants import *
@@ -81,6 +82,68 @@ class TextWriter(FanficWriter):
 			self.output.close()
 		
 
+class MobiWriter(FanficWriter):
+	body = ''
+
+	@staticmethod
+	def getFormatName():
+		return 'mobi'
+
+	@staticmethod	
+	def getFormatExt():
+		return '.mobi'
+
+	def __init__(self, base, adapter, inmemory=False, compress=False):
+		self.basePath = base
+		self.storyTitle = removeEntities(adapter.getStoryName())
+		self.name = makeAcceptableFilename(adapter.getOutputName())
+		self.fileName = self.basePath + '/' + self.name + self.getFormatExt()
+		self.authorName = removeEntities(adapter.getAuthorName())
+		self.adapter = adapter
+		self.mobi = mobi
+		self.inmemory = inmemory
+
+		if not self.inmemory and os.path.exists(self.fileName):
+			os.remove(self.fileName)
+
+		if self.inmemory:
+			self.output = StringIO.StringIO()
+		else:
+			self.output = open(self.fileName, 'w')
+
+		self.xhtmlTemplate = string.Template(html_constants.XHTML_START)
+		self.chapterStartTemplate = string.Template(html_constants.XHTML_CHAPTER_START)
+
+	def _printableVersion(self, text):
+		try:
+			d = text.decode('utf-8')
+			return d
+		except:
+			return text
+
+	def writeChapter(self, index, title, text):
+		title = self._printableVersion(title) #title.decode('utf-8')
+		text = self._printableVersion(text) #text.decode('utf-8')
+		self.body = self.body + '\n' + self.chapterStartTemplate.substitute({'chapter' : title})
+		self.body = self.body + '\n' + text
+
+	def finalise(self):
+		html = self.xhtmlTemplate.substitute({'title' : self.storyTitle, 'author' : self.authorName, 'body' : self.body})
+		soup = bs.BeautifulSoup(html)
+		result = soup.__str__('utf8')
+
+#		f = open(self.fileName, 'w')
+#		f.write(result)
+#		f.close()
+
+		c = mobi.Converter()
+		mobidata = c.ConvertString(result)
+
+		self.output.write(mobidata)
+		if not self.inmemory:
+			self.output.close()
+
+
 class HTMLWriter(FanficWriter):
 	body = ''
 	
@@ -92,14 +155,14 @@ class HTMLWriter(FanficWriter):
 	def getFormatExt():
 		return '.html'
 	
-	def __init__(self, base, adapter, inmemory=False, compress=False):
+	def __init__(self, base, adapter, inmemory=False, compress=False, mobi = False):
 		self.basePath = base
 		self.storyTitle = removeEntities(adapter.getStoryName())
 		self.name = makeAcceptableFilename(adapter.getOutputName())
 		self.fileName = self.basePath + '/' + self.name + self.getFormatExt()
 		self.authorName = removeEntities(adapter.getAuthorName())
 		self.adapter = adapter
-		
+		self.mobi = mobi
 		self.inmemory = inmemory
 
 		if not self.inmemory and os.path.exists(self.fileName):

From f3571959df98fdb237e192863d1b256bca00d0b6 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Tue, 23 Nov 2010 12:42:33 -0600
Subject: [PATCH 82/94] Change a couple of the example story URLs.

---
 app.yaml                                      |   31 +
 cron.yaml                                     |    4 +
 css/index.css                                 |   71 +
 delete_fic.py                                 |   59 +
 fanficdownloader/BeautifulSoup.py             | 2014 ++++++++
 fanficdownloader/__init__.py                  |    1 +
 fanficdownloader/adapter.py                   |  229 +
 fanficdownloader/books/place holder.txt       |    0
 fanficdownloader/constants.py                 |  542 ++
 fanficdownloader/downloader.py                |  205 +
 fanficdownloader/ffnet.py                     |  358 ++
 fanficdownloader/fictionalley.py              |  301 ++
 fanficdownloader/ficwad.py                    |  267 +
 fanficdownloader/fpcom.py                     |  344 ++
 fanficdownloader/hpfiction.py                 |  280 ++
 fanficdownloader/html2text.py                 |  452 ++
 fanficdownloader/html_constants.py            |   19 +
 fanficdownloader/mediaminer.py                |  406 ++
 fanficdownloader/output.py                    |  424 ++
 fanficdownloader/potionsNsnitches.py          |  367 ++
 fanficdownloader/readme.txt                   |   10 +
 fanficdownloader/twilighted.py                |  316 ++
 fanficdownloader/twipassword.py               |    4 +
 fanficdownloader/zipdir.py                    |  177 +
 ffstorage.py                                  |   21 +
 index-ajax.html                               |  109 +
 index.html                                    |  204 +
 index.yaml                                    |   22 +
 js/fdownloader.js                             |  116 +
 js/jquery-1.3.2.js                            | 4376 +++++++++++++++++
 main.py                                       |  316 ++
 queue.yaml                                    |    5 +
 recent.html                                   |   69 +
 simplejson/__init__.py                        |  318 ++
 simplejson/__init__.pyc                       |  Bin 0 -> 12071 bytes
 simplejson/_speedups.c                        | 2329 +++++++++
 simplejson/decoder.py                         |  354 ++
 simplejson/decoder.pyc                        |  Bin 0 -> 11292 bytes
 simplejson/encoder.py                         |  440 ++
 simplejson/encoder.pyc                        |  Bin 0 -> 13938 bytes
 simplejson/scanner.py                         |   65 +
 simplejson/scanner.pyc                        |  Bin 0 -> 2340 bytes
 simplejson/tests/__init__.py                  |   23 +
 simplejson/tests/test_check_circular.py       |   30 +
 simplejson/tests/test_decode.py               |   22 +
 simplejson/tests/test_default.py              |    9 +
 simplejson/tests/test_dump.py                 |   21 +
 .../tests/test_encode_basestring_ascii.py     |   38 +
 simplejson/tests/test_fail.py                 |   76 +
 simplejson/tests/test_float.py                |   15 +
 simplejson/tests/test_indent.py               |   41 +
 simplejson/tests/test_pass1.py                |   76 +
 simplejson/tests/test_pass2.py                |   14 +
 simplejson/tests/test_pass3.py                |   20 +
 simplejson/tests/test_recursion.py            |   67 +
 simplejson/tests/test_scanstring.py           |  111 +
 simplejson/tests/test_separators.py           |   42 +
 simplejson/tests/test_unicode.py              |   64 +
 simplejson/tool.py                            |   37 +
 static/ajax-loader.gif                        |  Bin 0 -> 10819 bytes
 static/favicon.ico                            |  Bin 0 -> 21792 bytes
 utils/remover.py                              |   53 +
 62 files changed, 16384 insertions(+)
 create mode 100644 app.yaml
 create mode 100644 cron.yaml
 create mode 100644 css/index.css
 create mode 100644 delete_fic.py
 create mode 100644 fanficdownloader/BeautifulSoup.py
 create mode 100644 fanficdownloader/__init__.py
 create mode 100644 fanficdownloader/adapter.py
 create mode 100644 fanficdownloader/books/place holder.txt
 create mode 100644 fanficdownloader/constants.py
 create mode 100644 fanficdownloader/downloader.py
 create mode 100644 fanficdownloader/ffnet.py
 create mode 100644 fanficdownloader/fictionalley.py
 create mode 100644 fanficdownloader/ficwad.py
 create mode 100644 fanficdownloader/fpcom.py
 create mode 100644 fanficdownloader/hpfiction.py
 create mode 100644 fanficdownloader/html2text.py
 create mode 100644 fanficdownloader/html_constants.py
 create mode 100644 fanficdownloader/mediaminer.py
 create mode 100644 fanficdownloader/output.py
 create mode 100644 fanficdownloader/potionsNsnitches.py
 create mode 100644 fanficdownloader/readme.txt
 create mode 100644 fanficdownloader/twilighted.py
 create mode 100644 fanficdownloader/twipassword.py
 create mode 100644 fanficdownloader/zipdir.py
 create mode 100644 ffstorage.py
 create mode 100644 index-ajax.html
 create mode 100644 index.html
 create mode 100644 index.yaml
 create mode 100644 js/fdownloader.js
 create mode 100644 js/jquery-1.3.2.js
 create mode 100644 main.py
 create mode 100644 queue.yaml
 create mode 100644 recent.html
 create mode 100644 simplejson/__init__.py
 create mode 100644 simplejson/__init__.pyc
 create mode 100644 simplejson/_speedups.c
 create mode 100644 simplejson/decoder.py
 create mode 100644 simplejson/decoder.pyc
 create mode 100644 simplejson/encoder.py
 create mode 100644 simplejson/encoder.pyc
 create mode 100644 simplejson/scanner.py
 create mode 100644 simplejson/scanner.pyc
 create mode 100644 simplejson/tests/__init__.py
 create mode 100644 simplejson/tests/test_check_circular.py
 create mode 100644 simplejson/tests/test_decode.py
 create mode 100644 simplejson/tests/test_default.py
 create mode 100644 simplejson/tests/test_dump.py
 create mode 100644 simplejson/tests/test_encode_basestring_ascii.py
 create mode 100644 simplejson/tests/test_fail.py
 create mode 100644 simplejson/tests/test_float.py
 create mode 100644 simplejson/tests/test_indent.py
 create mode 100644 simplejson/tests/test_pass1.py
 create mode 100644 simplejson/tests/test_pass2.py
 create mode 100644 simplejson/tests/test_pass3.py
 create mode 100644 simplejson/tests/test_recursion.py
 create mode 100644 simplejson/tests/test_scanstring.py
 create mode 100644 simplejson/tests/test_separators.py
 create mode 100644 simplejson/tests/test_unicode.py
 create mode 100644 simplejson/tool.py
 create mode 100644 static/ajax-loader.gif
 create mode 100644 static/favicon.ico
 create mode 100644 utils/remover.py

diff --git a/app.yaml b/app.yaml
new file mode 100644
index 00000000..6f1ccdc8
--- /dev/null
+++ b/app.yaml
@@ -0,0 +1,31 @@
+application: fanfictionloader
+version: 2-5-5
+runtime: python
+api_version: 1
+
+handlers:
+- url: /generate_mock_data
+  script: mocks/generate_mock_data.py
+  login: admin
+
+- url: /r3m0v3r
+  script: utils/remover.py
+  login: admin
+
+- url: /r3m0v3r
+  script: main.py
+  login: admin
+  
+- url: /css
+  static_dir: css
+
+- url: /js
+  static_dir: js
+
+- url: /static
+  static_dir: static
+
+
+- url: /.*
+  script: main.py
+ 
diff --git a/cron.yaml b/cron.yaml
new file mode 100644
index 00000000..1d9c70a0
--- /dev/null
+++ b/cron.yaml
@@ -0,0 +1,4 @@
+cron:
+- description: cleanup job
+  url: /r3m0v3r
+  schedule: every 3 hours
\ No newline at end of file
diff --git a/css/index.css b/css/index.css
new file mode 100644
index 00000000..f4aec452
--- /dev/null
+++ b/css/index.css
@@ -0,0 +1,71 @@
+body
+{
+	font: 0.9em "Helvetica Neue", Arial, Helvetica, Geneva, sans-serif;
+}
+
+#main
+{
+	width: 43%;
+	margin-left: 23%;
+	background-color: #dae6ff;
+	padding: 2em;
+}
+
+#greeting
+{
+	margin-bottom: 1em;
+	border-color: #efefef;
+}
+
+
+
+#logpassword:hover, #logpasswordtable:hover, #urlbox:hover, #typebox:hover, #helpbox:hover, #yourfile:hover
+{
+	border: thin solid #fffeff;	
+}
+
+h1
+{
+	text-decoration: none;
+}
+
+#logpasswordtable
+{
+	padding: 1em;
+}
+
+#logpassword, #logpasswordtable {
+  display: none;
+}
+
+#urlbox, #typebox, #logpasswordtable, #logpassword, #helpbox, #yourfile
+{
+	margin: 1em;
+	padding: 1em;
+	border: thin dotted #fffeff;	
+}
+
+div.field
+{
+	margin-bottom: 0.5em;
+}
+
+#submitbtn
+{
+	padding: 1em;
+}
+
+#typelabel
+{
+}
+
+#typeoptions
+{
+	margin-top: 0.5em;
+}
+
+#error
+{
+	font-size: small;
+	color: #f00;
+}
\ No newline at end of file
diff --git a/delete_fic.py b/delete_fic.py
new file mode 100644
index 00000000..73722724
--- /dev/null
+++ b/delete_fic.py
@@ -0,0 +1,59 @@
+import os
+import cgi
+import sys
+import logging
+import traceback
+import StringIO
+
+from google.appengine.api import users
+from google.appengine.ext import webapp
+from google.appengine.ext.webapp import util
+
+from fanficdownloader.downaloder import *
+from fanficdownloader.ffnet import *
+from fanficdownloader.output import *
+
+from google.appengine.ext import db
+
+from fanficdownloader.zipdir import *
+
+from ffstorage import *
+
+def create_mac(user, fic_id, fic_url):
+  return str(abs(hash(user)+hash(fic_id)))+str(abs(hash(fic_url)))
+  
+def check_mac(user, fic_id, fic_url, mac):
+  return (create_mac(user, fic_id, fic_url) == mac)
+
+def create_mac_for_fic(user, fic_id):
+  key = db.Key(fic_id)
+	fanfic = db.get(key)
+	if fanfic.user != user:
+	  return None
+	else:
+	  return create_mac(user, key, fanfic.url)
+
+class DeleteFicHandler(webapp.RequestHandler):
+	def get(self):
+		user = users.get_current_user()
+		if not user:
+			self.redirect('/login')
+
+    fic_id = self.request.get('fic_id')
+    fic_mac = self.request.get('key_id')
+    
+    actual_mac = create_mac_for_fic(user, fic_id)
+    if actual_mac != fic_mac:
+      self.response.out.write("Ooops")
+    else:
+      key = db.Key(fic_id)
+    	fanfic = db.get(key)
+      fanfic.delete()
+      self.redirect('/recent')
+    
+
+		fics = db.GqlQuery("Select * From DownloadedFanfic WHERE user = :1", user)
+		template_values = dict(fics = fics, nickname = user.nickname())
+		path = os.path.join(os.path.dirname(__file__), 'recent.html')
+		self.response.out.write(template.render(path, template_values))
+	
\ No newline at end of file
diff --git a/fanficdownloader/BeautifulSoup.py b/fanficdownloader/BeautifulSoup.py
new file mode 100644
index 00000000..31ff0e5f
--- /dev/null
+++ b/fanficdownloader/BeautifulSoup.py
@@ -0,0 +1,2014 @@
+# -*- coding: utf-8 -*-
+
+"""Beautiful Soup
+Elixir and Tonic
+"The Screen-Scraper's Friend"
+http://www.crummy.com/software/BeautifulSoup/
+
+Beautiful Soup parses a (possibly invalid) XML or HTML document into a
+tree representation. It provides methods and Pythonic idioms that make
+it easy to navigate, search, and modify the tree.
+
+A well-formed XML/HTML document yields a well-formed data
+structure. An ill-formed XML/HTML document yields a correspondingly
+ill-formed data structure. If your document is only locally
+well-formed, you can use this library to find and process the
+well-formed part of it.
+
+Beautiful Soup works with Python 2.2 and up. It has no external
+dependencies, but you'll have more success at converting data to UTF-8
+if you also install these three packages:
+
+* chardet, for auto-detecting character encodings
+  http://chardet.feedparser.org/
+* cjkcodecs and iconv_codec, which add more encodings to the ones supported
+  by stock Python.
+  http://cjkpython.i18n.org/
+
+Beautiful Soup defines classes for two main parsing strategies:
+
+ * BeautifulStoneSoup, for parsing XML, SGML, or your domain-specific
+   language that kind of looks like XML.
+
+ * BeautifulSoup, for parsing run-of-the-mill HTML code, be it valid
+   or invalid. This class has web browser-like heuristics for
+   obtaining a sensible parse tree in the face of common HTML errors.
+
+Beautiful Soup also defines a class (UnicodeDammit) for autodetecting
+the encoding of an HTML or XML document, and converting it to
+Unicode. Much of this code is taken from Mark Pilgrim's Universal Feed Parser.
+
+For more than you ever wanted to know about Beautiful Soup, see the
+documentation:
+http://www.crummy.com/software/BeautifulSoup/documentation.html
+
+Here, have some legalese:
+
+Copyright (c) 2004-2010, Leonard Richardson
+
+All rights reserved.
+
+Redistribution and use in source and binary forms, with or without
+modification, are permitted provided that the following conditions are
+met:
+
+  * Redistributions of source code must retain the above copyright
+    notice, this list of conditions and the following disclaimer.
+
+  * Redistributions in binary form must reproduce the above
+    copyright notice, this list of conditions and the following
+    disclaimer in the documentation and/or other materials provided
+    with the distribution.
+
+  * Neither the name of the the Beautiful Soup Consortium and All
+    Night Kosher Bakery nor the names of its contributors may be
+    used to endorse or promote products derived from this software
+    without specific prior written permission.
+
+THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS
+"AS IS" AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT
+LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR
+A PARTICULAR PURPOSE ARE DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT OWNER OR
+CONTRIBUTORS BE LIABLE FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL,
+EXEMPLARY, OR CONSEQUENTIAL DAMAGES (INCLUDING, BUT NOT LIMITED TO,
+PROCUREMENT OF SUBSTITUTE GOODS OR SERVICES; LOSS OF USE, DATA, OR
+PROFITS; OR BUSINESS INTERRUPTION) HOWEVER CAUSED AND ON ANY THEORY OF
+LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY, OR TORT (INCLUDING
+NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE OF THIS
+SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE, DAMMIT.
+
+"""
+from __future__ import generators
+
+__author__ = "Leonard Richardson (leonardr@segfault.org)"
+__version__ = "3.0.8.1"
+__copyright__ = "Copyright (c) 2004-2010 Leonard Richardson"
+__license__ = "New-style BSD"
+
+from sgmllib import SGMLParser, SGMLParseError
+import codecs
+import markupbase
+import types
+import re
+import sgmllib
+try:
+  from htmlentitydefs import name2codepoint
+except ImportError:
+  name2codepoint = {}
+try:
+    set
+except NameError:
+    from sets import Set as set
+
+#These hacks make Beautiful Soup able to parse XML with namespaces
+sgmllib.tagfind = re.compile('[a-zA-Z][-_.:a-zA-Z0-9]*')
+markupbase._declname_match = re.compile(r'[a-zA-Z][-_.:a-zA-Z0-9]*\s*').match
+
+DEFAULT_OUTPUT_ENCODING = "utf-8"
+
+def _match_css_class(str):
+    """Build a RE to match the given CSS class."""
+    return re.compile(r"(^|.*\s)%s($|\s)" % str)
+
+# First, the classes that represent markup elements.
+
+class PageElement(object):
+    """Contains the navigational information for some part of the page
+    (either a tag or a piece of text)"""
+
+    def setup(self, parent=None, previous=None):
+        """Sets up the initial relations between this element and
+        other elements."""
+        self.parent = parent
+        self.previous = previous
+        self.next = None
+        self.previousSibling = None
+        self.nextSibling = None
+        if self.parent and self.parent.contents:
+            self.previousSibling = self.parent.contents[-1]
+            self.previousSibling.nextSibling = self
+
+    def replaceWith(self, replaceWith):
+        oldParent = self.parent
+        myIndex = self.parent.index(self)
+        if hasattr(replaceWith, "parent")\
+                  and replaceWith.parent is self.parent:
+            # We're replacing this element with one of its siblings.
+            index = replaceWith.parent.index(replaceWith)
+            if index and index < myIndex:
+                # Furthermore, it comes before this element. That
+                # means that when we extract it, the index of this
+                # element will change.
+                myIndex = myIndex - 1
+        self.extract()
+        oldParent.insert(myIndex, replaceWith)
+
+    def replaceWithChildren(self):
+        myParent = self.parent
+        myIndex = self.parent.index(self)
+        self.extract()
+        reversedChildren = list(self.contents)
+        reversedChildren.reverse()
+        for child in reversedChildren:
+            myParent.insert(myIndex, child)
+
+    def extract(self):
+        """Destructively rips this element out of the tree."""
+        if self.parent:
+            try:
+                del self.parent.contents[self.parent.index(self)]
+            except ValueError:
+                pass
+
+        #Find the two elements that would be next to each other if
+        #this element (and any children) hadn't been parsed. Connect
+        #the two.
+        lastChild = self._lastRecursiveChild()
+        nextElement = lastChild.next
+
+        if self.previous:
+            self.previous.next = nextElement
+        if nextElement:
+            nextElement.previous = self.previous
+        self.previous = None
+        lastChild.next = None
+
+        self.parent = None
+        if self.previousSibling:
+            self.previousSibling.nextSibling = self.nextSibling
+        if self.nextSibling:
+            self.nextSibling.previousSibling = self.previousSibling
+        self.previousSibling = self.nextSibling = None
+        return self
+
+    def _lastRecursiveChild(self):
+        "Finds the last element beneath this object to be parsed."
+        lastChild = self
+        while hasattr(lastChild, 'contents') and lastChild.contents:
+            lastChild = lastChild.contents[-1]
+        return lastChild
+
+    def insert(self, position, newChild):
+        if isinstance(newChild, basestring) \
+            and not isinstance(newChild, NavigableString):
+            newChild = NavigableString(newChild)
+
+        position =  min(position, len(self.contents))
+        if hasattr(newChild, 'parent') and newChild.parent is not None:
+            # We're 'inserting' an element that's already one
+            # of this object's children.
+            if newChild.parent is self:
+                index = self.index(newChild)
+                if index > position:
+                    # Furthermore we're moving it further down the
+                    # list of this object's children. That means that
+                    # when we extract this element, our target index
+                    # will jump down one.
+                    position = position - 1
+            newChild.extract()
+
+        newChild.parent = self
+        previousChild = None
+        if position == 0:
+            newChild.previousSibling = None
+            newChild.previous = self
+        else:
+            previousChild = self.contents[position-1]
+            newChild.previousSibling = previousChild
+            newChild.previousSibling.nextSibling = newChild
+            newChild.previous = previousChild._lastRecursiveChild()
+        if newChild.previous:
+            newChild.previous.next = newChild
+
+        newChildsLastElement = newChild._lastRecursiveChild()
+
+        if position >= len(self.contents):
+            newChild.nextSibling = None
+
+            parent = self
+            parentsNextSibling = None
+            while not parentsNextSibling:
+                parentsNextSibling = parent.nextSibling
+                parent = parent.parent
+                if not parent: # This is the last element in the document.
+                    break
+            if parentsNextSibling:
+                newChildsLastElement.next = parentsNextSibling
+            else:
+                newChildsLastElement.next = None
+        else:
+            nextChild = self.contents[position]
+            newChild.nextSibling = nextChild
+            if newChild.nextSibling:
+                newChild.nextSibling.previousSibling = newChild
+            newChildsLastElement.next = nextChild
+
+        if newChildsLastElement.next:
+            newChildsLastElement.next.previous = newChildsLastElement
+        self.contents.insert(position, newChild)
+
+    def append(self, tag):
+        """Appends the given tag to the contents of this tag."""
+        self.insert(len(self.contents), tag)
+
+    def findNext(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the first item that matches the given criteria and
+        appears after this Tag in the document."""
+        return self._findOne(self.findAllNext, name, attrs, text, **kwargs)
+
+    def findAllNext(self, name=None, attrs={}, text=None, limit=None,
+                    **kwargs):
+        """Returns all items that match the given criteria and appear
+        after this Tag in the document."""
+        return self._findAll(name, attrs, text, limit, self.nextGenerator,
+                             **kwargs)
+
+    def findNextSibling(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the closest sibling to this Tag that matches the
+        given criteria and appears after this Tag in the document."""
+        return self._findOne(self.findNextSiblings, name, attrs, text,
+                             **kwargs)
+
+    def findNextSiblings(self, name=None, attrs={}, text=None, limit=None,
+                         **kwargs):
+        """Returns the siblings of this Tag that match the given
+        criteria and appear after this Tag in the document."""
+        return self._findAll(name, attrs, text, limit,
+                             self.nextSiblingGenerator, **kwargs)
+    fetchNextSiblings = findNextSiblings # Compatibility with pre-3.x
+
+    def findPrevious(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the first item that matches the given criteria and
+        appears before this Tag in the document."""
+        return self._findOne(self.findAllPrevious, name, attrs, text, **kwargs)
+
+    def findAllPrevious(self, name=None, attrs={}, text=None, limit=None,
+                        **kwargs):
+        """Returns all items that match the given criteria and appear
+        before this Tag in the document."""
+        return self._findAll(name, attrs, text, limit, self.previousGenerator,
+                           **kwargs)
+    fetchPrevious = findAllPrevious # Compatibility with pre-3.x
+
+    def findPreviousSibling(self, name=None, attrs={}, text=None, **kwargs):
+        """Returns the closest sibling to this Tag that matches the
+        given criteria and appears before this Tag in the document."""
+        return self._findOne(self.findPreviousSiblings, name, attrs, text,
+                             **kwargs)
+
+    def findPreviousSiblings(self, name=None, attrs={}, text=None,
+                             limit=None, **kwargs):
+        """Returns the siblings of this Tag that match the given
+        criteria and appear before this Tag in the document."""
+        return self._findAll(name, attrs, text, limit,
+                             self.previousSiblingGenerator, **kwargs)
+    fetchPreviousSiblings = findPreviousSiblings # Compatibility with pre-3.x
+
+    def findParent(self, name=None, attrs={}, **kwargs):
+        """Returns the closest parent of this Tag that matches the given
+        criteria."""
+        # NOTE: We can't use _findOne because findParents takes a different
+        # set of arguments.
+        r = None
+        l = self.findParents(name, attrs, 1)
+        if l:
+            r = l[0]
+        return r
+
+    def findParents(self, name=None, attrs={}, limit=None, **kwargs):
+        """Returns the parents of this Tag that match the given
+        criteria."""
+
+        return self._findAll(name, attrs, None, limit, self.parentGenerator,
+                             **kwargs)
+    fetchParents = findParents # Compatibility with pre-3.x
+
+    #These methods do the real heavy lifting.
+
+    def _findOne(self, method, name, attrs, text, **kwargs):
+        r = None
+        l = method(name, attrs, text, 1, **kwargs)
+        if l:
+            r = l[0]
+        return r
+
+    def _findAll(self, name, attrs, text, limit, generator, **kwargs):
+        "Iterates over a generator looking for things that match."
+
+        if isinstance(name, SoupStrainer):
+            strainer = name
+        # (Possibly) special case some findAll*(...) searches
+        elif text is None and not limit and not attrs and not kwargs:
+            # findAll*(True)
+            if name is True:
+                return [element for element in generator()
+                        if isinstance(element, Tag)]
+            # findAll*('tag-name')
+            elif isinstance(name, basestring):
+                return [element for element in generator()
+                        if isinstance(element, Tag) and
+                        element.name == name]
+            else:
+                strainer = SoupStrainer(name, attrs, text, **kwargs)
+        # Build a SoupStrainer
+        else:
+            strainer = SoupStrainer(name, attrs, text, **kwargs)
+        results = ResultSet(strainer)
+        g = generator()
+        while True:
+            try:
+                i = g.next()
+            except StopIteration:
+                break
+            if i:
+                found = strainer.search(i)
+                if found:
+                    results.append(found)
+                    if limit and len(results) >= limit:
+                        break
+        return results
+
+    #These Generators can be used to navigate starting from both
+    #NavigableStrings and Tags.
+    def nextGenerator(self):
+        i = self
+        while i is not None:
+            i = i.next
+            yield i
+
+    def nextSiblingGenerator(self):
+        i = self
+        while i is not None:
+            i = i.nextSibling
+            yield i
+
+    def previousGenerator(self):
+        i = self
+        while i is not None:
+            i = i.previous
+            yield i
+
+    def previousSiblingGenerator(self):
+        i = self
+        while i is not None:
+            i = i.previousSibling
+            yield i
+
+    def parentGenerator(self):
+        i = self
+        while i is not None:
+            i = i.parent
+            yield i
+
+    # Utility methods
+    def substituteEncoding(self, str, encoding=None):
+        encoding = encoding or "utf-8"
+        return str.replace("%SOUP-ENCODING%", encoding)
+
+    def toEncoding(self, s, encoding=None):
+        """Encodes an object to a string in some encoding, or to Unicode.
+        ."""
+        if isinstance(s, unicode):
+            if encoding:
+                s = s.encode(encoding)
+        elif isinstance(s, str):
+            if encoding:
+                s = s.encode(encoding)
+            else:
+                s = unicode(s)
+        else:
+            if encoding:
+                s  = self.toEncoding(str(s), encoding)
+            else:
+                s = unicode(s)
+        return s
+
+class NavigableString(unicode, PageElement):
+
+    def __new__(cls, value):
+        """Create a new NavigableString.
+
+        When unpickling a NavigableString, this method is called with
+        the string in DEFAULT_OUTPUT_ENCODING. That encoding needs to be
+        passed in to the superclass's __new__ or the superclass won't know
+        how to handle non-ASCII characters.
+        """
+        if isinstance(value, unicode):
+            return unicode.__new__(cls, value)
+        return unicode.__new__(cls, value, DEFAULT_OUTPUT_ENCODING)
+
+    def __getnewargs__(self):
+        return (NavigableString.__str__(self),)
+
+    def __getattr__(self, attr):
+        """text.string gives you text. This is for backwards
+        compatibility for Navigable*String, but for CData* it lets you
+        get the string without the CData wrapper."""
+        if attr == 'string':
+            return self
+        else:
+            raise AttributeError, "'%s' object has no attribute '%s'" % (self.__class__.__name__, attr)
+
+    def __unicode__(self):
+        return str(self).decode(DEFAULT_OUTPUT_ENCODING)
+
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        if encoding:
+            return self.encode(encoding)
+        else:
+            return self
+
+class CData(NavigableString):
+
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return "<![CDATA[%s]]>" % NavigableString.__str__(self, encoding)
+
+class ProcessingInstruction(NavigableString):
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        output = self
+        if "%SOUP-ENCODING%" in output:
+            output = self.substituteEncoding(output, encoding)
+        return "<?%s?>" % self.toEncoding(output, encoding)
+
+class Comment(NavigableString):
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return "<!--%s-->" % NavigableString.__str__(self, encoding)
+
+class Declaration(NavigableString):
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return "<!%s>" % NavigableString.__str__(self, encoding)
+
+class Tag(PageElement):
+
+    """Represents a found HTML tag with its attributes and contents."""
+
+    def _invert(h):
+        "Cheap function to invert a hash."
+        i = {}
+        for k,v in h.items():
+            i[v] = k
+        return i
+
+    XML_ENTITIES_TO_SPECIAL_CHARS = { "apos" : "'",
+                                      "quot" : '"',
+                                      "amp" : "&",
+                                      "lt" : "<",
+                                      "gt" : ">" }
+
+    XML_SPECIAL_CHARS_TO_ENTITIES = _invert(XML_ENTITIES_TO_SPECIAL_CHARS)
+
+    def _convertEntities(self, match):
+        """Used in a call to re.sub to replace HTML, XML, and numeric
+        entities with the appropriate Unicode characters. If HTML
+        entities are being converted, any unrecognized entities are
+        escaped."""
+        x = match.group(1)
+        if self.convertHTMLEntities and x in name2codepoint:
+            return unichr(name2codepoint[x])
+        elif x in self.XML_ENTITIES_TO_SPECIAL_CHARS:
+            if self.convertXMLEntities:
+                return self.XML_ENTITIES_TO_SPECIAL_CHARS[x]
+            else:
+                return u'&%s;' % x
+        elif len(x) > 0 and x[0] == '#':
+            # Handle numeric entities
+            if len(x) > 1 and x[1] == 'x':
+                return unichr(int(x[2:], 16))
+            else:
+                return unichr(int(x[1:]))
+
+        elif self.escapeUnrecognizedEntities:
+            return u'&amp;%s;' % x
+        else:
+            return u'&%s;' % x
+
+    def __init__(self, parser, name, attrs=None, parent=None,
+                 previous=None):
+        "Basic constructor."
+
+        # We don't actually store the parser object: that lets extracted
+        # chunks be garbage-collected
+        self.parserClass = parser.__class__
+        self.isSelfClosing = parser.isSelfClosingTag(name)
+        self.name = name
+        if attrs is None:
+            attrs = []
+        self.attrs = attrs
+        self.contents = []
+        self.setup(parent, previous)
+        self.hidden = False
+        self.containsSubstitutions = False
+        self.convertHTMLEntities = parser.convertHTMLEntities
+        self.convertXMLEntities = parser.convertXMLEntities
+        self.escapeUnrecognizedEntities = parser.escapeUnrecognizedEntities
+
+        # Convert any HTML, XML, or numeric entities in the attribute values.
+        convert = lambda(k, val): (k,
+                                   re.sub("&(#\d+|#x[0-9a-fA-F]+|\w+);",
+                                          self._convertEntities,
+                                          val))
+        self.attrs = map(convert, self.attrs)
+
+    def getString(self):
+        if (len(self.contents) == 1
+            and isinstance(self.contents[0], NavigableString)):
+            return self.contents[0]
+
+    def setString(self, string):
+        """Replace the contents of the tag with a string"""
+        self.clear()
+        self.append(string)
+
+    string = property(getString, setString)
+
+    def getText(self, separator=u""):
+        if not len(self.contents):
+            return u""
+        stopNode = self._lastRecursiveChild().next
+        strings = []
+        current = self.contents[0]
+        while current is not stopNode:
+            if isinstance(current, NavigableString):
+                strings.append(current.strip())
+            current = current.next
+        return separator.join(strings)
+
+    text = property(getText)
+
+    def get(self, key, default=None):
+        """Returns the value of the 'key' attribute for the tag, or
+        the value given for 'default' if it doesn't have that
+        attribute."""
+        return self._getAttrMap().get(key, default)
+
+    def clear(self):
+        """Extract all children."""
+        for child in self.contents[:]:
+            child.extract()
+
+    def index(self, element):
+        for i, child in enumerate(self.contents):
+            if child is element:
+                return i
+        raise ValueError("Tag.index: element not in tag")
+
+    def has_key(self, key):
+        return self._getAttrMap().has_key(key)
+
+    def __getitem__(self, key):
+        """tag[key] returns the value of the 'key' attribute for the tag,
+        and throws an exception if it's not there."""
+        return self._getAttrMap()[key]
+
+    def __iter__(self):
+        "Iterating over a tag iterates over its contents."
+        return iter(self.contents)
+
+    def __len__(self):
+        "The length of a tag is the length of its list of contents."
+        return len(self.contents)
+
+    def __contains__(self, x):
+        return x in self.contents
+
+    def __nonzero__(self):
+        "A tag is non-None even if it has no contents."
+        return True
+
+    def __setitem__(self, key, value):
+        """Setting tag[key] sets the value of the 'key' attribute for the
+        tag."""
+        self._getAttrMap()
+        self.attrMap[key] = value
+        found = False
+        for i in range(0, len(self.attrs)):
+            if self.attrs[i][0] == key:
+                self.attrs[i] = (key, value)
+                found = True
+        if not found:
+            self.attrs.append((key, value))
+        self._getAttrMap()[key] = value
+
+    def __delitem__(self, key):
+        "Deleting tag[key] deletes all 'key' attributes for the tag."
+        for item in self.attrs:
+            if item[0] == key:
+                self.attrs.remove(item)
+                #We don't break because bad HTML can define the same
+                #attribute multiple times.
+            self._getAttrMap()
+            if self.attrMap.has_key(key):
+                del self.attrMap[key]
+
+    def __call__(self, *args, **kwargs):
+        """Calling a tag like a function is the same as calling its
+        findAll() method. Eg. tag('a') returns a list of all the A tags
+        found within this tag."""
+        return apply(self.findAll, args, kwargs)
+
+    def __getattr__(self, tag):
+        #print "Getattr %s.%s" % (self.__class__, tag)
+        if len(tag) > 3 and tag.rfind('Tag') == len(tag)-3:
+            return self.find(tag[:-3])
+        elif tag.find('__') != 0:
+            return self.find(tag)
+        raise AttributeError, "'%s' object has no attribute '%s'" % (self.__class__, tag)
+
+    def __eq__(self, other):
+        """Returns true iff this tag has the same name, the same attributes,
+        and the same contents (recursively) as the given tag.
+
+        NOTE: right now this will return false if two tags have the
+        same attributes in a different order. Should this be fixed?"""
+        if other is self:
+            return True
+        if not hasattr(other, 'name') or not hasattr(other, 'attrs') or not hasattr(other, 'contents') or self.name != other.name or self.attrs != other.attrs or len(self) != len(other):
+            return False
+        for i in range(0, len(self.contents)):
+            if self.contents[i] != other.contents[i]:
+                return False
+        return True
+
+    def __ne__(self, other):
+        """Returns true iff this tag is not identical to the other tag,
+        as defined in __eq__."""
+        return not self == other
+
+    def __repr__(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        """Renders this tag as a string."""
+        return self.__str__(encoding)
+
+    def __unicode__(self):
+        return self.__str__(None)
+
+    BARE_AMPERSAND_OR_BRACKET = re.compile("([<>]|"
+                                           + "&(?!#\d+;|#x[0-9a-fA-F]+;|\w+;)"
+                                           + ")")
+
+    def _sub_entity(self, x):
+        """Used with a regular expression to substitute the
+        appropriate XML entity for an XML special character."""
+        return "&" + self.XML_SPECIAL_CHARS_TO_ENTITIES[x.group(0)[0]] + ";"
+
+    def __str__(self, encoding=DEFAULT_OUTPUT_ENCODING,
+                prettyPrint=False, indentLevel=0):
+        """Returns a string or Unicode representation of this tag and
+        its contents. To get Unicode, pass None for encoding.
+
+        NOTE: since Python's HTML parser consumes whitespace, this
+        method is not certain to reproduce the whitespace present in
+        the original string."""
+
+        encodedName = self.toEncoding(self.name, encoding)
+
+        attrs = []
+        if self.attrs:
+            for key, val in self.attrs:
+                fmt = '%s="%s"'
+                if isinstance(val, basestring):
+                    if self.containsSubstitutions and '%SOUP-ENCODING%' in val:
+                        val = self.substituteEncoding(val, encoding)
+
+                    # The attribute value either:
+                    #
+                    # * Contains no embedded double quotes or single quotes.
+                    #   No problem: we enclose it in double quotes.
+                    # * Contains embedded single quotes. No problem:
+                    #   double quotes work here too.
+                    # * Contains embedded double quotes. No problem:
+                    #   we enclose it in single quotes.
+                    # * Embeds both single _and_ double quotes. This
+                    #   can't happen naturally, but it can happen if
+                    #   you modify an attribute value after parsing
+                    #   the document. Now we have a bit of a
+                    #   problem. We solve it by enclosing the
+                    #   attribute in single quotes, and escaping any
+                    #   embedded single quotes to XML entities.
+                    if '"' in val:
+                        fmt = "%s='%s'"
+                        if "'" in val:
+                            # TODO: replace with apos when
+                            # appropriate.
+                            val = val.replace("'", "&squot;")
+
+                    # Now we're okay w/r/t quotes. But the attribute
+                    # value might also contain angle brackets, or
+                    # ampersands that aren't part of entities. We need
+                    # to escape those to XML entities too.
+                    val = self.BARE_AMPERSAND_OR_BRACKET.sub(self._sub_entity, val)
+
+                attrs.append(fmt % (self.toEncoding(key, encoding),
+                                    self.toEncoding(val, encoding)))
+        close = ''
+        closeTag = ''
+        if self.isSelfClosing:
+            close = ' /'
+        else:
+            closeTag = '</%s>' % encodedName
+
+        indentTag, indentContents = 0, 0
+        if prettyPrint:
+            indentTag = indentLevel
+            space = (' ' * (indentTag-1))
+            indentContents = indentTag + 1
+        contents = self.renderContents(encoding, prettyPrint, indentContents)
+        if self.hidden:
+            s = contents
+        else:
+            s = []
+            attributeString = ''
+            if attrs:
+                attributeString = ' ' + ' '.join(attrs)
+            if prettyPrint:
+                s.append(space)
+            s.append('<%s%s%s>' % (encodedName, attributeString, close))
+            if prettyPrint:
+                s.append("\n")
+            s.append(contents)
+            if prettyPrint and contents and contents[-1] != "\n":
+                s.append("\n")
+            if prettyPrint and closeTag:
+                s.append(space)
+            s.append(closeTag)
+            if prettyPrint and closeTag and self.nextSibling:
+                s.append("\n")
+            s = ''.join(s)
+        return s
+
+    def decompose(self):
+        """Recursively destroys the contents of this tree."""
+        self.extract()
+        if len(self.contents) == 0:
+            return
+        current = self.contents[0]
+        while current is not None:
+            next = current.next
+            if isinstance(current, Tag):
+                del current.contents[:]
+            current.parent = None
+            current.previous = None
+            current.previousSibling = None
+            current.next = None
+            current.nextSibling = None
+            current = next
+
+    def prettify(self, encoding=DEFAULT_OUTPUT_ENCODING):
+        return self.__str__(encoding, True)
+
+    def renderContents(self, encoding=DEFAULT_OUTPUT_ENCODING,
+                       prettyPrint=False, indentLevel=0):
+        """Renders the contents of this tag as a string in the given
+        encoding. If encoding is None, returns a Unicode string.."""
+        s=[]
+        for c in self:
+            text = None
+            if isinstance(c, NavigableString):
+                text = c.__str__(encoding)
+            elif isinstance(c, Tag):
+                s.append(c.__str__(encoding, prettyPrint, indentLevel))
+            if text and prettyPrint:
+                text = text.strip()
+            if text:
+                if prettyPrint:
+                    s.append(" " * (indentLevel-1))
+                s.append(text)
+                if prettyPrint:
+                    s.append("\n")
+        return ''.join(s)
+
+    #Soup methods
+
+    def find(self, name=None, attrs={}, recursive=True, text=None,
+             **kwargs):
+        """Return only the first child of this Tag matching the given
+        criteria."""
+        r = None
+        l = self.findAll(name, attrs, recursive, text, 1, **kwargs)
+        if l:
+            r = l[0]
+        return r
+    findChild = find
+
+    def findAll(self, name=None, attrs={}, recursive=True, text=None,
+                limit=None, **kwargs):
+        """Extracts a list of Tag objects that match the given
+        criteria.  You can specify the name of the Tag and any
+        attributes you want the Tag to have.
+
+        The value of a key-value pair in the 'attrs' map can be a
+        string, a list of strings, a regular expression object, or a
+        callable that takes a string and returns whether or not the
+        string matches for some custom definition of 'matches'. The
+        same is true of the tag name."""
+        generator = self.recursiveChildGenerator
+        if not recursive:
+            generator = self.childGenerator
+        return self._findAll(name, attrs, text, limit, generator, **kwargs)
+    findChildren = findAll
+
+    # Pre-3.x compatibility methods
+    first = find
+    fetch = findAll
+
+    def fetchText(self, text=None, recursive=True, limit=None):
+        return self.findAll(text=text, recursive=recursive, limit=limit)
+
+    def firstText(self, text=None, recursive=True):
+        return self.find(text=text, recursive=recursive)
+
+    #Private methods
+
+    def _getAttrMap(self):
+        """Initializes a map representation of this tag's attributes,
+        if not already initialized."""
+        if not getattr(self, 'attrMap'):
+            self.attrMap = {}
+            for (key, value) in self.attrs:
+                self.attrMap[key] = value
+        return self.attrMap
+
+    #Generator methods
+    def childGenerator(self):
+        # Just use the iterator from the contents
+        return iter(self.contents)
+
+    def recursiveChildGenerator(self):
+        if not len(self.contents):
+            raise StopIteration
+        stopNode = self._lastRecursiveChild().next
+        current = self.contents[0]
+        while current is not stopNode:
+            yield current
+            current = current.next
+
+
+# Next, a couple classes to represent queries and their results.
+class SoupStrainer:
+    """Encapsulates a number of ways of matching a markup element (tag or
+    text)."""
+
+    def __init__(self, name=None, attrs={}, text=None, **kwargs):
+        self.name = name
+        if isinstance(attrs, basestring):
+            kwargs['class'] = _match_css_class(attrs)
+            attrs = None
+        if kwargs:
+            if attrs:
+                attrs = attrs.copy()
+                attrs.update(kwargs)
+            else:
+                attrs = kwargs
+        self.attrs = attrs
+        self.text = text
+
+    def __str__(self):
+        if self.text:
+            return self.text
+        else:
+            return "%s|%s" % (self.name, self.attrs)
+
+    def searchTag(self, markupName=None, markupAttrs={}):
+        found = None
+        markup = None
+        if isinstance(markupName, Tag):
+            markup = markupName
+            markupAttrs = markup
+        callFunctionWithTagData = callable(self.name) \
+                                and not isinstance(markupName, Tag)
+
+        if (not self.name) \
+               or callFunctionWithTagData \
+               or (markup and self._matches(markup, self.name)) \
+               or (not markup and self._matches(markupName, self.name)):
+            if callFunctionWithTagData:
+                match = self.name(markupName, markupAttrs)
+            else:
+                match = True
+                markupAttrMap = None
+                for attr, matchAgainst in self.attrs.items():
+                    if not markupAttrMap:
+                         if hasattr(markupAttrs, 'get'):
+                            markupAttrMap = markupAttrs
+                         else:
+                            markupAttrMap = {}
+                            for k,v in markupAttrs:
+                                markupAttrMap[k] = v
+                    attrValue = markupAttrMap.get(attr)
+                    if not self._matches(attrValue, matchAgainst):
+                        match = False
+                        break
+            if match:
+                if markup:
+                    found = markup
+                else:
+                    found = markupName
+        return found
+
+    def search(self, markup):
+        #print 'looking for %s in %s' % (self, markup)
+        found = None
+        # If given a list of items, scan it for a text element that
+        # matches.
+        if hasattr(markup, "__iter__") \
+                and not isinstance(markup, Tag):
+            for element in markup:
+                if isinstance(element, NavigableString) \
+                       and self.search(element):
+                    found = element
+                    break
+        # If it's a Tag, make sure its name or attributes match.
+        # Don't bother with Tags if we're searching for text.
+        elif isinstance(markup, Tag):
+            if not self.text:
+                found = self.searchTag(markup)
+        # If it's text, make sure the text matches.
+        elif isinstance(markup, NavigableString) or \
+                 isinstance(markup, basestring):
+            if self._matches(markup, self.text):
+                found = markup
+        else:
+            raise Exception, "I don't know how to match against a %s" \
+                  % markup.__class__
+        return found
+
+    def _matches(self, markup, matchAgainst):
+        #print "Matching %s against %s" % (markup, matchAgainst)
+        result = False
+        if matchAgainst is True:
+            result = markup is not None
+        elif callable(matchAgainst):
+            result = matchAgainst(markup)
+        else:
+            #Custom match methods take the tag as an argument, but all
+            #other ways of matching match the tag name as a string.
+            if isinstance(markup, Tag):
+                markup = markup.name
+            if markup and not isinstance(markup, basestring):
+                markup = unicode(markup)
+            #Now we know that chunk is either a string, or None.
+            if hasattr(matchAgainst, 'match'):
+                # It's a regexp object.
+                result = markup and matchAgainst.search(markup)
+            elif hasattr(matchAgainst, '__iter__'): # list-like
+                result = markup in matchAgainst
+            elif hasattr(matchAgainst, 'items'):
+                result = markup.has_key(matchAgainst)
+            elif matchAgainst and isinstance(markup, basestring):
+                if isinstance(markup, unicode):
+                    matchAgainst = unicode(matchAgainst)
+                else:
+                    matchAgainst = str(matchAgainst)
+
+            if not result:
+                result = matchAgainst == markup
+        return result
+
+class ResultSet(list):
+    """A ResultSet is just a list that keeps track of the SoupStrainer
+    that created it."""
+    def __init__(self, source):
+        list.__init__([])
+        self.source = source
+
+# Now, some helper functions.
+
+def buildTagMap(default, *args):
+    """Turns a list of maps, lists, or scalars into a single map.
+    Used to build the SELF_CLOSING_TAGS, NESTABLE_TAGS, and
+    NESTING_RESET_TAGS maps out of lists and partial maps."""
+    built = {}
+    for portion in args:
+        if hasattr(portion, 'items'):
+            #It's a map. Merge it.
+            for k,v in portion.items():
+                built[k] = v
+        elif hasattr(portion, '__iter__'): # is a list
+            #It's a list. Map each item to the default.
+            for k in portion:
+                built[k] = default
+        else:
+            #It's a scalar. Map it to the default.
+            built[portion] = default
+    return built
+
+# Now, the parser classes.
+
+class BeautifulStoneSoup(Tag, SGMLParser):
+
+    """This class contains the basic parser and search code. It defines
+    a parser that knows nothing about tag behavior except for the
+    following:
+
+      You can't close a tag without closing all the tags it encloses.
+      That is, "<foo><bar></foo>" actually means
+      "<foo><bar></bar></foo>".
+
+    [Another possible explanation is "<foo><bar /></foo>", but since
+    this class defines no SELF_CLOSING_TAGS, it will never use that
+    explanation.]
+
+    This class is useful for parsing XML or made-up markup languages,
+    or when BeautifulSoup makes an assumption counter to what you were
+    expecting."""
+
+    SELF_CLOSING_TAGS = {}
+    NESTABLE_TAGS = {}
+    RESET_NESTING_TAGS = {}
+    QUOTE_TAGS = {}
+    PRESERVE_WHITESPACE_TAGS = []
+
+    MARKUP_MASSAGE = [(re.compile('(<[^<>]*)/>'),
+                       lambda x: x.group(1) + ' />'),
+                      (re.compile('<!\s+([^<>]*)>'),
+                       lambda x: '<!' + x.group(1) + '>')
+                      ]
+
+    ROOT_TAG_NAME = u'[document]'
+
+    HTML_ENTITIES = "html"
+    XML_ENTITIES = "xml"
+    XHTML_ENTITIES = "xhtml"
+    # TODO: This only exists for backwards-compatibility
+    ALL_ENTITIES = XHTML_ENTITIES
+
+    # Used when determining whether a text node is all whitespace and
+    # can be replaced with a single space. A text node that contains
+    # fancy Unicode spaces (usually non-breaking) should be left
+    # alone.
+    STRIP_ASCII_SPACES = { 9: None, 10: None, 12: None, 13: None, 32: None, }
+
+    def __init__(self, markup="", parseOnlyThese=None, fromEncoding=None,
+                 markupMassage=True, smartQuotesTo=XML_ENTITIES,
+                 convertEntities=None, selfClosingTags=None, isHTML=False):
+        """The Soup object is initialized as the 'root tag', and the
+        provided markup (which can be a string or a file-like object)
+        is fed into the underlying parser.
+
+        sgmllib will process most bad HTML, and the BeautifulSoup
+        class has some tricks for dealing with some HTML that kills
+        sgmllib, but Beautiful Soup can nonetheless choke or lose data
+        if your data uses self-closing tags or declarations
+        incorrectly.
+
+        By default, Beautiful Soup uses regexes to sanitize input,
+        avoiding the vast majority of these problems. If the problems
+        don't apply to you, pass in False for markupMassage, and
+        you'll get better performance.
+
+        The default parser massage techniques fix the two most common
+        instances of invalid HTML that choke sgmllib:
+
+         <br/> (No space between name of closing tag and tag close)
+         <! --Comment--> (Extraneous whitespace in declaration)
+
+        You can pass in a custom list of (RE object, replace method)
+        tuples to get Beautiful Soup to scrub your input the way you
+        want."""
+
+        self.parseOnlyThese = parseOnlyThese
+        self.fromEncoding = fromEncoding
+        self.smartQuotesTo = smartQuotesTo
+        self.convertEntities = convertEntities
+        # Set the rules for how we'll deal with the entities we
+        # encounter
+        if self.convertEntities:
+            # It doesn't make sense to convert encoded characters to
+            # entities even while you're converting entities to Unicode.
+            # Just convert it all to Unicode.
+            self.smartQuotesTo = None
+            if convertEntities == self.HTML_ENTITIES:
+                self.convertXMLEntities = False
+                self.convertHTMLEntities = True
+                self.escapeUnrecognizedEntities = True
+            elif convertEntities == self.XHTML_ENTITIES:
+                self.convertXMLEntities = True
+                self.convertHTMLEntities = True
+                self.escapeUnrecognizedEntities = False
+            elif convertEntities == self.XML_ENTITIES:
+                self.convertXMLEntities = True
+                self.convertHTMLEntities = False
+                self.escapeUnrecognizedEntities = False
+        else:
+            self.convertXMLEntities = False
+            self.convertHTMLEntities = False
+            self.escapeUnrecognizedEntities = False
+
+        self.instanceSelfClosingTags = buildTagMap(None, selfClosingTags)
+        SGMLParser.__init__(self)
+
+        if hasattr(markup, 'read'):        # It's a file-type object.
+            markup = markup.read()
+        self.markup = markup
+        self.markupMassage = markupMassage
+        try:
+            self._feed(isHTML=isHTML)
+        except StopParsing:
+            pass
+        self.markup = None                 # The markup can now be GCed
+
+    def convert_charref(self, name):
+        """This method fixes a bug in Python's SGMLParser."""
+        try:
+            n = int(name)
+        except ValueError:
+            return
+        if not 0 <= n <= 127 : # ASCII ends at 127, not 255
+            return
+        return self.convert_codepoint(n)
+
+    def _feed(self, inDocumentEncoding=None, isHTML=False):
+        # Convert the document to Unicode.
+        markup = self.markup
+        if isinstance(markup, unicode):
+            if not hasattr(self, 'originalEncoding'):
+                self.originalEncoding = None
+        else:
+            dammit = UnicodeDammit\
+                     (markup, [self.fromEncoding, inDocumentEncoding],
+                      smartQuotesTo=self.smartQuotesTo, isHTML=isHTML)
+            markup = dammit.unicode
+            self.originalEncoding = dammit.originalEncoding
+            self.declaredHTMLEncoding = dammit.declaredHTMLEncoding
+        if markup:
+            if self.markupMassage:
+                if not hasattr(self.markupMassage, "__iter__"):
+                    self.markupMassage = self.MARKUP_MASSAGE
+                for fix, m in self.markupMassage:
+                    markup = fix.sub(m, markup)
+                # TODO: We get rid of markupMassage so that the
+                # soup object can be deepcopied later on. Some
+                # Python installations can't copy regexes. If anyone
+                # was relying on the existence of markupMassage, this
+                # might cause problems.
+                del(self.markupMassage)
+        self.reset()
+
+        SGMLParser.feed(self, markup)
+        # Close out any unfinished strings and close all the open tags.
+        self.endData()
+        while self.currentTag.name != self.ROOT_TAG_NAME:
+            self.popTag()
+
+    def __getattr__(self, methodName):
+        """This method routes method call requests to either the SGMLParser
+        superclass or the Tag superclass, depending on the method name."""
+        #print "__getattr__ called on %s.%s" % (self.__class__, methodName)
+
+        if methodName.startswith('start_') or methodName.startswith('end_') \
+               or methodName.startswith('do_'):
+            return SGMLParser.__getattr__(self, methodName)
+        elif not methodName.startswith('__'):
+            return Tag.__getattr__(self, methodName)
+        else:
+            raise AttributeError
+
+    def isSelfClosingTag(self, name):
+        """Returns true iff the given string is the name of a
+        self-closing tag according to this parser."""
+        return self.SELF_CLOSING_TAGS.has_key(name) \
+               or self.instanceSelfClosingTags.has_key(name)
+
+    def reset(self):
+        Tag.__init__(self, self, self.ROOT_TAG_NAME)
+        self.hidden = 1
+        SGMLParser.reset(self)
+        self.currentData = []
+        self.currentTag = None
+        self.tagStack = []
+        self.quoteStack = []
+        self.pushTag(self)
+
+    def popTag(self):
+        tag = self.tagStack.pop()
+
+        #print "Pop", tag.name
+        if self.tagStack:
+            self.currentTag = self.tagStack[-1]
+        return self.currentTag
+
+    def pushTag(self, tag):
+        #print "Push", tag.name
+        if self.currentTag:
+            self.currentTag.contents.append(tag)
+        self.tagStack.append(tag)
+        self.currentTag = self.tagStack[-1]
+
+    def endData(self, containerClass=NavigableString):
+        if self.currentData:
+            currentData = u''.join(self.currentData)
+            if (currentData.translate(self.STRIP_ASCII_SPACES) == '' and
+                not set([tag.name for tag in self.tagStack]).intersection(
+                    self.PRESERVE_WHITESPACE_TAGS)):
+                if '\n' in currentData:
+                    currentData = '\n'
+                else:
+                    currentData = ' '
+            self.currentData = []
+            if self.parseOnlyThese and len(self.tagStack) <= 1 and \
+                   (not self.parseOnlyThese.text or \
+                    not self.parseOnlyThese.search(currentData)):
+                return
+            o = containerClass(currentData)
+            o.setup(self.currentTag, self.previous)
+            if self.previous:
+                self.previous.next = o
+            self.previous = o
+            self.currentTag.contents.append(o)
+
+
+    def _popToTag(self, name, inclusivePop=True):
+        """Pops the tag stack up to and including the most recent
+        instance of the given tag. If inclusivePop is false, pops the tag
+        stack up to but *not* including the most recent instqance of
+        the given tag."""
+        #print "Popping to %s" % name
+        if name == self.ROOT_TAG_NAME:
+            return
+
+        numPops = 0
+        mostRecentTag = None
+        for i in range(len(self.tagStack)-1, 0, -1):
+            if name == self.tagStack[i].name:
+                numPops = len(self.tagStack)-i
+                break
+        if not inclusivePop:
+            numPops = numPops - 1
+
+        for i in range(0, numPops):
+            mostRecentTag = self.popTag()
+        return mostRecentTag
+
+    def _smartPop(self, name):
+
+        """We need to pop up to the previous tag of this type, unless
+        one of this tag's nesting reset triggers comes between this
+        tag and the previous tag of this type, OR unless this tag is a
+        generic nesting trigger and another generic nesting trigger
+        comes between this tag and the previous tag of this type.
+
+        Examples:
+         <p>Foo<b>Bar *<p>* should pop to 'p', not 'b'.
+         <p>Foo<table>Bar *<p>* should pop to 'table', not 'p'.
+         <p>Foo<table><tr>Bar *<p>* should pop to 'tr', not 'p'.
+
+         <li><ul><li> *<li>* should pop to 'ul', not the first 'li'.
+         <tr><table><tr> *<tr>* should pop to 'table', not the first 'tr'
+         <td><tr><td> *<td>* should pop to 'tr', not the first 'td'
+        """
+
+        nestingResetTriggers = self.NESTABLE_TAGS.get(name)
+        isNestable = nestingResetTriggers != None
+        isResetNesting = self.RESET_NESTING_TAGS.has_key(name)
+        popTo = None
+        inclusive = True
+        for i in range(len(self.tagStack)-1, 0, -1):
+            p = self.tagStack[i]
+            if (not p or p.name == name) and not isNestable:
+                #Non-nestable tags get popped to the top or to their
+                #last occurance.
+                popTo = name
+                break
+            if (nestingResetTriggers is not None
+                and p.name in nestingResetTriggers) \
+                or (nestingResetTriggers is None and isResetNesting
+                    and self.RESET_NESTING_TAGS.has_key(p.name)):
+
+                #If we encounter one of the nesting reset triggers
+                #peculiar to this tag, or we encounter another tag
+                #that causes nesting to reset, pop up to but not
+                #including that tag.
+                popTo = p.name
+                inclusive = False
+                break
+            p = p.parent
+        if popTo:
+            self._popToTag(popTo, inclusive)
+
+    def unknown_starttag(self, name, attrs, selfClosing=0):
+        #print "Start tag %s: %s" % (name, attrs)
+        if self.quoteStack:
+            #This is not a real tag.
+            #print "<%s> is not real!" % name
+            attrs = ''.join([' %s="%s"' % (x, y) for x, y in attrs])
+            self.handle_data('<%s%s>' % (name, attrs))
+            return
+        self.endData()
+
+        if not self.isSelfClosingTag(name) and not selfClosing:
+            self._smartPop(name)
+
+        if self.parseOnlyThese and len(self.tagStack) <= 1 \
+               and (self.parseOnlyThese.text or not self.parseOnlyThese.searchTag(name, attrs)):
+            return
+
+        tag = Tag(self, name, attrs, self.currentTag, self.previous)
+        if self.previous:
+            self.previous.next = tag
+        self.previous = tag
+        self.pushTag(tag)
+        if selfClosing or self.isSelfClosingTag(name):
+            self.popTag()
+        if name in self.QUOTE_TAGS:
+            #print "Beginning quote (%s)" % name
+            self.quoteStack.append(name)
+            self.literal = 1
+        return tag
+
+    def unknown_endtag(self, name):
+        #print "End tag %s" % name
+        if self.quoteStack and self.quoteStack[-1] != name:
+            #This is not a real end tag.
+            #print "</%s> is not real!" % name
+            self.handle_data('</%s>' % name)
+            return
+        self.endData()
+        self._popToTag(name)
+        if self.quoteStack and self.quoteStack[-1] == name:
+            self.quoteStack.pop()
+            self.literal = (len(self.quoteStack) > 0)
+
+    def handle_data(self, data):
+        self.currentData.append(data)
+
+    def _toStringSubclass(self, text, subclass):
+        """Adds a certain piece of text to the tree as a NavigableString
+        subclass."""
+        self.endData()
+        self.handle_data(text)
+        self.endData(subclass)
+
+    def handle_pi(self, text):
+        """Handle a processing instruction as a ProcessingInstruction
+        object, possibly one with a %SOUP-ENCODING% slot into which an
+        encoding will be plugged later."""
+        if text[:3] == "xml":
+            text = u"xml version='1.0' encoding='%SOUP-ENCODING%'"
+        self._toStringSubclass(text, ProcessingInstruction)
+
+    def handle_comment(self, text):
+        "Handle comments as Comment objects."
+        self._toStringSubclass(text, Comment)
+
+    def handle_charref(self, ref):
+        "Handle character references as data."
+        if self.convertEntities:
+            data = unichr(int(ref))
+        else:
+            data = '&#%s;' % ref
+        self.handle_data(data)
+
+    def handle_entityref(self, ref):
+        """Handle entity references as data, possibly converting known
+        HTML and/or XML entity references to the corresponding Unicode
+        characters."""
+        data = None
+        if self.convertHTMLEntities:
+            try:
+                data = unichr(name2codepoint[ref])
+            except KeyError:
+                pass
+
+        if not data and self.convertXMLEntities:
+                data = self.XML_ENTITIES_TO_SPECIAL_CHARS.get(ref)
+
+        if not data and self.convertHTMLEntities and \
+            not self.XML_ENTITIES_TO_SPECIAL_CHARS.get(ref):
+                # TODO: We've got a problem here. We're told this is
+                # an entity reference, but it's not an XML entity
+                # reference or an HTML entity reference. Nonetheless,
+                # the logical thing to do is to pass it through as an
+                # unrecognized entity reference.
+                #
+                # Except: when the input is "&carol;" this function
+                # will be called with input "carol". When the input is
+                # "AT&T", this function will be called with input
+                # "T". We have no way of knowing whether a semicolon
+                # was present originally, so we don't know whether
+                # this is an unknown entity or just a misplaced
+                # ampersand.
+                #
+                # The more common case is a misplaced ampersand, so I
+                # escape the ampersand and omit the trailing semicolon.
+                data = "&amp;%s" % ref
+        if not data:
+            # This case is different from the one above, because we
+            # haven't already gone through a supposedly comprehensive
+            # mapping of entities to Unicode characters. We might not
+            # have gone through any mapping at all. So the chances are
+            # very high that this is a real entity, and not a
+            # misplaced ampersand.
+            data = "&%s;" % ref
+        self.handle_data(data)
+
+    def handle_decl(self, data):
+        "Handle DOCTYPEs and the like as Declaration objects."
+        self._toStringSubclass(data, Declaration)
+
+    def parse_declaration(self, i):
+        """Treat a bogus SGML declaration as raw data. Treat a CDATA
+        declaration as a CData object."""
+        j = None
+        if self.rawdata[i:i+9] == '<![CDATA[':
+             k = self.rawdata.find(']]>', i)
+             if k == -1:
+                 k = len(self.rawdata)
+             data = self.rawdata[i+9:k]
+             j = k+3
+             self._toStringSubclass(data, CData)
+        else:
+            try:
+                j = SGMLParser.parse_declaration(self, i)
+            except SGMLParseError:
+                toHandle = self.rawdata[i:]
+                self.handle_data(toHandle)
+                j = i + len(toHandle)
+        return j
+
+class BeautifulSoup(BeautifulStoneSoup):
+
+    """This parser knows the following facts about HTML:
+
+    * Some tags have no closing tag and should be interpreted as being
+      closed as soon as they are encountered.
+
+    * The text inside some tags (ie. 'script') may contain tags which
+      are not really part of the document and which should be parsed
+      as text, not tags. If you want to parse the text as tags, you can
+      always fetch it and parse it explicitly.
+
+    * Tag nesting rules:
+
+      Most tags can't be nested at all. For instance, the occurance of
+      a <p> tag should implicitly close the previous <p> tag.
+
+       <p>Para1<p>Para2
+        should be transformed into:
+       <p>Para1</p><p>Para2
+
+      Some tags can be nested arbitrarily. For instance, the occurance
+      of a <blockquote> tag should _not_ implicitly close the previous
+      <blockquote> tag.
+
+       Alice said: <blockquote>Bob said: <blockquote>Blah
+        should NOT be transformed into:
+       Alice said: <blockquote>Bob said: </blockquote><blockquote>Blah
+
+      Some tags can be nested, but the nesting is reset by the
+      interposition of other tags. For instance, a <tr> tag should
+      implicitly close the previous <tr> tag within the same <table>,
+      but not close a <tr> tag in another table.
+
+       <table><tr>Blah<tr>Blah
+        should be transformed into:
+       <table><tr>Blah</tr><tr>Blah
+        but,
+       <tr>Blah<table><tr>Blah
+        should NOT be transformed into
+       <tr>Blah<table></tr><tr>Blah
+
+    Differing assumptions about tag nesting rules are a major source
+    of problems with the BeautifulSoup class. If BeautifulSoup is not
+    treating as nestable a tag your page author treats as nestable,
+    try ICantBelieveItsBeautifulSoup, MinimalSoup, or
+    BeautifulStoneSoup before writing your own subclass."""
+
+    def __init__(self, *args, **kwargs):
+        if not kwargs.has_key('smartQuotesTo'):
+            kwargs['smartQuotesTo'] = self.HTML_ENTITIES
+        kwargs['isHTML'] = True
+        BeautifulStoneSoup.__init__(self, *args, **kwargs)
+
+    SELF_CLOSING_TAGS = buildTagMap(None,
+                                    ('br' , 'hr', 'input', 'img', 'meta',
+                                    'spacer', 'link', 'frame', 'base', 'col'))
+
+    PRESERVE_WHITESPACE_TAGS = set(['pre', 'textarea'])
+
+    QUOTE_TAGS = {'script' : None, 'textarea' : None}
+
+    #According to the HTML standard, each of these inline tags can
+    #contain another tag of the same type. Furthermore, it's common
+    #to actually use these tags this way.
+    NESTABLE_INLINE_TAGS = ('span', 'font', 'q', 'object', 'bdo', 'sub', 'sup',
+                            'center')
+
+    #According to the HTML standard, these block tags can contain
+    #another tag of the same type. Furthermore, it's common
+    #to actually use these tags this way.
+    NESTABLE_BLOCK_TAGS = ('blockquote', 'div', 'fieldset', 'ins', 'del')
+
+    #Lists can contain other lists, but there are restrictions.
+    NESTABLE_LIST_TAGS = { 'ol' : [],
+                           'ul' : [],
+                           'li' : ['ul', 'ol'],
+                           'dl' : [],
+                           'dd' : ['dl'],
+                           'dt' : ['dl'] }
+
+    #Tables can contain other tables, but there are restrictions.
+    NESTABLE_TABLE_TAGS = {'table' : [],
+                           'tr' : ['table', 'tbody', 'tfoot', 'thead'],
+                           'td' : ['tr'],
+                           'th' : ['tr'],
+                           'thead' : ['table'],
+                           'tbody' : ['table'],
+                           'tfoot' : ['table'],
+                           }
+
+    NON_NESTABLE_BLOCK_TAGS = ('address', 'form', 'p', 'pre')
+
+    #If one of these tags is encountered, all tags up to the next tag of
+    #this type are popped.
+    RESET_NESTING_TAGS = buildTagMap(None, NESTABLE_BLOCK_TAGS, 'noscript',
+                                     NON_NESTABLE_BLOCK_TAGS,
+                                     NESTABLE_LIST_TAGS,
+                                     NESTABLE_TABLE_TAGS)
+
+    NESTABLE_TAGS = buildTagMap([], NESTABLE_INLINE_TAGS, NESTABLE_BLOCK_TAGS,
+                                NESTABLE_LIST_TAGS, NESTABLE_TABLE_TAGS)
+
+    # Used to detect the charset in a META tag; see start_meta
+    CHARSET_RE = re.compile("((^|;)\s*charset=)([^;]*)", re.M)
+
+    def start_meta(self, attrs):
+        """Beautiful Soup can detect a charset included in a META tag,
+        try to convert the document to that charset, and re-parse the
+        document from the beginning."""
+        httpEquiv = None
+        contentType = None
+        contentTypeIndex = None
+        tagNeedsEncodingSubstitution = False
+
+        for i in range(0, len(attrs)):
+            key, value = attrs[i]
+            key = key.lower()
+            if key == 'http-equiv':
+                httpEquiv = value
+            elif key == 'content':
+                contentType = value
+                contentTypeIndex = i
+
+        if httpEquiv and contentType: # It's an interesting meta tag.
+            match = self.CHARSET_RE.search(contentType)
+            if match:
+                if (self.declaredHTMLEncoding is not None or
+                    self.originalEncoding == self.fromEncoding):
+                    # An HTML encoding was sniffed while converting
+                    # the document to Unicode, or an HTML encoding was
+                    # sniffed during a previous pass through the
+                    # document, or an encoding was specified
+                    # explicitly and it worked. Rewrite the meta tag.
+                    def rewrite(match):
+                        return match.group(1) + "%SOUP-ENCODING%"
+                    newAttr = self.CHARSET_RE.sub(rewrite, contentType)
+                    attrs[contentTypeIndex] = (attrs[contentTypeIndex][0],
+                                               newAttr)
+                    tagNeedsEncodingSubstitution = True
+                else:
+                    # This is our first pass through the document.
+                    # Go through it again with the encoding information.
+                    newCharset = match.group(3)
+                    if newCharset and newCharset != self.originalEncoding:
+                        self.declaredHTMLEncoding = newCharset
+                        self._feed(self.declaredHTMLEncoding)
+                        raise StopParsing
+                    pass
+        tag = self.unknown_starttag("meta", attrs)
+        if tag and tagNeedsEncodingSubstitution:
+            tag.containsSubstitutions = True
+
+class StopParsing(Exception):
+    pass
+
+class ICantBelieveItsBeautifulSoup(BeautifulSoup):
+
+    """The BeautifulSoup class is oriented towards skipping over
+    common HTML errors like unclosed tags. However, sometimes it makes
+    errors of its own. For instance, consider this fragment:
+
+     <b>Foo<b>Bar</b></b>
+
+    This is perfectly valid (if bizarre) HTML. However, the
+    BeautifulSoup class will implicitly close the first b tag when it
+    encounters the second 'b'. It will think the author wrote
+    "<b>Foo<b>Bar", and didn't close the first 'b' tag, because
+    there's no real-world reason to bold something that's already
+    bold. When it encounters '</b></b>' it will close two more 'b'
+    tags, for a grand total of three tags closed instead of two. This
+    can throw off the rest of your document structure. The same is
+    true of a number of other tags, listed below.
+
+    It's much more common for someone to forget to close a 'b' tag
+    than to actually use nested 'b' tags, and the BeautifulSoup class
+    handles the common case. This class handles the not-co-common
+    case: where you can't believe someone wrote what they did, but
+    it's valid HTML and BeautifulSoup screwed up by assuming it
+    wouldn't be."""
+
+    I_CANT_BELIEVE_THEYRE_NESTABLE_INLINE_TAGS = \
+     ('em', 'big', 'i', 'small', 'tt', 'abbr', 'acronym', 'strong',
+      'cite', 'code', 'dfn', 'kbd', 'samp', 'strong', 'var', 'b',
+      'big')
+
+    I_CANT_BELIEVE_THEYRE_NESTABLE_BLOCK_TAGS = ('noscript',)
+
+    NESTABLE_TAGS = buildTagMap([], BeautifulSoup.NESTABLE_TAGS,
+                                I_CANT_BELIEVE_THEYRE_NESTABLE_BLOCK_TAGS,
+                                I_CANT_BELIEVE_THEYRE_NESTABLE_INLINE_TAGS)
+
+class MinimalSoup(BeautifulSoup):
+    """The MinimalSoup class is for parsing HTML that contains
+    pathologically bad markup. It makes no assumptions about tag
+    nesting, but it does know which tags are self-closing, that
+    <script> tags contain Javascript and should not be parsed, that
+    META tags may contain encoding information, and so on.
+
+    This also makes it better for subclassing than BeautifulStoneSoup
+    or BeautifulSoup."""
+
+    RESET_NESTING_TAGS = buildTagMap('noscript')
+    NESTABLE_TAGS = {}
+
+class BeautifulSOAP(BeautifulStoneSoup):
+    """This class will push a tag with only a single string child into
+    the tag's parent as an attribute. The attribute's name is the tag
+    name, and the value is the string child. An example should give
+    the flavor of the change:
+
+    <foo><bar>baz</bar></foo>
+     =>
+    <foo bar="baz"><bar>baz</bar></foo>
+
+    You can then access fooTag['bar'] instead of fooTag.barTag.string.
+
+    This is, of course, useful for scraping structures that tend to
+    use subelements instead of attributes, such as SOAP messages. Note
+    that it modifies its input, so don't print the modified version
+    out.
+
+    I'm not sure how many people really want to use this class; let me
+    know if you do. Mainly I like the name."""
+
+    def popTag(self):
+        if len(self.tagStack) > 1:
+            tag = self.tagStack[-1]
+            parent = self.tagStack[-2]
+            parent._getAttrMap()
+            if (isinstance(tag, Tag) and len(tag.contents) == 1 and
+                isinstance(tag.contents[0], NavigableString) and
+                not parent.attrMap.has_key(tag.name)):
+                parent[tag.name] = tag.contents[0]
+        BeautifulStoneSoup.popTag(self)
+
+#Enterprise class names! It has come to our attention that some people
+#think the names of the Beautiful Soup parser classes are too silly
+#and "unprofessional" for use in enterprise screen-scraping. We feel
+#your pain! For such-minded folk, the Beautiful Soup Consortium And
+#All-Night Kosher Bakery recommends renaming this file to
+#"RobustParser.py" (or, in cases of extreme enterprisiness,
+#"RobustParserBeanInterface.class") and using the following
+#enterprise-friendly class aliases:
+class RobustXMLParser(BeautifulStoneSoup):
+    pass
+class RobustHTMLParser(BeautifulSoup):
+    pass
+class RobustWackAssHTMLParser(ICantBelieveItsBeautifulSoup):
+    pass
+class RobustInsanelyWackAssHTMLParser(MinimalSoup):
+    pass
+class SimplifyingSOAPParser(BeautifulSOAP):
+    pass
+
+######################################################
+#
+# Bonus library: Unicode, Dammit
+#
+# This class forces XML data into a standard format (usually to UTF-8
+# or Unicode).  It is heavily based on code from Mark Pilgrim's
+# Universal Feed Parser. It does not rewrite the XML or HTML to
+# reflect a new encoding: that happens in BeautifulStoneSoup.handle_pi
+# (XML) and BeautifulSoup.start_meta (HTML).
+
+# Autodetects character encodings.
+# Download from http://chardet.feedparser.org/
+try:
+    import chardet
+#    import chardet.constants
+#    chardet.constants._debug = 1
+except ImportError:
+    chardet = None
+
+# cjkcodecs and iconv_codec make Python know about more character encodings.
+# Both are available from http://cjkpython.i18n.org/
+# They're built in if you use Python 2.4.
+try:
+    import cjkcodecs.aliases
+except ImportError:
+    pass
+try:
+    import iconv_codec
+except ImportError:
+    pass
+
+class UnicodeDammit:
+    """A class for detecting the encoding of a *ML document and
+    converting it to a Unicode string. If the source encoding is
+    windows-1252, can replace MS smart quotes with their HTML or XML
+    equivalents."""
+
+    # This dictionary maps commonly seen values for "charset" in HTML
+    # meta tags to the corresponding Python codec names. It only covers
+    # values that aren't in Python's aliases and can't be determined
+    # by the heuristics in find_codec.
+    CHARSET_ALIASES = { "macintosh" : "mac-roman",
+                        "x-sjis" : "shift-jis" }
+
+    def __init__(self, markup, overrideEncodings=[],
+                 smartQuotesTo='xml', isHTML=False):
+        self.declaredHTMLEncoding = None
+        self.markup, documentEncoding, sniffedEncoding = \
+                     self._detectEncoding(markup, isHTML)
+        self.smartQuotesTo = smartQuotesTo
+        self.triedEncodings = []
+        if markup == '' or isinstance(markup, unicode):
+            self.originalEncoding = None
+            self.unicode = unicode(markup)
+            return
+
+        u = None
+        for proposedEncoding in overrideEncodings:
+            u = self._convertFrom(proposedEncoding)
+            if u: break
+        if not u:
+            for proposedEncoding in (documentEncoding, sniffedEncoding):
+                u = self._convertFrom(proposedEncoding)
+                if u: break
+
+        # If no luck and we have auto-detection library, try that:
+        if not u and chardet and not isinstance(self.markup, unicode):
+            u = self._convertFrom(chardet.detect(self.markup)['encoding'])
+
+        # As a last resort, try utf-8 and windows-1252:
+        if not u:
+            for proposed_encoding in ("utf-8", "windows-1252"):
+                u = self._convertFrom(proposed_encoding)
+                if u: break
+
+        self.unicode = u
+        if not u: self.originalEncoding = None
+
+    def _subMSChar(self, orig):
+        """Changes a MS smart quote character to an XML or HTML
+        entity."""
+        sub = self.MS_CHARS.get(orig)
+        if isinstance(sub, tuple):
+            if self.smartQuotesTo == 'xml':
+                sub = '&#x%s;' % sub[1]
+            else:
+                sub = '&%s;' % sub[0]
+        return sub
+
+    def _convertFrom(self, proposed):
+        proposed = self.find_codec(proposed)
+        if not proposed or proposed in self.triedEncodings:
+            return None
+        self.triedEncodings.append(proposed)
+        markup = self.markup
+
+        # Convert smart quotes to HTML if coming from an encoding
+        # that might have them.
+        if self.smartQuotesTo and proposed.lower() in("windows-1252",
+                                                      "iso-8859-1",
+                                                      "iso-8859-2"):
+            markup = re.compile("([\x80-\x9f])").sub \
+                     (lambda(x): self._subMSChar(x.group(1)),
+                      markup)
+
+        try:
+            # print "Trying to convert document to %s" % proposed
+            u = self._toUnicode(markup, proposed)
+            self.markup = u
+            self.originalEncoding = proposed
+        except Exception, e:
+            # print "That didn't work!"
+            # print e
+            return None
+        #print "Correct encoding: %s" % proposed
+        return self.markup
+
+    def _toUnicode(self, data, encoding):
+        '''Given a string and its encoding, decodes the string into Unicode.
+        %encoding is a string recognized by encodings.aliases'''
+
+        # strip Byte Order Mark (if present)
+        if (len(data) >= 4) and (data[:2] == '\xfe\xff') \
+               and (data[2:4] != '\x00\x00'):
+            encoding = 'utf-16be'
+            data = data[2:]
+        elif (len(data) >= 4) and (data[:2] == '\xff\xfe') \
+                 and (data[2:4] != '\x00\x00'):
+            encoding = 'utf-16le'
+            data = data[2:]
+        elif data[:3] == '\xef\xbb\xbf':
+            encoding = 'utf-8'
+            data = data[3:]
+        elif data[:4] == '\x00\x00\xfe\xff':
+            encoding = 'utf-32be'
+            data = data[4:]
+        elif data[:4] == '\xff\xfe\x00\x00':
+            encoding = 'utf-32le'
+            data = data[4:]
+        newdata = unicode(data, encoding)
+        return newdata
+
+    def _detectEncoding(self, xml_data, isHTML=False):
+        """Given a document, tries to detect its XML encoding."""
+        xml_encoding = sniffed_xml_encoding = None
+        try:
+            if xml_data[:4] == '\x4c\x6f\xa7\x94':
+                # EBCDIC
+                xml_data = self._ebcdic_to_ascii(xml_data)
+            elif xml_data[:4] == '\x00\x3c\x00\x3f':
+                # UTF-16BE
+                sniffed_xml_encoding = 'utf-16be'
+                xml_data = unicode(xml_data, 'utf-16be').encode('utf-8')
+            elif (len(xml_data) >= 4) and (xml_data[:2] == '\xfe\xff') \
+                     and (xml_data[2:4] != '\x00\x00'):
+                # UTF-16BE with BOM
+                sniffed_xml_encoding = 'utf-16be'
+                xml_data = unicode(xml_data[2:], 'utf-16be').encode('utf-8')
+            elif xml_data[:4] == '\x3c\x00\x3f\x00':
+                # UTF-16LE
+                sniffed_xml_encoding = 'utf-16le'
+                xml_data = unicode(xml_data, 'utf-16le').encode('utf-8')
+            elif (len(xml_data) >= 4) and (xml_data[:2] == '\xff\xfe') and \
+                     (xml_data[2:4] != '\x00\x00'):
+                # UTF-16LE with BOM
+                sniffed_xml_encoding = 'utf-16le'
+                xml_data = unicode(xml_data[2:], 'utf-16le').encode('utf-8')
+            elif xml_data[:4] == '\x00\x00\x00\x3c':
+                # UTF-32BE
+                sniffed_xml_encoding = 'utf-32be'
+                xml_data = unicode(xml_data, 'utf-32be').encode('utf-8')
+            elif xml_data[:4] == '\x3c\x00\x00\x00':
+                # UTF-32LE
+                sniffed_xml_encoding = 'utf-32le'
+                xml_data = unicode(xml_data, 'utf-32le').encode('utf-8')
+            elif xml_data[:4] == '\x00\x00\xfe\xff':
+                # UTF-32BE with BOM
+                sniffed_xml_encoding = 'utf-32be'
+                xml_data = unicode(xml_data[4:], 'utf-32be').encode('utf-8')
+            elif xml_data[:4] == '\xff\xfe\x00\x00':
+                # UTF-32LE with BOM
+                sniffed_xml_encoding = 'utf-32le'
+                xml_data = unicode(xml_data[4:], 'utf-32le').encode('utf-8')
+            elif xml_data[:3] == '\xef\xbb\xbf':
+                # UTF-8 with BOM
+                sniffed_xml_encoding = 'utf-8'
+                xml_data = unicode(xml_data[3:], 'utf-8').encode('utf-8')
+            else:
+                sniffed_xml_encoding = 'ascii'
+                pass
+        except:
+            xml_encoding_match = None
+        xml_encoding_match = re.compile(
+            '^<\?.*encoding=[\'"](.*?)[\'"].*\?>').match(xml_data)
+        if not xml_encoding_match and isHTML:
+            regexp = re.compile('<\s*meta[^>]+charset=([^>]*?)[;\'">]', re.I)
+            xml_encoding_match = regexp.search(xml_data)
+        if xml_encoding_match is not None:
+            xml_encoding = xml_encoding_match.groups()[0].lower()
+            if isHTML:
+                self.declaredHTMLEncoding = xml_encoding
+            if sniffed_xml_encoding and \
+               (xml_encoding in ('iso-10646-ucs-2', 'ucs-2', 'csunicode',
+                                 'iso-10646-ucs-4', 'ucs-4', 'csucs4',
+                                 'utf-16', 'utf-32', 'utf_16', 'utf_32',
+                                 'utf16', 'u16')):
+                xml_encoding = sniffed_xml_encoding
+        return xml_data, xml_encoding, sniffed_xml_encoding
+
+
+    def find_codec(self, charset):
+        return self._codec(self.CHARSET_ALIASES.get(charset, charset)) \
+               or (charset and self._codec(charset.replace("-", ""))) \
+               or (charset and self._codec(charset.replace("-", "_"))) \
+               or charset
+
+    def _codec(self, charset):
+        if not charset: return charset
+        codec = None
+        try:
+            codecs.lookup(charset)
+            codec = charset
+        except (LookupError, ValueError):
+            pass
+        return codec
+
+    EBCDIC_TO_ASCII_MAP = None
+    def _ebcdic_to_ascii(self, s):
+        c = self.__class__
+        if not c.EBCDIC_TO_ASCII_MAP:
+            emap = (0,1,2,3,156,9,134,127,151,141,142,11,12,13,14,15,
+                    16,17,18,19,157,133,8,135,24,25,146,143,28,29,30,31,
+                    128,129,130,131,132,10,23,27,136,137,138,139,140,5,6,7,
+                    144,145,22,147,148,149,150,4,152,153,154,155,20,21,158,26,
+                    32,160,161,162,163,164,165,166,167,168,91,46,60,40,43,33,
+                    38,169,170,171,172,173,174,175,176,177,93,36,42,41,59,94,
+                    45,47,178,179,180,181,182,183,184,185,124,44,37,95,62,63,
+                    186,187,188,189,190,191,192,193,194,96,58,35,64,39,61,34,
+                    195,97,98,99,100,101,102,103,104,105,196,197,198,199,200,
+                    201,202,106,107,108,109,110,111,112,113,114,203,204,205,
+                    206,207,208,209,126,115,116,117,118,119,120,121,122,210,
+                    211,212,213,214,215,216,217,218,219,220,221,222,223,224,
+                    225,226,227,228,229,230,231,123,65,66,67,68,69,70,71,72,
+                    73,232,233,234,235,236,237,125,74,75,76,77,78,79,80,81,
+                    82,238,239,240,241,242,243,92,159,83,84,85,86,87,88,89,
+                    90,244,245,246,247,248,249,48,49,50,51,52,53,54,55,56,57,
+                    250,251,252,253,254,255)
+            import string
+            c.EBCDIC_TO_ASCII_MAP = string.maketrans( \
+            ''.join(map(chr, range(256))), ''.join(map(chr, emap)))
+        return s.translate(c.EBCDIC_TO_ASCII_MAP)
+
+    MS_CHARS = { '\x80' : ('euro', '20AC'),
+                 '\x81' : ' ',
+                 '\x82' : ('sbquo', '201A'),
+                 '\x83' : ('fnof', '192'),
+                 '\x84' : ('bdquo', '201E'),
+                 '\x85' : ('hellip', '2026'),
+                 '\x86' : ('dagger', '2020'),
+                 '\x87' : ('Dagger', '2021'),
+                 '\x88' : ('circ', '2C6'),
+                 '\x89' : ('permil', '2030'),
+                 '\x8A' : ('Scaron', '160'),
+                 '\x8B' : ('lsaquo', '2039'),
+                 '\x8C' : ('OElig', '152'),
+                 '\x8D' : '?',
+                 '\x8E' : ('#x17D', '17D'),
+                 '\x8F' : '?',
+                 '\x90' : '?',
+                 '\x91' : ('lsquo', '2018'),
+                 '\x92' : ('rsquo', '2019'),
+                 '\x93' : ('ldquo', '201C'),
+                 '\x94' : ('rdquo', '201D'),
+                 '\x95' : ('bull', '2022'),
+                 '\x96' : ('ndash', '2013'),
+                 '\x97' : ('mdash', '2014'),
+                 '\x98' : ('tilde', '2DC'),
+                 '\x99' : ('trade', '2122'),
+                 '\x9a' : ('scaron', '161'),
+                 '\x9b' : ('rsaquo', '203A'),
+                 '\x9c' : ('oelig', '153'),
+                 '\x9d' : '?',
+                 '\x9e' : ('#x17E', '17E'),
+                 '\x9f' : ('Yuml', ''),}
+
+#######################################################################
+
+
+#By default, act as an HTML pretty-printer.
+if __name__ == '__main__':
+    import sys
+    soup = BeautifulSoup(sys.stdin)
+    print soup.prettify()
diff --git a/fanficdownloader/__init__.py b/fanficdownloader/__init__.py
new file mode 100644
index 00000000..40a96afc
--- /dev/null
+++ b/fanficdownloader/__init__.py
@@ -0,0 +1 @@
+# -*- coding: utf-8 -*-
diff --git a/fanficdownloader/adapter.py b/fanficdownloader/adapter.py
new file mode 100644
index 00000000..f4dd116a
--- /dev/null
+++ b/fanficdownloader/adapter.py
@@ -0,0 +1,229 @@
+# -*- coding: utf-8 -*-
+
+import logging
+import datetime
+from output import makeAcceptableFilename
+
+try:
+	from google.appengine.api.urlfetch import fetch as googlefetch
+	appEngineGlob = True
+except:
+	appEngineGlob = False
+
+class LoginRequiredException(Exception):
+	def __init__(self, url):
+		self.url = url
+	
+	def __str__(self):
+		return repr(self.url + ' requires user to be logged in')
+	
+class StoryArchivedAlready(Exception):
+	pass
+
+class StoryDoesNotExist(Exception):
+	pass
+
+class FailedToDownload(Exception):
+	pass
+
+class InvalidStoryURL(Exception):
+	pass
+
+class FanfictionSiteAdapter:
+	appEngine = appEngineGlob
+	login = ''
+	password = ''
+	url = ''
+	host = ''
+	path = ''
+	uuid = ''
+	storyName = ''
+	storyId = ''
+	authorName = ''
+	authorId = ''
+	authorURL = ''
+	outputStorySep = '-Ukn_'
+	outputName = ''
+	outputFileName = ''
+	storyDescription = ''
+	storyCharacters = []
+	storySeries = ''
+	storyPublished = datetime.date(1970, 01, 31)
+	storyCreated = datetime.datetime.now()
+	storyUpdated = datetime.date(1970, 01, 31)
+	languageId = 'en-UK'
+	language = 'English'
+	subjects = []
+	publisher = ''
+	numChapters = '0'
+	numWords = '0'
+	genre = ''
+	category = ''
+	storyStatus = 'In-Progress'
+	storyRating = ''
+	storyUserRating = '0'
+	def __init__(self, url):
+		# basic plain url parsing...
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+			
+	def hasAppEngine(self):
+		return self.appEngine
+	
+	def fetchUrl(self, url):
+		if not self.appEngine:
+			return self.opener.open(url).read().decode('utf-8')
+		else:
+			return googlefetch(url).content
+	
+	def requiresLogin(self, url = None):
+		return False
+	
+	def performLogin(self, url = None):
+		return True
+	
+	def extractIndividualUrls(self):
+		pass
+		
+	def getText(self, url):
+		pass
+
+	def setLogin(self, login):
+		self.login = login
+
+	def setPassword(self, password):
+		self.password = password
+
+	def getHost(self):
+		logging.debug('self.host=%s' % self.host)
+		return self.host
+	
+	def getUUID(self):
+		self.uuid = 'urn:uuid:' + self.host + '-u.' + self.authorId + '-s.' + self.storyId
+		logging.debug('self.uuid=%s' % self.uuid)
+		return self.uuid
+
+	def getOutputName(self):
+		self.outputName = makeAcceptableFilename(self.storyName.replace(" ", "_") + self.outputStorySep + self.storyId)
+		logging.debug('self.outputName=%s' % self.outputName)
+		return self.outputName
+
+	def getOutputFileName(self, booksDirectory, bookExt):
+		self.getOutputName()	# make sure self.outputName is populated
+		self.outputFileName = booksDirectory + "/" + self.outputName + bookExt
+		logging.debug('self.outputFileName=%s' % self.outputFileName)
+		return self.outputFileName
+
+	def getAuthorURL(self):
+		logging.debug('self.authorURL=%s' % self.authorURL)
+		return self.authorURL
+
+	def getAuthorId(self):
+		logging.debug('self.authorId=%s' % self.authorId)
+		return self.authorId
+
+	def getAuthorName(self):
+		logging.debug('self.authorName=%s' % self.authorName)
+		return self.authorName
+
+	def getStoryURL(self):
+		logging.debug('self.url=%s' % self.url)
+		return self.url
+
+	def getStoryId(self):
+		logging.debug('self.storyId=%s' % self.storyId)
+		return self.storyId
+
+	def getStoryName(self):
+		logging.debug('self.storyName=%s' % self.storyName)
+		return self.storyName
+
+	def getStoryDescription(self):
+		logging.debug('self.storyDescription=%s' % self.storyDescription)
+		return self.storyDescription
+
+	def getStoryCreated(self):
+		self.storyCreated = datetime.datetime.now()
+		logging.debug('self.storyCreated=%s' % self.storyCreated)
+		return self.storyCreated
+
+	def addCharacter(self, character):
+		chara = character.upper()
+		for c in self.storyCharacters:
+			if c.upper() == chara:
+				return False
+		self.storyCharacters.append(character)
+		return True
+
+	def getStoryCharacters(self):
+		logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+		return self.storyCharacters
+	
+	def getStoryPublished(self):
+		logging.debug('self.storyPublished=%s' % self.storyPublished)
+		return self.storyPublished
+
+	def getStoryUpdated(self):
+		logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+		return self.storyUpdated
+
+	def getStorySeries(self):
+		logging.debug('self.storySeries=%s' % self.storySeries)
+		return self.storySeries
+
+	def getLanguage(self):
+		logging.debug('self.language=%s' % self.language)
+		return self.language
+
+	def getLanguageId(self):
+		logging.debug('self.languageId=%s' % self.languageId)
+		return self.languageId
+
+	def addSubject(self, subject):
+		subj = subject.upper()
+		for s in self.subjects:
+			if s.upper() == subj:
+				return False
+		self.subjects.append(subject)
+		return True
+
+	def getSubjects(self):
+		logging.debug('self.subjects=%s' % self.subjects)
+		return self.subjects
+
+	def getPublisher(self):
+		logging.debug('self.publisher=%s' % self.publisher)
+		return self.publisher
+
+	def getNumChapters(self):
+		logging.debug('self.numChapters=%s' % self.numChapters)
+		return self.numChapters
+
+	def getNumWords(self):
+		logging.debug('self.numWords=%s' % self.numWords)
+		return self.numWords
+
+	def getCategory(self):
+		logging.debug('self.category=%s' % self.category)
+		return self.category
+
+	def getGenre(self):
+		logging.debug('self.genre=%s' % self.genre)
+		return self.genre
+
+	def getStoryStatus(self):
+		logging.debug('self.storyStatus=%s' % self.storyStatus)
+		return self.storyStatus
+
+	def getStoryRating(self):
+		logging.debug('self.storyRating=%s' % self.storyRating)
+		return self.storyRating
+
+	def getStoryUserRating(self):
+		logging.debug('self.storyUserRating=%s' % self.storyUserRating)
+		return self.storyUserRating
+
+	def getPrintableUrl(self, url):
+		return url
diff --git a/fanficdownloader/books/place holder.txt b/fanficdownloader/books/place holder.txt
new file mode 100644
index 00000000..e69de29b
diff --git a/fanficdownloader/constants.py b/fanficdownloader/constants.py
new file mode 100644
index 00000000..bd35546a
--- /dev/null
+++ b/fanficdownloader/constants.py
@@ -0,0 +1,542 @@
+# -*- coding: utf-8 -*-
+
+CSS = '''body { margin-left: 2%; margin-right: 2%; margin-top: 2%; margin-bottom: 2%; text-align: justify; }
+pre { font-size: x-small; }
+sml { font-size: small; }
+h1 { text-align: center; }
+h2 { text-align: center; }
+h3 { text-align: center; }
+h4 { text-align: center; }
+h5 { text-align: center; }
+h6 { text-align: center; }
+h7 { text-align: left; font-size: large; font-weight: bold; }
+.CI {
+    text-align:center;
+    margin-top:0px;
+    margin-bottom:0px;
+    padding:0px;
+    }
+.center   {text-align: center;}
+.cover    {text-align: center;}
+.full     {width: 100%; }
+.quarter  {width: 25%; }
+.smcap    {font-variant: small-caps;}
+.u        {text-decoration: underline;}
+.bold     {font-weight: bold;}
+'''
+
+MIMETYPE = '''application/epub+zip'''
+
+TITLE_HEADER = '''<?xml version="1.0" encoding="utf-8"?><html xmlns="http://www.w3.org/1999/xhtml" xmlns:xlink="http://www.w3.org/1999/xlink"><head><meta http-equiv="Content-Type" content="text/html; charset=utf-8"/>
+<title>%s - %s</title><link href="stylesheet.css" type="text/css" charset="UTF-8" rel="stylesheet"/></head><body>
+<p><h7 id="lnks"><b><a id="StoryLink" href="%s">%s</a></b> by <b><a id="AuthorLink" href="%s">%s</a></b></h7></p>
+<table class="full">
+'''
+
+TITLE_ENTRY = '''<tr><td><b>%s</b></td><td>%s</td></tr>
+'''
+
+TITLE_FOOTER = '''</table>
+<p><b>Summary:</b><br />%s</p>
+</body></html>
+'''
+
+CONTAINER = '''<?xml version="1.0" encoding="utf-8"?>
+<container version="1.0" xmlns="urn:oasis:names:tc:opendocument:xmlns:container">
+  <rootfiles>
+    <rootfile full-path="OEBPS/content.opf" media-type="application/oebps-package+xml"/>
+  </rootfiles>
+</container>
+'''
+
+CONTENT_START = '''<?xml version="1.0" encoding="utf-8"?>
+<package version="2.0" xmlns="http://www.idpf.org/2007/opf"
+         unique-identifier="fanficdownloader-uuid">
+ <metadata xmlns:xsi="http://www.w3.org/2001/XMLSchema-instance"
+           xmlns:dc="http://purl.org/dc/elements/1.1/"
+           xmlns:dcterms="http://purl.org/dc/terms/"
+           xmlns:opf="http://www.idpf.org/2007/opf"
+           xmlns:calibre="http://calibre.kovidgoyal.net/2009/metadata">
+   <dc:identifier id="fanficdownloader-uuid">BookID-Epub-%s</dc:identifier>
+   <dc:title>%s</dc:title> 
+   <dc:creator opf:role="aut">%s</dc:creator>
+   <dc:contributor opf:role="bkp">fanficdownloader [http://fanficdownloader.googlecode.com]</dc:contributor>
+   <dc:language>%s</dc:language> 
+   <dc:rights></dc:rights>
+   <dc:date opf:event="publication">%s</dc:date>
+   <dc:date opf:event="creation">%s</dc:date>
+   <dc:date opf:event="modification">%s</dc:date>
+   <meta name="calibre:timestamp" content="%s"/>
+   <dc:description>%s</dc:description>
+'''
+
+CONTENT_END_METADATA = '''   <dc:publisher>%s</dc:publisher> 
+   <dc:identifier id="BookId">%s</dc:identifier>
+   <dc:identifier opf:scheme="URL">%s</dc:identifier>
+   <dc:source>%s</dc:source>
+   <dc:type>FanFiction</dc:type>
+   <meta name="calibre:rating" content="%s"/>
+ </metadata>
+ <manifest>
+  <item id="ncx" href="toc.ncx" media-type="application/x-dtbncx+xml"/>
+  <item id="style" href="stylesheet.css" media-type="text/css" />
+'''
+
+CONTENT_SUBJECT = '''   <dc:subject>%s</dc:subject> 
+'''
+
+CONTENT_ITEM = '''  <item id="%s" href="%s" media-type="application/xhtml+xml" />
+'''
+
+CONTENT_END_MANIFEST = ''' </manifest>
+ <spine toc="ncx">
+'''
+
+CONTENT_ITEMREF = '''  <itemref idref="%s" />
+'''
+
+CONTENT_END = ''' </spine>
+</package>
+'''
+
+TOC_START = '''<?xml version="1.0" encoding="UTF-8"?>
+<ncx xmlns="http://www.daisy.org/z3986/2005/ncx/" version="2005-1">
+  <head>
+    <meta name="dtb:uid" content="%s"/>
+    <meta name="dtb:depth" content="1"/>
+    <meta name="dtb:totalPageCount" content="0"/>
+    <meta name="dtb:maxPageNumber" content="0"/>
+  </head>
+  <docTitle>
+    <text>%s</text>
+  </docTitle>
+  <navMap>
+'''
+
+TOC_ITEM = '''<navPoint id="%s" playOrder="%d">
+  <navLabel>
+    <text>%s</text>
+  </navLabel>
+  <content src="%s"/>
+</navPoint>
+'''
+
+TOC_END = '''</navMap>
+</ncx>
+'''
+
+XHTML_START = '''<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN" "http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml">
+<head>
+<title>%s</title>
+<link href="stylesheet.css" type="text/css" rel="stylesheet" />
+</head>
+<body>
+<div>
+<h3>%s</h3>
+'''
+
+XHTML_END = '''</div>
+</body>
+</html>
+'''
+
+acceptable_elements = ['a', 'abbr', 'acronym', 'address', 'area', 'b', 'big',
+      'blockquote', 'br', 'center', 'cite', 'code', 'col',
+      'colgroup', 'dd', 'del', 'dfn', 'dir', 'dl', 'dt', 'em',
+      'font', 'h1', 'h2', 'h3', 'h4', 'h5', 'h6', 'i', 
+      'ins', 'kbd', 'label', 'li', 'ol', 
+      'p', 'pre', 'q', 's', 'samp', 'small', 'span', 'strike',
+      'strong', 'sub', 'sup', 'u', 'ul']
+
+acceptable_attributes = ['href']
+
+# entity list from http://code.google.com/p/doctype/wiki/CharacterEntitiesConsistent
+entities = { '&aacute;' : 'á',
+             '&Aacute;' : 'Á',
+             '&Aacute' : 'Á',
+             '&aacute' : 'á',
+             '&acirc;' : 'â',
+             '&Acirc;' : 'Â',
+             '&Acirc' : 'Â',
+             '&acirc' : 'â',
+             '&acute;' : '´',
+             '&acute' : '´',
+             '&AElig;' : 'Æ',
+             '&aelig;' : 'æ',
+             '&AElig' : 'Æ',
+             '&aelig' : 'æ',
+             '&agrave;' : 'à',
+             '&Agrave;' : 'À',
+             '&Agrave' : 'À',
+             '&agrave' : 'à',
+             '&alefsym;' : 'ℵ',
+             '&alpha;' : 'α',
+             '&Alpha;' : 'Α',
+             '&amp;' : '&',
+             '&AMP;' : '&',
+             '&AMP' : '&',
+             '&amp' : '&',
+             '&and;' : '∧',
+             '&ang;' : '∠',
+             '&aring;' : 'å',
+             '&Aring;' : 'Å',
+             '&Aring' : 'Å',
+             '&aring' : 'å',
+             '&asymp;' : '≈',
+             '&atilde;' : 'ã',
+             '&Atilde;' : 'Ã',
+             '&Atilde' : 'Ã',
+             '&atilde' : 'ã',
+             '&auml;' : 'ä',
+             '&Auml;' : 'Ä',
+             '&Auml' : 'Ä',
+             '&auml' : 'ä',
+             '&bdquo;' : '„',
+             '&beta;' : 'β',
+             '&Beta;' : 'Β',
+             '&brvbar;' : '¦',
+             '&brvbar' : '¦',
+             '&bull;' : '•',
+             '&cap;' : '∩',
+             '&ccedil;' : 'ç',
+             '&Ccedil;' : 'Ç',
+             '&Ccedil' : 'Ç',
+             '&ccedil' : 'ç',
+             '&cedil;' : '¸',
+             '&cedil' : '¸',
+             '&cent;' : '¢',
+             '&cent' : '¢',
+             '&chi;' : 'χ',
+             '&Chi;' : 'Χ',
+             '&circ;' : 'ˆ',
+             '&clubs;' : '♣',
+             '&cong;' : '≅',
+             '&copy;' : '©',
+             '&COPY;' : '©',
+             '&COPY' : '©',
+             '&copy' : '©',
+             '&crarr;' : '↵',
+             '&cup;' : '∪',
+             '&curren;' : '¤',
+             '&curren' : '¤',
+             '&dagger;' : '†',
+             '&Dagger;' : '‡',
+             '&darr;' : '↓',
+             '&dArr;' : '⇓',
+             '&deg;' : '°',
+             '&deg' : '°',
+             '&delta;' : 'δ',
+             '&Delta;' : 'Δ',
+             '&diams;' : '♦',
+             '&divide;' : '÷',
+             '&divide' : '÷',
+             '&eacute;' : 'é',
+             '&Eacute;' : 'É',
+             '&Eacute' : 'É',
+             '&eacute' : 'é',
+             '&ecirc;' : 'ê',
+             '&Ecirc;' : 'Ê',
+             '&Ecirc' : 'Ê',
+             '&ecirc' : 'ê',
+             '&egrave;' : 'è',
+             '&Egrave;' : 'È',
+             '&Egrave' : 'È',
+             '&egrave' : 'è',
+             '&empty;' : '∅',
+             '&emsp;' : ' ',
+             '&ensp;' : ' ',
+             '&epsilon;' : 'ε',
+             '&Epsilon;' : 'Ε',
+             '&equiv;' : '≡',
+             '&eta;' : 'η',
+             '&Eta;' : 'Η',
+             '&eth;' : 'ð',
+             '&ETH;' : 'Ð',
+             '&ETH' : 'Ð',
+             '&eth' : 'ð',
+             '&euml;' : 'ë',
+             '&Euml;' : 'Ë',
+             '&Euml' : 'Ë',
+             '&euml' : 'ë',
+             '&euro;' : '€',
+             '&exist;' : '∃',
+             '&fnof;' : 'ƒ',
+             '&forall;' : '∀',
+             '&frac12;' : '½',
+             '&frac12' : '½',
+             '&frac14;' : '¼',
+             '&frac14' : '¼',
+             '&frac34;' : '¾',
+             '&frac34' : '¾',
+             '&frasl;' : '⁄',
+             '&gamma;' : 'γ',
+             '&Gamma;' : 'Γ',
+             '&ge;' : '≥',
+             '&gt;' : '>',
+             '&GT;' : '>',
+             '&GT' : '>',
+             '&gt' : '>',
+             '&harr;' : '↔',
+             '&hArr;' : '⇔',
+             '&hearts;' : '♥',
+             '&hellip;' : '…',
+             '&iacute;' : 'í',
+             '&Iacute;' : 'Í',
+             '&Iacute' : 'Í',
+             '&iacute' : 'í',
+             '&icirc;' : 'î',
+             '&Icirc;' : 'Î',
+             '&Icirc' : 'Î',
+             '&icirc' : 'î',
+             '&iexcl;' : '¡',
+             '&iexcl' : '¡',
+             '&igrave;' : 'ì',
+             '&Igrave;' : 'Ì',
+             '&Igrave' : 'Ì',
+             '&igrave' : 'ì',
+             '&image;' : 'ℑ',
+             '&infin;' : '∞',
+             '&int;' : '∫',
+             '&iota;' : 'ι',
+             '&Iota;' : 'Ι',
+             '&iquest;' : '¿',
+             '&iquest' : '¿',
+             '&isin;' : '∈',
+             '&iuml;' : 'ï',
+             '&Iuml;' : 'Ï',
+             '&Iuml' : 'Ï',
+             '&iuml' : 'ï',
+             '&kappa;' : 'κ',
+             '&Kappa;' : 'Κ',
+             '&lambda;' : 'λ',
+             '&Lambda;' : 'Λ',
+             '&laquo;' : '«',
+             '&laquo' : '«',
+             '&larr;' : '←',
+             '&lArr;' : '⇐',
+             '&lceil;' : '⌈',
+             '&ldquo;' : '“',
+             '&le;' : '≤',
+             '&lfloor;' : '⌊',
+             '&lowast;' : '∗',
+             '&loz;' : '◊',
+             '&lrm;' : '‎',
+             '&lsaquo;' : '‹',
+             '&lsquo;' : '‘',
+             '&lt;' : '<',
+             '&LT;' : '<',
+             '&LT' : '<',
+             '&lt' : '<',
+             '&macr;' : '¯',
+             '&macr' : '¯',
+             '&mdash;' : '—',
+             '&micro;' : 'µ',
+             '&micro' : 'µ',
+             '&middot;' : '·',
+             '&middot' : '·',
+             '&minus;' : '−',
+             '&mu;' : 'μ',
+             '&Mu;' : 'Μ',
+             '&nabla;' : '∇',
+             '&nbsp;' : ' ',
+             '&nbsp' : ' ',
+             '&ndash;' : '–',
+             '&ne;' : '≠',
+             '&ni;' : '∋',
+             '&not;' : '¬',
+             '&not' : '¬',
+             '&notin;' : '∉',
+             '&nsub;' : '⊄',
+             '&ntilde;' : 'ñ',
+             '&Ntilde;' : 'Ñ',
+             '&Ntilde' : 'Ñ',
+             '&ntilde' : 'ñ',
+             '&nu;' : 'ν',
+             '&Nu;' : 'Ν',
+             '&oacute;' : 'ó',
+             '&Oacute;' : 'Ó',
+             '&Oacute' : 'Ó',
+             '&oacute' : 'ó',
+             '&ocirc;' : 'ô',
+             '&Ocirc;' : 'Ô',
+             '&Ocirc' : 'Ô',
+             '&ocirc' : 'ô',
+             '&OElig;' : 'Œ',
+             '&oelig;' : 'œ',
+             '&ograve;' : 'ò',
+             '&Ograve;' : 'Ò',
+             '&Ograve' : 'Ò',
+             '&ograve' : 'ò',
+             '&oline;' : '‾',
+             '&omega;' : 'ω',
+             '&Omega;' : 'Ω',
+             '&omicron;' : 'ο',
+             '&Omicron;' : 'Ο',
+             '&oplus;' : '⊕',
+             '&or;' : '∨',
+             '&ordf;' : 'ª',
+             '&ordf' : 'ª',
+             '&ordm;' : 'º',
+             '&ordm' : 'º',
+             '&oslash;' : 'ø',
+             '&Oslash;' : 'Ø',
+             '&Oslash' : 'Ø',
+             '&oslash' : 'ø',
+             '&otilde;' : 'õ',
+             '&Otilde;' : 'Õ',
+             '&Otilde' : 'Õ',
+             '&otilde' : 'õ',
+             '&otimes;' : '⊗',
+             '&ouml;' : 'ö',
+             '&Ouml;' : 'Ö',
+             '&Ouml' : 'Ö',
+             '&ouml' : 'ö',
+             '&para;' : '¶',
+             '&para' : '¶',
+             '&part;' : '∂',
+             '&permil;' : '‰',
+             '&perp;' : '⊥',
+             '&phi;' : 'φ',
+             '&Phi;' : 'Φ',
+             '&pi;' : 'π',
+             '&Pi;' : 'Π',
+             '&piv;' : 'ϖ',
+             '&plusmn;' : '±',
+             '&plusmn' : '±',
+             '&pound;' : '£',
+             '&pound' : '£',
+             '&prime;' : '′',
+             '&Prime;' : '″',
+             '&prod;' : '∏',
+             '&prop;' : '∝',
+             '&psi;' : 'ψ',
+             '&Psi;' : 'Ψ',
+             '&quot;' : '"',
+             '&QUOT;' : '"',
+             '&QUOT' : '"',
+             '&quot' : '"',
+             '&radic;' : '√',
+             '&raquo;' : '»',
+             '&raquo' : '»',
+             '&rarr;' : '→',
+             '&rArr;' : '⇒',
+             '&rceil;' : '⌉',
+             '&rdquo;' : '”',
+             '&real;' : 'ℜ',
+             '&reg;' : '®',
+             '&REG;' : '®',
+             '&REG' : '®',
+             '&reg' : '®',
+             '&rfloor;' : '⌋',
+             '&rho;' : 'ρ',
+             '&Rho;' : 'Ρ',
+             '&rlm;' : '‏',
+             '&rsaquo;' : '›',
+             '&rsquo;' : '’',
+             '&sbquo;' : '‚',
+             '&scaron;' : 'š',
+             '&Scaron;' : 'Š',
+             '&sdot;' : '⋅',
+             '&sect;' : '§',
+             '&sect' : '§',
+             '&shy;' : '­', # strange optional hyphenation control character, not just a dash
+             '&shy' : '­',
+             '&sigma;' : 'σ',
+             '&Sigma;' : 'Σ',
+             '&sigmaf;' : 'ς',
+             '&sim;' : '∼',
+             '&spades;' : '♠',
+             '&sub;' : '⊂',
+             '&sube;' : '⊆',
+             '&sum;' : '∑',
+             '&sup1;' : '¹',
+             '&sup1' : '¹',
+             '&sup2;' : '²',
+             '&sup2' : '²',
+             '&sup3;' : '³',
+             '&sup3' : '³',
+             '&sup;' : '⊃',
+             '&supe;' : '⊇',
+             '&szlig;' : 'ß',
+             '&szlig' : 'ß',
+             '&tau;' : 'τ',
+             '&Tau;' : 'Τ',
+             '&there4;' : '∴',
+             '&theta;' : 'θ',
+             '&Theta;' : 'Θ',
+             '&thetasym;' : 'ϑ',
+             '&thinsp;' : ' ',
+             '&thorn;' : 'þ',
+             '&THORN;' : 'Þ',
+             '&THORN' : 'Þ',
+             '&thorn' : 'þ',
+             '&tilde;' : '˜',
+             '&times;' : '×',
+             '&times' : '×',
+             '&trade;' : '™',
+             '&uacute;' : 'ú',
+             '&Uacute;' : 'Ú',
+             '&Uacute' : 'Ú',
+             '&uacute' : 'ú',
+             '&uarr;' : '↑',
+             '&uArr;' : '⇑',
+             '&ucirc;' : 'û',
+             '&Ucirc;' : 'Û',
+             '&Ucirc' : 'Û',
+             '&ucirc' : 'û',
+             '&ugrave;' : 'ù',
+             '&Ugrave;' : 'Ù',
+             '&Ugrave' : 'Ù',
+             '&ugrave' : 'ù',
+             '&uml;' : '¨',
+             '&uml' : '¨',
+             '&upsih;' : 'ϒ',
+             '&upsilon;' : 'υ',
+             '&Upsilon;' : 'Υ',
+             '&uuml;' : 'ü',
+             '&Uuml;' : 'Ü',
+             '&Uuml' : 'Ü',
+             '&uuml' : 'ü',
+             '&weierp;' : '℘',
+             '&xi;' : 'ξ',
+             '&Xi;' : 'Ξ',
+             '&yacute;' : 'ý',
+             '&Yacute;' : 'Ý',
+             '&Yacute' : 'Ý',
+             '&yacute' : 'ý',
+             '&yen;' : '¥',
+             '&yen' : '¥',
+             '&yuml;' : 'ÿ',
+             '&Yuml;' : 'Ÿ',
+             '&yuml' : 'ÿ',
+             '&zeta;' : 'ζ',
+             '&Zeta;' : 'Ζ',
+             '&zwj;' : '‍',  # strange spacing control character, not just a space
+             '&zwnj;' : '‌',  # strange spacing control character, not just a space
+             }
+
+FB2_PROLOGUE = '<FictionBook>'
+FB2_DESCRIPTION = '''<description>
+<title-info>
+  <genre>fanfiction</genre>
+  <author>
+  <first-name></first-name>
+  <middle-name></middle-name>
+  <last-name>%s</last-name>
+  </author>
+  <book-title>%s</book-title>
+  <lang>eng</lang>
+</title-info>
+<document-info>
+  <author>
+  <nickname>sgzmd</nickname>
+  </author>
+<date value="%s">%s</date>
+<id>sgzmd_%s</id>
+<version>2.0</version>
+</document-info>
+</description>'''
+
+HTML_ESC_Definitions = 'HTML_Escape.def'
diff --git a/fanficdownloader/downloader.py b/fanficdownloader/downloader.py
new file mode 100644
index 00000000..17078430
--- /dev/null
+++ b/fanficdownloader/downloader.py
@@ -0,0 +1,205 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import shutil
+import os.path
+import getpass
+import logging
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+import zipdir
+
+import output
+import adapter
+from adapter import StoryArchivedAlready
+from adapter import StoryDoesNotExist
+from adapter import FailedToDownload
+from adapter import InvalidStoryURL
+from adapter import LoginRequiredException
+import ffnet
+import fpcom
+import ficwad
+import fictionalley
+import hpfiction
+import twilighted
+import potionsNsnitches
+import mediaminer
+
+import time
+
+class FanficLoader:
+	'''A controller class which handles the interaction between various specific downloaders and writers'''
+	booksDirectory = "books"
+	standAlone = False
+	
+	def __init__(self, adapter, writerClass, quiet = False, inmemory = False, compress=True, overwrite=False):
+		self.adapter = adapter
+		self.writerClass = writerClass
+		self.quiet = quiet
+		self.inmemory = inmemory
+		self.compress = compress
+		self.badLogin = False
+		self.overWrite = overwrite
+			
+	def getBooksDirectory(self):
+		return self.booksDirectory
+
+	def setBooksDirectory(self, bd):
+		self.booksDirectory = bd
+		return self.booksDirectory
+	
+	def getStandAlone(self):
+		return self.standAlone
+
+	def setStandAlone(self, sa):
+		self.standAlone = sa
+		return self.standAlone
+	
+	def getOverWrite(self):
+		return self.overWrite
+
+	def setOverWrite(self, sa):
+		self.overWrite = sa
+		return self.overWrite
+	
+	def getAdapter():
+		return self.adapter
+	
+	def download(self):
+		logging.debug("Trying to download the story")
+		if self.adapter.requiresLogin():
+			logging.debug("Story requires login")
+			if not self.adapter.performLogin():
+				logging.debug("Login/password problem")
+				self.badLogin = True
+				raise adapter.LoginRequiredException(self.adapter.url)
+		
+		urls = self.adapter.extractIndividualUrls()
+
+		logging.debug("self.writerClass=%s" % self.writerClass)
+		if self.standAlone and not self.inmemory:
+			s = self.adapter.getOutputFileName(self.booksDirectory, self.writerClass.getFormatExt())
+			logging.debug("Always overwrite? %s" % self.overWrite)
+			if not self.overWrite:
+				logging.debug("Checking if current archive of the story exists.  Filename=%s" % s)
+				if not zipdir.checkNewer ( s, self.adapter.getStoryUpdated() ):
+					raise StoryArchivedAlready("A Current archive file \"" + s + "\" already exists!  Skipping!")
+		else:
+			logging.debug("Do not check for existance of archive file.")
+
+		self.writer = self.writerClass(self.booksDirectory, self.adapter, inmemory=self.inmemory, compress=self.compress)
+		
+		i = 1
+		for u,n in urls:
+			if not self.quiet:
+				print('Downloading chapter %d/%d' % (i, len(urls)))
+			text = self.adapter.getText(u)
+			self.writer.writeChapter(i, n, text)
+			i = i+1
+			# time.sleep(2)
+			
+		self.writer.finalise()
+		
+		if self.inmemory:
+			self.name = self.writer.name
+			return self.writer.output.getvalue()
+	
+
+if __name__ == '__main__':
+	logging.basicConfig(level=logging.DEBUG)
+	argvlen = len(sys.argv)
+	url = None
+	bookFormat = 'epub'
+	if argvlen > 1:
+		url = sys.argv[1]
+	if argvlen > 2:
+		bookFormat = sys.argv[2]
+	
+	if url is None: 
+		print >> sys.stderr, "Usage: downloader.py URL Type"
+		sys.exit(-1)
+		
+	if type(url) is unicode:
+		print('URL is unicode')
+		url = url.encode('latin1')
+	url = url.strip()
+	adapter = None
+	writerClass = None
+	
+	if url.find('fanficauthors') != -1:
+		print >> sys.stderr, "fanficauthors.net already provides ebooks"
+		sys.exit(0)
+	elif url.find('fictionalley') != -1:
+		adapter = fictionalley.FictionAlley(url)
+	elif url.find('ficwad') != -1:
+		adapter = ficwad.FicWad(url)
+	elif url.find('fanfiction.net') != -1:
+		adapter = ffnet.FFNet(url)
+	elif url.find('fictionpress.com') != -1:
+		adapter = fpcom.FPCom(url)
+	elif url.find('harrypotterfanfiction.com') != -1:
+		adapter = hpfiction.HPFiction(url)
+	elif url.find('twilighted.net') != -1:
+		adapter = twilighted.Twilighted(url)
+	elif url.find('potionsandsnitches.net') != -1:
+		adapter = potionsNsnitches.PotionsNSnitches(url)
+	elif url.find('mediaminer.org') != -1:
+		adapter = mediaminer.MediaMiner(url)
+	else:
+		print >> sys.stderr, "Oi! I can haz not appropriate adapter for URL %s!" % url
+		sys.exit(1)
+
+	if bookFormat == 'epub':
+		writerClass = output.EPubFanficWriter
+	elif bookFormat == 'html':
+		writerClass = output.HTMLWriter
+	elif bookFormat == 'text':
+		writerClass = output.TextWriter
+	
+	if adapter.requiresLogin(url):
+		print("Meow, URL %s requires you to haz been logged in! Please can I haz this datas?" % url)
+		sys.stdout.write("Can I haz ur login? ")
+		login = sys.stdin.readline().strip()
+		password = getpass.getpass(prompt='Can I haz ur password? ')
+		print("Login: `%s`, Password: `%s`" % (login, password))
+		
+		adapter.setLogin(login)
+		adapter.setPassword(password)
+		
+	
+	loader = FanficLoader(adapter, writerClass)
+	loader.setStandAlone(True)
+	if bookFormat != 'epub':
+		loader.setOverWrite(True)
+	
+
+	try:
+		loader.download()
+	except FailedToDownload, ftd:
+		print >> sys.stderr, str(ftd)
+		sys.exit(2)		# Error Downloading
+	except InvalidStoryURL, isu:
+		print >> sys.stderr, str(isu)
+		sys.exit(3)		# Unknown Error
+	except StoryArchivedAlready, se:
+		print >> sys.stderr, str(se)
+		sys.exit(10)	# Skipped
+	except StoryDoesNotExist, sdne:
+		print >> sys.stderr, str(sdne)
+		sys.exit(20) 	# Missing
+	except LoginRequiredException, lre:
+		print >> sys.stderr, str(lre)
+		sys.exit(30) 	# Missing
+	except Exception, e:
+		print >> sys.stderr, str(e)
+		sys.exit(99)		# Unknown Error
+	
+	sys.exit(0)
+	
diff --git a/fanficdownloader/ffnet.py b/fanficdownloader/ffnet.py
new file mode 100644
index 00000000..4caa13fa
--- /dev/null
+++ b/fanficdownloader/ffnet.py
@@ -0,0 +1,358 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import os.path
+import logging
+import unittest
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time
+import datetime
+
+from constants import *
+from adapter import *
+
+try:
+	import login_password
+except:
+	# tough luck
+	pass
+
+class FFNet(FanfictionSiteAdapter):
+	def __init__(self, url):
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		
+		self.storyName = 'FF.Net story'
+		self.authorName = 'FF.Net author'
+		self.storyDescription = 'Fanfiction Story'
+		self.storyCharacters = []
+		self.storySeries = ''
+		self.authorId = '0'
+		self.authorURL = self.path
+		self.storyId = '0'
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		self.subjects.append ('FanFiction')
+		logging.debug('self.subjects=%s' % self.subjects)
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = 'FanFiction'
+		self.category = 'FF.Net Category'
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'K'
+		self.storyUserRating = '0'
+		self.outputName = ''
+		self.outputStorySep = '-ffnet_'
+		
+		logging.debug('self.path=%s' % self.path)
+
+		if self.path.startswith('/'):
+			self.path = self.path[1:]
+		
+		spl = self.path.split('/')
+		logging.debug('spl=%s' % spl)
+		if spl is not None:
+			if len(spl) > 0 and spl[0] != 's':
+				raise InvalidStoryURL("Error URL \"%s\" is not a story." % self.url)
+			if len(spl) > 1:
+				self.storyId = spl[1]
+			if len(spl) > 2:
+				chapter = spl[1]
+			else:
+				chapter = '1'
+			if len(spl) == 5:
+				self.path = "/".join(spl[1:-1])
+		
+		if self.path.endswith('/'):
+			self.path = self.path[:-1]
+		
+		logging.debug('self.path=%s' % self.path)
+		
+		if self.host is not None and self.host == "m.fanfiction.net":
+			self.host = "www.fanfiction.net"
+			logging.debug('self.host=%s' % self.host)
+			self.url = "http://" + self.host + "/" + self.path
+			logging.debug('self.url=%s' % self.url)
+			
+		logging.debug('self.storyId=%s' % self.storyId)
+		if not self.appEngine:
+			self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+		else:
+			self.opener = None
+	
+		logging.debug("Created FF.Net: url=%s" % (self.url))
+	
+	def _getLoginScript(self):
+		return self.path
+
+	def _getVarValue(self, varstr):
+		#logging.debug('_getVarValue varstr=%s' % varstr)
+		vals = varstr.split('=')
+		#logging.debug('vals=%s' % vals)
+		retstr="".join(vals[+1:])
+		#logging.debug('retstr=%s' % retstr)
+		if retstr.startswith(' '):
+			retstr = retstr[1:]
+		if retstr.endswith(';'):
+			retstr = retstr[:-1]
+		return retstr
+	
+	def _splitCrossover(self, subject):
+		if "Crossover" in subject:
+			self.addSubject ("Crossover")
+			logging.debug('Crossover=%s' % subject)
+			if subject.find(' and ') != -1:
+				words = subject.split(' ')
+				logging.debug('words=%s' % words)
+				subj = ''
+				for s in words:
+					if s in "and Crossover":
+						if len(subj) > 0:
+							self.addSubject(subj)
+						subj = ''
+					else:
+						if len(subj) > 0:
+							subj = subj + ' '
+						subj = subj + s
+				if len(subj) > 0:
+					self.addSubject(subj)
+			else:
+				self.addSubject(subject)
+		else:
+			self.addSubject(subject)
+		return True
+
+	def _splitGenre(self, subject):
+		if len(subject) > 0:
+			words = subject.split('/')
+			logging.debug('words=%s' % words)
+			for subj in words:
+			    if len(subj) > 0:
+				self.addSubject(subj)
+		return True
+
+	def extractIndividualUrls(self):
+		data = ''
+		try:
+			data = self.fetchUrl(self.url)
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
+		
+		d2 = re.sub('&\#[0-9]+;', ' ', data)
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(d2)
+		except:
+			logging.error("Failed to decode: <%s>" % d2)
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
+
+		allA = soup.findAll('a')
+		for a in allA:
+			if 'href' in a._getAttrMap() and a['href'].find('/u/') != -1:
+				self.authorName = a.string
+				(u1, u2, self.authorId, u3) = a['href'].split('/')
+				logging.debug('self.authorId=%s self.authorName=%s' % (self.authorId, self.authorName))
+
+		urls = []
+		lines = data.split('\n')
+		for l in lines:
+			if l.find("&#187;") != -1 and l.find('<b>') != -1:
+				s2 = bs.BeautifulStoneSoup(l)
+				self.storyName = unicode(s2.find('b').string)
+				logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+			elif l.find("<a href='/u/") != -1:
+				s2 = bs.BeautifulStoneSoup(l)
+				self.authorName = unicode(s2.a.string)
+				(u1, u2, self.authorId, u3) = s2.a['href'].split('/')
+				logging.debug('self.authorId=%s, self.authorName=%s' % (self.authorId, self.authorName))
+			elif l.find("Rated: <a href=") != -1:
+				s2 = bs.BeautifulStoneSoup(l)
+				self.storyRating = unicode(s2.a.string).strip()
+				logging.debug('self.storyRating=%s' % self.storyRating)
+				logging.debug('s2.a=%s' % s2.a)
+				s3 = l.split('-')
+				logging.debug('s3=%s' % s3)
+				if len(s3) > 0:
+					if s3[1].find("Reviews: <a href=") != -1:
+						continue
+					self.language = s3[1].strip()
+					logging.debug('self.language=%s' % self.language)
+					if len(s3) > 1:
+						if s3[2].find("Reviews: <a href=") != -1:
+							continue
+						self.genre = s3[2].strip()
+						if "&" in self.genre:
+							self.genre = ''
+							continue
+						logging.debug('self.genre=%s' % self.genre)
+						self._splitGenre(self.genre)
+						logging.debug('self.subjects=%s' % self.subjects)
+				if "Complete" in l:
+					self.storyStatus = 'Completed'
+				else:
+					self.storyStatus = 'In-Progress'
+			elif l.find("<SELECT title='chapter navigation'") != -1:
+				if len(urls) > 0:
+					continue
+				try:
+					u = l.decode('utf-8')
+				except UnicodeEncodeError, e:
+					u = l
+				except:
+					u = l.encode('ascii', 'xmlcharrefreplace')
+				u = re.sub('&\#[0-9]+;', ' ', u)
+				s2 = bs.BeautifulSoup(u)
+				options = s2.findAll('option')
+				for o in options:
+					url = 'http://' + self.host + '/s/' + self.storyId + '/' + o['value']
+					title = o.string
+					logging.debug('URL = `%s`, Title = `%s`' % (url, title))
+					urls.append((url,title))
+			elif l.find("var chapters") != -1:
+				self.numChapters = self._getVarValue (l)
+				logging.debug('self.numChapters=%s' % self.numChapters)
+			elif l.find("var words") != -1:
+				self.numWords = self._getVarValue (l)
+				logging.debug('self.numWords=%s' % self.numWords)
+			elif l.find("var categoryid") != -1:
+				categoryid = self._getVarValue (l)
+				logging.debug('categoryid=%s' % categoryid)
+			elif l.find("var cat_title") != -1:
+				self.category = self._getVarValue (l).strip("'")
+				logging.debug('self.category=%s' % self.category)
+				self._splitCrossover(self.category)
+				logging.debug('self.subjects=%s' % self.subjects)
+			elif l.find("var summary") != -1:
+				self.storyDescription = self._getVarValue (l).strip("'")
+				if '&' in self.storyDescription:
+					s = self.storyDescription.split('&')
+					logging.debug('s=%s' % s)
+					self.storyDescription = ''
+					for ss in s:
+						if len(self.storyDescription) > 0:
+							if len(ss) > 4 and 'amp;' in ss[1:4]:
+								self.storyDescription = self.storyDescription + '&' + ss
+							else:
+								self.storyDescription = self.storyDescription + '&amp;' + ss
+						else:
+							self.storyDescription = ss
+				logging.debug('self.storyDescription=%s' % self.storyDescription)
+			elif l.find("var datep") != -1:
+				dateps = self._getVarValue (l)
+				self.storyPublished = datetime.datetime(*time.strptime ( dateps, "'%m-%d-%y'" )[0:5])
+				logging.debug('self.storyPublished=%s' % self.storyPublished.strftime("%Y-%m-%dT%I:%M:%S"))
+			elif l.find("var dateu") != -1:
+				dateus = self._getVarValue (l)
+				self.storyUpdated = datetime.datetime(*time.strptime ( dateus, "'%m-%d-%y'" )[0:5])
+				logging.debug('self.storyUpdated=%s' % self.storyUpdated.strftime("%Y-%m-%dT%I:%M:%S"))
+		
+		if len(urls) <= 0:
+			# no chapters found, try url by itself.
+			urls.append((self.url,self.storyName))
+
+		self.authorURL = 'http://' + self.host + '/u/' + self.authorId
+
+		#logging.debug('urls=%s' % urls)
+		return urls
+	
+	def getText(self, url):
+		# time.sleep( 2.0 )
+		data = ''
+		try:
+			logging.debug("Fetching URL: %s" % url)
+			data = self.fetchUrl(url)
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
+		lines = data.split('\n')
+		
+		textbuf = ''
+		emit = False
+		
+		olddata = data
+		try:
+			data = data.decode('utf8')
+		except:
+			data = olddata
+		
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			logging.debug(data)
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+
+		div = soup.find('div', {'id' : 'storytext'})
+		if None == div:
+			logging.debug(data)
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
+			
+		return div.__str__('utf8')
+					
+		
+class FFA_UnitTests(unittest.TestCase):
+	def setUp(self):
+		logging.basicConfig(level=logging.DEBUG)
+		pass
+	
+	def testChaptersAuthStory(self):
+		f = FFNet('http://www.fanfiction.net/s/5257563/1')
+		f.extractIndividualUrls()
+		
+		self.assertEquals('Beka0502', f.getAuthorName())
+		self.assertEquals("Draco's Redemption", f.getStoryName())
+
+	def testChaptersCountNames(self):
+		f = FFNet('http://www.fanfiction.net/s/5257563/1')
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals(10, len(urls))
+	
+	def testGetText(self):
+		url = 'http://www.fanfiction.net/s/5257563/1'
+		f = FFNet(url)
+		text = f.getText(url)
+		self.assertTrue(text.find('He was just about to look at some photos when he heard a crack') != -1)
+	
+	def testBrokenWands(self):
+		url = 'http://www.fanfiction.net/s/1527263/30/Harry_Potter_and_Broken_Wands'
+		f = FFNet(url)
+		text = f.getText(url)
+		
+		urls = f.extractIndividualUrls()
+	
+	def testFictionPress(self):
+		url = 'http://www.fictionpress.com/s/2725180/1/Behind_This_Facade'
+		f = FFNet(url)
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals('Behind This Facade', f.getStoryName())
+		self.assertEquals('IntoxicatingMelody', f.getAuthorName())
+	
+		text = f.getText(url)
+		self.assertTrue(text.find('Kale Resgerald at your service" He answered, "So, can we go now? Or do you want to') != -1)
+if __name__ == '__main__':
+	unittest.main()
diff --git a/fanficdownloader/fictionalley.py b/fanficdownloader/fictionalley.py
new file mode 100644
index 00000000..68cd36e4
--- /dev/null
+++ b/fanficdownloader/fictionalley.py
@@ -0,0 +1,301 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import shutil
+import logging
+import os.path
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import cookielib as cl
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time as time
+import datetime
+from adapter import *
+
+
+class FictionAlley(FanfictionSiteAdapter):
+	def __init__(self, url):
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		
+		logging.debug('self.host=%s' % self.host)
+		logging.debug('self.path=%s' % self.path)
+
+		cookieproc = u2.HTTPCookieProcessor()
+
+		# FictionAlley wants a cookie to prove you're old enough to read R+ rated stuff.
+		cookie = cl.Cookie(version=0, name='fauser', value='wizard',
+                 port=None, port_specified=False,
+                  domain='www.fictionalley.org', domain_specified=False, domain_initial_dot=False,
+                 path='/authors', path_specified=True,
+                 secure=False,
+                 expires=time.time()+10000,
+                 discard=False,
+                 comment=None,
+                 comment_url=None,
+                 rest={'HttpOnly': None},
+					  rfc2109=False)
+		cookieproc.cookiejar.set_cookie(cookie)
+		self.opener = u2.build_opener(cookieproc)
+
+		ss = self.path.split('/')
+		
+		self.storyDescription = 'Fanfiction Story'
+		self.authorId = ''
+		self.authorURL = ''
+		self.storyId = ''
+		if len(ss) > 2 and ss[1] == 'authors':
+			self.authorId = ss[2]
+			self.authorURL = 'http://' + self.host + '/authors/' + self.authorId
+			if len(ss) > 3:
+				self.storyId = ss[3].replace ('.html','')
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		self.subjects.append ('fanfiction')
+		self.subjects.append ('Harry Potter')
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = ''
+		self.category = 'Harry Potter'
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'K'
+		self.storyUserRating = '0'
+		self.storyCharacters = []
+		self.storySeries = ''
+		self.storyName = ''
+		self.outputName = ''
+		self.outputStorySep = '-fa_'	
+		
+	def getPasswordLine(self):
+		return 'opaopapassword'
+
+	def getLoginScript(self):
+		return 'opaopaloginscript'
+
+	def getLoginPasswordOthers(self):
+		login = dict(login = 'name', password = 'pass')
+		other = dict(submit = 'Log In', remember='yes')
+		return (login, other)
+
+	def _processChapterHeaders(self, div):
+		brs = div.findAll ('br')
+		for br in brs:
+			keystr=''
+			valstr=''
+			if len(br.contents) > 2:
+				keystr = br.contents[1]
+				if keystr is not None:
+					strs = re.split ("<[^>]+>", unicode(keystr))
+					keystr=''
+					for s in strs:
+						keystr = keystr + s					
+				valstr = br.contents[2].strip(' ')
+			if keystr is not None:
+				if keystr == 'Rating:':
+					self.storyRating = valstr
+					logging.debug('self.storyRating=%s' % self.storyRating)
+				elif keystr == 'Genre:':
+					self.genre = valstr
+					logging.debug('self.genre=%s' % self.genre)
+					s2 = valstr.split(', ')
+					for ss2 in s2:
+						self.addSubject(ss2)
+					logging.debug('self.subjects=%s' % self.subjects)
+				elif keystr == 'Main Character(s):':
+					s2 = valstr.split(', ')
+					for ss2 in s2:
+						self.addCharacter(ss2)
+					logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+				elif keystr == 'Summary:':
+					self.storyDescription = valstr
+					logging.debug('self.storyDescription=%s' % self.storyDescription)
+	
+		
+	def extractIndividualUrls(self):
+		data = ''
+		try:
+			data = self.opener.open(self.url).read()		
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
+		
+		# There is some usefull information in the headers of the first chapter page..
+		data = data.replace('<!-- headerstart -->','<crazytagstringnobodywouldstumbleonaccidently id="storyheaders">').replace('<!-- headerend -->','</crazytagstringnobodywouldstumbleonaccidently>')
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
+				
+		breadcrumbs = soup.find('div', {'class': 'breadcrumbs'})
+		if breadcrumbs is not None:
+			# Be aware that this means that the user has entered the {STORY}01.html 
+			# We will not have valid Publised and Updated dates.  User should enter 
+			# the {STORY}.html instead.  We should force that instead of this.
+			#logging.debug('breadcrumbs=%s' % breadcrumbs )
+			bcas = breadcrumbs.findAll('a')
+			#logging.debug('bcas=%s' % bcas )
+			if bcas is not None and len(bcas) > 1:
+				bca = bcas[1]
+				#logging.debug('bca=%s' % bca )
+				if 'href' in bca._getAttrMap():
+					#logging.debug('bca.href=%s' % bca['href'] )
+					url = unicode(bca['href'])
+					if url is not None and len(url) > 0:
+						self.url = url
+						logging.debug('self.url=%s' % self.url )
+						ss = self.url.split('/')
+						self.storyId = ss[-1].replace('.html','')
+						self.storyName = bca.string
+						logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+
+						data = self.opener.open(self.url).read()		
+						
+						# There is some usefull information in the headers of the first chapter page..
+						data = data.replace('<!-- headerstart -->','<crazytagstringnobodywouldstumbleonaccidently id="storyheaders">').replace('<!-- headerend -->','</crazytagstringnobodywouldstumbleonaccidently>')
+						soup = bs.BeautifulStoneSoup(data)
+		
+		# If it is decided that we really do care about number of words..  It's only available on the author's page..
+		#d0 = self.opener.open(self.authorURL).read()
+		#soupA = bs.BeautifulStoneSoup(d0)
+		#dls = soupA.findAll('dl')
+		#logging.debug('dls=%s' % dls)
+		
+		# Get title from <title>, remove before '-'.
+		if len(self.storyName) == 0:
+			title = soup.find('title').string
+			self.storyName = "-".join(title.split('-')[1:]).strip().replace(" (Story Text)","")
+		
+		links = soup.findAll('li')
+
+		self.numChapters = 0;
+		result = []
+		if len(links) == 0:
+			# Be aware that this means that the user has entered the {STORY}01.html 
+			# We will not have valid Publised and Updated dates.  User should enter 
+			# the {STORY}.html instead.  We should force that instead of this.
+			breadcrumbs = soup.find('div', {'class': 'breadcrumbs'})
+			self.authorName = breadcrumbs.a.string.replace("'s Fics","")
+			result.append((self.url,self.storyName))
+			#logging.debug('chapter[%s]=%s, %s' % (self.numChapters+1,self.url,self.storyName))
+			self.numChapters = self.numChapters + 1;
+			div = soup.find('crazytagstringnobodywouldstumbleonaccidently', {'id' : 'storyheaders'})
+			if div is not None:
+				self._processChapterHeaders(div)
+		else:
+			author = soup.find('h1', {'class' : 'title'})
+			self.authorName = author.a.string
+			
+			summary = soup.find('div', {'class' : 'summary'})
+			ss = summary.contents
+			if len(ss) > 1:
+				ss1 = ss[0].split(': ')
+				if len(ss1) > 1 and ss1[0] == 'Rating':
+					self.storyRating = ss1[1]
+					logging.debug('self.storyRating=%s' % self.storyRating)
+				self.storyDescription = unicode(ss[1]).replace("<br>","").replace("</br>","").replace('\n','')
+				logging.debug('self.storyDescription=%s' % self.storyDescription)
+			
+			for li in links:
+				a = li.find('a', {'class' : 'chapterlink'})
+				s = li.contents
+				if a is not None:
+					url = a['href']
+					title = a.string
+					result.append((url,title))
+					#logging.debug('chapter[%s]=%s, %s' % (self.numChapters+1,url,title))
+					if self.numChapters == 0:
+						# fictionalley uses full URLs in chapter list.
+						d1 = self.opener.open(url).read()
+						
+						# find <!-- headerstart --> & <!-- headerend --> and
+						# replaced with matching div pair for easier parsing.
+						# Yes, it's an evil kludge, but what can ya do?  Using
+						# something other than div prevents soup from pairing
+						# our div with poor html inside the story text.
+						d1 = d1.replace('<!-- headerstart -->','<crazytagstringnobodywouldstumbleonaccidently id="storyheaders">').replace('<!-- headerend -->','</crazytagstringnobodywouldstumbleonaccidently>')
+						sop = bs.BeautifulStoneSoup(d1)
+						
+						div = sop.find('crazytagstringnobodywouldstumbleonaccidently', {'id' : 'storyheaders'})
+						if div is not None:
+							self._processChapterHeaders(div)
+							
+					self.numChapters = self.numChapters + 1
+					if len(s) > 1:
+						datestr=''
+						ss2 = s[1].replace('\n','').replace('(','').split(' ')
+						if len(ss2) > 2 and ss2[0] == 'Posted:':
+							datestr = ss2[1] + ' ' + ss2[2]
+							tmpdate = datetime.datetime.fromtimestamp(time.mktime(time.strptime(datestr.strip(' '), "%Y-%m-%d %H:%M:%S")))
+							if self.numChapters == 1:
+								self.storyPublished = tmpdate
+							self.storyUpdated = tmpdate
+						logging.debug('self.storyPublished=%s, self.storyUpdated=%s' % (self.storyPublished, self.storyUpdated))
+				else:
+					logging.debug('li chapterlink not found!  li=%s' % li)
+					
+
+		logging.debug('Story "%s" by %s' % (self.storyName, self.authorName))
+		
+		return result
+	
+	def getText(self, url):
+		# fictionalley uses full URLs in chapter list.
+		data = ''
+		try:
+			data = self.opener.open(url).read()
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
+		
+		# find <!-- headerend --> & <!-- footerstart --> and
+		# replaced with matching div pair for easier parsing.
+		# Yes, it's an evil kludge, but what can ya do?  Using
+		# something other than div prevents soup from pairing
+		# our div with poor html inside the story text.
+		data = data.replace('<!-- headerend -->','<crazytagstringnobodywouldstumbleonaccidently id="storytext">').replace('<!-- footerstart -->','</crazytagstringnobodywouldstumbleonaccidently>')
+		
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			logging.info("Failed to decode: <%s>" % data)
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+		
+		div = soup.find('crazytagstringnobodywouldstumbleonaccidently', {'id' : 'storytext'})
+		if None == div:
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
+
+		html = soup.findAll('html')
+		if len(html) > 1:
+			return html[1].__str__('utf8')
+		else:
+			return div.__str__('utf8').replace('crazytagstringnobodywouldstumbleonaccidently','div')
+	
+	
+		
+if __name__ == '__main__':
+	url = 'http://www.fictionalley.org/authors/drt/DA.html'
+	data = self.opener.open(url).read()
+	host = up.urlparse(url).netloc
+	fw = FictionAlley(url)
+	urls = fw.extractIndividualUrls(data, host, url)
+	pp.pprint(urls)
+	print(fw.getText(data))
diff --git a/fanficdownloader/ficwad.py b/fanficdownloader/ficwad.py
new file mode 100644
index 00000000..058528bc
--- /dev/null
+++ b/fanficdownloader/ficwad.py
@@ -0,0 +1,267 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import shutil
+import os.path
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import logging
+import time
+import datetime
+
+from adapter import *
+
+class FicWad(FanfictionSiteAdapter):
+	def __init__(self, url):
+		self.url = url
+		self.host = up.urlparse(url).netloc
+		self.storyDescription = 'Fanfiction Story'
+		self.authorId = '0'
+		self.storyId = '0'
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		self.subjects.append ('fanfiction')
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = 'FanFiction'
+		self.category = 'Category'
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'PG'
+		self.storyUserRating = '0'
+		self.storyCharacters = []
+		self.storySeries = ''
+		self.outputName = ''
+		self.outputStorySep = '-fw_'
+
+	def getPasswordLine(self):
+		return 'opaopapassword'
+
+	def getLoginScript(self):
+		return 'opaopaloginscript'
+
+	def getLoginPasswordOthers(self):
+		login = dict(login = 'name', password = 'pass')
+		other = dict(submit = 'Log In', remember='yes')
+		return (login, other)
+
+	def extractIndividualUrls(self):
+		oldurl = ''
+		cururl = self.url
+		data = ''
+		try:
+			data = u2.urlopen(self.url).read()
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
+
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
+		
+		story = soup.find('div', {'id' : 'story'})
+		crumbtrail = story.find('h3') # the only h3 ficwad uses.
+		allAhrefs = crumbtrail.findAll('a')
+		# last of crumbtrail
+		storyinfo = allAhrefs[-1]
+		(u0, u1, storyid) = storyinfo['href'].split('/')
+		if u1 == "story":
+			# This page does not have the correct information on it..  Need to get the Story Title Page
+			logging.debug('URL %s is a chapter URL.  Getting Title Page http://%s/%s/%s.' % (self.url, self.host, u1, storyid))
+			oldurl = self.url
+			self.url = 'http://' + self.host + '/' + u1 + '/' + storyid
+			data = u2.urlopen(self.url).read()
+			soup = bs.BeautifulStoneSoup(data)
+			
+			story = soup.find('div', {'id' : 'story'})
+			crumbtrail = story.find('h3') # the only h3 ficwad uses.
+			allAhrefs = crumbtrail.findAll('a')
+		
+		# save chapter name from header in case of one-shot.
+		storyinfo = story.find('h4').find('a')
+		(u0, u1, self.storyId) = storyinfo['href'].split('/')
+		self.storyName = storyinfo.string.strip()
+
+		logging.debug('self.storyName=%s, self.storyId=%s' % (self.storyName, self.storyId))
+		
+		author = soup.find('span', {'class' : 'author'})
+		self.authorName = unicode(author.a.string)
+		(u0, u1,self.authorId) = author.a['href'].split('/')
+		self.authorURL = 'http://' + self.host + author.a['href']
+		logging.debug('self.authorName=%s self.authorId=%s' % (self.authorName, self.authorId))
+		
+		description = soup.find('blockquote', {'class' : 'summary'})
+		if description is not None:
+			self.storyDescription = unicode(description.p.string)
+		logging.debug('self.storyDescription=%s' % self.storyDescription)
+		
+		meta = soup.find('p', {'class' : 'meta'})
+		if meta is not None:
+			s = unicode(meta).replace('\n',' ').replace('\t','').split(' - ')
+			#logging.debug('meta.s=%s' % s)
+			for ss in s:
+				s1 = ss.replace('&nbsp;','').split(':')
+				#logging.debug('meta.s.s1=%s' % s1)
+				if len(s1) > 1:
+					s2 = re.split ('<[^>]+>', s1[0])
+					#logging.debug('meta.s.s1.s2=%s' % s2)
+					if len(s2) > 1:
+						s1[0] = s2[1]
+					skey = s1[0].strip()
+					#logging.debug('Checking = %s' % skey)
+					if skey == 'Category':
+						soup1 = bs.BeautifulStoneSoup(s1[1])
+						allAs = soup1.findAll('a')
+						for a in allAs:
+							if self.category == 'Category':
+								self.category = unicode(a.string)
+								logging.debug('self.category=%s' % self.category)
+							self.addSubject(self.category)
+						logging.debug('self.subjects=%s' % self.subjects)
+					elif skey == 'Rating':
+						self.storyRating = s1[1]
+						logging.debug('self.storyRating=%s' % self.storyRating)
+					elif skey == 'Genres':
+						self.genre = s1[1]
+						logging.debug('self.genre=%s' % self.genre)
+						s2 = s1[1].split(', ')
+						for ss2 in s2:
+							self.addSubject(ss2)
+						logging.debug('self.subjects=%s' % self.subjects)
+					elif skey == 'Characters':
+						s2 = s1[1].split(', ')
+						for ss2 in s2:
+							self.addCharacter(ss2)
+						logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+					elif skey == 'Chapters':
+						self.numChapters = s1[1]
+						logging.debug('self.numChapters=%s' % self.numChapters)
+					elif skey == 'Warnings':
+						logging.debug('Warnings=%s' % s1[1])
+					elif skey == 'Published':
+						self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s1[1].strip(' '), "%Y/%m/%d")))
+						logging.debug('self.storyPublished=%s' % self.storyPublished)
+					elif skey == 'Updated':
+						self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s1[1].strip(' '), "%Y/%m/%d")))
+						logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+				else:
+					s3 = re.split ('<[^>]+>', s1[0])
+					#logging.debug('meta.s.s1.s3=%s' % s3)
+					if len(s3) > 1:
+						s1[0] = s3[0]
+					s4 = s1[0].split('w')
+					#logging.debug('meta.s.s1.s4=%s' % s4)
+					if len(s4) > 1 and s4[1] == 'ords':
+						self.numWords = s4[0]
+						logging.debug('self.numWords=%s' % self.numWords)
+					
+		
+		logging.debug('Story "%s" by %s' % (self.storyName, self.authorName))
+		
+		result = []
+		ii = 1
+
+		if oldurl is not None and len(oldurl) > 0:
+			logging.debug('Switching back to %s' % oldurl)
+			cururl = oldurl
+			data = u2.urlopen(oldurl).read()
+			soup = bs.BeautifulStoneSoup(data)
+			
+		storylist = soup.find('ul', {'id' : 'storylist'})
+		if storylist is not None:
+			allBlocked = storylist.findAll('li', {'class' : 'blocked'})
+			if allBlocked is not None:
+				#logging.debug('allBlocked=%s' % allBlocked)
+				raise LoginRequiredException(cururl)
+
+			allH4s = storylist.findAll('h4')
+			#logging.debug('allH4s=%s' % allH4s)
+	
+			if allH4s is not None:
+				for h4 in allH4s:
+					chapterinfo = h4.find('a')
+					#logging.debug('Chapter1=%s' % chapterinfo)
+					url = 'http://' + self.host + chapterinfo['href']
+					title = chapterinfo.string.strip()
+					#logging.debug('Chapter=%s, %s' % (url, title))
+					# ficwad includes 'Story Index' in the dropdown of chapters, 
+					# but it's not a real chapter.
+					if title != "Story Index":
+						logging.debug('Chapter[%s]=%s, %s' % (ii, url, title))
+						result.append((url,title))
+						ii = ii+1
+					else:
+						logging.debug('Skipping Story Index.  URL %s' % url)
+				
+		if ii == 1:
+			select = soup.find('select', { 'name' : 'goto' } )
+
+			if select is None:
+				self.numChapters = '1'
+				logging.debug('self.numChapters=%s' % self.numChapters)
+				result.append((self.url,self.storyName))
+				logging.debug('Chapter[%s]=%s %s' % (ii, self.url, self.storyName))
+			else:
+				allOptions = select.findAll('option')
+				for o in allOptions:
+					url = 'http://' + self.host + o['value']
+					title = o.string
+					# ficwad includes 'Story Index' in the dropdown of chapters, 
+					# but it's not a real chapter.
+					if title != "Story Index":
+						logging.debug('Chapter[%s]=%s, %s' % (ii, url, title))
+						result.append((url,title))
+						ii = ii+1
+					else:
+						logging.debug('Skipping Story Index.  URL %s' % url)
+		
+		return result
+	
+	def getText(self, url):
+		if url.find('http://') == -1:
+			url = 'http://' + self.host + '/' + url
+		
+		data = ''
+		try:
+			data = u2.urlopen(url).read()
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			logging.info("Failed to decode: <%s>" % data)
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+		
+		div = soup.find('div', {'id' : 'storytext'})
+		if None == div:
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
+
+		return div.__str__('utf8')
+	
+		
+if __name__ == '__main__':
+	url = 'http://www.ficwad.com/story/14536'
+	data = u2.urlopen(url).read()
+	host = up.urlparse(url).netloc
+	fw = FicWad(url)
+	urls = fw.extractIndividualUrls()
+	pp.pprint(urls)
+	print(fw.getText(data))
diff --git a/fanficdownloader/fpcom.py b/fanficdownloader/fpcom.py
new file mode 100644
index 00000000..471c0b85
--- /dev/null
+++ b/fanficdownloader/fpcom.py
@@ -0,0 +1,344 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import os.path
+import logging
+import unittest
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time
+import datetime
+
+from constants import *
+from adapter import *
+
+try:
+	import login_password
+except:
+	# tough luck
+	pass
+
+class FPCom(FanfictionSiteAdapter):
+	def __init__(self, url):		
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		
+		self.storyName = ''
+		self.authorName = ''
+		self.storyDescription = ''
+		self.storyCharacters = []
+		self.storySeries = ''
+		self.authorId = '0'
+		self.authorURL = self.path
+		self.storyId = '0'
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = ''
+		self.category = ''
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'K'
+		self.storyUserRating = '0'
+		self.outputName = ''
+		self.outputStorySep = '-fpcom_'
+		
+		if self.path.startswith('/'):
+			self.path = self.path[1:]
+		
+		spl = self.path.split('/')
+		if spl is not None:
+			if len(spl) > 0 and spl[0] != 's':
+				raise InvalidStoryURL("Error URL \"%s\" is not a story." % self.url)
+			if len(spl) > 1:
+				self.storyId = spl[1]
+			if len(spl) > 2:
+				chapter = spl[1]
+			else:
+				chapter = '1'
+			if len(spl) == 5:
+				self.path = "/".join(spl[1:-1])
+		
+		if self.path.endswith('/'):
+			self.path = self.path[:-1]
+		
+		logging.debug('self.path=%s' % self.path)
+		
+		if not self.appEngine:
+			self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+		else:
+			self.opener = None
+	
+		logging.debug("Created FP.Com: url=%s" % (self.url))
+	
+	def _getLoginScript(self):
+		return self.path
+
+	def _getVarValue(self, varstr):
+		#logging.debug('_getVarValue varstr=%s' % varstr)
+		vals = varstr.split('=')
+		#logging.debug('vals=%s' % vals)
+		retstr="".join(vals[+1:])
+		#logging.debug('retstr=%s' % retstr)
+		if retstr.startswith(' '):
+			retstr = retstr[1:]
+		if retstr.endswith(';'):
+			retstr = retstr[:-1]
+		return retstr
+	
+	def _splitCrossover(self, subject):
+		if "Crossover" in subject:
+			self.addSubject ("Crossover")
+			logging.debug('Crossover=%s' % subject)
+			if subject.find(' and ') != -1:
+				words = subject.split(' ')
+				logging.debug('words=%s' % words)
+				subj = ''
+				for s in words:
+					if s in "and Crossover":
+						if len(subj) > 0:
+							self.addSubject(subj)
+						subj = ''
+					else:
+						if len(subj) > 0:
+							subj = subj + ' '
+						subj = subj + s
+				if len(subj) > 0:
+					self.addSubject(subj)
+			else:
+				self.addSubject(subject)
+		else:
+			self.addSubject(subject)
+		return True
+
+	def _splitGenre(self, subject):
+		if len(subject) > 0:
+			words = subject.split('/')
+			logging.debug('words=%s' % words)
+			for subj in words:
+			    if len(subj) > 0:
+				self.addSubject(subj)
+		return True
+	
+	def extractIndividualUrls(self):
+		data = ''
+		try:
+			data = self.fetchUrl(self.url)
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
+		
+		d2 = re.sub('&\#[0-9]+;', ' ', data)
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(d2)
+		except:
+			logging.error("Failed to decode: <%s>" % d2)
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
+
+		allA = soup.findAll('a')
+		for a in allA:
+			if 'href' in a._getAttrMap() and a['href'].find('/u/') != -1:
+				self.authorName = a.string
+				(u1, u2, self.authorId, u3) = a['href'].split('/')
+				logging.debug('self.authorId=%s self.authorName=%s' % (self.authorId, self.authorName))
+
+		urls = []
+		
+		metas = soup.findAll ('meta', {'name' : 'description'})
+		if metas is not None:
+			for meta in metas:
+				if 'content' in meta._getAttrMap():
+					self.storyDescription = unicode(meta['content'])
+					logging.debug('self.storyDescription=%s' % self.storyDescription)
+					
+					title=meta.find('title')
+					logging.debug('title=%s' % title.string)
+					tt = title.string.split(',')
+					if tt is not None:
+						if len(tt) > 0:
+							self.storyName = tt[0]
+							logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+						if len(tt) > 1:
+							tt1 = tt[1].split(' - ')
+							if tt1 is not None and len(tt1) > 0:
+								self.category = tt1[0].strip()
+								logging.debug('self.category=%s' % self.category)
+								cc = self.category.split(' ')
+								for cc1 in cc:
+									if cc1 is not None and cc1 != 'a':
+										if cc1 == 'fanfic':
+											self.addSubject('FanFiction')
+										else:
+											self.addSubject(cc1)
+								logging.debug('self.subjects=%s' % self.subjects)
+								
+
+		numchapters = 0
+		urlstory = ''
+
+		fidochap = soup.find('form', {'name':'fidochap'})
+		sl = fidochap.find('select', {'title':'chapter navigation'})
+		if sl is not None:
+			logging.debug('sl=%s' % sl )
+			if 'onchange' in sl._getAttrMap():
+				ocs = sl['onchange'].split('\'')
+				logging.debug('ocs=%s' % ocs)
+				if ocs is not None and len(ocs) > 3:
+					urlstory = ocs[3]
+					logging.debug('urlstory=%s' % urlstory)
+				
+			opts = sl.findAll('option')
+			for o in opts:
+				if 'value' in o._getAttrMap():
+					url = 'http://' + self.host + '/s/' + self.storyId  + '/' + o['value'] + urlstory
+					logging.debug('URL=%s, Title=%s' % (url, o.string))
+					urls.append((url, o.string))
+					numchapters = numchapters + 1
+		
+		if numchapters == 0:
+			numchapters = 1
+			url = 'http://' + self.host + '/s/' + self.storyId  + '/1' +  urlstory
+			logging.debug('URL=%s, Title=%s' % (url, self.storyName))
+			urls.append((url, self.storyName))
+			
+		self.numChapters = unicode(numchapters)
+		logging.debug('self.numChapters=%s' % self.numChapters)
+		logging.debug('urls=%s' % urls)
+		
+		self.genre = ''
+		tds = fidochap.findAll('td')
+		for td in tds:
+			tdb = td.find('b')
+			if tdb is not None and tdb.string == self.storyName:
+				tdas = td.findAll('a')
+				for tda in tdas:
+					ss = tda.string
+					if ss is not None:
+						if len(self.genre) > 0:
+							self.genre = self.genre + ', '
+						self.genre = self.genre + ss
+						self.addSubject(ss)
+				logging.debug('self.genre=%s' % self.genre)
+				logging.debug('self.subjects=%s' % self.subjects)
+			tda = td.find ('a')
+			if tda is not None and tda.string.find('Rated:') != -1:
+				tdas = re.split ("<[^>]+>", unicode(td).replace('\n','').replace('&nbsp;',' '))
+				if tdas is not None:
+					ll = len(tdas)
+					if ll > 2:
+						ss = tdas[2].split(': ')
+						if ss is not None and len(ss) > 1:
+							self.storyRating = ss[1]
+							logging.debug('self.storyRating=%s' % self.storyRating)
+					if ll > 3:
+						ss = tdas[3].split(' - ')
+						if ss is not None:
+							lls = len(ss)
+							if lls > 1:
+								language = ss[1]
+								logging.debug('language=%s' % language)
+							if lls > 2:
+								self.category = ss[2]
+								logging.debug('self.category=%s' % self.category)
+								sgs = self.category.split('/')
+								for sg in sgs:
+									self.addSubject(sg)
+								logging.debug('self.subjects=%s' % self.subjects)
+							if lls > 3 and ss[3].strip() == 'Reviews:' and ll > 4:
+								reviews = tdas[4] 
+								logging.debug('reviews=%s' % reviews)
+					if ll > 5:
+						ss = tdas[5].split(' - ')
+						if ss is not None:
+							lls = len(ss)
+							if lls > 1:
+								sds = ss[1].split(': ')
+								if sds is not None and len(sds) > 1 and sds[0] == 'Published':
+									self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sds[1].strip(' '), "%m-%d-%y")))
+									logging.debug('self.storyPublished=%s' % self.storyPublished)
+							lls = len(ss)
+							if lls > 2:
+								sds = ss[2].split(': ')
+								if sds is not None and len(sds) > 1 and sds[0] == 'Updated':
+									self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sds[1].strip(' '), "%m-%d-%y")))
+									logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+									
+
+
+		self.authorURL = 'http://' + self.host + '/u/' + self.authorId
+
+		return urls
+	
+	def getText(self, url):
+		time.sleep( 2.0 )
+		data = ''
+		try:
+			data = self.fetchUrl(url)
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
+		lines = data.split('\n')
+		
+		textbuf = ''
+		emit = False
+		
+		olddata = data
+		try:
+			data = data.decode('utf8')
+		except:
+			data = olddata
+		
+		soup = None
+		try:
+			soup = bs.BeautifulStoneSoup(data)
+		except:
+			logging.info("Failed to decode: <%s>" % data)
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+
+		div = soup.find('div', {'id' : 'storytext'})
+		if None == div:
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
+			
+		return div.__str__('utf8')
+					
+		
+class FPC_UnitTests(unittest.TestCase):
+	def setUp(self):
+		logging.basicConfig(level=logging.DEBUG)
+		pass
+	
+	def testFictionPress(self):
+		url = 'http://www.fictionpress.com/s/2725180/1/Behind_This_Facade'
+		f = FPCom(url)
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals('Behind This Facade', f.getStoryName())
+		self.assertEquals('IntoxicatingMelody', f.getAuthorName())
+	
+		text = f.getText(url)
+		self.assertTrue(text.find('Kale Resgerald at your service" He answered, "So, can we go now? Or do you want to') != -1)
+
+if __name__ == '__main__':
+	unittest.main()
diff --git a/fanficdownloader/hpfiction.py b/fanficdownloader/hpfiction.py
new file mode 100644
index 00000000..aeda7d36
--- /dev/null
+++ b/fanficdownloader/hpfiction.py
@@ -0,0 +1,280 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import os.path
+import logging
+import unittest
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time
+import datetime
+
+from constants import *
+from adapter import *
+
+try:
+	import login_password
+except:
+	# tough luck
+	pass
+
+class HPFiction(FanfictionSiteAdapter):
+	def __init__(self, url):
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		
+		logging.debug('self.url=%s' % self.url)
+		logging.debug('self.host=%s' % self.host)
+		logging.debug('self.path=%s' % self.path)
+	
+		self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+
+		self.chapurl = False
+		self.storyId = '0'
+		
+		sss = self.url.split('?')
+		logging.debug('sss=%s' % sss)
+		if sss is not None and len(sss) > 1:
+			sc = sss[1].split('=')
+			logging.debug('sc=%s' % sc)
+			if sc is not None and len(sc) > 1:
+				if sc[0] == 'chapterid':
+					self.chapurl = True
+				elif sc[0] == 'psid' or sc[0] == 'sid':
+					self.storyId = sc[1]
+
+		self.storyDescription = 'Fanfiction Story'
+		self.authorId = '0'
+		self.authorURL = ''
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		self.subjects.append ('fanfiction')
+		self.subjects.append ('Harry Potter')
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = 'FanFiction'
+		self.category = 'Category'
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'K'
+		self.storyUserRating = '0'
+		self.storyCharacters = []
+		self.storySeries = ''
+		self.outputName = ''
+		self.outputStorySep = '-hp_'
+		
+		logging.debug("Created HPFiction: url=%s" % (self.url))
+	
+	def _getLoginScript(self):
+		return self.path
+	
+	def extractIndividualUrls(self):
+		data = ''
+		try:
+			data = self.opener.open(self.url).read()
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
+		
+		soup = None
+		try:
+			soup = bs.BeautifulSoup(data)
+		except:
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
+				
+		links = soup.findAll('a')
+		def_chapurl = ''
+		def_chaptitle = ''
+		
+		if self.chapurl:
+			foundid = False
+			for a in links:
+				if a['href'].find('psid') != -1:
+					sp = a['href'].split('?')
+					if sp is not None and len(sp) > 1:
+						for sp1 in sp:
+							if sp1.find('psid') != -1:
+								ps = sp1.split('=')
+								if ps is not None and len(ps) > 1:
+									self.storyId = ps[1].replace('\'','')
+									foundid = True
+					self.storyName = a.string
+					logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+					break
+			if foundid:
+				self.url = "http://" + self.host + "/viewstory.php?psid=" + self.storyId
+				logging.debug('Title Page URL=%s' % self.url)
+				data1 = self.opener.open(self.url).read()
+				hdrsoup = bs.BeautifulSoup(data1)
+			else:
+				hdrsoup = soup
+		else:
+			hdrsoup = soup
+			
+		for a in links:
+			if not self.chapurl and a['href'].find('psid') != -1:
+				sp = a['href'].split('?')
+				if sp is not None and len(sp) > 1:
+					for sp1 in sp:
+						if sp1.find('psid') != -1:
+							ps = sp1.split('=')
+							if ps is not None and len(ps) > 1:
+								self.storyId = ps[1].replace('\'','')
+				self.storyName = a.string
+				logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+			elif a['href'].find('viewuser.php') != -1:
+				self.authorName = a.string
+				self.authorURL = 'http://' + self.host + '/' + a['href']
+				(u1, self.authorId) = a['href'].split('=')
+				logging.debug('self.authorName=%s, self.authorId=%s' % (self.authorName, self.authorId))
+			elif a['href'].find('chapterid=') != -1 and len(def_chapurl) == 0:
+				def_chapurl = 'http://' + self.host + '/viewstory.php' + unicode(a['href'])
+				def_chaptitle = a.string
+				logging.debug('def_chapurl=%s, def_chaptitle=%s' % (def_chapurl, def_chaptitle))
+		
+		centers = hdrsoup.findAll('center')
+		for center in centers:
+			tds = center.findAll ('td')
+			if tds is not None and len(tds) > 0:
+				for td in tds:
+					s = re.split ("<[^>]+>", unicode(td).replace('\n','').replace('&nbsp;',' '))
+					ii = 0
+					ll = len(s)
+					sss = ''
+					while ii < ll - 1:
+						if s[ii] is not None and len(s[ii]) > 0:
+							if s[ii] == 'Rating:':
+								self.storyRating = s[ii+1]
+								logging.debug('self.storyRating=%s' % self.storyRating)
+								ii = ii + 2
+							elif s[ii] == 'Chapters:':
+								self.numChapters = s[ii+1]
+								logging.debug('self.numChapters=%s' % self.numChapters)
+								ii = ii + 2
+							elif s[ii] == 'Characters:':
+								s2 = s[ii+1].split(', ')
+								for ss2 in s2:
+									self.addCharacter(ss2)
+								logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+								ii = ii + 2
+							elif s[ii] == 'Genre(s):':
+								self.genre = s[ii+1]
+								logging.debug('self.genre=%s' % self.genre)
+								s2 = s[ii+1].split(', ')
+								for ss2 in s2:
+									self.addSubject(ss2)
+								logging.debug('self.subjects=%s' % self.subjects)
+								ii = ii + 2
+							elif s[ii] == 'Status:':
+								if s[ii+1].strip(' ') == "Work In Progress":
+									self.storyStatus = 'In-Progress'
+								else:
+									self.storyStatus = 'Completed'
+								ii = ii + 2
+							elif s[ii] == 'First Published:':
+								self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s[ii+1].strip(' '), "%Y.%m.%d")))
+								logging.debug('self.storyPublished=%s' % self.storyPublished)
+								ii = ii + 2
+							elif s[ii] == 'Last Updated:':
+								self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s[ii+1].strip(' '), "%Y.%m.%d")))
+								logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+								ii = ii + 2
+							elif s[ii] == 'Last Published Chapter:':
+								ii = ii + 2
+							elif s[ii] == 'Pairings:':
+								ii = ii + 2
+							elif s[ii] == 'Warnings:':
+								ii = ii + 2
+							else:
+								sss = sss + ' ' + s[ii]
+								ii = ii + 1
+						else:
+							ii = ii + 1
+					self.storyDescription = sss
+					logging.debug('self.storyDescription=%s' % self.storyDescription)
+		
+		urls = []
+
+		select = soup.find('select', {'name' : 'chapterid'})
+		if select is None:
+			# no chapters found, try url by itself.
+			if len(def_chapurl) > 0:
+				urls.append((def_chapurl, def_chaptitle))
+			else:
+				urls.append((self.url,self.storyName))
+		else:
+			for o in select.findAll('option'):
+				if 'value' in o._getAttrMap():
+					url = 'http://' + self.host + self.path + o['value']
+					title = o.string
+					if title != "Story Index":
+						urls.append((url,title))
+
+		return urls
+
+	def getText(self, url):
+		logging.debug('Downloading from URL: %s' % url)
+		data = ''
+		try:
+			data = self.opener.open(url).read()
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
+		soup = None
+		try:
+			soup = bs.BeautifulSoup(data)
+		except:
+			logging.info("Failed to decode: <%s>" % data)
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+		
+		divtext = soup.find('div', {'id' : 'fluidtext'})
+		if None == divtext:
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
+
+		return divtext.__str__('utf8')
+
+
+class FF_UnitTests(unittest.TestCase):
+	def setUp(self):
+		logging.basicConfig(level=logging.DEBUG)
+		pass
+
+	def testChaptersAuthStory(self):
+		f = HPFiction('http://www.harrypotterfanfiction.com/viewstory.php?chapterid=80123')
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals(49, len(urls))
+		self.assertEquals('Elisha', f.getAuthorName())
+		self.assertEquals('A Secret Thought', f.getStoryName())
+	
+	def testGetText(self):
+		url = 'http://www.harrypotterfanfiction.com/viewstory.php?chapterid=80123'
+		f = HPFiction(url)
+		#urls = f.extractIndividualUrls()
+		text = f.getText(url)
+		self.assertTrue(text.find('She pulled out of his arms and felt the subtle regret') != -1)
+
+if __name__ == '__main__':
+	unittest.main()
+
+	
diff --git a/fanficdownloader/html2text.py b/fanficdownloader/html2text.py
new file mode 100644
index 00000000..ce6e1d3d
--- /dev/null
+++ b/fanficdownloader/html2text.py
@@ -0,0 +1,452 @@
+#!/usr/bin/env python
+# -*- coding: utf-8 -*-
+
+"""html2text: Turn HTML into equivalent Markdown-structured text."""
+__version__ = "2.37"
+__author__ = "Aaron Swartz (me@aaronsw.com)"
+__copyright__ = "(C) 2004-2008 Aaron Swartz. GNU GPL 3."
+__contributors__ = ["Martin 'Joey' Schulze", "Ricardo Reyes", "Kevin Jay North"]
+
+# TODO:
+#   Support decoded entities with unifiable.
+
+if not hasattr(__builtins__, 'True'): True, False = 1, 0
+import re, sys, urllib, htmlentitydefs, codecs, StringIO, types
+import sgmllib
+import urlparse
+sgmllib.charref = re.compile('&#([xX]?[0-9a-fA-F]+)[^0-9a-fA-F]')
+
+try: from textwrap import wrap
+except: pass
+
+# Use Unicode characters instead of their ascii psuedo-replacements
+UNICODE_SNOB = 0
+
+# Put the links after each paragraph instead of at the end.
+LINKS_EACH_PARAGRAPH = 0
+
+# Wrap long lines at position. 0 for no wrapping. (Requires Python 2.3.)
+BODY_WIDTH = 78
+
+# Don't show internal links (href="#local-anchor") -- corresponding link targets
+# won't be visible in the plain text file anyway.
+SKIP_INTERNAL_LINKS = False
+
+### Entity Nonsense ###
+
+def name2cp(k):
+    if k == 'apos': return ord("'")
+    if hasattr(htmlentitydefs, "name2codepoint"): # requires Python 2.3
+        return htmlentitydefs.name2codepoint[k]
+    else:
+        k = htmlentitydefs.entitydefs[k]
+        if k.startswith("&#") and k.endswith(";"): return int(k[2:-1]) # not in latin-1
+        return ord(codecs.latin_1_decode(k)[0])
+
+unifiable = {'rsquo':"'", 'lsquo':"'", 'rdquo':'"', 'ldquo':'"', 
+'copy':'(C)', 'mdash':'--', 'nbsp':' ', 'rarr':'->', 'larr':'<-', 'middot':'*',
+'ndash':'-', 'oelig':'oe', 'aelig':'ae',
+'agrave':'a', 'aacute':'a', 'acirc':'a', 'atilde':'a', 'auml':'a', 'aring':'a', 
+'egrave':'e', 'eacute':'e', 'ecirc':'e', 'euml':'e', 
+'igrave':'i', 'iacute':'i', 'icirc':'i', 'iuml':'i',
+'ograve':'o', 'oacute':'o', 'ocirc':'o', 'otilde':'o', 'ouml':'o', 
+'ugrave':'u', 'uacute':'u', 'ucirc':'u', 'uuml':'u'}
+
+unifiable_n = {}
+
+for k in unifiable.keys():
+    unifiable_n[name2cp(k)] = unifiable[k]
+
+def charref(name):
+    if name[0] in ['x','X']:
+        c = int(name[1:], 16)
+    else:
+        c = int(name)
+    
+    if not UNICODE_SNOB and c in unifiable_n.keys():
+        return unifiable_n[c]
+    else:
+        return unichr(c)
+
+def entityref(c):
+    if not UNICODE_SNOB and c in unifiable.keys():
+        return unifiable[c]
+    else:
+        try: name2cp(c)
+        except KeyError: return "&" + c
+        else: return unichr(name2cp(c))
+
+def replaceEntities(s):
+    s = s.group(1)
+    if s[0] == "#": 
+        return charref(s[1:])
+    else: return entityref(s)
+
+r_unescape = re.compile(r"&(#?[xX]?(?:[0-9a-fA-F]+|\w{1,8}));")
+def unescape(s):
+    return r_unescape.sub(replaceEntities, s)
+    
+def fixattrs(attrs):
+    # Fix bug in sgmllib.py
+    if not attrs: return attrs
+    newattrs = []
+    for attr in attrs:
+        newattrs.append((attr[0], unescape(attr[1])))
+    return newattrs
+
+### End Entity Nonsense ###
+
+def onlywhite(line):
+    """Return true if the line does only consist of whitespace characters."""
+    for c in line:
+        if c is not ' ' and c is not '  ':
+            return c is ' '
+    return line
+
+def optwrap(text):
+    """Wrap all paragraphs in the provided text."""
+    if not BODY_WIDTH:
+        return text
+    
+    assert wrap, "Requires Python 2.3."
+    result = ''
+    newlines = 0
+    for para in text.split("\n"):
+        if len(para) > 0:
+            if para[0] is not ' ' and para[0] is not '-' and para[0] is not '*':
+                for line in wrap(para, BODY_WIDTH):
+                    result += line + "\n"
+                result += "\n"
+                newlines = 2
+            else:
+                if not onlywhite(para):
+                    result += para + "\n"
+                    newlines = 1
+        else:
+            if newlines < 2:
+                result += "\n"
+                newlines += 1
+    return result
+
+def hn(tag):
+    if tag[0] == 'h' and len(tag) == 2:
+        try:
+            n = int(tag[1])
+            if n in range(1, 10): return n
+        except ValueError: return 0
+
+class _html2text(sgmllib.SGMLParser):
+    def __init__(self, out=None, baseurl=''):
+        sgmllib.SGMLParser.__init__(self)
+        
+        if out is None: self.out = self.outtextf
+        else: self.out = out
+        self.outtext = u''
+        self.quiet = 0
+        self.p_p = 0
+        self.outcount = 0
+        self.start = 1
+        self.space = 0
+        self.a = []
+        self.astack = []
+        self.acount = 0
+        self.list = []
+        self.blockquote = 0
+        self.pre = 0
+        self.startpre = 0
+        self.lastWasNL = 0
+        self.abbr_title = None # current abbreviation definition
+        self.abbr_data = None # last inner HTML (for abbr being defined)
+        self.abbr_list = {} # stack of abbreviations to write later
+        self.baseurl = baseurl
+    
+    def outtextf(self, s): 
+        self.outtext += s
+    
+    def close(self):
+        sgmllib.SGMLParser.close(self)
+        
+        self.pbr()
+        self.o('', 0, 'end')
+        
+        return self.outtext
+        
+    def handle_charref(self, c):
+        self.o(charref(c))
+
+    def handle_entityref(self, c):
+        self.o(entityref(c))
+            
+    def unknown_starttag(self, tag, attrs):
+        self.handle_tag(tag, attrs, 1)
+    
+    def unknown_endtag(self, tag):
+        self.handle_tag(tag, None, 0)
+        
+    def previousIndex(self, attrs):
+        """ returns the index of certain set of attributes (of a link) in the
+            self.a list
+ 
+            If the set of attributes is not found, returns None
+        """
+        if not attrs.has_key('href'): return None
+        
+        i = -1
+        for a in self.a:
+            i += 1
+            match = 0
+            
+            if a.has_key('href') and a['href'] == attrs['href']:
+                if a.has_key('title') or attrs.has_key('title'):
+                        if (a.has_key('title') and attrs.has_key('title') and
+                            a['title'] == attrs['title']):
+                            match = True
+                else:
+                    match = True
+
+            if match: return i
+
+    def handle_tag(self, tag, attrs, start):
+        attrs = fixattrs(attrs)
+    
+        if hn(tag):
+            self.p()
+            if start: self.o(hn(tag)*"#" + ' ')
+
+        if tag in ['p', 'div']: self.p()
+        
+        if tag == "br" and start: self.o("  \n")
+
+        if tag == "hr" and start:
+            self.p()
+            self.o("* * *")
+            self.p()
+
+        if tag in ["head", "style", 'script']: 
+            if start: self.quiet += 1
+            else: self.quiet -= 1
+
+        if tag in ["body"]:
+            self.quiet = 0 # sites like 9rules.com never close <head>
+        
+        if tag == "blockquote":
+            if start: 
+                self.p(); self.o('> ', 0, 1); self.start = 1
+                self.blockquote += 1
+            else:
+                self.blockquote -= 1
+                self.p()
+        
+        if tag in ['em', 'i', 'u']: self.o("_")
+        if tag in ['strong', 'b']: self.o("**")
+        if tag == "code" and not self.pre: self.o('`') #TODO: `` `this` ``
+        if tag == "abbr":
+            if start:
+                attrsD = {}
+                for (x, y) in attrs: attrsD[x] = y
+                attrs = attrsD
+                
+                self.abbr_title = None
+                self.abbr_data = ''
+                if attrs.has_key('title'):
+                    self.abbr_title = attrs['title']
+            else:
+                if self.abbr_title != None:
+                    self.abbr_list[self.abbr_data] = self.abbr_title
+                    self.abbr_title = None
+                self.abbr_data = ''
+        
+        if tag == "a":
+            if start:
+                attrsD = {}
+                for (x, y) in attrs: attrsD[x] = y
+                attrs = attrsD
+                if attrs.has_key('href') and not (SKIP_INTERNAL_LINKS and attrs['href'].startswith('#')): 
+                    self.astack.append(attrs)
+                    self.o("[")
+                else:
+                    self.astack.append(None)
+            else:
+                if self.astack:
+                    a = self.astack.pop()
+                    if a:
+                        i = self.previousIndex(a)
+                        if i is not None:
+                            a = self.a[i]
+                        else:
+                            self.acount += 1
+                            a['count'] = self.acount
+                            a['outcount'] = self.outcount
+                            self.a.append(a)
+                        self.o("][" + `a['count']` + "]")
+        
+        if tag == "img" and start:
+            attrsD = {}
+            for (x, y) in attrs: attrsD[x] = y
+            attrs = attrsD
+            if attrs.has_key('src'):
+                attrs['href'] = attrs['src']
+                alt = attrs.get('alt', '')
+                i = self.previousIndex(attrs)
+                if i is not None:
+                    attrs = self.a[i]
+                else:
+                    self.acount += 1
+                    attrs['count'] = self.acount
+                    attrs['outcount'] = self.outcount
+                    self.a.append(attrs)
+                self.o("![")
+                self.o(alt)
+                self.o("]["+`attrs['count']`+"]")
+        
+        if tag == 'dl' and start: self.p()
+        if tag == 'dt' and not start: self.pbr()
+        if tag == 'dd' and start: self.o('    ')
+        if tag == 'dd' and not start: self.pbr()
+        
+        if tag in ["ol", "ul"]:
+            if start:
+                self.list.append({'name':tag, 'num':0})
+            else:
+                if self.list: self.list.pop()
+            
+            self.p()
+        
+        if tag == 'li':
+            if start:
+                self.pbr()
+                if self.list: li = self.list[-1]
+                else: li = {'name':'ul', 'num':0}
+                self.o("  "*len(self.list)) #TODO: line up <ol><li>s > 9 correctly.
+                if li['name'] == "ul": self.o("* ")
+                elif li['name'] == "ol":
+                    li['num'] += 1
+                    self.o(`li['num']`+". ")
+                self.start = 1
+            else:
+                self.pbr()
+        
+        if tag in ["table", "tr"] and start: self.p()
+        if tag == 'td': self.pbr()
+        
+        if tag == "pre":
+            if start:
+                self.startpre = 1
+                self.pre = 1
+            else:
+                self.pre = 0
+            self.p()
+            
+    def pbr(self):
+        if self.p_p == 0: self.p_p = 1
+
+    def p(self): self.p_p = 2
+    
+    def o(self, data, puredata=0, force=0):
+        if self.abbr_data is not None: self.abbr_data += data
+        
+        if not self.quiet: 
+            if puredata and not self.pre:
+                data = re.sub('\s+', ' ', data)
+                if data and data[0] == ' ':
+                    self.space = 1
+                    data = data[1:]
+            if not data and not force: return
+            
+            if self.startpre:
+                #self.out(" :") #TODO: not output when already one there
+                self.startpre = 0
+            
+            bq = (">" * self.blockquote)
+            if not (force and data and data[0] == ">") and self.blockquote: bq += " "
+            
+            if self.pre:
+                bq += "    "
+                data = data.replace("\n", "\n"+bq)
+            
+            if self.start:
+                self.space = 0
+                self.p_p = 0
+                self.start = 0
+
+            if force == 'end':
+                # It's the end.
+                self.p_p = 0
+                self.out("\n")
+                self.space = 0
+
+
+            if self.p_p:
+                self.out(('\n'+bq)*self.p_p)
+                self.space = 0
+                
+            if self.space:
+                if not self.lastWasNL: self.out(' ')
+                self.space = 0
+
+            if self.a and ((self.p_p == 2 and LINKS_EACH_PARAGRAPH) or force == "end"):
+                if force == "end": self.out("\n")
+
+                newa = []
+                for link in self.a:
+                    if self.outcount > link['outcount']:
+                        self.out("   ["+`link['count']`+"]: " + urlparse.urljoin(self.baseurl, link['href'])) 
+                        if link.has_key('title'): self.out(" ("+link['title']+")")
+                        self.out("\n")
+                    else:
+                        newa.append(link)
+
+                if self.a != newa: self.out("\n") # Don't need an extra line when nothing was done.
+
+                self.a = newa
+            
+            if self.abbr_list and force == "end":
+                for abbr, definition in self.abbr_list.items():
+                    self.out("  *[" + abbr + "]: " + definition + "\n")
+
+            self.p_p = 0
+            self.out(data)
+            self.lastWasNL = data and data[-1] == '\n'
+            self.outcount += 1
+
+    def handle_data(self, data):
+        if r'\/script>' in data: self.quiet -= 1
+        self.o(data, 1)
+    
+    def unknown_decl(self, data): pass
+
+def wrapwrite(text): sys.stdout.write(text.encode('utf8'))
+
+def html2text_file(html, out=wrapwrite, baseurl=''):
+    h = _html2text(out, baseurl)
+    h.feed(html)
+    h.feed("")
+    return h.close()
+
+def html2text(html, baseurl=''):
+    return optwrap(html2text_file(html, None, baseurl))
+
+if __name__ == "__main__":
+    baseurl = ''
+    if sys.argv[1:]:
+        arg = sys.argv[1]
+        if arg.startswith('http://'):
+            baseurl = arg
+            j = urllib.urlopen(baseurl)
+            try:
+                from feedparser import _getCharacterEncoding as enc
+            except ImportError:
+                   enc = lambda x, y: ('utf-8', 1)
+            text = j.read()
+            encoding = enc(j.headers, text)[0]
+            if encoding == 'us-ascii': encoding = 'utf-8'
+            data = text.decode(encoding)
+
+        else:
+            encoding = 'utf8'
+            if len(sys.argv) > 2:
+                encoding = sys.argv[2]
+            data = open(arg, 'r').read().decode(encoding)
+    else:
+        data = sys.stdin.read().decode('utf8')
+    wrapwrite(html2text(data, baseurl))
diff --git a/fanficdownloader/html_constants.py b/fanficdownloader/html_constants.py
new file mode 100644
index 00000000..f160a8a1
--- /dev/null
+++ b/fanficdownloader/html_constants.py
@@ -0,0 +1,19 @@
+# -*- coding: utf-8 -*-
+
+XHTML_START = '''<?xml version="1.0" encoding="UTF-8"?>
+<!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.1//EN" "http://www.w3.org/TR/xhtml11/DTD/xhtml11.dtd">
+<html xmlns="http://www.w3.org/1999/xhtml">
+<head>
+<title>${title} by ${author}</title>
+<link href="stylesheet.css" type="text/css" rel="stylesheet" />
+</head>
+<body>
+<div>
+<h1>${title} by ${author}</h1>
+${body}
+</body></html>
+'''
+
+XHTML_CHAPTER_START = '''<h2>${chapter}</h2>'''
+
+XHTML_END = ''''''
diff --git a/fanficdownloader/mediaminer.py b/fanficdownloader/mediaminer.py
new file mode 100644
index 00000000..6a4c03a7
--- /dev/null
+++ b/fanficdownloader/mediaminer.py
@@ -0,0 +1,406 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import shutil
+import os.path
+import logging
+import unittest
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time
+import datetime
+
+from constants import *
+from adapter import *
+
+try:
+	import login_password
+except:
+	# tough luck
+	pass
+
+class MediaMiner(FanfictionSiteAdapter):
+	def __init__(self, url):		
+		self.url = url
+		parsedUrl = up.urlparse(url)
+		self.host = parsedUrl.netloc
+		self.path = parsedUrl.path
+		
+		self.storyName = ''
+		self.authorName = ''
+		self.storyDescription = ''
+		self.storyCharacters = []
+		self.storySeries = ''
+		self.authorId = '0'
+		self.authorURL = self.path
+		self.storyId = '0'
+		self.storyPublished = datetime.date(1970, 01, 31)
+		self.storyCreated = datetime.datetime.now()
+		self.storyUpdated = datetime.date(1970, 01, 31)
+		self.languageId = 'en-UK'
+		self.language = 'English'
+		self.subjects = []
+		self.publisher = self.host
+		self.numChapters = 0
+		self.numWords = 0
+		self.genre = ''
+		self.category = ''
+		self.storyStatus = 'In-Progress'
+		self.storyRating = 'K'
+		self.storyUserRating = '0'
+		self.outputName = ''
+		self.outputStorySep = '-mm_'
+				
+		logging.debug('self.url=%s' % self.url)
+		
+		if self.url.find('view_st.php') != -1:
+			ss = self.url.split('view_st.php')
+			logging.debug('ss=%s' % ss)
+			if ss is not None and len(ss) > 1:
+				self.storyId = ss[1].replace('/','').strip()
+		elif self.url.find('view_ch.php?') != -1:
+			ss = self.url.split('=')
+			logging.debug('ss=%s' % ss)
+			if ss is not None and len(ss) > 1:
+				self.storyId = ss[-1].replace('/','').strip()
+				self.path = '/fanfic/view_st.php/' + self.storyId
+				self.url = 'http://' + self.host + self.path
+				logging.debug('self.url=%s' % self.url)
+		elif self.url.find('view_ch.php/') != -1:
+			ss = self.url.split('/')
+			logging.debug('ss=%s' % ss)
+			if ss is not None and len(ss) > 2:
+				self.storyId = ss[-2].strip()
+				self.path = '/fanfic/view_st.php/' + self.storyId
+				self.url = 'http://' + self.host + self.path
+				logging.debug('self.url=%s' % self.url)
+		else:			
+			raise InvalidStoryURL("Error URL \"%s\" is not a story." % self.url)
+			
+		logging.debug('self.storyId=%s' % self.storyId)
+		
+		logging.debug('self.path=%s' % self.path)
+		
+		if not self.appEngine:
+			self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+		else:
+			self.opener = None
+	
+		logging.debug("Created MediaMiner: url=%s" % (self.url))
+	
+	def _getLoginScript(self):
+		return self.path
+
+	def _getVarValue(self, varstr):
+		#logging.debug('_getVarValue varstr=%s' % varstr)
+		vals = varstr.split('=')
+		#logging.debug('vals=%s' % vals)
+		retstr="".join(vals[+1:])
+		#logging.debug('retstr=%s' % retstr)
+		if retstr.startswith(' '):
+			retstr = retstr[1:]
+		if retstr.endswith(';'):
+			retstr = retstr[:-1]
+		return retstr
+	
+	def _splitCrossover(self, subject):
+		if "Crossover" in subject:
+			self.addSubject ("Crossover")
+			logging.debug('Crossover=%s' % subject)
+			if subject.find(' and ') != -1:
+				words = subject.split(' ')
+				logging.debug('words=%s' % words)
+				subj = ''
+				for s in words:
+					if s in "and Crossover":
+						if len(subj) > 0:
+							self.addSubject(subj)
+						subj = ''
+					else:
+						if len(subj) > 0:
+							subj = subj + ' '
+						subj = subj + s
+				if len(subj) > 0:
+					self.addSubject(subj)
+			else:
+				self.addSubject(subject)
+		else:
+			self.addSubject(subject)
+		return True
+
+	def _splitGenre(self, subject):
+		if len(subject) > 0:
+			words = subject.split('/')
+			logging.debug('words=%s' % words)
+			for subj in words:
+			    if len(subj) > 0:
+				self.addSubject(subj)
+		return True
+
+	def extractIndividualUrls(self):
+		data = None
+		try:
+			data = self.fetchUrl(self.url)
+		except Exception, e:
+			data = None
+			logging.error("Caught an exception reading URL " + self.url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise StoryDoesNotExist("Problem reading story URL " + self.url + "!")
+		
+		#data.replace('<br />',' ').replace('<br>',' ').replace('</br>',' ')
+		soup = None
+		try:
+			soup = bs.BeautifulSoup(data)
+		except:
+			logging.error("Failed to decode: <%s>" % data)
+			raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % self.url)
+
+		#logging.debug('soap=%s' % soup)
+		urls = []
+		
+		td_ffh = soup.find('td', {'class' : 'ffh'})
+		#logging.debug('td_ffh=%s' % td_ffh)
+		if td_ffh is not None:
+			#logging.debug('td_ffh.text=%s' % td_ffh.find(text=True))
+			self.storyName = unicode(td_ffh.find(text=True)).strip()
+			logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+			fft = td_ffh.find('font', {'class' : 'smtxt'})
+			#logging.debug('fft=%s' % fft)
+			if fft is not None:
+				ffts = fft.string.split(' ')
+				if ffts is not None:
+					if len(ffts) > 1:
+						self.storyRating = ffts[1]
+						logging.debug('self.storyRating=%s' % self.storyRating)
+		self.genre = ''
+		td_smtxt = soup.findAll('td')
+		if td_smtxt is None:
+			#logging.debug('td_smtxt is NONE!')
+			pass
+		else:
+			ll = len(td_smtxt)
+			#logging.debug('td_smtxt=%s, len=%s' % (td_smtxt, ll))
+			for ii in range(ll):
+				td = td_smtxt[ii]
+				if 'class' in td._getAttrMap() and td['class'] != 'smtxt':
+					#logging.debug('td has class attribute but is not smtxt')
+					continue
+				ss = unicode(td).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
+				#logging.debug('ss=%s' % ss)
+				if len(ss) > 1 and (ss.find('Genre(s):') != -1 or ss.find('Type:') != -1):
+					#logging.debug('ss=%s' % ss)
+					ssbs = td.findAll('b')
+					#logging.debug('ssbs=%s' % ssbs)
+					bb = 0
+					while bb < len(ssbs):
+						nvs = bs.NavigableString('')
+						sst=''
+						ssb = ssbs[bb]
+						ssbt = unicode(ssb.text).strip()
+						#logging.debug('ssb=%s' % ssb)
+						#logging.debug('ssbt=%s' % ssbt)
+						ssbn = ssb.nextSibling
+						while ssbn is not None:
+							#logging.debug('ssbn=%s' % ssbn)
+							#logging.debug('ssbn.class=%s' % ssbn.__class__)
+							if nvs.__class__ == ssbn.__class__:
+								st = unicode(ssbn)
+								if st.strip() != '|':
+									sst = sst + st
+							else:
+								#logging.debug('ssbn.name=%s' % ssbn.name)
+								if ssbn.name == 'b':
+									break								
+								ssbnts = ssbn.findAll(text=True)
+								for ssbnt in ssbnts:
+									sst = sst + ssbnt
+							ssbn = ssbn.nextSibling
+						sst = sst.replace('&nbsp;',' ').strip()
+						#logging.debug('sst=%s' % sst)
+						if bb == 0:
+							ssbt = ssbt.replace(':','')
+							self.addSubject(ssbt)
+							self.addSubject(sst)
+							logging.debug('self.subjects=%s' % self.subjects)
+						else:
+							if ssbt == 'Genre(s):':
+								self.genre = sst
+								logging.debug('self.genre=%s' % self.genre)
+								sts = sst.split(' / ')
+								for st in sts:
+									self.addSubject(st.strip())
+								logging.debug('self.subjects=%s' % self.subjects)
+							elif ssbt == 'Type:':
+								self.category = sst
+								logging.debug('self.category=%s' % self.category)
+								self.addSubject(sst)
+								logging.debug('self.subjects=%s' % self.subjects)
+							elif ssbt == 'Author:':
+								pass
+							elif ssbt == 'Visits:':
+								pass
+							elif ssbt == 'Size:':
+								pass
+							elif ssbt == 'Pages:':
+								pass
+							elif ssbt == 'Status:':
+								if sst == "Completed":
+									self.storyStatus = 'Completed'
+								else:
+									self.storyStatus = 'In-Progress'
+							elif ssbt == 'Words:':
+								self.numWords = sst.replace('|','').strip()
+								logging.debug('self.numWords=%s' % self.numWords)
+								pass
+							elif ssbt == 'Summary:':
+								self.storyDescription = sst.strip()
+								logging.debug('self.storyDescription=%s' % self.storyDescription)
+							elif ssbt == 'Latest Revision:' or ssbt == 'Uploaded On:':
+								#logging.debug('sst=%s' % sst)
+								ssts = sst.split(' ')
+								if ssts is not None and len(ssts) > 3:
+									sst = ssts[0] + ' ' + ssts[1] + ' ' + ssts[2]
+								#logging.debug('sst=%s' % sst)
+								self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sst.strip(' '), "%B %d, %Y")))
+								logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+							else:
+								pass
+						bb = bb+1
+						
+					smtxt_as = td_smtxt[ii].findAll('a')
+					#logging.debug('smtxt_as=%s' % smtxt_as)
+					for smtxt_a in smtxt_as:
+						if 'href' in smtxt_a._getAttrMap() and smtxt_a['href'].find('/u/'):
+							sta = smtxt_a['href']
+							#logging.debug('sta=%s' % sta)
+							stas = sta.split('/u/')
+							#logging.debug('stas=%s' % stas)
+							if stas is not None and len(stas) > 1:
+								self.authorId = stas[1]
+								self.authorURL = 'http://' + self.host + sta
+								self.authorName = smtxt_a.string
+								logging.debug('self.authorName=%s, self.authorId=%s' % (self.authorName, self.authorId))
+				
+		urlstory=''
+		numchapters = 0
+		td_tbbrdr = soup.find('td', {'class' : 'tbbrdr'})
+		if td_tbbrdr is not None:
+			#logging.debug('td_tbbrdr=%s' % td_tbbrdr )
+
+			sl = td_tbbrdr.find('select', {'name':'cid'})
+			if sl is not None:
+				#logging.debug('sl=%s' % sl )
+				opts = sl.findAll('option')
+				for o in opts:
+					#logging.debug('o=%s' % o)				
+					if 'value' in o._getAttrMap():
+						url = 'http://' + self.host + '/fanfic/view_ch.php/' + self.storyId  + '/' + o['value']
+						logging.debug('URL=%s, Title=%s' % (url, o.string))
+						if numchapters == 0:
+							ss = o.string.split('[')
+							if ss is not None and len(ss) > 1:
+								ssd = ss[-1].replace(']','') 
+								#logging.debug('ssd=%s' % ssd)
+								self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(ssd.strip(' '), "%b %d, %Y")))
+								logging.debug('self.storyPublished=%s' % self.storyPublished)
+						urls.append((url, o.string))
+						numchapters = numchapters + 1
+		
+		if numchapters == 0:
+			numchapters = 1
+			url = 'http://' + self.host + '/fanfic/view_st.php/' + self.storyId
+			self.storyPublished = self.storyUpdated
+			logging.debug('self.storyPublished=%s' % self.storyPublished)
+			ssd = self.storyName + ' [' + self.storyPublished.strftime("%b %d, %Y") + ']'
+			logging.debug('URL=%s, Title=%s' % (url, ssd))
+			urls.append((url, ssd))
+			
+		self.numChapters = unicode(numchapters)
+		logging.debug('self.numChapters=%s' % self.numChapters)
+		#logging.debug('urls=%s' % urls)
+		
+		return urls
+	
+	def getText(self, url):
+		time.sleep( 2.0 )
+		logging.debug('url=%s' % url)
+		data = ''
+		try:
+			data = self.fetchUrl(url)
+		except Exception, e:
+			data = ''
+			logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+		if data is None:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+		
+		soup = None
+		try:
+			soup = bs.BeautifulSoup(data)
+		except:
+			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+		
+		nvs = bs.NavigableString('')
+		sst=''
+		allAs = soup.findAll ('a', { 'name' : 'fic_c' })
+		#logging.debug('allAs=%s' % allAs)
+		for a in allAs:
+			#logging.debug('a=%s' % a)
+			foundfirst = False
+			done = False
+			nxta = a.nextSibling
+			while nxta is not None and not done:
+				#logging.debug('nxta=%s' % nxta)
+				#logging.debug('nxta.class=%s' % nxta.__class__)
+				st = unicode(nxta)
+				if nvs.__class__ != nxta.__class__:
+					#logging.debug('nxta.name=%s' % nxta.name)
+					if nxta.name == 'table':
+						st = ''
+						if foundfirst:
+							done = True
+					if nxta.name == 'div' and 'class' in nxta._getAttrMap() and nxta['class'] == 'acl' and foundfirst:
+						st = ''
+						done = True
+				
+					if nxta.name == 'br':
+						if not foundfirst:
+							st = ''
+					else:
+						foundfirst = True
+				else:
+					foundfirst = True
+					
+				sst = sst + st
+				nxta = nxta.nextSibling
+
+		if sst is None:	
+			raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
+		
+		return sst
+			
+class FPC_UnitTests(unittest.TestCase):
+	def setUp(self):
+		logging.basicConfig(level=logging.DEBUG)
+		pass
+	
+	def testFictionPress(self):
+		url = 'http://www.fictionpress.com/s/2725180/1/Behind_This_Facade'
+		f = FPCom(url)
+		urls = f.extractIndividualUrls()
+		
+		self.assertEquals('Behind This Facade', f.getStoryName())
+		self.assertEquals('IntoxicatingMelody', f.getAuthorName())
+	
+		text = f.getText(url)
+		self.assertTrue(text.find('Kale Resgerald at your service" He answered, "So, can we go now? Or do you want to') != -1)
+
+if __name__ == '__main__':
+	unittest.main()
diff --git a/fanficdownloader/output.py b/fanficdownloader/output.py
new file mode 100644
index 00000000..ff5daa51
--- /dev/null
+++ b/fanficdownloader/output.py
@@ -0,0 +1,424 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import cgi
+import uuid
+import unicodedata
+import codecs
+import shutil
+import string
+import os.path
+import zipfile
+import StringIO
+import logging
+import hashlib
+import urllib as u
+import pprint as pp
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+
+import zipdir
+import html_constants
+from constants import *
+
+
+import html2text
+import datetime
+
+
+class FanficWriter:
+	def __init__(self):
+		pass
+		
+	def writeChapter(self, index, title, text):
+		pass
+	
+	def finalise(self):
+		pass
+
+	@staticmethod
+	def getFormatName():
+		return 'base'
+	
+	@staticmethod	
+	def getFormatExt():
+		return '.bse'
+	
+class TextWriter(FanficWriter):
+	htmlWriter = None
+	
+	@staticmethod
+	def getFormatName():
+		return 'text'
+	
+	@staticmethod	
+	def getFormatExt():
+		return '.txt'
+	
+	def __init__(self, base, adapter, inmemory=False, compress=False):
+		self.inmemory = inmemory
+		self.htmlWriter = HTMLWriter(base, adapter, True, False)
+	
+	def writeChapter(self, index, title, text):
+		self.htmlWriter.writeChapter(index, title, text)
+	
+	def finalise(self):
+		self.htmlWriter.finalise()
+		self.name=self.htmlWriter.name
+		self.fileName = self.htmlWriter.fileName.replace(".html",".txt")
+		if self.inmemory:
+			self.output = StringIO.StringIO()
+		else:
+			self.output = open(self.fileName, 'w')
+		
+		self.output.write(html2text.html2text(self.htmlWriter.output.getvalue().decode('utf-8')).encode('utf-8'))
+		
+		if not self.inmemory:
+			self.output.close()
+		
+
+class HTMLWriter(FanficWriter):
+	body = ''
+	
+	@staticmethod
+	def getFormatName():
+		return 'html'
+	
+	@staticmethod	
+	def getFormatExt():
+		return '.html'
+	
+	def __init__(self, base, adapter, inmemory=False, compress=False):
+		self.basePath = base
+		self.storyTitle = removeEntities(adapter.getStoryName())
+		self.name = makeAcceptableFilename(adapter.getOutputName())
+		self.fileName = self.basePath + '/' + self.name + self.getFormatExt()
+		self.authorName = removeEntities(adapter.getAuthorName())
+		self.adapter = adapter
+		
+		self.inmemory = inmemory
+
+		if not self.inmemory and os.path.exists(self.fileName):
+			os.remove(self.fileName)
+		
+		if self.inmemory:
+			self.output = StringIO.StringIO()
+		else:
+			self.output = open(self.fileName, 'w')
+		
+		self.xhtmlTemplate = string.Template(html_constants.XHTML_START)
+		self.chapterStartTemplate = string.Template(html_constants.XHTML_CHAPTER_START)
+	
+	def _printableVersion(self, text):
+		try:
+			d = text.decode('utf-8')
+			return d
+		except:
+			return text
+	
+	def writeChapter(self, index, title, text):
+		title = self._printableVersion(title) #title.decode('utf-8')
+		text = self._printableVersion(text) #text.decode('utf-8')
+		self.body = self.body + '\n' + self.chapterStartTemplate.substitute({'chapter' : title})
+		self.body = self.body + '\n' + text
+	
+	def finalise(self):
+		html = self.xhtmlTemplate.substitute({'title' : self.storyTitle, 'author' : self.authorName, 'body' : self.body})
+		soup = bs.BeautifulSoup(html)
+		result = soup.__str__('utf8')
+		
+#		f = open(self.fileName, 'w')
+#		f.write(result)
+#		f.close()
+
+		self.output.write(result)
+		if not self.inmemory:
+			self.output.close()
+
+class EPubFanficWriter(FanficWriter):
+	chapters = []
+	
+	files = {}
+	
+	@staticmethod
+	def getFormatName():
+		return 'epub'
+	
+	@staticmethod	
+	def getFormatExt():
+		return '.epub'
+	
+	def __init__(self, base, adapter, inmemory=False, compress=True):
+		self.basePath = base
+		self.storyTitle = removeEntities(adapter.getStoryName())
+		self.name = makeAcceptableFilename(adapter.getOutputName())
+		self.directory = self.basePath + '/' + self.name
+		self.authorName = removeEntities(adapter.getAuthorName())
+		self.inmemory = inmemory
+		self.adapter = adapter
+		
+		self.files = {}
+		self.chapters = []
+		
+		if not self.inmemory:
+			self.inmemory = True
+			self.writeToFile = True
+		else:
+			self.writeToFile = False
+
+		if not self.inmemory:
+			if os.path.exists(self.directory):
+				shutil.rmtree(self.directory)
+		
+			os.mkdir(self.directory)
+		
+			os.mkdir(self.directory + '/META-INF')
+			os.mkdir(self.directory + '/OEBPS')
+		
+		self._writeFile('mimetype', MIMETYPE)
+		self._writeFile('META-INF/container.xml', CONTAINER)
+		self._writeFile('OEBPS/stylesheet.css', CSS)
+
+	def _writeFile(self, fileName, data):
+		#logging.debug('_writeFile(`%s`, data)' % fileName)
+		if fileName in self.files:
+			try:
+				d = data.decode('utf-8')
+			except UnicodeEncodeError, e:
+				d = data
+			
+			self.files[fileName].write(d)
+		else:
+			if self.inmemory:
+				self.files[fileName] = StringIO.StringIO()
+			else:
+				self.files[fileName] = open(self.directory + '/' + fileName, encoding='utf-8', mode='w')
+			
+			self._writeFile(fileName, data)
+		
+		
+	def _closeFiles(self):
+		if not self.inmemory:
+			for f in self.files:
+				self.files[f].close()
+	
+	def writeChapter(self, index, title, text):
+		title = removeEntities(title)
+		logging.debug("Writing chapter: %s" % title)
+		fileName="chapter%04d.xhtml" % index
+
+		filePath = self.directory + "/OEBPS/" + fileName
+		
+		fn = 'OEBPS/' + fileName
+		
+#		f = open(filePath, 'w')
+		
+		text = removeEntities(text)
+		
+		# BeautifulStoneSoup doesn't have any selfClosingTags by default.  
+		# hr & br needs to be if they're going to work.
+		# Some stories do use multiple br tags as their section breaks...
+		self.soup = bs.BeautifulStoneSoup(text, selfClosingTags=('br','hr'))
+
+		allTags = self.soup.findAll(recursive=True)
+		for t in allTags:
+			for attr in t._getAttrMap().keys():
+				if attr not in acceptable_attributes:
+					del t[attr]
+			# these are not acceptable strict XHTML.  But we do already have 
+			# CSS classes of the same names defined in constants.py
+			if t.name in ('u'):
+				t['class']=t.name
+				t.name='span'
+			if t.name in ('center'):
+				t['class']=t.name
+				t.name='div'
+			# removes paired, but empty tags.
+			if t.string != None and len(t.string.strip()) == 0 :
+				t.extract()
+
+		text = self.soup.__str__('utf8')
+		
+		# ffnet(& maybe others) gives the whole chapter text
+		# as one line.  This causes problems for nook(at
+		# least) when the chapter size starts getting big
+		# (200k+) Using Soup's prettify() messes up italics
+		# and such.  Done after soup extract so <p> and <br>
+		# tags are normalized.  Doing it here seems less evil
+		# than hacking BeautifulSoup, but it's debatable.
+		text = text.replace('</p>','</p>\n').replace('<br />','<br />\n')
+		
+		self._writeFile(fn, XHTML_START % (title, title))
+		self._writeFile(fn, text)
+		self._writeFile(fn, XHTML_END)
+#		print >> f, XHTML_START % (title, title)
+#		f.write(text)
+#		print >> f, XHTML_END
+		
+		self.chapters.append((title, fileName))
+	
+	def finalise(self):
+		logging.debug("Finalising...")
+		### writing table of contents -- ncx file
+		
+		tocFilePath = "OEBPS/toc.ncx"
+#		toc = open(tocFilePath, 'w')
+#		print >> toc, TOC_START % self.storyTitle
+		self._writeFile(tocFilePath, TOC_START % (self.adapter.getUUID(), self.storyTitle))
+
+		published = self.adapter.getStoryPublished().strftime("%Y-%m-%d")
+		createda = self.adapter.getStoryCreated().strftime("%Y-%m-%d %H:%M:%S")
+		created = self.adapter.getStoryCreated().strftime("%Y-%m-%d")
+		updated = self.adapter.getStoryUpdated().strftime("%Y-%m-%d")
+		calibre = self.adapter.getStoryUpdated().strftime("%Y-%m-%dT%H:%M:%S")
+		
+		description = self.adapter.getStoryDescription()
+		if hasattr(description, "text"):
+			description = unicode(description.text)
+		else:
+			description = unicode(description)
+		if description is not None and len(description) > 0:
+			description = description.replace ('\\\'', '\'').replace('\\\"', '\"')
+			description =  removeEntities(description)
+		else:
+			description = ' '
+
+		### writing content -- title page
+		titleFilePath = "OEBPS/title_page.xhtml"
+		self._writeFile(titleFilePath, TITLE_HEADER % (self.authorName, self.storyTitle, self.adapter.getStoryURL(), self.storyTitle, self.adapter.getAuthorURL(), self.authorName))
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Category:', self.adapter.getCategory()))		 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Genre:', self.adapter.getGenre())) 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Status:', self.adapter.getStoryStatus()))		 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Published:', published))		 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Updated:', updated))		 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Packaged:', createda))
+		tmpstr = self.adapter.getStoryRating() + " / " + self.adapter.getStoryUserRating()		 
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Rating Age/User:', tmpstr))
+		tmpstr = unicode(self.adapter.getNumChapters()) + " / " + unicode(self.adapter.getNumWords())
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Chapters/Words:', tmpstr))
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Publisher:', self.adapter.getHost()))
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Story ID:', self.adapter.getStoryId()))
+		self._writeFile(titleFilePath, TITLE_ENTRY % ('Author ID:', self.adapter.getAuthorId()))
+
+		self._writeFile(titleFilePath, TITLE_FOOTER % description )
+
+		### writing content -- opf file
+		opfFilePath = "OEBPS/content.opf"
+
+#		opf = open(opfFilePath, 'w')
+		self._writeFile(opfFilePath, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName, self.adapter.getLanguageId(), published, created, updated, calibre, description))
+
+		i = 0
+		subjs = []
+		subjs = self.adapter.getSubjects()
+		for subj in subjs:
+			self._writeFile(opfFilePath, CONTENT_SUBJECT % subj)
+			i = i + 1
+		if (i <= 0):
+			self._writeFile(opfFilePath, CONTENT_SUBJECT % "FanFiction")
+
+		self._writeFile(opfFilePath, CONTENT_END_METADATA % (self.adapter.getPublisher(), self.adapter.getUUID(), self.adapter.getStoryURL(), self.adapter.getStoryURL(), self.adapter.getStoryUserRating()))
+#		print >> opf, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName)
+
+		ids = []
+		
+		i = 0
+
+		t = "Title Page"
+		f = "title_page.xhtml"
+		chapterId = "Title Page"		
+		self._writeFile(tocFilePath, TOC_ITEM % (chapterId, i, t, f))
+		self._writeFile(opfFilePath, CONTENT_ITEM % (chapterId, f))
+		
+		ids.append(chapterId)
+		
+		i = i + 1
+		
+		for t,f in self.chapters:
+			chapterId = "chapter%04d" % i
+			
+			self._writeFile(tocFilePath, TOC_ITEM % (chapterId, i, t, f))
+			self._writeFile(opfFilePath, CONTENT_ITEM % (chapterId, f))
+			
+			ids.append(chapterId)
+			
+			i = i + 1
+			
+#		logging.d('Toc and refs printed, proceesing to ref-ids....')
+		
+		self._writeFile(tocFilePath, TOC_END)
+		self._writeFile(opfFilePath, CONTENT_END_MANIFEST)
+		
+		for chapterId in ids:
+			self._writeFile(opfFilePath, CONTENT_ITEMREF % chapterId)
+		
+		self._writeFile(opfFilePath, CONTENT_END)
+		
+		self._closeFiles()
+		
+		filename = self.directory + self.getFormatExt()
+		
+		zipdata = zipdir.inMemoryZip(self.files)
+		
+		if self.writeToFile:
+			f = open(filename, 'wb')
+			f.write(zipdata.getvalue())
+			f.close()
+		else:
+			self.output = zipdata
+			
+#		zipdir.toZip(filename, self.directory)
+
+def unirepl(match):
+	"Return the unicode string for a decimal number"
+	if match.group(1)=='x':
+		radix=16
+	else:
+		radix=10
+	value = int(match.group(2), radix )
+	return unichr(value)
+
+def replaceNumberEntities(data):
+	p = re.compile(r'&#(x?)(\d+);')
+	return p.sub(unirepl, data)
+
+def removeEntities(text):
+	# replace numeric versions of [&<>] with named versions.
+	
+	try:
+		t = text.decode('utf-8')
+	except UnicodeEncodeError, e:
+		try:
+			t = text.encode ('ascii', 'xmlcharrefreplace') 
+		except UnicodeEncodeError, e:
+			t = text
+	text = t 
+	text = re.sub(r'&#0*38;','&amp;',text)
+	text = re.sub(r'&#0*60;','&lt;',text)
+	text = re.sub(r'&#0*62;','&gt;',text)
+	
+	# replace remaining &#000; entities with unicode value, such as &#039; -> '
+	text = replaceNumberEntities(text)
+
+	# replace several named entities with character, such as &mdash; -> -
+	# see constants.py for the list.
+	# reverse sort will put entities with ; before the same one without, when valid.
+	for e in reversed(sorted(entities.keys())):
+		v = entities[e]
+		try:
+			text = text.replace(e, v)
+		except UnicodeDecodeError, ex:
+			# for the pound symbol in constants.py
+			text = text.replace(e, v.decode('utf-8'))
+	
+	# &lt; &lt; and &amp; are the only html entities allowed in xhtml, put those back.
+	text = text.replace('&', '&amp;').replace('&amp;lt;', '&lt;').replace('&amp;gt;', '&gt;')
+		
+	return text
+	
+def makeAcceptableFilename(text):
+	return re.sub('[^a-zA-Z0-9_-]+','',removeEntities(text).replace(" ", "_").replace(":","_"))	
diff --git a/fanficdownloader/potionsNsnitches.py b/fanficdownloader/potionsNsnitches.py
new file mode 100644
index 00000000..43dc47a7
--- /dev/null
+++ b/fanficdownloader/potionsNsnitches.py
@@ -0,0 +1,367 @@
+# -*- coding: utf-8 -*-
+
+# Copied from the twilighted.py because site is almost the same..
+# of course, now that we're trying to scrape more detail about the
+# story, there were differences in how headers are displayed
+
+import os
+import re
+import sys
+import shutil
+import os.path
+import urllib as u
+import logging
+import pprint as pp
+import unittest
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time
+import datetime
+
+from adapter import *
+
+class PotionsNSnitches(FanfictionSiteAdapter):
+    def __init__(self, url):
+        self.url = url
+        parsedUrl = up.urlparse(url)
+        self.host = parsedUrl.netloc
+        self.path = parsedUrl.path
+        self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+        self.password = ''
+        self.login='sigizmund'
+        self.storyDescription = 'Fanfiction Story'
+        self.authorId = '0'
+        self.authorURL = ''
+        self.storyId = '0'
+        self.storyPublished = datetime.date(1970, 01, 31)
+        self.storyCreated = datetime.datetime.now()
+        self.storyUpdated = datetime.date(1970, 01, 31)
+        self.languageId = 'en-UK'
+        self.language = 'English'
+        self.subjects = []
+        self.subjects.append ('fanfiction')
+        self.subjects.append ('Harry Potter')
+        self.publisher = self.host
+        self.numChapters = 0
+        self.numWords = 0
+        self.genre = 'FanFiction'
+        self.category = 'Category'
+        self.storyStatus = 'In-Progress'
+        self.storyRating = 'PG'
+        self.storyUserRating = '0'
+        self.storyCharacters = []
+        self.storySeries = ''
+        self.outputName = ''
+        self.outputStorySep = '-pns_'
+
+        self.chapurl = False
+        ss=self.url.split('?')
+        if ss is not None and len(ss) > 1:
+            sss = ss[1].replace('&amp;','&').split('&')
+            if sss is not None and len(sss) > 0:
+                ssss = sss[0].split('=')
+                if ssss is not None and len(ssss) > 1 and ssss[0] == 'sid':
+                    self.storyId = ssss[1]
+                if len(sss) > 1:
+                    ssss = sss[1].split('=')
+                    if ssss is not None and len(ssss) > 1 and ssss[0] == 'chapter':
+                        self.chapurl = True
+
+        self.url = 'http://' + self.host + self.path + '?sid=' + self.storyId
+        logging.debug('self.url=%s' % self.url)
+        
+        logging.debug("Created PotionsNSnitches: url=%s" % (self.url))
+
+
+    def _getLoginScript(self):
+        return '/user.php?action=login'
+
+    def reqLoginData(self, data):
+        if data.find('Registered Users Only. Please click OK to login or register.') != -1 or data.find('There is no such account on our website') != -1:
+          return True
+        else:
+          return False
+
+    def _fillCharacters(self, strlist, idx, maxlen):
+        ii = idx
+        while ii < maxlen:
+            chara = strlist[ii].strip()
+            if len(chara) > 0:
+                if chara.find(':') != -1:
+                    return (ii-1)
+                elif chara.find(',') == -1:
+                    self.addCharacter (chara)
+            ii = ii + 1
+        return (ii) 
+
+    def _buildGenre(self, strlist, idx, maxlen):
+        self.genre = ''
+        ii = idx
+        while ii < maxlen:
+            genre = strlist[ii].strip()
+            if len(genre) > 0:
+                if genre.find(':') != -1:
+                    return (ii-1)
+                elif genre.find(',') != -1:
+                    genre = ', '
+                else:
+                    self.addSubject (genre)
+                self.genre = self.genre + genre
+            ii = ii + 1
+        return (ii) 
+
+    def _buildCategory(self, strlist, idx, maxlen):
+        self.category = ''
+        ii = idx
+        while ii < maxlen:
+            cat = strlist[ii].strip()
+            if len(cat) > 0:
+                if cat.find(':') != -1:
+                    return (ii-1)
+                elif cat.find(',') != -1:
+                    cat = ', '
+                else:
+                    self.addSubject (cat)
+                self.category = self.category + cat
+            ii = ii + 1
+        return (ii) 
+
+    def extractIndividualUrls(self):
+        url = self.url + '&chapter=1'
+        data = ''
+        try:
+            data = self.opener.open(url).read()
+        except Exception, e:
+            data = ''
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+        if data is None:
+            raise StoryDoesNotExist("Problem reading story URL " + url + "!")
+        
+        if self.reqLoginData(data):
+            self.performLogin()
+            
+            data = ''
+            try:
+                data = self.opener.open(url).read()
+            except Exception, e:
+                data = ''
+                logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+            if data is None:
+                raise StoryDoesNotExist("Problem reading story URL " + url + "!")
+        
+            if self.reqLoginData(data):
+                raise FailedToDownload("Error downloading Story: %s!  Login Failed!" % url)    
+        
+        soup = None
+        try:
+            soup = bs.BeautifulStoneSoup(data)
+        except:
+            raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % url)    
+
+        self.storyName = ''
+        self.authorName = ''
+        self.storyId = '0'
+        title = soup.find('title').string
+        if title is not None and len(title) > 0:
+            logging.debug('Title: %s' % title)
+            ss = title.split(' by ')
+            if ss is not None and len(ss) > 1:
+                self.storyName = ss[0].strip()
+                self.authorName = ss[1].strip()
+
+        logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+        logging.debug('self.authorId=%s, self.authorName=%s' % (self.authorId, self.authorName))
+                
+        select = soup.find('select', { 'name' : 'chapter' } )
+    	 
+        result = []
+        if select is None:
+    	   # no chapters found, try url by itself.
+           chaptitle = soup.find('div', { 'id' : 'chaptertitle' } )
+           if chaptitle is not None and chaptitle.string is not None and len(chaptitle.string) > 0:
+               result.append((url,chaptitle.string))
+           else:
+    	       result.append((url,self.storyName))
+        else:
+    	   allOptions = select.findAll('option')
+    	   for o in allOptions:
+    	     url = self.url + "&chapter=%s" % o['value']
+    	     title = o.string
+    	     result.append((url,title))
+    
+        url = self.url + "&index=1"
+        data = self.opener.open(url).read()
+        lines = data.split('\n')
+        soup = bs.BeautifulStoneSoup(data)
+        pgt = soup.find('div', {'id' : 'pagetitle'})
+        #logging.debug('pagetitle: %s' % pgt)
+        pgtAs = pgt.findAll('a')
+        #logging.debug('pgtAs: %s' % pgtAs)
+        for a in pgtAs:
+            if a['href'].find('viewstory.php') != -1:
+                (u1, self.storyId) = a['href'].split('=')
+                self.storyName = a.string
+                logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+            elif a['href'].find('viewuser.php') != -1:
+                self.authorName = a.string
+                self.authorURL = 'http://' + self.host + '/' + a['href']
+                (u1, self.authorId) = a['href'].split('=')
+                logging.debug('self.authorName=%s, self.authorId=%s' % (self.authorName, self.authorId))
+
+        output = soup.find('div', {'id' : 'output'})
+        #logging.debug('output: %s' % unicode(output))
+        if output is not None and len(unicode(output)) > 1:
+            s2 = re.split ('<[^>]+>', unicode(output))
+            #logging.debug('s2=%s' % s2)
+            ii = 0
+            ll = len(s2)
+            while ii < ll:
+                if s2[ii] == 'Summary:' and ii+1 < ll:
+                    self.storyDescription = s2[ii+1].strip()
+                    logging.debug('self.storyDescription: %s' % self.storyDescription)
+                    break;
+                ii = ii+1
+            
+        cnt = soup.find('div', {'class' : 'content'})
+        #logging.debug('content: %s' % cnt)
+        cnttd = cnt.findAll('td')
+        #logging.debug('cnttd: %s' % cnttd)
+        for td in cnttd:
+            #logging.debug('td: %s' % unicode(td))
+            ss = unicode(td).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
+            if len(ss) > 1:
+                s2 = re.split ('<[^>]+>', ss)
+                #logging.debug('s2=%s' % s2)
+                ii = 0
+                ll = len(s2)
+                while ii < ll-1:
+                    if s2[ii] is not None and len(s2[ii]) > 0 and s2[ii].find(':') != -1:
+                        skey = s2[ii].strip()
+                        ii = ii+1
+                        if skey == 'Rated:':
+                            self.storyRating = s2[ii].strip()
+                            logging.debug('self.storyRating=%s' % self.storyRating)
+                            ii = ii + 1
+                        elif skey == 'Chapters:':
+                            self.numChapters = s2[ii].strip()
+                            logging.debug('self.numChapters=%s' % self.numChapters)
+                            ii = ii + 1
+                        elif skey == 'Characters:':
+                            ii = self._fillCharacters(s2, ii, ll)
+                            logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+                            ii = ii + 1
+                        elif skey == 'Genres:':
+                            ii = self._buildGenre(s2, ii, ll)
+                            logging.debug('self.genre=%s' % self.genre)
+                            logging.debug('self.subjects=%s' % self.subjects)
+                        elif skey == 'Categories:':
+                            ii = self._buildCategory(s2, ii, ll)
+                            logging.debug('self.category=%s' % self.category)
+                            logging.debug('self.subjects=%s' % self.subjects)
+                        elif skey == 'Completed:':
+                            if s2[ii].strip(' ') == "No":
+                                self.storyStatus = 'In-Progress'
+                            else:
+                                self.storyStatus = 'Completed'
+                            ii = ii + 1
+                        elif skey == 'Word count:':
+                            self.numWords = s2[ii].strip()
+                            if self.numWords is None or len(self.numWords) == 0:
+                                self.numWords = '0'
+                            logging.debug('self.numWords=%s' % self.numWords)
+                            ii = ii + 1
+                        elif skey == 'Takes Place:':
+                            ii = ii + 1
+                        elif skey == 'Awards:':
+                            ii = ii + 1
+                        elif skey == 'Series:':
+                            ii = ii + 1
+                        elif skey == 'Read:':
+                            ii = ii + 1
+                        elif skey == 'Warnings:':
+                            ii = ii + 1
+                    else:
+                        ii = ii + 1
+                                        
+        tls = soup.findAll('div', {'style' : 'text-align: center;'})
+        for tl in tls:
+            #logging.debug('tl: %s' % tl)
+            ss = unicode(tl).replace('\n','').replace('\r','').replace('&nbsp;', ' ')
+            if ss.find('Published:') != -1:
+                s2 = re.split ('<[^>]+>', ss)
+                #logging.debug('s2: %s' % s2)
+                ii = 0
+                ll = len(s2)
+                while ii < ll-1:
+                    if s2[ii] is not None and len(s2[ii]) > 0 and s2[ii].find(':') != -1:
+                        skey = s2[ii].strip()
+                        #logging.debug('skey: %s' % skey)
+                        ii = ii+1
+                        if skey == 'Published:':
+                            self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s2[ii].strip(' '), "%b %d %Y")))
+                            logging.debug('self.storyPublished=%s' % self.storyPublished)
+                            ii = ii + 1
+                        elif skey == 'Updated:':
+                            self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s2[ii].strip(' '), "%b %d %Y")))
+                            logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+                            ii = ii + 1
+                    else:
+                        ii = ii + 1
+            
+        if (self.storyName is None or len(self.storyName) == 0) and self.storyId == '0': 
+            logging.error('self.storyName is empty!!  Exitting!')
+            exit(1)
+            
+        return result
+    
+    def getText(self, url):
+        if url.find('http://') == -1:
+          url = 'http://' + self.host + '/' + url
+    
+        logging.debug('Getting data from: %s' % url)
+    
+        data = ''
+        try:
+            data = self.opener.open(url).read()
+        except Exception, e:
+            data = ''
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+        if data is None:
+            raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+        
+        # need to do this, because for some reason the <br /> tag in the story causes problems
+        data = data.replace('<br />', ' SOMETHING_BR ')
+
+        soup = None
+        try:
+            soup = bs.BeautifulStoneSoup(data, convertEntities=bs.BeautifulStoneSoup.HTML_ENTITIES)
+        except:
+            logging.info("Failed to decode: <%s>" % data)
+            raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+        
+        div = soup.find('div', {'id' : 'story'})
+    
+        if None == div:
+            raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
+
+        # put the <br /> tags back in..
+        text = div.__str__('utf8').replace(' SOMETHING_BR ','<br />')    
+        return text
+
+
+class PotionsNSnitches_UnitTests(unittest.TestCase):
+    def setUp(self):
+        logging.basicConfig(level=logging.DEBUG)
+        pass
+  
+    def testLoginWorks(self):
+        pass
+  
+    def testGetUrlsWorks(self):
+        url = 'http://potionsandsnitches.net/fanfiction/viewstory.php?sid=2230'
+        self.assertEquals(32, len(Twilighted(url).extractIndividualUrls()))
+
+if __name__ == '__main__':
+    unittest.main()
diff --git a/fanficdownloader/readme.txt b/fanficdownloader/readme.txt
new file mode 100644
index 00000000..108eff20
--- /dev/null
+++ b/fanficdownloader/readme.txt
@@ -0,0 +1,10 @@
+To use, do:
+
+python downloader.py <url> (epub|html)
+
+Eg:
+
+python downloader.py http://www.fanfiction.net/s/5192986/1/A_Fox_in_Tokyo epub
+
+This tool uses Python 2.5.2, but should work with newer versions.
+
diff --git a/fanficdownloader/twilighted.py b/fanficdownloader/twilighted.py
new file mode 100644
index 00000000..f3b72e3c
--- /dev/null
+++ b/fanficdownloader/twilighted.py
@@ -0,0 +1,316 @@
+# -*- coding: utf-8 -*-
+
+import os
+import re
+import sys
+import shutil
+import os.path
+import urllib as u
+import logging
+import pprint as pp
+import unittest
+import urllib2 as u2
+import urlparse as up
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time
+import datetime
+
+from adapter import *
+import twipassword
+
+class Twilighted(FanfictionSiteAdapter):
+    def __init__(self, url):
+        self.url = url
+        parsedUrl = up.urlparse(url)
+        self.host = parsedUrl.netloc
+        self.path = parsedUrl.path
+        self.opener = u2.build_opener(u2.HTTPCookieProcessor())
+        self.password=twipassword.password
+        self.login='sigizmund'
+        self.storyDescription = 'Fanfiction Story'
+        self.authorId = '0'
+        self.authorURL = ''
+        self.storyId = '0'
+        self.storyPublished = datetime.date(1970, 01, 31)
+        self.storyCreated = datetime.datetime.now()
+        self.storyUpdated = datetime.date(1970, 01, 31)
+        self.languageId = 'en-UK'
+        self.language = 'English'
+        self.subjects = []
+        self.subjects.append ('fanfiction')
+        self.subjects.append ('Twilight')
+        self.publisher = self.host
+        self.numChapters = 0
+        self.numWords = 0
+        self.genre = ''
+        self.category = 'Fanfiction'
+        self.storyStatus = 'In-Progress'
+        self.storyRating = 'PG'
+        self.storyUserRating = '0'
+        self.storyCharacters = []
+        self.storySeries = ''
+        self.outputName = ''
+        self.outputStorySep = '-tw_'
+        
+        self.chapurl = False
+        ss=self.url.split('?')
+        logging.debug('ss=%s' % ss)
+        if ss is not None and len(ss) > 1:
+            sss = ss[1].replace('&amp;','&').split('&')
+            logging.debug('sss=%s' % sss)
+            if sss is not None and len(sss) > 0:
+                ssss = sss[0].split('=')
+                logging.debug('ssss=%s' % ssss)
+                if ssss is not None and len(ssss) > 1 and ssss[0] == 'sid':
+                    self.storyId = ssss[1]
+                if len(sss) > 1:
+                    ssss = sss[1].split('=')
+                    logging.debug('ssss=%s' % ssss)
+                    if ssss is not None and len(ssss) > 1 and ssss[0] == 'chapter':
+                        self.chapurl = True
+
+        self.url = 'http://' + self.host + '/' + self.path + '?sid=' + self.storyId
+        logging.debug('self.url=%s' % self.url)
+        
+        logging.debug("Created Twilighted: url=%s" % (self.url))
+
+    def _getLoginScript(self):
+        return '/user.php?action=login'
+
+    def reqLoginData(self, data):
+        if data.find('Registered Users Only. Please click OK to login or register.') != -1 or data.find('There is no such account on our website') != -1:
+          return True
+        else:
+          return False
+
+    def requiresLogin(self, url = None):
+        return True
+
+    def performLogin(self, url = None):
+        data = {}
+    
+        data['penname'] = self.login
+        data['password'] = self.password
+        data['cookiecheck'] = '1'
+        data['submit'] = 'Submit'
+    
+        urlvals = u.urlencode(data)
+        loginUrl = 'http://' + self.host + self._getLoginScript()
+        logging.debug("Will now login to URL %s" % loginUrl)
+    
+        req = self.opener.open(loginUrl, urlvals)
+    
+        d = req.read().decode('utf-8')
+    
+        if self.reqLoginData(d) :
+          return False
+        else:
+          return True
+
+    def extractIndividualUrls(self):
+        url = self.url + '&chapter=1'
+
+        data = ''
+        try:
+            data = self.opener.open(url).read()
+        except Exception, e:
+            data = ''
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+        if data is None:
+            raise StoryDoesNotExist("Problem reading story URL " + url + "!")
+        
+        if self.reqLoginData(data):
+            self.performLogin()
+
+            data = ''
+            try:
+                data = self.opener.open(url).read()
+            except Exception, e:
+                data = ''
+                logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+            if data is None:
+                raise StoryDoesNotExist("Problem reading story URL " + url + "!")
+        
+            if self.reqLoginData(data):
+                raise FailedToDownload("Error downloading Story: %s!  Login Failed!" % url)    
+        
+        soup = None
+        try:
+            soup = bs.BeautifulStoneSoup(data)
+        except:
+            raise FailedToDownload("Error downloading Story: %s!  Problem decoding page!" % url)    
+
+        title = soup.find('title').string
+        logging.debug('Title: %s' % title)
+        self.storyName = title.split(' by ')[0].strip()
+        self.authorName = title.split(' by ')[1].strip()
+
+        logging.debug('self.storyId=%s, self.storyName=%s' % (self.storyId, self.storyName))
+        logging.debug('self.authorId=%s, self.authorName=%s' % (self.authorId, self.authorName))
+                
+        select = soup.find('select', { 'name' : 'chapter' } )
+    	 
+        result = []
+        if select is None:
+    	   # no chapters found, try url by itself.
+    	   result.append((self.url,self.storyName))
+        else:
+    	   allOptions = select.findAll('option')
+    	   for o in allOptions:
+    	     url = self.url + "&chapter=%s" % o['value']
+    	     title = o.string
+    	     result.append((url,title))
+    
+        url = self.url + "&index=1"
+        data = self.opener.open(url).read()
+        lines = data.split('\n')
+        soup = bs.BeautifulStoneSoup(data)
+        metas = soup.findAll('meta')
+        
+        for meta in metas:
+            if 'name' in meta._getAttrMap() and meta['name'].find('description') != -1:
+                #logging.debug('Meta: %s' % meta)
+                if 'content' in meta._getAttrMap():
+                    s1 = bs.BeautifulStoneSoup(meta['content'])
+                    ps = s1.findAll('p')
+                    if len(ps) > 0:
+                        self.storyDescription = ps[0]
+                        logging.debug('self.storyDescription=%s' % (self.storyDescription))
+                    else:
+                        divs = meta.findAll('div')
+                        #logging.debug('Divs: %s' % divs)
+                        
+                        for div in divs:
+                            #logging.debug('Div: %s' % div)
+                            if 'id' in div._getAttrMap() and div['id'].find('pagetitle') != -1:
+                                #logging.debug('Div PAGETITLE: %s' % div)
+                                allA = div.findAll('a')
+                                for a in allA:
+                                    if 'href' in a._getAttrMap(): 
+                                        if a['href'].find('viewstory.php?sid=') != -1:
+                                            str1 = a.string
+                                            (vs, self.storyId) = a['href'].split('=')
+                                            logging.debug('self.storyId=%s self.storyName=%s' % (self.storyId, self.storyName))
+                                        if a['href'].find('viewuser.php?uid=') != -1:
+                                            str1 = a.string
+                                            (vs, self.authorId) = a['href'].split('=')
+                                            logging.debug('self.authorId=%s self.authorName=%s' % (self.authorId, self.authorName))
+                                            self.authorURL = 'http://'+self.host+'/viewuser.php?uid='+self.authorId
+                                            logging.debug('self.authorURL=%s' % self.authorURL)
+                            if 'class' in div._getAttrMap() and div['class'].find('content') !=   -1:
+                                #logging.debug('Div CONTENT: %s' % div)        
+                                brs = div.findAll('br')
+                                for br in brs:
+                                    buf = unicode(br).encode('utf-8')  
+                                    strs = re.split ('<[^>]+>', buf)
+                                    #logging.debug('BUF: %s' % strs)
+                                    ii = 2
+                                    stlen = len(strs)
+                                    while stlen > ii+1:
+                                        if len(strs[ii]) == 0:
+                                            ii = ii+1
+                                            continue
+                                        if strs[ii] == 'Categories:':
+                                            ii = ii+1
+                                            while stlen > ii and len(strs[ii]) != 0 and strs[ii].find(':') == -1:
+                                                if strs[ii] != ' ' and strs[ii] != ', ':
+                                                    if len(self.genre) > 0:
+                                                        self.genre = self.genre + ', '
+                                                    self.genre = strs[ii].strip(' ')
+                                                    if len(self.category) == 0:
+                                                        self.category = strs[ii].strip(' ')
+                                                    self.addSubject(strs[ii].strip(' '))
+                                                ii = ii+1
+                                            logging.debug('self.subjects=%s' % self.subjects)
+                                        if strs[ii] == 'Characters: ':
+                                            ii = ii+1
+                                            while stlen > ii and len(strs[ii]) != 0 and strs[ii].find(':') == -1:
+                                                if strs[ii] != ' ' and strs[ii] != ', ':
+                                                    self.addCharacter(strs[ii].strip(' '))
+                                                ii = ii+1
+                                            logging.debug('self.storyCharacters=%s' % self.storyCharacters)
+                                        elif strs[ii] == 'Completed:':
+                                            if strs[ii+1].strip(' ') == "No":
+                                                self.storyStatus = 'In-Progress'
+                                            else:
+                                                self.storyStatus = 'Completed'
+                                            ii = ii+2
+                                            logging.debug('self.storyStatus=%s' % self.storyStatus)
+                                        elif strs[ii] == 'Rated:':
+                                            self.storyRating = strs[ii+1].strip(' ')
+                                            ii = ii+2
+                                            logging.debug('self.storyRating=%s' % self.storyRating)
+                                        elif strs[ii] == 'Series:':
+                                            self.storySeries = strs[ii+1].strip(' ')
+                                            if self.storySeries == 'None':
+                                                self.storySeries = ''
+                                            ii = ii+2
+                                            logging.debug('self.storySeries=%s' % self.storySeries)
+                                        elif strs[ii] == 'Chapters: ':
+                                            self.numChapters = strs[ii+1].strip(' ')
+                                            ii = ii+2
+                                            logging.debug('self.numChapters=%s' % self.numChapters)
+                                        elif strs[ii] == 'Word count:':
+                                            self.numWords = strs[ii+1].strip(' ')
+                                            ii = ii+2
+                                            logging.debug('self.numWords=%s' % self.numWords)
+                                        elif strs[ii] == ' Published: ':
+                                            self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(strs[ii+1].strip(' '), "%B %d, %Y")))
+                                            ii = ii+2
+                                            logging.debug('self.storyPublished=%s' % self.storyPublished)
+                                        elif strs[ii] == 'Updated:':
+                                            self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(strs[ii+1].strip(' '), "%B %d, %Y")))
+                                            ii = ii+2
+                                            logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+                                        else:
+                                            logging.debug('Skipped Label \"%s\" Value \"%s\"' % (strs[ii], strs[ii+1]))
+                                            ii = ii+2
+                                
+        return result
+
+    def getText(self, url):
+        if url.find('http://') == -1:
+          url = 'http://' + self.host + '/' + url
+    
+        logging.debug('Getting data from: %s' % url)
+    
+        data = ''
+        try:
+            data = self.opener.open(url).read()
+        except Exception, e:
+            data = ''
+            logging.error("Caught an exception reading URL " + url + ".  Exception " + unicode(e) + ".")
+        if data is None:
+            raise FailedToDownload("Error downloading Chapter: %s!  Problem getting page!" % url)
+                
+        soup = None
+        try:
+            soup = bs.BeautifulStoneSoup(data, convertEntities=bs.BeautifulStoneSoup.HTML_ENTITIES)
+        except:
+            logging.info("Failed to decode: <%s>" % data)
+            raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+        
+        div = soup.find('div', {'id' : 'story'})
+    
+        if None == div:
+            raise FailedToDownload("Error downloading Chapter: %s!  Missing required element!" % url)
+    
+        return div.__str__('utf8')
+
+
+class Twilighted_UnitTests(unittest.TestCase):
+  def setUp(self):
+    logging.basicConfig(level=logging.DEBUG)
+    pass
+  
+  def testLoginWorks(self):
+    url = 'http://www.twilighted.net/viewstory.php?sid=10004'
+    self.assertTrue(Twilighted(url).performLogin())
+  
+  def testGetUrlsWorks(self):
+    url = 'http://www.twilighted.net/viewstory.php?sid=10004'
+    self.assertEquals(32, len(Twilighted(url).extractIndividualUrls()))
+
+if __name__ == '__main__':
+  unittest.main()
diff --git a/fanficdownloader/twipassword.py b/fanficdownloader/twipassword.py
new file mode 100644
index 00000000..105c09c3
--- /dev/null
+++ b/fanficdownloader/twipassword.py
@@ -0,0 +1,4 @@
+# -*- coding: utf-8 -*-
+
+# This is really for the web version.  downalod.py will ask.
+password='somepass'
diff --git a/fanficdownloader/zipdir.py b/fanficdownloader/zipdir.py
new file mode 100644
index 00000000..eb50c961
--- /dev/null
+++ b/fanficdownloader/zipdir.py
@@ -0,0 +1,177 @@
+# -*- coding: utf-8 -*-
+
+from __future__ import with_statement
+
+import sys
+import os
+import zlib
+import zipfile
+from zipfile import ZipFile, ZIP_STORED, ZIP_DEFLATED
+from contextlib import closing
+import logging
+
+import BeautifulSoup as bs
+import htmlentitydefs as hdefs
+import time
+import datetime
+from datetime import timedelta
+
+import StringIO
+
+class InvalidEPub(Exception):
+    pass
+
+def checkNewer(filename, curdte):
+	ret = True
+	
+	if not os.path.isfile(filename):
+		logging.debug('File %s does not already exist.' % filename)
+		return ret
+	
+	#logging.debug('filename=%s, curdte=%s' % (filename, curdte))
+	lastdate = None
+	with closing(ZipFile(open(filename, 'rb'))) as epub:
+		titleFilePath = "OEBPS/title_page.xhtml"
+		contentFilePath = "OEBPS/content.opf"
+		
+		namelist = set(epub.namelist())
+		#logging.debug('namelist=%s' % namelist)
+		if 'mimetype' not in namelist or \
+		   'META-INF/container.xml' not in namelist:
+			#raise InvalidEPub('%s: not a valid EPUB' % filename)
+			logging.debug('File %s is not a valid EPub format file.' % filename)
+			return ret
+		
+		if contentFilePath not in namelist:
+			return ret	# file is not newer
+		
+		data = epub.read(contentFilePath)
+		soup = bs.BeautifulStoneSoup(data)
+		lstdte = soup.find ('dc:date', {'opf:event' : 'modification'})
+		#logging.debug('lstdte=%s' % lstdte.string)
+		if lstdte is None and titleFilePath in namelist:
+			data = epub.read(titleFilePath)
+			soup = bs.BeautifulStoneSoup(data)
+			fld = ''
+			allTDs = soup.findAll ('td')
+			for td in allTDs:
+				b = td.find ('b')
+				if b is not None:
+					fld = b.string
+				if td.string is not None and fld == "Updated:":
+					lastdate = td.string
+					#logging.debug('title lastdate=%s' % lastdate)
+		else:
+			lastdate = lstdte.string.strip(' ')
+			#logging.debug('contents lastdate=%s' % lastdate)
+	
+	if lastdate is not None:	
+		currUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(curdte.strftime('%Y-%m-%d'), "%Y-%m-%d")))
+		storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(lastdate, "%Y-%m-%d")))
+		logging.debug('File %s last update date is %s, comparing to %s' % (filename, storyUpdated, currUpdated))
+		if currUpdated <= storyUpdated :	
+			ret = False
+	
+	logging.debug("Does %s need to be updated? %s" % (filename, ret))
+	return ret
+
+
+def toZip(filename, directory):
+	zippedHelp = zipfile.ZipFile(filename, "w", compression=zipfile.ZIP_DEFLATED)
+	lst = os.listdir(directory)
+	
+	for entity in lst:
+		if entity.startswith('.'):
+			continue
+
+		each = os.path.join(directory,entity)
+		print(each)
+
+		if os.path.isfile(each):
+			print(each)
+			# epub standard requires mimetype to be uncompressed and first file.
+			if entity == 'mimetype':
+				zippedHelp.write(each, arcname=entity, compress_type=zipfile.ZIP_STORED)
+			else:
+				zippedHelp.write(each, arcname=entity)
+		else:
+			addFolderToZip(zippedHelp,entity, each)
+ 	
+	zippedHelp.close()
+
+def addFolderToZip(zippedHelp,folder,fpath):
+	#print('addFolderToZip(%s)' % folder)
+	
+	if folder == '.' or folder == '..':
+		return
+	
+	folderFiles = os.listdir(fpath)
+	for f in folderFiles:
+		if os.path.isfile(fpath + '/' + f):
+			#print('basename=%s' % os.path.basename(fpath + '/' + f))
+			zippedHelp.write(fpath + '/' + f, folder + '/' + f, zipfile.ZIP_DEFLATED)
+		elif os.path.isdir(f):
+			addFolderToZip(zippedHelp,f)
+
+def inMemoryZip(files):
+	# files have a structure of {'path/to/file' => content} dictionary
+	io = StringIO.StringIO()
+
+	if 'mimetype' in files:
+		# This fixes the uncompressed mimetype-first issue by opening
+		# the in memory file as STORE, putting in the mimetype, then
+		# closing and re-opening with DEFLATED.  while it is often
+		# true that mimetype is the first file, we can't assume it,
+		# because the dict object is defined as unordered.
+		path='mimetype'
+		memzip = zipfile.ZipFile(io, 'a', compression=zipfile.ZIP_STORED)
+		memzip.debug = 3
+		if type(files[path]) != type('str'):
+			data = files[path].getvalue()
+		else:
+			data = files[path]
+		
+		logging.debug("Writing ZIP path %s" % path)
+		try:
+			memzip.writestr(path, data.encode('utf-8'))
+		except UnicodeDecodeError, e:
+			memzip.writestr(path.encode('utf-8'), data.encode('utf-8'))
+		
+		memzip.close()
+
+		# remove it from the files dict.
+		del(files['mimetype'])
+	
+	# open in 'a' append mode.
+	memzip = zipfile.ZipFile(io, 'a', compression=zipfile.ZIP_DEFLATED)
+	memzip.debug = 3
+	
+	for path in files:
+		if type(files[path]) != type('str'):
+			data = files[path].getvalue()
+		else:
+			data = files[path]
+		
+#		logging.debug(data)
+		logging.debug("Writing ZIP path %s" % path)
+		try:
+			memzip.writestr(path, data.encode('utf-8'))
+		except UnicodeDecodeError, e:
+			memzip.writestr(path.encode('utf-8'), data.encode('utf-8'))
+
+	# declares all the files created by Windows.  
+	for zf in memzip.filelist:
+		zf.create_system = 0
+	
+	memzip.close()
+	
+	return io
+
+if __name__ == '__main__':
+#	toZip('sample.epub', "books/A_Time_To_Reflect")
+#	z = zipfile.ZipFile('sample.epub', 'r')
+	files = {'test.txt' : 'test', 'data/abc.txt' : 'abc'}
+	data = inMemoryZip(files)
+	f = open('res.zip', 'w')
+	f.write(data)
+	f.close()
diff --git a/ffstorage.py b/ffstorage.py
new file mode 100644
index 00000000..78647803
--- /dev/null
+++ b/ffstorage.py
@@ -0,0 +1,21 @@
+from google.appengine.ext import db
+
+class OneDownload(db.Model):
+	user = db.UserProperty()
+	url = db.StringProperty()
+	format = db.StringProperty()
+	login = db.StringProperty()
+	password = db.StringProperty()
+	failure = db.StringProperty()
+	date = db.DateTimeProperty(auto_now_add=True)
+	
+class DownloadedFanfic(db.Model):
+	user = db.UserProperty()
+	url = db.StringProperty()
+	name = db.StringProperty()
+	author = db.StringProperty()
+	format = db.StringProperty()
+	date = db.DateTimeProperty(auto_now_add=True)
+	blob = db.BlobProperty()
+	mac = db.StringProperty()
+	cleared = db.BooleanProperty(default=False)
\ No newline at end of file
diff --git a/index-ajax.html b/index-ajax.html
new file mode 100644
index 00000000..51dc6318
--- /dev/null
+++ b/index-ajax.html
@@ -0,0 +1,109 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01//EN">
+<html>
+	<head>
+		<link href="css/index.css" rel="stylesheet" type="text/css">
+		<link type="text/css" href="http://jqueryui.com/latest/themes/base/ui.all.css" rel="stylesheet" />
+	 
+		<title>Fanfiction Downloader (fanfiction.net, fictionalley, ficwad to epub and HTML)</title>
+		<meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
+		<script src="/js/jquery-1.3.2.js"></script>
+		<script src="/js/fdownloader.js"></script>
+		
+		<script type="text/javascript" src="http://jqueryui.com/latest/ui/ui.core.js"></script>
+	    <script type="text/javascript" src="http://jqueryui.com/latest/ui/ui.progressbar.js"></script>
+	  
+	</head>
+	<body>
+		<div id='main'>
+			<h1>
+				<a href="/" style="text-decoration: none; color: black;">FanFiction Downloader</a>
+			</h1>
+				
+<!--			<form action="/fdown" method="post"> -->
+				<div id='urlbox'>
+					<div id='greeting'>
+						Hi, {{ nickname }}! This is a fan fiction downloader, which makes reading stories from various websites much easier. Please paste a URL of the <em>first chapter</em> in the box to start. Alternatively, see your personal list of <a href="/recent">previously downloaded fanfics</a>.
+					</div>
+					<input type="text" id='url' name="url" size="50" value='{{ url }}'>
+					<div style="margin-top: 0.5em;">
+					Ebook format &nbsp;<select name="format" id="format">
+												<option value='epub'>ePub</option>
+												<option value='html'>HTML</option>
+											</select>
+					</div>
+					
+					<div id='error' style='color: red'>
+
+					</div>
+					
+					
+					
+				</div>
+				
+				<div id='yourfile' style='display:none'>
+				</div>
+				
+				<div id='typebox'>
+				</div>
+				
+				<h3>
+					Login and Password
+				</h3>
+				<div id='logpassword'>
+					If the story requires a login and password to download (e.g. marked as Mature on FFA), you may need to provide your credentials to download it, otherwise just leave it empty
+				</div>
+				<div id='logpasswordtable'>
+					<div class='fieldandlabel'>
+						<div class='label'>Login</div>
+						<div class='field'><input type='text' name='login' id='login' size='50'></div>
+					</div>
+					
+					<div class='fieldandlabel'>
+						<div class='label'>Password</div>
+						<div class='field'><input type='password' id='password' name='password' size='50'></div>
+					</div>
+				</div>
+				<div id='submitbtn'>
+					<span id='submit_button'><button onclick='downloadFanfic();'>Download</button></span>
+					<span id='ajax_loader' style='display:none'><img src="/static/ajax-loader.gif"></span>
+				</div>
+
+				
+				<div id="progressbar">
+					
+				</div>
+				<div id='helpbox'>
+				Few things to know, which will make your life substantially easier:
+				<ol>
+					<li>Small <a href="http://www.sigizmund.com/reading-fanfiction-off-line-in-stanza-and-oth">post written by me</a> &mdash; how to read fiction in Stanza or any other ebook reader. </a></li>
+					<li>Currently we support fanfiction.net, fictionpress.com, fanficauthors.net and ficwad.com</li>
+					<li>Paste a URL of the first chapter of the fanfic, not the index page</li>
+					<li>Fics with a single chapter are not supported (you can just copy and paste it)</li>
+					<li>Stories which are too long may not be downloaded correctly and application will report a time-out error &mdash; this is a limitation which is currently imposed by Google AppEngine on a long-running activities</li>
+					<li>FicWad support is somewhat flaky &mdash; if you feel it doesn't work for you, send all the details to me</li>
+					<li>You can download fanfics and store them for 'later' by just downloading them and visiting <a href="/recent">recent downloads</a> section, but in future they will be deleted after 5 days to save the space</li>
+					<li>If Downloader simply opens a download file window rather than saves the fanfic and gives you a link, it means it is too large to save in the database and you need to download it straight away</li>
+					<li>If you think that something that should work in fact doesn't, drop me a mail to <a href='mailto:sigizmund@gmail.com'>sigizmund@gmail.com</a></li>
+				</ol>
+				Otherwise, just have fun, and if you want to say thank you &mdash; use the email above.
+				</div>
+				<div style='text-align: center'>
+					<img src="http://code.google.com/appengine/images/appengine-silver-120x30.gif"
+					alt="Powered by Google App Engine" />
+					<br/><br/>
+					FanfictionLoader is a web front-end to <A href="http://code.google.com/p/fanficdownloader/">fanficdownloader</a><br/>
+					Copyright &copy; <a href="http://twitter.com/sigizmund">Roman Kirillov</a>
+				</div>
+<!--			</form> -->
+		</div>
+		<script type="text/javascript">
+		var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+		document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+		</script>
+		<script type="text/javascript">
+		try {
+		var pageTracker = _gat._getTracker("UA-12136939-1");
+		pageTracker._trackPageview();
+		} catch(err) {}</script>
+	</body>
+</html>
diff --git a/index.html b/index.html
new file mode 100644
index 00000000..4ee35c4f
--- /dev/null
+++ b/index.html
@@ -0,0 +1,204 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01//EN">
+<html>
+	<head>
+		<link href="css/index.css" rel="stylesheet" type="text/css">
+		<title>Fanfiction Downloader &mdash; twilighted.net, fanfiction.net, fictionpress.com, fictionalley.org, ficwad.com, potionsandsnitches.net, harrypotterfanfiction.com, mediaminer.org to epub and HTML to Stanza, Kindle, Nook, Sony Reader</title>
+		<meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
+		<meta name="google-site-verification" content="kCFc-G4bka_pJN6Rv8CapPBcwmq0hbAUZPkKWqRsAYU" />
+	</head>
+	<body>
+		<div id='main'>
+			<h1>
+				<a href="/" style="text-decoration: none; color: black;">FanFiction Downloader</a>
+			</h1>
+			
+			<div style="text-align: center">
+                <script type="text/javascript"><!--
+                google_ad_client = "pub-2027714004231956";
+                /* FFD */
+                google_ad_slot = "7330682770";
+                google_ad_width = 468;
+                google_ad_height = 60;
+                //-->
+                </script>
+                <script type="text/javascript"
+                src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
+                </script>
+            </div>
+<!--			<div id='yourfile'> -->
+			{{yourfile}}
+<!--			</div> -->
+
+			{% if authorized %}
+			<form action="/fdown" method="post">
+				<div id='urlbox'>
+					<div id='greeting'>
+					  <p>Hi, {{ nickname }}! This is a fan fiction downloader, which makes reading stories from various websites
+					  much easier. </p>
+					  <p>To support new features, such as including story summaries,
+					    the URL you need to use for some sites has changed.  See below for example URLs for each site.  </p>
+					  <p>Or see your personal list of <a href="/recent">previously downloaded fanfics</a>.</p>
+					</div>
+					<div id='error'>
+					{{ error_message }}
+					</div>
+					<input type="text" name="url" size="50" value='{{ url }}'>
+				</div>
+				
+				<div id='typebox'>
+					<div id='typelabel'>Ebook format</div>
+					<div id='typeoptions'>
+						<input type='radio' name='format' value='epub' checked>EPub</input>
+						<input type='radio' name='format' value='html'>HTML</input>
+						<input type='radio' name='format' value='text'>Plain Text</input>
+					</div>
+				</div>
+				
+				<div id='logpasswordtable'>
+				  <h3>Login and Password</h3>
+				  <div id='logpassword'>
+				    
+				    If the story requires a login and password to download (e.g. marked as Mature on FFA), you may need to provide
+				    your credentials to download it, otherwise just leave it empty
+				  </div>
+				  <div class='fieldandlabel'>
+				    <div class='label'>Login</div>
+				    <div class='field'><input type='text' name='login' size='50'></div>
+				  </div>
+				  
+				  <div class='fieldandlabel'>
+				    <div class='label'>Password</div>
+				    <div class='field'><input type='password' name='password' size='50'></div>
+				  </div>
+				</div>
+				
+				<div id='submitbtn'>
+					<input type="submit" value="Download">
+				</div>
+			</form>
+			{% else %}
+			<div id='urlbox'>
+				<div id='greeting'>
+					<p>
+					  This is a fan fiction downloader, which makes reading stories from various websites much easier. Before you
+					  can start downloading fanfics, you need to login, so downloader can remember your fanfics and store them.
+					</p>
+					<p><a href="{{ login_url }}">Login using Google account</a></p>
+				</div>
+			</div>
+			{% endif %}
+			
+				<div id='helpbox'>
+				  <dl>
+				    <dt>fictionalley.org
+				    <dd>Use the URL of the story's chapter list, such as
+				      <br /><a href="http://www.fictionalley.org/authors/drt/DA.html">http://www.fictionalley.org/authors/drt/DA.html</a>.  Or the story text URL for
+				      fictionalley.org one-shots, such as
+				      <br /><a href="http://www.fictionalley.org/authors/drt/JOTP01a.html">http://www.fictionalley.org/authors/drt/JOTP01a.html</a>.
+				    <dt>fanfiction.net
+				    <dd>Use the URL of any story chapter, with or without story title such as
+				      <br /><a href="http://www.fanfiction.net/s/5192986/1/A_Fox_in_Tokyo">http://www.fanfiction.net/s/5192986/1/A_Fox_in_Tokyo</a> or 
+				      <br /><a href="http://www.fanfiction.net/s/2345466/3/">http://www.fanfiction.net/s/5192986/5/</a>.
+				    <dt>fictionpress.com
+				    <dd>Use the URL of any story chapter, such as
+				      <br /><a href="http://www.fictionpress.com/s/2851771/1/Untouchable_Love">http://www.fictionpress.com/s/2851771/1/Untouchable_Love</a> or 
+				      <br /><a href="http://www.fictionpress.com/s/2847338/6/">http://www.fictionpress.com/s/2847338/6/</a>.
+				    <dt>twilighted.net
+				    <dd>Use the URL of the start of the story, such as
+				      <br /><a href="http://twilighted.net/viewstory.php?sid=8422">http://twilighted.net/viewstory.php?sid=8422</a>.
+				    <dt>ficwad.com
+				    <dd>Use the URL of any story chapter, such as
+				      <br /><a href="http://www.ficwad.com/story/75246">http://www.ficwad.com/story/75246</a>.
+				    <dt>harrypotterfanfiction.com
+				    <dd>Use the URL of the story's chapter list, such as
+				      <br /><a href="http://www.harrypotterfanfiction.com/viewstory.php?psid=289208">http://www.harrypotterfanfiction.com/viewstory.php?psid=289208</a>.
+				    <dt>potionsandsnitches.net
+				    <dd>Use the URL of the story's chapter list, such as
+				      <br /><a href="http://potionsandsnitches.net/fanfiction/viewstory.php?sid=2332">http://potionsandsnitches.net/fanfiction/viewstory.php?sid=2332</a>.
+				    <dt>mediaminer.org
+				    <dd>Use the URL of the story's chapter list, such as
+				      <br /><a href="http://www.mediaminer.org/fanfic/view_st.php/156934">http://www.mediaminer.org/fanfic/view_st.php/166653</a>.
+				      Or the story URL for one-shots, such as
+				      <br /><a href="http://www.mediaminer.org/fanfic/view_st.php/167618">http://www.mediaminer.org/fanfic/view_st.php/167618</a>.
+				  </dl>	
+
+				  
+				A few additional things to know, which will make your life substantially easier:
+				<ol>
+				  <li>
+				    First thing to know: I do not use your login and password. In fact, all I know about it is your ID &ndash; password
+				    is being verified by Google and is absolutely, totally unknown to anyone but you.
+				  </li>
+				  <li>
+				    Small <a href="http://www.sigizmund.com/reading-fanfiction-off-line-in-stanza-and-oth">post written by me</a>
+				    &mdash; how to read fiction in Stanza or any other ebook reader.
+				  </li>
+				  <li>
+				    Currently we support fanfiction.net, fictionpress.com, ficwad.com, fictionalley.org, harrypotterfanfiction.com, potionsandsnitches.net, mediaminer.org and twilighted.net.
+				    fanficauthors.net and tthfanfic.org offer native ePub functionality.
+				  </li>
+				  <li>
+				    You can download fanfiction directly from your iPhone, Kindle or (possibly) other ebook reader.
+				  </li>
+				  <li>
+				    One-shots, fics with a single chapter, <em>are</em> now supported.
+				  </li>
+				  <li>
+				    You can download fanfics and store them for 'later' by just downloading them and visiting <a href="/recent">recent
+				    downloads</a> section.
+				  </li>
+				  <li>
+				    Downloaded stories are deleted after some time (which should give you enough of time to download it and will keep
+				    Google happy about the app not going over the storage limit).
+				  </li>
+				  <li>
+				    If Downloader simply opens a download file window rather than saves the fanfic and gives you a link, it means it is
+				    too large to save in the database and you need to download it straight away.
+				  </li>
+				  <li>
+				    If you see some funny characters in downloaded Plain Text file, make sure you choose text file encoding UTF-8 and
+				    not something else.
+				  </li>
+				  <li>
+				    If you think that something that should work in fact doesn't, drop me a mail
+				    to <a href='mailto:sigizmund@gmail.com'>sigizmund@gmail.com</a>, or, even better, write an email to
+				    our <a href="http://groups.google.com/group/fanfic-downloader">Google Group</a>. I also encourage you to join it so
+				    you will find out about latest updates and fixes as soon as possible
+				  </li>
+				</ol>
+				Otherwise, just have fun, and if you want to say thank you &mdash; use the contacts above. 
+				</div>
+				<div style='text-align: center'>
+					<img src="http://code.google.com/appengine/images/appengine-silver-120x30.gif"
+					alt="Powered by Google App Engine" />
+					<br/><br/>
+					FanfictionLoader is a web front-end to <A href="http://code.google.com/p/fanficdownloader/">fanficdownloader</a><br/>
+					Copyright &copy; <a href="http://twitter.com/sigizmund">Roman Kirillov</a>
+				</div>
+
+			<div style="margin-top: 1em; text-align: center'">
+                <script type="text/javascript"><!--
+                google_ad_client = "pub-2027714004231956";
+                /* FFD */
+                google_ad_slot = "7330682770";
+                google_ad_width = 468;
+                google_ad_height = 60;
+                //-->
+                </script>
+                <script type="text/javascript"
+                src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
+                </script>
+            </div>
+			
+		</div>
+		<script type="text/javascript">
+		var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+		document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+		</script>
+		<script type="text/javascript">
+		try {
+		var pageTracker = _gat._getTracker("UA-12136939-1");
+		pageTracker._trackPageview();
+		} catch(err) {}</script>
+	</body>
+</html>
diff --git a/index.yaml b/index.yaml
new file mode 100644
index 00000000..bbed2dff
--- /dev/null
+++ b/index.yaml
@@ -0,0 +1,22 @@
+indexes:
+
+# AUTOGENERATED
+
+# This index.yaml is automatically updated whenever the dev_appserver
+# detects that a new type of query is run.  If you want to manage the
+# index.yaml file manually, remove the above marker line (the line
+# saying "# AUTOGENERATED").  If you want to manage some indexes
+# manually, move them above the marker line.  The index.yaml file is
+# automatically uploaded to the admin console when you next deploy
+# your application using appcfg.py.
+
+- kind: DownloadedFanfic
+  properties:
+  - name: cleared
+  - name: date
+
+- kind: DownloadedFanfic
+  properties:
+  - name: user
+  - name: date
+    direction: desc
diff --git a/js/fdownloader.js b/js/fdownloader.js
new file mode 100644
index 00000000..8f6ab0a8
--- /dev/null
+++ b/js/fdownloader.js
@@ -0,0 +1,116 @@
+var g_CurrentKey = null;
+var g_Counter = 0;
+
+var COUNTER_MAX = 50;
+
+
+function setErrorState(error)
+{
+	olderr = error;
+	error = error + "<br/><a href='mailto:sigizmund@gmail.com?subject=Problem with the fanfiction downloader'>" + "Complain about this error</a>";
+	$('#error').html(error);
+}
+
+function clearErrorState()
+{
+	$('#error').html('');
+}
+
+function showFile(data)
+{
+	$('#yourfile').html('<a href="/file?id=' + data.key + '">' + data.name + " by " + data.author + "</a>");
+	$('#yourfile').show();
+}
+
+function hideFile()
+{
+	$('#yourfile').hide();
+}
+
+function checkResults()
+{
+	if ( g_Counter >= COUNTER_MAX )
+	{
+		return;
+	}
+	
+	g_Counter+=1;
+
+	$.getJSON('/progress', { 'key' : g_CurrentKey }, function(data)
+	{
+		if ( data.result != "Nope")
+		{
+			if ( data.result != "OK" )
+			{
+				leaveLoadingState();
+				setErrorState(data.result);
+			}
+			else
+			{
+				showFile(data);
+				leaveLoadingState();
+				// result = data.split("|");
+				// showFile(result[1], result[2], result[3]);
+			}
+			
+			$("#progressbar").progressbar('destroy');
+			g_Counter = 101;
+		}
+	});
+	
+	if ( g_Counter < COUNTER_MAX ) 
+		setTimeout("checkResults()", 1000);
+	else
+	{
+		leaveLoadingState();
+		setErrorState("Operation takes too long - terminating by timeout (story too long?)");
+	}
+}
+
+function enterLoadingState()
+{
+	$('#submit_button').hide();
+	$('#ajax_loader').show();
+}
+
+function leaveLoadingState()
+{
+	$('#submit_button').show();
+	$('#ajax_loader').hide();
+}
+
+function downloadFanfic()
+{
+	clearErrorState();
+	hideFile();
+
+
+	format = $("#format").val();
+	alert(format);
+	
+	return;
+	
+	var url = $('#url').val();
+	var login = $('#login').val();
+	var password = $('#password').val();
+	
+	if ( url == '' )
+	{
+		setErrorState('URL shouldn\'t be empty');
+		return;
+	}
+	
+	if ( (url.indexOf('fanfiction.net') == -1 && url.indexOf('fanficauthors') == -1 && url.indexOf('ficwad') == -1  &&  url.indexOf('fictionpress') == -1) || (url.indexOf('adultfanfiction.net') != -1) )
+	{
+		setErrorState("This source is not yet supported. Ping me if you want it!");
+		return;
+	}
+	
+	$.post('/submitDownload', {'url' : url, 'login' : login, 'password' : password, 'format' : format}, function(data)
+	{
+		g_CurrentKey = data;
+		g_Counter = 0;
+		setTimeout("checkResults()", 1000);
+		enterLoadingState();
+	})
+}
\ No newline at end of file
diff --git a/js/jquery-1.3.2.js b/js/jquery-1.3.2.js
new file mode 100644
index 00000000..92635743
--- /dev/null
+++ b/js/jquery-1.3.2.js
@@ -0,0 +1,4376 @@
+/*!
+ * jQuery JavaScript Library v1.3.2
+ * http://jquery.com/
+ *
+ * Copyright (c) 2009 John Resig
+ * Dual licensed under the MIT and GPL licenses.
+ * http://docs.jquery.com/License
+ *
+ * Date: 2009-02-19 17:34:21 -0500 (Thu, 19 Feb 2009)
+ * Revision: 6246
+ */
+(function(){
+
+var 
+	// Will speed up references to window, and allows munging its name.
+	window = this,
+	// Will speed up references to undefined, and allows munging its name.
+	undefined,
+	// Map over jQuery in case of overwrite
+	_jQuery = window.jQuery,
+	// Map over the $ in case of overwrite
+	_$ = window.$,
+
+	jQuery = window.jQuery = window.$ = function( selector, context ) {
+		// The jQuery object is actually just the init constructor 'enhanced'
+		return new jQuery.fn.init( selector, context );
+	},
+
+	// A simple way to check for HTML strings or ID strings
+	// (both of which we optimize for)
+	quickExpr = /^[^<]*(<(.|\s)+>)[^>]*$|^#([\w-]+)$/,
+	// Is it a simple selector
+	isSimple = /^.[^:#\[\.,]*$/;
+
+jQuery.fn = jQuery.prototype = {
+	init: function( selector, context ) {
+		// Make sure that a selection was provided
+		selector = selector || document;
+
+		// Handle $(DOMElement)
+		if ( selector.nodeType ) {
+			this[0] = selector;
+			this.length = 1;
+			this.context = selector;
+			return this;
+		}
+		// Handle HTML strings
+		if ( typeof selector === "string" ) {
+			// Are we dealing with HTML string or an ID?
+			var match = quickExpr.exec( selector );
+
+			// Verify a match, and that no context was specified for #id
+			if ( match && (match[1] || !context) ) {
+
+				// HANDLE: $(html) -> $(array)
+				if ( match[1] )
+					selector = jQuery.clean( [ match[1] ], context );
+
+				// HANDLE: $("#id")
+				else {
+					var elem = document.getElementById( match[3] );
+
+					// Handle the case where IE and Opera return items
+					// by name instead of ID
+					if ( elem && elem.id != match[3] )
+						return jQuery().find( selector );
+
+					// Otherwise, we inject the element directly into the jQuery object
+					var ret = jQuery( elem || [] );
+					ret.context = document;
+					ret.selector = selector;
+					return ret;
+				}
+
+			// HANDLE: $(expr, [context])
+			// (which is just equivalent to: $(content).find(expr)
+			} else
+				return jQuery( context ).find( selector );
+
+		// HANDLE: $(function)
+		// Shortcut for document ready
+		} else if ( jQuery.isFunction( selector ) )
+			return jQuery( document ).ready( selector );
+
+		// Make sure that old selector state is passed along
+		if ( selector.selector && selector.context ) {
+			this.selector = selector.selector;
+			this.context = selector.context;
+		}
+
+		return this.setArray(jQuery.isArray( selector ) ?
+			selector :
+			jQuery.makeArray(selector));
+	},
+
+	// Start with an empty selector
+	selector: "",
+
+	// The current version of jQuery being used
+	jquery: "1.3.2",
+
+	// The number of elements contained in the matched element set
+	size: function() {
+		return this.length;
+	},
+
+	// Get the Nth element in the matched element set OR
+	// Get the whole matched element set as a clean array
+	get: function( num ) {
+		return num === undefined ?
+
+			// Return a 'clean' array
+			Array.prototype.slice.call( this ) :
+
+			// Return just the object
+			this[ num ];
+	},
+
+	// Take an array of elements and push it onto the stack
+	// (returning the new matched element set)
+	pushStack: function( elems, name, selector ) {
+		// Build a new jQuery matched element set
+		var ret = jQuery( elems );
+
+		// Add the old object onto the stack (as a reference)
+		ret.prevObject = this;
+
+		ret.context = this.context;
+
+		if ( name === "find" )
+			ret.selector = this.selector + (this.selector ? " " : "") + selector;
+		else if ( name )
+			ret.selector = this.selector + "." + name + "(" + selector + ")";
+
+		// Return the newly-formed element set
+		return ret;
+	},
+
+	// Force the current matched set of elements to become
+	// the specified array of elements (destroying the stack in the process)
+	// You should use pushStack() in order to do this, but maintain the stack
+	setArray: function( elems ) {
+		// Resetting the length to 0, then using the native Array push
+		// is a super-fast way to populate an object with array-like properties
+		this.length = 0;
+		Array.prototype.push.apply( this, elems );
+
+		return this;
+	},
+
+	// Execute a callback for every element in the matched set.
+	// (You can seed the arguments with an array of args, but this is
+	// only used internally.)
+	each: function( callback, args ) {
+		return jQuery.each( this, callback, args );
+	},
+
+	// Determine the position of an element within
+	// the matched set of elements
+	index: function( elem ) {
+		// Locate the position of the desired element
+		return jQuery.inArray(
+			// If it receives a jQuery object, the first element is used
+			elem && elem.jquery ? elem[0] : elem
+		, this );
+	},
+
+	attr: function( name, value, type ) {
+		var options = name;
+
+		// Look for the case where we're accessing a style value
+		if ( typeof name === "string" )
+			if ( value === undefined )
+				return this[0] && jQuery[ type || "attr" ]( this[0], name );
+
+			else {
+				options = {};
+				options[ name ] = value;
+			}
+
+		// Check to see if we're setting style values
+		return this.each(function(i){
+			// Set all the styles
+			for ( name in options )
+				jQuery.attr(
+					type ?
+						this.style :
+						this,
+					name, jQuery.prop( this, options[ name ], type, i, name )
+				);
+		});
+	},
+
+	css: function( key, value ) {
+		// ignore negative width and height values
+		if ( (key == 'width' || key == 'height') && parseFloat(value) < 0 )
+			value = undefined;
+		return this.attr( key, value, "curCSS" );
+	},
+
+	text: function( text ) {
+		if ( typeof text !== "object" && text != null )
+			return this.empty().append( (this[0] && this[0].ownerDocument || document).createTextNode( text ) );
+
+		var ret = "";
+
+		jQuery.each( text || this, function(){
+			jQuery.each( this.childNodes, function(){
+				if ( this.nodeType != 8 )
+					ret += this.nodeType != 1 ?
+						this.nodeValue :
+						jQuery.fn.text( [ this ] );
+			});
+		});
+
+		return ret;
+	},
+
+	wrapAll: function( html ) {
+		if ( this[0] ) {
+			// The elements to wrap the target around
+			var wrap = jQuery( html, this[0].ownerDocument ).clone();
+
+			if ( this[0].parentNode )
+				wrap.insertBefore( this[0] );
+
+			wrap.map(function(){
+				var elem = this;
+
+				while ( elem.firstChild )
+					elem = elem.firstChild;
+
+				return elem;
+			}).append(this);
+		}
+
+		return this;
+	},
+
+	wrapInner: function( html ) {
+		return this.each(function(){
+			jQuery( this ).contents().wrapAll( html );
+		});
+	},
+
+	wrap: function( html ) {
+		return this.each(function(){
+			jQuery( this ).wrapAll( html );
+		});
+	},
+
+	append: function() {
+		return this.domManip(arguments, true, function(elem){
+			if (this.nodeType == 1)
+				this.appendChild( elem );
+		});
+	},
+
+	prepend: function() {
+		return this.domManip(arguments, true, function(elem){
+			if (this.nodeType == 1)
+				this.insertBefore( elem, this.firstChild );
+		});
+	},
+
+	before: function() {
+		return this.domManip(arguments, false, function(elem){
+			this.parentNode.insertBefore( elem, this );
+		});
+	},
+
+	after: function() {
+		return this.domManip(arguments, false, function(elem){
+			this.parentNode.insertBefore( elem, this.nextSibling );
+		});
+	},
+
+	end: function() {
+		return this.prevObject || jQuery( [] );
+	},
+
+	// For internal use only.
+	// Behaves like an Array's method, not like a jQuery method.
+	push: [].push,
+	sort: [].sort,
+	splice: [].splice,
+
+	find: function( selector ) {
+		if ( this.length === 1 ) {
+			var ret = this.pushStack( [], "find", selector );
+			ret.length = 0;
+			jQuery.find( selector, this[0], ret );
+			return ret;
+		} else {
+			return this.pushStack( jQuery.unique(jQuery.map(this, function(elem){
+				return jQuery.find( selector, elem );
+			})), "find", selector );
+		}
+	},
+
+	clone: function( events ) {
+		// Do the clone
+		var ret = this.map(function(){
+			if ( !jQuery.support.noCloneEvent && !jQuery.isXMLDoc(this) ) {
+				// IE copies events bound via attachEvent when
+				// using cloneNode. Calling detachEvent on the
+				// clone will also remove the events from the orignal
+				// In order to get around this, we use innerHTML.
+				// Unfortunately, this means some modifications to
+				// attributes in IE that are actually only stored
+				// as properties will not be copied (such as the
+				// the name attribute on an input).
+				var html = this.outerHTML;
+				if ( !html ) {
+					var div = this.ownerDocument.createElement("div");
+					div.appendChild( this.cloneNode(true) );
+					html = div.innerHTML;
+				}
+
+				return jQuery.clean([html.replace(/ jQuery\d+="(?:\d+|null)"/g, "").replace(/^\s*/, "")])[0];
+			} else
+				return this.cloneNode(true);
+		});
+
+		// Copy the events from the original to the clone
+		if ( events === true ) {
+			var orig = this.find("*").andSelf(), i = 0;
+
+			ret.find("*").andSelf().each(function(){
+				if ( this.nodeName !== orig[i].nodeName )
+					return;
+
+				var events = jQuery.data( orig[i], "events" );
+
+				for ( var type in events ) {
+					for ( var handler in events[ type ] ) {
+						jQuery.event.add( this, type, events[ type ][ handler ], events[ type ][ handler ].data );
+					}
+				}
+
+				i++;
+			});
+		}
+
+		// Return the cloned set
+		return ret;
+	},
+
+	filter: function( selector ) {
+		return this.pushStack(
+			jQuery.isFunction( selector ) &&
+			jQuery.grep(this, function(elem, i){
+				return selector.call( elem, i );
+			}) ||
+
+			jQuery.multiFilter( selector, jQuery.grep(this, function(elem){
+				return elem.nodeType === 1;
+			}) ), "filter", selector );
+	},
+
+	closest: function( selector ) {
+		var pos = jQuery.expr.match.POS.test( selector ) ? jQuery(selector) : null,
+			closer = 0;
+
+		return this.map(function(){
+			var cur = this;
+			while ( cur && cur.ownerDocument ) {
+				if ( pos ? pos.index(cur) > -1 : jQuery(cur).is(selector) ) {
+					jQuery.data(cur, "closest", closer);
+					return cur;
+				}
+				cur = cur.parentNode;
+				closer++;
+			}
+		});
+	},
+
+	not: function( selector ) {
+		if ( typeof selector === "string" )
+			// test special case where just one selector is passed in
+			if ( isSimple.test( selector ) )
+				return this.pushStack( jQuery.multiFilter( selector, this, true ), "not", selector );
+			else
+				selector = jQuery.multiFilter( selector, this );
+
+		var isArrayLike = selector.length && selector[selector.length - 1] !== undefined && !selector.nodeType;
+		return this.filter(function() {
+			return isArrayLike ? jQuery.inArray( this, selector ) < 0 : this != selector;
+		});
+	},
+
+	add: function( selector ) {
+		return this.pushStack( jQuery.unique( jQuery.merge(
+			this.get(),
+			typeof selector === "string" ?
+				jQuery( selector ) :
+				jQuery.makeArray( selector )
+		)));
+	},
+
+	is: function( selector ) {
+		return !!selector && jQuery.multiFilter( selector, this ).length > 0;
+	},
+
+	hasClass: function( selector ) {
+		return !!selector && this.is( "." + selector );
+	},
+
+	val: function( value ) {
+		if ( value === undefined ) {			
+			var elem = this[0];
+
+			if ( elem ) {
+				if( jQuery.nodeName( elem, 'option' ) )
+					return (elem.attributes.value || {}).specified ? elem.value : elem.text;
+				
+				// We need to handle select boxes special
+				if ( jQuery.nodeName( elem, "select" ) ) {
+					var index = elem.selectedIndex,
+						values = [],
+						options = elem.options,
+						one = elem.type == "select-one";
+
+					// Nothing was selected
+					if ( index < 0 )
+						return null;
+
+					// Loop through all the selected options
+					for ( var i = one ? index : 0, max = one ? index + 1 : options.length; i < max; i++ ) {
+						var option = options[ i ];
+
+						if ( option.selected ) {
+							// Get the specifc value for the option
+							value = jQuery(option).val();
+
+							// We don't need an array for one selects
+							if ( one )
+								return value;
+
+							// Multi-Selects return an array
+							values.push( value );
+						}
+					}
+
+					return values;				
+				}
+
+				// Everything else, we just grab the value
+				return (elem.value || "").replace(/\r/g, "");
+
+			}
+
+			return undefined;
+		}
+
+		if ( typeof value === "number" )
+			value += '';
+
+		return this.each(function(){
+			if ( this.nodeType != 1 )
+				return;
+
+			if ( jQuery.isArray(value) && /radio|checkbox/.test( this.type ) )
+				this.checked = (jQuery.inArray(this.value, value) >= 0 ||
+					jQuery.inArray(this.name, value) >= 0);
+
+			else if ( jQuery.nodeName( this, "select" ) ) {
+				var values = jQuery.makeArray(value);
+
+				jQuery( "option", this ).each(function(){
+					this.selected = (jQuery.inArray( this.value, values ) >= 0 ||
+						jQuery.inArray( this.text, values ) >= 0);
+				});
+
+				if ( !values.length )
+					this.selectedIndex = -1;
+
+			} else
+				this.value = value;
+		});
+	},
+
+	html: function( value ) {
+		return value === undefined ?
+			(this[0] ?
+				this[0].innerHTML.replace(/ jQuery\d+="(?:\d+|null)"/g, "") :
+				null) :
+			this.empty().append( value );
+	},
+
+	replaceWith: function( value ) {
+		return this.after( value ).remove();
+	},
+
+	eq: function( i ) {
+		return this.slice( i, +i + 1 );
+	},
+
+	slice: function() {
+		return this.pushStack( Array.prototype.slice.apply( this, arguments ),
+			"slice", Array.prototype.slice.call(arguments).join(",") );
+	},
+
+	map: function( callback ) {
+		return this.pushStack( jQuery.map(this, function(elem, i){
+			return callback.call( elem, i, elem );
+		}));
+	},
+
+	andSelf: function() {
+		return this.add( this.prevObject );
+	},
+
+	domManip: function( args, table, callback ) {
+		if ( this[0] ) {
+			var fragment = (this[0].ownerDocument || this[0]).createDocumentFragment(),
+				scripts = jQuery.clean( args, (this[0].ownerDocument || this[0]), fragment ),
+				first = fragment.firstChild;
+
+			if ( first )
+				for ( var i = 0, l = this.length; i < l; i++ )
+					callback.call( root(this[i], first), this.length > 1 || i > 0 ?
+							fragment.cloneNode(true) : fragment );
+		
+			if ( scripts )
+				jQuery.each( scripts, evalScript );
+		}
+
+		return this;
+		
+		function root( elem, cur ) {
+			return table && jQuery.nodeName(elem, "table") && jQuery.nodeName(cur, "tr") ?
+				(elem.getElementsByTagName("tbody")[0] ||
+				elem.appendChild(elem.ownerDocument.createElement("tbody"))) :
+				elem;
+		}
+	}
+};
+
+// Give the init function the jQuery prototype for later instantiation
+jQuery.fn.init.prototype = jQuery.fn;
+
+function evalScript( i, elem ) {
+	if ( elem.src )
+		jQuery.ajax({
+			url: elem.src,
+			async: false,
+			dataType: "script"
+		});
+
+	else
+		jQuery.globalEval( elem.text || elem.textContent || elem.innerHTML || "" );
+
+	if ( elem.parentNode )
+		elem.parentNode.removeChild( elem );
+}
+
+function now(){
+	return +new Date;
+}
+
+jQuery.extend = jQuery.fn.extend = function() {
+	// copy reference to target object
+	var target = arguments[0] || {}, i = 1, length = arguments.length, deep = false, options;
+
+	// Handle a deep copy situation
+	if ( typeof target === "boolean" ) {
+		deep = target;
+		target = arguments[1] || {};
+		// skip the boolean and the target
+		i = 2;
+	}
+
+	// Handle case when target is a string or something (possible in deep copy)
+	if ( typeof target !== "object" && !jQuery.isFunction(target) )
+		target = {};
+
+	// extend jQuery itself if only one argument is passed
+	if ( length == i ) {
+		target = this;
+		--i;
+	}
+
+	for ( ; i < length; i++ )
+		// Only deal with non-null/undefined values
+		if ( (options = arguments[ i ]) != null )
+			// Extend the base object
+			for ( var name in options ) {
+				var src = target[ name ], copy = options[ name ];
+
+				// Prevent never-ending loop
+				if ( target === copy )
+					continue;
+
+				// Recurse if we're merging object values
+				if ( deep && copy && typeof copy === "object" && !copy.nodeType )
+					target[ name ] = jQuery.extend( deep, 
+						// Never move original objects, clone them
+						src || ( copy.length != null ? [ ] : { } )
+					, copy );
+
+				// Don't bring in undefined values
+				else if ( copy !== undefined )
+					target[ name ] = copy;
+
+			}
+
+	// Return the modified object
+	return target;
+};
+
+// exclude the following css properties to add px
+var	exclude = /z-?index|font-?weight|opacity|zoom|line-?height/i,
+	// cache defaultView
+	defaultView = document.defaultView || {},
+	toString = Object.prototype.toString;
+
+jQuery.extend({
+	noConflict: function( deep ) {
+		window.$ = _$;
+
+		if ( deep )
+			window.jQuery = _jQuery;
+
+		return jQuery;
+	},
+
+	// See test/unit/core.js for details concerning isFunction.
+	// Since version 1.3, DOM methods and functions like alert
+	// aren't supported. They return false on IE (#2968).
+	isFunction: function( obj ) {
+		return toString.call(obj) === "[object Function]";
+	},
+
+	isArray: function( obj ) {
+		return toString.call(obj) === "[object Array]";
+	},
+
+	// check if an element is in a (or is an) XML document
+	isXMLDoc: function( elem ) {
+		return elem.nodeType === 9 && elem.documentElement.nodeName !== "HTML" ||
+			!!elem.ownerDocument && jQuery.isXMLDoc( elem.ownerDocument );
+	},
+
+	// Evalulates a script in a global context
+	globalEval: function( data ) {
+		if ( data && /\S/.test(data) ) {
+			// Inspired by code by Andrea Giammarchi
+			// http://webreflection.blogspot.com/2007/08/global-scope-evaluation-and-dom.html
+			var head = document.getElementsByTagName("head")[0] || document.documentElement,
+				script = document.createElement("script");
+
+			script.type = "text/javascript";
+			if ( jQuery.support.scriptEval )
+				script.appendChild( document.createTextNode( data ) );
+			else
+				script.text = data;
+
+			// Use insertBefore instead of appendChild  to circumvent an IE6 bug.
+			// This arises when a base node is used (#2709).
+			head.insertBefore( script, head.firstChild );
+			head.removeChild( script );
+		}
+	},
+
+	nodeName: function( elem, name ) {
+		return elem.nodeName && elem.nodeName.toUpperCase() == name.toUpperCase();
+	},
+
+	// args is for internal usage only
+	each: function( object, callback, args ) {
+		var name, i = 0, length = object.length;
+
+		if ( args ) {
+			if ( length === undefined ) {
+				for ( name in object )
+					if ( callback.apply( object[ name ], args ) === false )
+						break;
+			} else
+				for ( ; i < length; )
+					if ( callback.apply( object[ i++ ], args ) === false )
+						break;
+
+		// A special, fast, case for the most common use of each
+		} else {
+			if ( length === undefined ) {
+				for ( name in object )
+					if ( callback.call( object[ name ], name, object[ name ] ) === false )
+						break;
+			} else
+				for ( var value = object[0];
+					i < length && callback.call( value, i, value ) !== false; value = object[++i] ){}
+		}
+
+		return object;
+	},
+
+	prop: function( elem, value, type, i, name ) {
+		// Handle executable functions
+		if ( jQuery.isFunction( value ) )
+			value = value.call( elem, i );
+
+		// Handle passing in a number to a CSS property
+		return typeof value === "number" && type == "curCSS" && !exclude.test( name ) ?
+			value + "px" :
+			value;
+	},
+
+	className: {
+		// internal only, use addClass("class")
+		add: function( elem, classNames ) {
+			jQuery.each((classNames || "").split(/\s+/), function(i, className){
+				if ( elem.nodeType == 1 && !jQuery.className.has( elem.className, className ) )
+					elem.className += (elem.className ? " " : "") + className;
+			});
+		},
+
+		// internal only, use removeClass("class")
+		remove: function( elem, classNames ) {
+			if (elem.nodeType == 1)
+				elem.className = classNames !== undefined ?
+					jQuery.grep(elem.className.split(/\s+/), function(className){
+						return !jQuery.className.has( classNames, className );
+					}).join(" ") :
+					"";
+		},
+
+		// internal only, use hasClass("class")
+		has: function( elem, className ) {
+			return elem && jQuery.inArray( className, (elem.className || elem).toString().split(/\s+/) ) > -1;
+		}
+	},
+
+	// A method for quickly swapping in/out CSS properties to get correct calculations
+	swap: function( elem, options, callback ) {
+		var old = {};
+		// Remember the old values, and insert the new ones
+		for ( var name in options ) {
+			old[ name ] = elem.style[ name ];
+			elem.style[ name ] = options[ name ];
+		}
+
+		callback.call( elem );
+
+		// Revert the old values
+		for ( var name in options )
+			elem.style[ name ] = old[ name ];
+	},
+
+	css: function( elem, name, force, extra ) {
+		if ( name == "width" || name == "height" ) {
+			var val, props = { position: "absolute", visibility: "hidden", display:"block" }, which = name == "width" ? [ "Left", "Right" ] : [ "Top", "Bottom" ];
+
+			function getWH() {
+				val = name == "width" ? elem.offsetWidth : elem.offsetHeight;
+
+				if ( extra === "border" )
+					return;
+
+				jQuery.each( which, function() {
+					if ( !extra )
+						val -= parseFloat(jQuery.curCSS( elem, "padding" + this, true)) || 0;
+					if ( extra === "margin" )
+						val += parseFloat(jQuery.curCSS( elem, "margin" + this, true)) || 0;
+					else
+						val -= parseFloat(jQuery.curCSS( elem, "border" + this + "Width", true)) || 0;
+				});
+			}
+
+			if ( elem.offsetWidth !== 0 )
+				getWH();
+			else
+				jQuery.swap( elem, props, getWH );
+
+			return Math.max(0, Math.round(val));
+		}
+
+		return jQuery.curCSS( elem, name, force );
+	},
+
+	curCSS: function( elem, name, force ) {
+		var ret, style = elem.style;
+
+		// We need to handle opacity special in IE
+		if ( name == "opacity" && !jQuery.support.opacity ) {
+			ret = jQuery.attr( style, "opacity" );
+
+			return ret == "" ?
+				"1" :
+				ret;
+		}
+
+		// Make sure we're using the right name for getting the float value
+		if ( name.match( /float/i ) )
+			name = styleFloat;
+
+		if ( !force && style && style[ name ] )
+			ret = style[ name ];
+
+		else if ( defaultView.getComputedStyle ) {
+
+			// Only "float" is needed here
+			if ( name.match( /float/i ) )
+				name = "float";
+
+			name = name.replace( /([A-Z])/g, "-$1" ).toLowerCase();
+
+			var computedStyle = defaultView.getComputedStyle( elem, null );
+
+			if ( computedStyle )
+				ret = computedStyle.getPropertyValue( name );
+
+			// We should always get a number back from opacity
+			if ( name == "opacity" && ret == "" )
+				ret = "1";
+
+		} else if ( elem.currentStyle ) {
+			var camelCase = name.replace(/\-(\w)/g, function(all, letter){
+				return letter.toUpperCase();
+			});
+
+			ret = elem.currentStyle[ name ] || elem.currentStyle[ camelCase ];
+
+			// From the awesome hack by Dean Edwards
+			// http://erik.eae.net/archives/2007/07/27/18.54.15/#comment-102291
+
+			// If we're not dealing with a regular pixel number
+			// but a number that has a weird ending, we need to convert it to pixels
+			if ( !/^\d+(px)?$/i.test( ret ) && /^\d/.test( ret ) ) {
+				// Remember the original values
+				var left = style.left, rsLeft = elem.runtimeStyle.left;
+
+				// Put in the new values to get a computed value out
+				elem.runtimeStyle.left = elem.currentStyle.left;
+				style.left = ret || 0;
+				ret = style.pixelLeft + "px";
+
+				// Revert the changed values
+				style.left = left;
+				elem.runtimeStyle.left = rsLeft;
+			}
+		}
+
+		return ret;
+	},
+
+	clean: function( elems, context, fragment ) {
+		context = context || document;
+
+		// !context.createElement fails in IE with an error but returns typeof 'object'
+		if ( typeof context.createElement === "undefined" )
+			context = context.ownerDocument || context[0] && context[0].ownerDocument || document;
+
+		// If a single string is passed in and it's a single tag
+		// just do a createElement and skip the rest
+		if ( !fragment && elems.length === 1 && typeof elems[0] === "string" ) {
+			var match = /^<(\w+)\s*\/?>$/.exec(elems[0]);
+			if ( match )
+				return [ context.createElement( match[1] ) ];
+		}
+
+		var ret = [], scripts = [], div = context.createElement("div");
+
+		jQuery.each(elems, function(i, elem){
+			if ( typeof elem === "number" )
+				elem += '';
+
+			if ( !elem )
+				return;
+
+			// Convert html string into DOM nodes
+			if ( typeof elem === "string" ) {
+				// Fix "XHTML"-style tags in all browsers
+				elem = elem.replace(/(<(\w+)[^>]*?)\/>/g, function(all, front, tag){
+					return tag.match(/^(abbr|br|col|img|input|link|meta|param|hr|area|embed)$/i) ?
+						all :
+						front + "></" + tag + ">";
+				});
+
+				// Trim whitespace, otherwise indexOf won't work as expected
+				var tags = elem.replace(/^\s+/, "").substring(0, 10).toLowerCase();
+
+				var wrap =
+					// option or optgroup
+					!tags.indexOf("<opt") &&
+					[ 1, "<select multiple='multiple'>", "</select>" ] ||
+
+					!tags.indexOf("<leg") &&
+					[ 1, "<fieldset>", "</fieldset>" ] ||
+
+					tags.match(/^<(thead|tbody|tfoot|colg|cap)/) &&
+					[ 1, "<table>", "</table>" ] ||
+
+					!tags.indexOf("<tr") &&
+					[ 2, "<table><tbody>", "</tbody></table>" ] ||
+
+				 	// <thead> matched above
+					(!tags.indexOf("<td") || !tags.indexOf("<th")) &&
+					[ 3, "<table><tbody><tr>", "</tr></tbody></table>" ] ||
+
+					!tags.indexOf("<col") &&
+					[ 2, "<table><tbody></tbody><colgroup>", "</colgroup></table>" ] ||
+
+					// IE can't serialize <link> and <script> tags normally
+					!jQuery.support.htmlSerialize &&
+					[ 1, "div<div>", "</div>" ] ||
+
+					[ 0, "", "" ];
+
+				// Go to html and back, then peel off extra wrappers
+				div.innerHTML = wrap[1] + elem + wrap[2];
+
+				// Move to the right depth
+				while ( wrap[0]-- )
+					div = div.lastChild;
+
+				// Remove IE's autoinserted <tbody> from table fragments
+				if ( !jQuery.support.tbody ) {
+
+					// String was a <table>, *may* have spurious <tbody>
+					var hasBody = /<tbody/i.test(elem),
+						tbody = !tags.indexOf("<table") && !hasBody ?
+							div.firstChild && div.firstChild.childNodes :
+
+						// String was a bare <thead> or <tfoot>
+						wrap[1] == "<table>" && !hasBody ?
+							div.childNodes :
+							[];
+
+					for ( var j = tbody.length - 1; j >= 0 ; --j )
+						if ( jQuery.nodeName( tbody[ j ], "tbody" ) && !tbody[ j ].childNodes.length )
+							tbody[ j ].parentNode.removeChild( tbody[ j ] );
+
+					}
+
+				// IE completely kills leading whitespace when innerHTML is used
+				if ( !jQuery.support.leadingWhitespace && /^\s/.test( elem ) )
+					div.insertBefore( context.createTextNode( elem.match(/^\s*/)[0] ), div.firstChild );
+				
+				elem = jQuery.makeArray( div.childNodes );
+			}
+
+			if ( elem.nodeType )
+				ret.push( elem );
+			else
+				ret = jQuery.merge( ret, elem );
+
+		});
+
+		if ( fragment ) {
+			for ( var i = 0; ret[i]; i++ ) {
+				if ( jQuery.nodeName( ret[i], "script" ) && (!ret[i].type || ret[i].type.toLowerCase() === "text/javascript") ) {
+					scripts.push( ret[i].parentNode ? ret[i].parentNode.removeChild( ret[i] ) : ret[i] );
+				} else {
+					if ( ret[i].nodeType === 1 )
+						ret.splice.apply( ret, [i + 1, 0].concat(jQuery.makeArray(ret[i].getElementsByTagName("script"))) );
+					fragment.appendChild( ret[i] );
+				}
+			}
+			
+			return scripts;
+		}
+
+		return ret;
+	},
+
+	attr: function( elem, name, value ) {
+		// don't set attributes on text and comment nodes
+		if (!elem || elem.nodeType == 3 || elem.nodeType == 8)
+			return undefined;
+
+		var notxml = !jQuery.isXMLDoc( elem ),
+			// Whether we are setting (or getting)
+			set = value !== undefined;
+
+		// Try to normalize/fix the name
+		name = notxml && jQuery.props[ name ] || name;
+
+		// Only do all the following if this is a node (faster for style)
+		// IE elem.getAttribute passes even for style
+		if ( elem.tagName ) {
+
+			// These attributes require special treatment
+			var special = /href|src|style/.test( name );
+
+			// Safari mis-reports the default selected property of a hidden option
+			// Accessing the parent's selectedIndex property fixes it
+			if ( name == "selected" && elem.parentNode )
+				elem.parentNode.selectedIndex;
+
+			// If applicable, access the attribute via the DOM 0 way
+			if ( name in elem && notxml && !special ) {
+				if ( set ){
+					// We can't allow the type property to be changed (since it causes problems in IE)
+					if ( name == "type" && jQuery.nodeName( elem, "input" ) && elem.parentNode )
+						throw "type property can't be changed";
+
+					elem[ name ] = value;
+				}
+
+				// browsers index elements by id/name on forms, give priority to attributes.
+				if( jQuery.nodeName( elem, "form" ) && elem.getAttributeNode(name) )
+					return elem.getAttributeNode( name ).nodeValue;
+
+				// elem.tabIndex doesn't always return the correct value when it hasn't been explicitly set
+				// http://fluidproject.org/blog/2008/01/09/getting-setting-and-removing-tabindex-values-with-javascript/
+				if ( name == "tabIndex" ) {
+					var attributeNode = elem.getAttributeNode( "tabIndex" );
+					return attributeNode && attributeNode.specified
+						? attributeNode.value
+						: elem.nodeName.match(/(button|input|object|select|textarea)/i)
+							? 0
+							: elem.nodeName.match(/^(a|area)$/i) && elem.href
+								? 0
+								: undefined;
+				}
+
+				return elem[ name ];
+			}
+
+			if ( !jQuery.support.style && notxml &&  name == "style" )
+				return jQuery.attr( elem.style, "cssText", value );
+
+			if ( set )
+				// convert the value to a string (all browsers do this but IE) see #1070
+				elem.setAttribute( name, "" + value );
+
+			var attr = !jQuery.support.hrefNormalized && notxml && special
+					// Some attributes require a special call on IE
+					? elem.getAttribute( name, 2 )
+					: elem.getAttribute( name );
+
+			// Non-existent attributes return null, we normalize to undefined
+			return attr === null ? undefined : attr;
+		}
+
+		// elem is actually elem.style ... set the style
+
+		// IE uses filters for opacity
+		if ( !jQuery.support.opacity && name == "opacity" ) {
+			if ( set ) {
+				// IE has trouble with opacity if it does not have layout
+				// Force it by setting the zoom level
+				elem.zoom = 1;
+
+				// Set the alpha filter to set the opacity
+				elem.filter = (elem.filter || "").replace( /alpha\([^)]*\)/, "" ) +
+					(parseInt( value ) + '' == "NaN" ? "" : "alpha(opacity=" + value * 100 + ")");
+			}
+
+			return elem.filter && elem.filter.indexOf("opacity=") >= 0 ?
+				(parseFloat( elem.filter.match(/opacity=([^)]*)/)[1] ) / 100) + '':
+				"";
+		}
+
+		name = name.replace(/-([a-z])/ig, function(all, letter){
+			return letter.toUpperCase();
+		});
+
+		if ( set )
+			elem[ name ] = value;
+
+		return elem[ name ];
+	},
+
+	trim: function( text ) {
+		return (text || "").replace( /^\s+|\s+$/g, "" );
+	},
+
+	makeArray: function( array ) {
+		var ret = [];
+
+		if( array != null ){
+			var i = array.length;
+			// The window, strings (and functions) also have 'length'
+			if( i == null || typeof array === "string" || jQuery.isFunction(array) || array.setInterval )
+				ret[0] = array;
+			else
+				while( i )
+					ret[--i] = array[i];
+		}
+
+		return ret;
+	},
+
+	inArray: function( elem, array ) {
+		for ( var i = 0, length = array.length; i < length; i++ )
+		// Use === because on IE, window == document
+			if ( array[ i ] === elem )
+				return i;
+
+		return -1;
+	},
+
+	merge: function( first, second ) {
+		// We have to loop this way because IE & Opera overwrite the length
+		// expando of getElementsByTagName
+		var i = 0, elem, pos = first.length;
+		// Also, we need to make sure that the correct elements are being returned
+		// (IE returns comment nodes in a '*' query)
+		if ( !jQuery.support.getAll ) {
+			while ( (elem = second[ i++ ]) != null )
+				if ( elem.nodeType != 8 )
+					first[ pos++ ] = elem;
+
+		} else
+			while ( (elem = second[ i++ ]) != null )
+				first[ pos++ ] = elem;
+
+		return first;
+	},
+
+	unique: function( array ) {
+		var ret = [], done = {};
+
+		try {
+
+			for ( var i = 0, length = array.length; i < length; i++ ) {
+				var id = jQuery.data( array[ i ] );
+
+				if ( !done[ id ] ) {
+					done[ id ] = true;
+					ret.push( array[ i ] );
+				}
+			}
+
+		} catch( e ) {
+			ret = array;
+		}
+
+		return ret;
+	},
+
+	grep: function( elems, callback, inv ) {
+		var ret = [];
+
+		// Go through the array, only saving the items
+		// that pass the validator function
+		for ( var i = 0, length = elems.length; i < length; i++ )
+			if ( !inv != !callback( elems[ i ], i ) )
+				ret.push( elems[ i ] );
+
+		return ret;
+	},
+
+	map: function( elems, callback ) {
+		var ret = [];
+
+		// Go through the array, translating each of the items to their
+		// new value (or values).
+		for ( var i = 0, length = elems.length; i < length; i++ ) {
+			var value = callback( elems[ i ], i );
+
+			if ( value != null )
+				ret[ ret.length ] = value;
+		}
+
+		return ret.concat.apply( [], ret );
+	}
+});
+
+// Use of jQuery.browser is deprecated.
+// It's included for backwards compatibility and plugins,
+// although they should work to migrate away.
+
+var userAgent = navigator.userAgent.toLowerCase();
+
+// Figure out what browser is being used
+jQuery.browser = {
+	version: (userAgent.match( /.+(?:rv|it|ra|ie)[\/: ]([\d.]+)/ ) || [0,'0'])[1],
+	safari: /webkit/.test( userAgent ),
+	opera: /opera/.test( userAgent ),
+	msie: /msie/.test( userAgent ) && !/opera/.test( userAgent ),
+	mozilla: /mozilla/.test( userAgent ) && !/(compatible|webkit)/.test( userAgent )
+};
+
+jQuery.each({
+	parent: function(elem){return elem.parentNode;},
+	parents: function(elem){return jQuery.dir(elem,"parentNode");},
+	next: function(elem){return jQuery.nth(elem,2,"nextSibling");},
+	prev: function(elem){return jQuery.nth(elem,2,"previousSibling");},
+	nextAll: function(elem){return jQuery.dir(elem,"nextSibling");},
+	prevAll: function(elem){return jQuery.dir(elem,"previousSibling");},
+	siblings: function(elem){return jQuery.sibling(elem.parentNode.firstChild,elem);},
+	children: function(elem){return jQuery.sibling(elem.firstChild);},
+	contents: function(elem){return jQuery.nodeName(elem,"iframe")?elem.contentDocument||elem.contentWindow.document:jQuery.makeArray(elem.childNodes);}
+}, function(name, fn){
+	jQuery.fn[ name ] = function( selector ) {
+		var ret = jQuery.map( this, fn );
+
+		if ( selector && typeof selector == "string" )
+			ret = jQuery.multiFilter( selector, ret );
+
+		return this.pushStack( jQuery.unique( ret ), name, selector );
+	};
+});
+
+jQuery.each({
+	appendTo: "append",
+	prependTo: "prepend",
+	insertBefore: "before",
+	insertAfter: "after",
+	replaceAll: "replaceWith"
+}, function(name, original){
+	jQuery.fn[ name ] = function( selector ) {
+		var ret = [], insert = jQuery( selector );
+
+		for ( var i = 0, l = insert.length; i < l; i++ ) {
+			var elems = (i > 0 ? this.clone(true) : this).get();
+			jQuery.fn[ original ].apply( jQuery(insert[i]), elems );
+			ret = ret.concat( elems );
+		}
+
+		return this.pushStack( ret, name, selector );
+	};
+});
+
+jQuery.each({
+	removeAttr: function( name ) {
+		jQuery.attr( this, name, "" );
+		if (this.nodeType == 1)
+			this.removeAttribute( name );
+	},
+
+	addClass: function( classNames ) {
+		jQuery.className.add( this, classNames );
+	},
+
+	removeClass: function( classNames ) {
+		jQuery.className.remove( this, classNames );
+	},
+
+	toggleClass: function( classNames, state ) {
+		if( typeof state !== "boolean" )
+			state = !jQuery.className.has( this, classNames );
+		jQuery.className[ state ? "add" : "remove" ]( this, classNames );
+	},
+
+	remove: function( selector ) {
+		if ( !selector || jQuery.filter( selector, [ this ] ).length ) {
+			// Prevent memory leaks
+			jQuery( "*", this ).add([this]).each(function(){
+				jQuery.event.remove(this);
+				jQuery.removeData(this);
+			});
+			if (this.parentNode)
+				this.parentNode.removeChild( this );
+		}
+	},
+
+	empty: function() {
+		// Remove element nodes and prevent memory leaks
+		jQuery(this).children().remove();
+
+		// Remove any remaining nodes
+		while ( this.firstChild )
+			this.removeChild( this.firstChild );
+	}
+}, function(name, fn){
+	jQuery.fn[ name ] = function(){
+		return this.each( fn, arguments );
+	};
+});
+
+// Helper function used by the dimensions and offset modules
+function num(elem, prop) {
+	return elem[0] && parseInt( jQuery.curCSS(elem[0], prop, true), 10 ) || 0;
+}
+var expando = "jQuery" + now(), uuid = 0, windowData = {};
+
+jQuery.extend({
+	cache: {},
+
+	data: function( elem, name, data ) {
+		elem = elem == window ?
+			windowData :
+			elem;
+
+		var id = elem[ expando ];
+
+		// Compute a unique ID for the element
+		if ( !id )
+			id = elem[ expando ] = ++uuid;
+
+		// Only generate the data cache if we're
+		// trying to access or manipulate it
+		if ( name && !jQuery.cache[ id ] )
+			jQuery.cache[ id ] = {};
+
+		// Prevent overriding the named cache with undefined values
+		if ( data !== undefined )
+			jQuery.cache[ id ][ name ] = data;
+
+		// Return the named cache data, or the ID for the element
+		return name ?
+			jQuery.cache[ id ][ name ] :
+			id;
+	},
+
+	removeData: function( elem, name ) {
+		elem = elem == window ?
+			windowData :
+			elem;
+
+		var id = elem[ expando ];
+
+		// If we want to remove a specific section of the element's data
+		if ( name ) {
+			if ( jQuery.cache[ id ] ) {
+				// Remove the section of cache data
+				delete jQuery.cache[ id ][ name ];
+
+				// If we've removed all the data, remove the element's cache
+				name = "";
+
+				for ( name in jQuery.cache[ id ] )
+					break;
+
+				if ( !name )
+					jQuery.removeData( elem );
+			}
+
+		// Otherwise, we want to remove all of the element's data
+		} else {
+			// Clean up the element expando
+			try {
+				delete elem[ expando ];
+			} catch(e){
+				// IE has trouble directly removing the expando
+				// but it's ok with using removeAttribute
+				if ( elem.removeAttribute )
+					elem.removeAttribute( expando );
+			}
+
+			// Completely remove the data cache
+			delete jQuery.cache[ id ];
+		}
+	},
+	queue: function( elem, type, data ) {
+		if ( elem ){
+	
+			type = (type || "fx") + "queue";
+	
+			var q = jQuery.data( elem, type );
+	
+			if ( !q || jQuery.isArray(data) )
+				q = jQuery.data( elem, type, jQuery.makeArray(data) );
+			else if( data )
+				q.push( data );
+	
+		}
+		return q;
+	},
+
+	dequeue: function( elem, type ){
+		var queue = jQuery.queue( elem, type ),
+			fn = queue.shift();
+		
+		if( !type || type === "fx" )
+			fn = queue[0];
+			
+		if( fn !== undefined )
+			fn.call(elem);
+	}
+});
+
+jQuery.fn.extend({
+	data: function( key, value ){
+		var parts = key.split(".");
+		parts[1] = parts[1] ? "." + parts[1] : "";
+
+		if ( value === undefined ) {
+			var data = this.triggerHandler("getData" + parts[1] + "!", [parts[0]]);
+
+			if ( data === undefined && this.length )
+				data = jQuery.data( this[0], key );
+
+			return data === undefined && parts[1] ?
+				this.data( parts[0] ) :
+				data;
+		} else
+			return this.trigger("setData" + parts[1] + "!", [parts[0], value]).each(function(){
+				jQuery.data( this, key, value );
+			});
+	},
+
+	removeData: function( key ){
+		return this.each(function(){
+			jQuery.removeData( this, key );
+		});
+	},
+	queue: function(type, data){
+		if ( typeof type !== "string" ) {
+			data = type;
+			type = "fx";
+		}
+
+		if ( data === undefined )
+			return jQuery.queue( this[0], type );
+
+		return this.each(function(){
+			var queue = jQuery.queue( this, type, data );
+			
+			 if( type == "fx" && queue.length == 1 )
+				queue[0].call(this);
+		});
+	},
+	dequeue: function(type){
+		return this.each(function(){
+			jQuery.dequeue( this, type );
+		});
+	}
+});/*!
+ * Sizzle CSS Selector Engine - v0.9.3
+ *  Copyright 2009, The Dojo Foundation
+ *  Released under the MIT, BSD, and GPL Licenses.
+ *  More information: http://sizzlejs.com/
+ */
+(function(){
+
+var chunker = /((?:\((?:\([^()]+\)|[^()]+)+\)|\[(?:\[[^[\]]*\]|['"][^'"]*['"]|[^[\]'"]+)+\]|\\.|[^ >+~,(\[\\]+)+|[>+~])(\s*,\s*)?/g,
+	done = 0,
+	toString = Object.prototype.toString;
+
+var Sizzle = function(selector, context, results, seed) {
+	results = results || [];
+	context = context || document;
+
+	if ( context.nodeType !== 1 && context.nodeType !== 9 )
+		return [];
+	
+	if ( !selector || typeof selector !== "string" ) {
+		return results;
+	}
+
+	var parts = [], m, set, checkSet, check, mode, extra, prune = true;
+	
+	// Reset the position of the chunker regexp (start from head)
+	chunker.lastIndex = 0;
+	
+	while ( (m = chunker.exec(selector)) !== null ) {
+		parts.push( m[1] );
+		
+		if ( m[2] ) {
+			extra = RegExp.rightContext;
+			break;
+		}
+	}
+
+	if ( parts.length > 1 && origPOS.exec( selector ) ) {
+		if ( parts.length === 2 && Expr.relative[ parts[0] ] ) {
+			set = posProcess( parts[0] + parts[1], context );
+		} else {
+			set = Expr.relative[ parts[0] ] ?
+				[ context ] :
+				Sizzle( parts.shift(), context );
+
+			while ( parts.length ) {
+				selector = parts.shift();
+
+				if ( Expr.relative[ selector ] )
+					selector += parts.shift();
+
+				set = posProcess( selector, set );
+			}
+		}
+	} else {
+		var ret = seed ?
+			{ expr: parts.pop(), set: makeArray(seed) } :
+			Sizzle.find( parts.pop(), parts.length === 1 && context.parentNode ? context.parentNode : context, isXML(context) );
+		set = Sizzle.filter( ret.expr, ret.set );
+
+		if ( parts.length > 0 ) {
+			checkSet = makeArray(set);
+		} else {
+			prune = false;
+		}
+
+		while ( parts.length ) {
+			var cur = parts.pop(), pop = cur;
+
+			if ( !Expr.relative[ cur ] ) {
+				cur = "";
+			} else {
+				pop = parts.pop();
+			}
+
+			if ( pop == null ) {
+				pop = context;
+			}
+
+			Expr.relative[ cur ]( checkSet, pop, isXML(context) );
+		}
+	}
+
+	if ( !checkSet ) {
+		checkSet = set;
+	}
+
+	if ( !checkSet ) {
+		throw "Syntax error, unrecognized expression: " + (cur || selector);
+	}
+
+	if ( toString.call(checkSet) === "[object Array]" ) {
+		if ( !prune ) {
+			results.push.apply( results, checkSet );
+		} else if ( context.nodeType === 1 ) {
+			for ( var i = 0; checkSet[i] != null; i++ ) {
+				if ( checkSet[i] && (checkSet[i] === true || checkSet[i].nodeType === 1 && contains(context, checkSet[i])) ) {
+					results.push( set[i] );
+				}
+			}
+		} else {
+			for ( var i = 0; checkSet[i] != null; i++ ) {
+				if ( checkSet[i] && checkSet[i].nodeType === 1 ) {
+					results.push( set[i] );
+				}
+			}
+		}
+	} else {
+		makeArray( checkSet, results );
+	}
+
+	if ( extra ) {
+		Sizzle( extra, context, results, seed );
+
+		if ( sortOrder ) {
+			hasDuplicate = false;
+			results.sort(sortOrder);
+
+			if ( hasDuplicate ) {
+				for ( var i = 1; i < results.length; i++ ) {
+					if ( results[i] === results[i-1] ) {
+						results.splice(i--, 1);
+					}
+				}
+			}
+		}
+	}
+
+	return results;
+};
+
+Sizzle.matches = function(expr, set){
+	return Sizzle(expr, null, null, set);
+};
+
+Sizzle.find = function(expr, context, isXML){
+	var set, match;
+
+	if ( !expr ) {
+		return [];
+	}
+
+	for ( var i = 0, l = Expr.order.length; i < l; i++ ) {
+		var type = Expr.order[i], match;
+		
+		if ( (match = Expr.match[ type ].exec( expr )) ) {
+			var left = RegExp.leftContext;
+
+			if ( left.substr( left.length - 1 ) !== "\\" ) {
+				match[1] = (match[1] || "").replace(/\\/g, "");
+				set = Expr.find[ type ]( match, context, isXML );
+				if ( set != null ) {
+					expr = expr.replace( Expr.match[ type ], "" );
+					break;
+				}
+			}
+		}
+	}
+
+	if ( !set ) {
+		set = context.getElementsByTagName("*");
+	}
+
+	return {set: set, expr: expr};
+};
+
+Sizzle.filter = function(expr, set, inplace, not){
+	var old = expr, result = [], curLoop = set, match, anyFound,
+		isXMLFilter = set && set[0] && isXML(set[0]);
+
+	while ( expr && set.length ) {
+		for ( var type in Expr.filter ) {
+			if ( (match = Expr.match[ type ].exec( expr )) != null ) {
+				var filter = Expr.filter[ type ], found, item;
+				anyFound = false;
+
+				if ( curLoop == result ) {
+					result = [];
+				}
+
+				if ( Expr.preFilter[ type ] ) {
+					match = Expr.preFilter[ type ]( match, curLoop, inplace, result, not, isXMLFilter );
+
+					if ( !match ) {
+						anyFound = found = true;
+					} else if ( match === true ) {
+						continue;
+					}
+				}
+
+				if ( match ) {
+					for ( var i = 0; (item = curLoop[i]) != null; i++ ) {
+						if ( item ) {
+							found = filter( item, match, i, curLoop );
+							var pass = not ^ !!found;
+
+							if ( inplace && found != null ) {
+								if ( pass ) {
+									anyFound = true;
+								} else {
+									curLoop[i] = false;
+								}
+							} else if ( pass ) {
+								result.push( item );
+								anyFound = true;
+							}
+						}
+					}
+				}
+
+				if ( found !== undefined ) {
+					if ( !inplace ) {
+						curLoop = result;
+					}
+
+					expr = expr.replace( Expr.match[ type ], "" );
+
+					if ( !anyFound ) {
+						return [];
+					}
+
+					break;
+				}
+			}
+		}
+
+		// Improper expression
+		if ( expr == old ) {
+			if ( anyFound == null ) {
+				throw "Syntax error, unrecognized expression: " + expr;
+			} else {
+				break;
+			}
+		}
+
+		old = expr;
+	}
+
+	return curLoop;
+};
+
+var Expr = Sizzle.selectors = {
+	order: [ "ID", "NAME", "TAG" ],
+	match: {
+		ID: /#((?:[\w\u00c0-\uFFFF_-]|\\.)+)/,
+		CLASS: /\.((?:[\w\u00c0-\uFFFF_-]|\\.)+)/,
+		NAME: /\[name=['"]*((?:[\w\u00c0-\uFFFF_-]|\\.)+)['"]*\]/,
+		ATTR: /\[\s*((?:[\w\u00c0-\uFFFF_-]|\\.)+)\s*(?:(\S?=)\s*(['"]*)(.*?)\3|)\s*\]/,
+		TAG: /^((?:[\w\u00c0-\uFFFF\*_-]|\\.)+)/,
+		CHILD: /:(only|nth|last|first)-child(?:\((even|odd|[\dn+-]*)\))?/,
+		POS: /:(nth|eq|gt|lt|first|last|even|odd)(?:\((\d*)\))?(?=[^-]|$)/,
+		PSEUDO: /:((?:[\w\u00c0-\uFFFF_-]|\\.)+)(?:\((['"]*)((?:\([^\)]+\)|[^\2\(\)]*)+)\2\))?/
+	},
+	attrMap: {
+		"class": "className",
+		"for": "htmlFor"
+	},
+	attrHandle: {
+		href: function(elem){
+			return elem.getAttribute("href");
+		}
+	},
+	relative: {
+		"+": function(checkSet, part, isXML){
+			var isPartStr = typeof part === "string",
+				isTag = isPartStr && !/\W/.test(part),
+				isPartStrNotTag = isPartStr && !isTag;
+
+			if ( isTag && !isXML ) {
+				part = part.toUpperCase();
+			}
+
+			for ( var i = 0, l = checkSet.length, elem; i < l; i++ ) {
+				if ( (elem = checkSet[i]) ) {
+					while ( (elem = elem.previousSibling) && elem.nodeType !== 1 ) {}
+
+					checkSet[i] = isPartStrNotTag || elem && elem.nodeName === part ?
+						elem || false :
+						elem === part;
+				}
+			}
+
+			if ( isPartStrNotTag ) {
+				Sizzle.filter( part, checkSet, true );
+			}
+		},
+		">": function(checkSet, part, isXML){
+			var isPartStr = typeof part === "string";
+
+			if ( isPartStr && !/\W/.test(part) ) {
+				part = isXML ? part : part.toUpperCase();
+
+				for ( var i = 0, l = checkSet.length; i < l; i++ ) {
+					var elem = checkSet[i];
+					if ( elem ) {
+						var parent = elem.parentNode;
+						checkSet[i] = parent.nodeName === part ? parent : false;
+					}
+				}
+			} else {
+				for ( var i = 0, l = checkSet.length; i < l; i++ ) {
+					var elem = checkSet[i];
+					if ( elem ) {
+						checkSet[i] = isPartStr ?
+							elem.parentNode :
+							elem.parentNode === part;
+					}
+				}
+
+				if ( isPartStr ) {
+					Sizzle.filter( part, checkSet, true );
+				}
+			}
+		},
+		"": function(checkSet, part, isXML){
+			var doneName = done++, checkFn = dirCheck;
+
+			if ( !part.match(/\W/) ) {
+				var nodeCheck = part = isXML ? part : part.toUpperCase();
+				checkFn = dirNodeCheck;
+			}
+
+			checkFn("parentNode", part, doneName, checkSet, nodeCheck, isXML);
+		},
+		"~": function(checkSet, part, isXML){
+			var doneName = done++, checkFn = dirCheck;
+
+			if ( typeof part === "string" && !part.match(/\W/) ) {
+				var nodeCheck = part = isXML ? part : part.toUpperCase();
+				checkFn = dirNodeCheck;
+			}
+
+			checkFn("previousSibling", part, doneName, checkSet, nodeCheck, isXML);
+		}
+	},
+	find: {
+		ID: function(match, context, isXML){
+			if ( typeof context.getElementById !== "undefined" && !isXML ) {
+				var m = context.getElementById(match[1]);
+				return m ? [m] : [];
+			}
+		},
+		NAME: function(match, context, isXML){
+			if ( typeof context.getElementsByName !== "undefined" ) {
+				var ret = [], results = context.getElementsByName(match[1]);
+
+				for ( var i = 0, l = results.length; i < l; i++ ) {
+					if ( results[i].getAttribute("name") === match[1] ) {
+						ret.push( results[i] );
+					}
+				}
+
+				return ret.length === 0 ? null : ret;
+			}
+		},
+		TAG: function(match, context){
+			return context.getElementsByTagName(match[1]);
+		}
+	},
+	preFilter: {
+		CLASS: function(match, curLoop, inplace, result, not, isXML){
+			match = " " + match[1].replace(/\\/g, "") + " ";
+
+			if ( isXML ) {
+				return match;
+			}
+
+			for ( var i = 0, elem; (elem = curLoop[i]) != null; i++ ) {
+				if ( elem ) {
+					if ( not ^ (elem.className && (" " + elem.className + " ").indexOf(match) >= 0) ) {
+						if ( !inplace )
+							result.push( elem );
+					} else if ( inplace ) {
+						curLoop[i] = false;
+					}
+				}
+			}
+
+			return false;
+		},
+		ID: function(match){
+			return match[1].replace(/\\/g, "");
+		},
+		TAG: function(match, curLoop){
+			for ( var i = 0; curLoop[i] === false; i++ ){}
+			return curLoop[i] && isXML(curLoop[i]) ? match[1] : match[1].toUpperCase();
+		},
+		CHILD: function(match){
+			if ( match[1] == "nth" ) {
+				// parse equations like 'even', 'odd', '5', '2n', '3n+2', '4n-1', '-n+6'
+				var test = /(-?)(\d*)n((?:\+|-)?\d*)/.exec(
+					match[2] == "even" && "2n" || match[2] == "odd" && "2n+1" ||
+					!/\D/.test( match[2] ) && "0n+" + match[2] || match[2]);
+
+				// calculate the numbers (first)n+(last) including if they are negative
+				match[2] = (test[1] + (test[2] || 1)) - 0;
+				match[3] = test[3] - 0;
+			}
+
+			// TODO: Move to normal caching system
+			match[0] = done++;
+
+			return match;
+		},
+		ATTR: function(match, curLoop, inplace, result, not, isXML){
+			var name = match[1].replace(/\\/g, "");
+			
+			if ( !isXML && Expr.attrMap[name] ) {
+				match[1] = Expr.attrMap[name];
+			}
+
+			if ( match[2] === "~=" ) {
+				match[4] = " " + match[4] + " ";
+			}
+
+			return match;
+		},
+		PSEUDO: function(match, curLoop, inplace, result, not){
+			if ( match[1] === "not" ) {
+				// If we're dealing with a complex expression, or a simple one
+				if ( match[3].match(chunker).length > 1 || /^\w/.test(match[3]) ) {
+					match[3] = Sizzle(match[3], null, null, curLoop);
+				} else {
+					var ret = Sizzle.filter(match[3], curLoop, inplace, true ^ not);
+					if ( !inplace ) {
+						result.push.apply( result, ret );
+					}
+					return false;
+				}
+			} else if ( Expr.match.POS.test( match[0] ) || Expr.match.CHILD.test( match[0] ) ) {
+				return true;
+			}
+			
+			return match;
+		},
+		POS: function(match){
+			match.unshift( true );
+			return match;
+		}
+	},
+	filters: {
+		enabled: function(elem){
+			return elem.disabled === false && elem.type !== "hidden";
+		},
+		disabled: function(elem){
+			return elem.disabled === true;
+		},
+		checked: function(elem){
+			return elem.checked === true;
+		},
+		selected: function(elem){
+			// Accessing this property makes selected-by-default
+			// options in Safari work properly
+			elem.parentNode.selectedIndex;
+			return elem.selected === true;
+		},
+		parent: function(elem){
+			return !!elem.firstChild;
+		},
+		empty: function(elem){
+			return !elem.firstChild;
+		},
+		has: function(elem, i, match){
+			return !!Sizzle( match[3], elem ).length;
+		},
+		header: function(elem){
+			return /h\d/i.test( elem.nodeName );
+		},
+		text: function(elem){
+			return "text" === elem.type;
+		},
+		radio: function(elem){
+			return "radio" === elem.type;
+		},
+		checkbox: function(elem){
+			return "checkbox" === elem.type;
+		},
+		file: function(elem){
+			return "file" === elem.type;
+		},
+		password: function(elem){
+			return "password" === elem.type;
+		},
+		submit: function(elem){
+			return "submit" === elem.type;
+		},
+		image: function(elem){
+			return "image" === elem.type;
+		},
+		reset: function(elem){
+			return "reset" === elem.type;
+		},
+		button: function(elem){
+			return "button" === elem.type || elem.nodeName.toUpperCase() === "BUTTON";
+		},
+		input: function(elem){
+			return /input|select|textarea|button/i.test(elem.nodeName);
+		}
+	},
+	setFilters: {
+		first: function(elem, i){
+			return i === 0;
+		},
+		last: function(elem, i, match, array){
+			return i === array.length - 1;
+		},
+		even: function(elem, i){
+			return i % 2 === 0;
+		},
+		odd: function(elem, i){
+			return i % 2 === 1;
+		},
+		lt: function(elem, i, match){
+			return i < match[3] - 0;
+		},
+		gt: function(elem, i, match){
+			return i > match[3] - 0;
+		},
+		nth: function(elem, i, match){
+			return match[3] - 0 == i;
+		},
+		eq: function(elem, i, match){
+			return match[3] - 0 == i;
+		}
+	},
+	filter: {
+		PSEUDO: function(elem, match, i, array){
+			var name = match[1], filter = Expr.filters[ name ];
+
+			if ( filter ) {
+				return filter( elem, i, match, array );
+			} else if ( name === "contains" ) {
+				return (elem.textContent || elem.innerText || "").indexOf(match[3]) >= 0;
+			} else if ( name === "not" ) {
+				var not = match[3];
+
+				for ( var i = 0, l = not.length; i < l; i++ ) {
+					if ( not[i] === elem ) {
+						return false;
+					}
+				}
+
+				return true;
+			}
+		},
+		CHILD: function(elem, match){
+			var type = match[1], node = elem;
+			switch (type) {
+				case 'only':
+				case 'first':
+					while (node = node.previousSibling)  {
+						if ( node.nodeType === 1 ) return false;
+					}
+					if ( type == 'first') return true;
+					node = elem;
+				case 'last':
+					while (node = node.nextSibling)  {
+						if ( node.nodeType === 1 ) return false;
+					}
+					return true;
+				case 'nth':
+					var first = match[2], last = match[3];
+
+					if ( first == 1 && last == 0 ) {
+						return true;
+					}
+					
+					var doneName = match[0],
+						parent = elem.parentNode;
+	
+					if ( parent && (parent.sizcache !== doneName || !elem.nodeIndex) ) {
+						var count = 0;
+						for ( node = parent.firstChild; node; node = node.nextSibling ) {
+							if ( node.nodeType === 1 ) {
+								node.nodeIndex = ++count;
+							}
+						} 
+						parent.sizcache = doneName;
+					}
+					
+					var diff = elem.nodeIndex - last;
+					if ( first == 0 ) {
+						return diff == 0;
+					} else {
+						return ( diff % first == 0 && diff / first >= 0 );
+					}
+			}
+		},
+		ID: function(elem, match){
+			return elem.nodeType === 1 && elem.getAttribute("id") === match;
+		},
+		TAG: function(elem, match){
+			return (match === "*" && elem.nodeType === 1) || elem.nodeName === match;
+		},
+		CLASS: function(elem, match){
+			return (" " + (elem.className || elem.getAttribute("class")) + " ")
+				.indexOf( match ) > -1;
+		},
+		ATTR: function(elem, match){
+			var name = match[1],
+				result = Expr.attrHandle[ name ] ?
+					Expr.attrHandle[ name ]( elem ) :
+					elem[ name ] != null ?
+						elem[ name ] :
+						elem.getAttribute( name ),
+				value = result + "",
+				type = match[2],
+				check = match[4];
+
+			return result == null ?
+				type === "!=" :
+				type === "=" ?
+				value === check :
+				type === "*=" ?
+				value.indexOf(check) >= 0 :
+				type === "~=" ?
+				(" " + value + " ").indexOf(check) >= 0 :
+				!check ?
+				value && result !== false :
+				type === "!=" ?
+				value != check :
+				type === "^=" ?
+				value.indexOf(check) === 0 :
+				type === "$=" ?
+				value.substr(value.length - check.length) === check :
+				type === "|=" ?
+				value === check || value.substr(0, check.length + 1) === check + "-" :
+				false;
+		},
+		POS: function(elem, match, i, array){
+			var name = match[2], filter = Expr.setFilters[ name ];
+
+			if ( filter ) {
+				return filter( elem, i, match, array );
+			}
+		}
+	}
+};
+
+var origPOS = Expr.match.POS;
+
+for ( var type in Expr.match ) {
+	Expr.match[ type ] = RegExp( Expr.match[ type ].source + /(?![^\[]*\])(?![^\(]*\))/.source );
+}
+
+var makeArray = function(array, results) {
+	array = Array.prototype.slice.call( array );
+
+	if ( results ) {
+		results.push.apply( results, array );
+		return results;
+	}
+	
+	return array;
+};
+
+// Perform a simple check to determine if the browser is capable of
+// converting a NodeList to an array using builtin methods.
+try {
+	Array.prototype.slice.call( document.documentElement.childNodes );
+
+// Provide a fallback method if it does not work
+} catch(e){
+	makeArray = function(array, results) {
+		var ret = results || [];
+
+		if ( toString.call(array) === "[object Array]" ) {
+			Array.prototype.push.apply( ret, array );
+		} else {
+			if ( typeof array.length === "number" ) {
+				for ( var i = 0, l = array.length; i < l; i++ ) {
+					ret.push( array[i] );
+				}
+			} else {
+				for ( var i = 0; array[i]; i++ ) {
+					ret.push( array[i] );
+				}
+			}
+		}
+
+		return ret;
+	};
+}
+
+var sortOrder;
+
+if ( document.documentElement.compareDocumentPosition ) {
+	sortOrder = function( a, b ) {
+		var ret = a.compareDocumentPosition(b) & 4 ? -1 : a === b ? 0 : 1;
+		if ( ret === 0 ) {
+			hasDuplicate = true;
+		}
+		return ret;
+	};
+} else if ( "sourceIndex" in document.documentElement ) {
+	sortOrder = function( a, b ) {
+		var ret = a.sourceIndex - b.sourceIndex;
+		if ( ret === 0 ) {
+			hasDuplicate = true;
+		}
+		return ret;
+	};
+} else if ( document.createRange ) {
+	sortOrder = function( a, b ) {
+		var aRange = a.ownerDocument.createRange(), bRange = b.ownerDocument.createRange();
+		aRange.selectNode(a);
+		aRange.collapse(true);
+		bRange.selectNode(b);
+		bRange.collapse(true);
+		var ret = aRange.compareBoundaryPoints(Range.START_TO_END, bRange);
+		if ( ret === 0 ) {
+			hasDuplicate = true;
+		}
+		return ret;
+	};
+}
+
+// Check to see if the browser returns elements by name when
+// querying by getElementById (and provide a workaround)
+(function(){
+	// We're going to inject a fake input element with a specified name
+	var form = document.createElement("form"),
+		id = "script" + (new Date).getTime();
+	form.innerHTML = "<input name='" + id + "'/>";
+
+	// Inject it into the root element, check its status, and remove it quickly
+	var root = document.documentElement;
+	root.insertBefore( form, root.firstChild );
+
+	// The workaround has to do additional checks after a getElementById
+	// Which slows things down for other browsers (hence the branching)
+	if ( !!document.getElementById( id ) ) {
+		Expr.find.ID = function(match, context, isXML){
+			if ( typeof context.getElementById !== "undefined" && !isXML ) {
+				var m = context.getElementById(match[1]);
+				return m ? m.id === match[1] || typeof m.getAttributeNode !== "undefined" && m.getAttributeNode("id").nodeValue === match[1] ? [m] : undefined : [];
+			}
+		};
+
+		Expr.filter.ID = function(elem, match){
+			var node = typeof elem.getAttributeNode !== "undefined" && elem.getAttributeNode("id");
+			return elem.nodeType === 1 && node && node.nodeValue === match;
+		};
+	}
+
+	root.removeChild( form );
+})();
+
+(function(){
+	// Check to see if the browser returns only elements
+	// when doing getElementsByTagName("*")
+
+	// Create a fake element
+	var div = document.createElement("div");
+	div.appendChild( document.createComment("") );
+
+	// Make sure no comments are found
+	if ( div.getElementsByTagName("*").length > 0 ) {
+		Expr.find.TAG = function(match, context){
+			var results = context.getElementsByTagName(match[1]);
+
+			// Filter out possible comments
+			if ( match[1] === "*" ) {
+				var tmp = [];
+
+				for ( var i = 0; results[i]; i++ ) {
+					if ( results[i].nodeType === 1 ) {
+						tmp.push( results[i] );
+					}
+				}
+
+				results = tmp;
+			}
+
+			return results;
+		};
+	}
+
+	// Check to see if an attribute returns normalized href attributes
+	div.innerHTML = "<a href='#'></a>";
+	if ( div.firstChild && typeof div.firstChild.getAttribute !== "undefined" &&
+			div.firstChild.getAttribute("href") !== "#" ) {
+		Expr.attrHandle.href = function(elem){
+			return elem.getAttribute("href", 2);
+		};
+	}
+})();
+
+if ( document.querySelectorAll ) (function(){
+	var oldSizzle = Sizzle, div = document.createElement("div");
+	div.innerHTML = "<p class='TEST'></p>";
+
+	// Safari can't handle uppercase or unicode characters when
+	// in quirks mode.
+	if ( div.querySelectorAll && div.querySelectorAll(".TEST").length === 0 ) {
+		return;
+	}
+	
+	Sizzle = function(query, context, extra, seed){
+		context = context || document;
+
+		// Only use querySelectorAll on non-XML documents
+		// (ID selectors don't work in non-HTML documents)
+		if ( !seed && context.nodeType === 9 && !isXML(context) ) {
+			try {
+				return makeArray( context.querySelectorAll(query), extra );
+			} catch(e){}
+		}
+		
+		return oldSizzle(query, context, extra, seed);
+	};
+
+	Sizzle.find = oldSizzle.find;
+	Sizzle.filter = oldSizzle.filter;
+	Sizzle.selectors = oldSizzle.selectors;
+	Sizzle.matches = oldSizzle.matches;
+})();
+
+if ( document.getElementsByClassName && document.documentElement.getElementsByClassName ) (function(){
+	var div = document.createElement("div");
+	div.innerHTML = "<div class='test e'></div><div class='test'></div>";
+
+	// Opera can't find a second classname (in 9.6)
+	if ( div.getElementsByClassName("e").length === 0 )
+		return;
+
+	// Safari caches class attributes, doesn't catch changes (in 3.2)
+	div.lastChild.className = "e";
+
+	if ( div.getElementsByClassName("e").length === 1 )
+		return;
+
+	Expr.order.splice(1, 0, "CLASS");
+	Expr.find.CLASS = function(match, context, isXML) {
+		if ( typeof context.getElementsByClassName !== "undefined" && !isXML ) {
+			return context.getElementsByClassName(match[1]);
+		}
+	};
+})();
+
+function dirNodeCheck( dir, cur, doneName, checkSet, nodeCheck, isXML ) {
+	var sibDir = dir == "previousSibling" && !isXML;
+	for ( var i = 0, l = checkSet.length; i < l; i++ ) {
+		var elem = checkSet[i];
+		if ( elem ) {
+			if ( sibDir && elem.nodeType === 1 ){
+				elem.sizcache = doneName;
+				elem.sizset = i;
+			}
+			elem = elem[dir];
+			var match = false;
+
+			while ( elem ) {
+				if ( elem.sizcache === doneName ) {
+					match = checkSet[elem.sizset];
+					break;
+				}
+
+				if ( elem.nodeType === 1 && !isXML ){
+					elem.sizcache = doneName;
+					elem.sizset = i;
+				}
+
+				if ( elem.nodeName === cur ) {
+					match = elem;
+					break;
+				}
+
+				elem = elem[dir];
+			}
+
+			checkSet[i] = match;
+		}
+	}
+}
+
+function dirCheck( dir, cur, doneName, checkSet, nodeCheck, isXML ) {
+	var sibDir = dir == "previousSibling" && !isXML;
+	for ( var i = 0, l = checkSet.length; i < l; i++ ) {
+		var elem = checkSet[i];
+		if ( elem ) {
+			if ( sibDir && elem.nodeType === 1 ) {
+				elem.sizcache = doneName;
+				elem.sizset = i;
+			}
+			elem = elem[dir];
+			var match = false;
+
+			while ( elem ) {
+				if ( elem.sizcache === doneName ) {
+					match = checkSet[elem.sizset];
+					break;
+				}
+
+				if ( elem.nodeType === 1 ) {
+					if ( !isXML ) {
+						elem.sizcache = doneName;
+						elem.sizset = i;
+					}
+					if ( typeof cur !== "string" ) {
+						if ( elem === cur ) {
+							match = true;
+							break;
+						}
+
+					} else if ( Sizzle.filter( cur, [elem] ).length > 0 ) {
+						match = elem;
+						break;
+					}
+				}
+
+				elem = elem[dir];
+			}
+
+			checkSet[i] = match;
+		}
+	}
+}
+
+var contains = document.compareDocumentPosition ?  function(a, b){
+	return a.compareDocumentPosition(b) & 16;
+} : function(a, b){
+	return a !== b && (a.contains ? a.contains(b) : true);
+};
+
+var isXML = function(elem){
+	return elem.nodeType === 9 && elem.documentElement.nodeName !== "HTML" ||
+		!!elem.ownerDocument && isXML( elem.ownerDocument );
+};
+
+var posProcess = function(selector, context){
+	var tmpSet = [], later = "", match,
+		root = context.nodeType ? [context] : context;
+
+	// Position selectors must be done after the filter
+	// And so must :not(positional) so we move all PSEUDOs to the end
+	while ( (match = Expr.match.PSEUDO.exec( selector )) ) {
+		later += match[0];
+		selector = selector.replace( Expr.match.PSEUDO, "" );
+	}
+
+	selector = Expr.relative[selector] ? selector + "*" : selector;
+
+	for ( var i = 0, l = root.length; i < l; i++ ) {
+		Sizzle( selector, root[i], tmpSet );
+	}
+
+	return Sizzle.filter( later, tmpSet );
+};
+
+// EXPOSE
+jQuery.find = Sizzle;
+jQuery.filter = Sizzle.filter;
+jQuery.expr = Sizzle.selectors;
+jQuery.expr[":"] = jQuery.expr.filters;
+
+Sizzle.selectors.filters.hidden = function(elem){
+	return elem.offsetWidth === 0 || elem.offsetHeight === 0;
+};
+
+Sizzle.selectors.filters.visible = function(elem){
+	return elem.offsetWidth > 0 || elem.offsetHeight > 0;
+};
+
+Sizzle.selectors.filters.animated = function(elem){
+	return jQuery.grep(jQuery.timers, function(fn){
+		return elem === fn.elem;
+	}).length;
+};
+
+jQuery.multiFilter = function( expr, elems, not ) {
+	if ( not ) {
+		expr = ":not(" + expr + ")";
+	}
+
+	return Sizzle.matches(expr, elems);
+};
+
+jQuery.dir = function( elem, dir ){
+	var matched = [], cur = elem[dir];
+	while ( cur && cur != document ) {
+		if ( cur.nodeType == 1 )
+			matched.push( cur );
+		cur = cur[dir];
+	}
+	return matched;
+};
+
+jQuery.nth = function(cur, result, dir, elem){
+	result = result || 1;
+	var num = 0;
+
+	for ( ; cur; cur = cur[dir] )
+		if ( cur.nodeType == 1 && ++num == result )
+			break;
+
+	return cur;
+};
+
+jQuery.sibling = function(n, elem){
+	var r = [];
+
+	for ( ; n; n = n.nextSibling ) {
+		if ( n.nodeType == 1 && n != elem )
+			r.push( n );
+	}
+
+	return r;
+};
+
+return;
+
+window.Sizzle = Sizzle;
+
+})();
+/*
+ * A number of helper functions used for managing events.
+ * Many of the ideas behind this code originated from
+ * Dean Edwards' addEvent library.
+ */
+jQuery.event = {
+
+	// Bind an event to an element
+	// Original by Dean Edwards
+	add: function(elem, types, handler, data) {
+		if ( elem.nodeType == 3 || elem.nodeType == 8 )
+			return;
+
+		// For whatever reason, IE has trouble passing the window object
+		// around, causing it to be cloned in the process
+		if ( elem.setInterval && elem != window )
+			elem = window;
+
+		// Make sure that the function being executed has a unique ID
+		if ( !handler.guid )
+			handler.guid = this.guid++;
+
+		// if data is passed, bind to handler
+		if ( data !== undefined ) {
+			// Create temporary function pointer to original handler
+			var fn = handler;
+
+			// Create unique handler function, wrapped around original handler
+			handler = this.proxy( fn );
+
+			// Store data in unique handler
+			handler.data = data;
+		}
+
+		// Init the element's event structure
+		var events = jQuery.data(elem, "events") || jQuery.data(elem, "events", {}),
+			handle = jQuery.data(elem, "handle") || jQuery.data(elem, "handle", function(){
+				// Handle the second event of a trigger and when
+				// an event is called after a page has unloaded
+				return typeof jQuery !== "undefined" && !jQuery.event.triggered ?
+					jQuery.event.handle.apply(arguments.callee.elem, arguments) :
+					undefined;
+			});
+		// Add elem as a property of the handle function
+		// This is to prevent a memory leak with non-native
+		// event in IE.
+		handle.elem = elem;
+
+		// Handle multiple events separated by a space
+		// jQuery(...).bind("mouseover mouseout", fn);
+		jQuery.each(types.split(/\s+/), function(index, type) {
+			// Namespaced event handlers
+			var namespaces = type.split(".");
+			type = namespaces.shift();
+			handler.type = namespaces.slice().sort().join(".");
+
+			// Get the current list of functions bound to this event
+			var handlers = events[type];
+			
+			if ( jQuery.event.specialAll[type] )
+				jQuery.event.specialAll[type].setup.call(elem, data, namespaces);
+
+			// Init the event handler queue
+			if (!handlers) {
+				handlers = events[type] = {};
+
+				// Check for a special event handler
+				// Only use addEventListener/attachEvent if the special
+				// events handler returns false
+				if ( !jQuery.event.special[type] || jQuery.event.special[type].setup.call(elem, data, namespaces) === false ) {
+					// Bind the global event handler to the element
+					if (elem.addEventListener)
+						elem.addEventListener(type, handle, false);
+					else if (elem.attachEvent)
+						elem.attachEvent("on" + type, handle);
+				}
+			}
+
+			// Add the function to the element's handler list
+			handlers[handler.guid] = handler;
+
+			// Keep track of which events have been used, for global triggering
+			jQuery.event.global[type] = true;
+		});
+
+		// Nullify elem to prevent memory leaks in IE
+		elem = null;
+	},
+
+	guid: 1,
+	global: {},
+
+	// Detach an event or set of events from an element
+	remove: function(elem, types, handler) {
+		// don't do events on text and comment nodes
+		if ( elem.nodeType == 3 || elem.nodeType == 8 )
+			return;
+
+		var events = jQuery.data(elem, "events"), ret, index;
+
+		if ( events ) {
+			// Unbind all events for the element
+			if ( types === undefined || (typeof types === "string" && types.charAt(0) == ".") )
+				for ( var type in events )
+					this.remove( elem, type + (types || "") );
+			else {
+				// types is actually an event object here
+				if ( types.type ) {
+					handler = types.handler;
+					types = types.type;
+				}
+
+				// Handle multiple events seperated by a space
+				// jQuery(...).unbind("mouseover mouseout", fn);
+				jQuery.each(types.split(/\s+/), function(index, type){
+					// Namespaced event handlers
+					var namespaces = type.split(".");
+					type = namespaces.shift();
+					var namespace = RegExp("(^|\\.)" + namespaces.slice().sort().join(".*\\.") + "(\\.|$)");
+
+					if ( events[type] ) {
+						// remove the given handler for the given type
+						if ( handler )
+							delete events[type][handler.guid];
+
+						// remove all handlers for the given type
+						else
+							for ( var handle in events[type] )
+								// Handle the removal of namespaced events
+								if ( namespace.test(events[type][handle].type) )
+									delete events[type][handle];
+									
+						if ( jQuery.event.specialAll[type] )
+							jQuery.event.specialAll[type].teardown.call(elem, namespaces);
+
+						// remove generic event handler if no more handlers exist
+						for ( ret in events[type] ) break;
+						if ( !ret ) {
+							if ( !jQuery.event.special[type] || jQuery.event.special[type].teardown.call(elem, namespaces) === false ) {
+								if (elem.removeEventListener)
+									elem.removeEventListener(type, jQuery.data(elem, "handle"), false);
+								else if (elem.detachEvent)
+									elem.detachEvent("on" + type, jQuery.data(elem, "handle"));
+							}
+							ret = null;
+							delete events[type];
+						}
+					}
+				});
+			}
+
+			// Remove the expando if it's no longer used
+			for ( ret in events ) break;
+			if ( !ret ) {
+				var handle = jQuery.data( elem, "handle" );
+				if ( handle ) handle.elem = null;
+				jQuery.removeData( elem, "events" );
+				jQuery.removeData( elem, "handle" );
+			}
+		}
+	},
+
+	// bubbling is internal
+	trigger: function( event, data, elem, bubbling ) {
+		// Event object or event type
+		var type = event.type || event;
+
+		if( !bubbling ){
+			event = typeof event === "object" ?
+				// jQuery.Event object
+				event[expando] ? event :
+				// Object literal
+				jQuery.extend( jQuery.Event(type), event ) :
+				// Just the event type (string)
+				jQuery.Event(type);
+
+			if ( type.indexOf("!") >= 0 ) {
+				event.type = type = type.slice(0, -1);
+				event.exclusive = true;
+			}
+
+			// Handle a global trigger
+			if ( !elem ) {
+				// Don't bubble custom events when global (to avoid too much overhead)
+				event.stopPropagation();
+				// Only trigger if we've ever bound an event for it
+				if ( this.global[type] )
+					jQuery.each( jQuery.cache, function(){
+						if ( this.events && this.events[type] )
+							jQuery.event.trigger( event, data, this.handle.elem );
+					});
+			}
+
+			// Handle triggering a single element
+
+			// don't do events on text and comment nodes
+			if ( !elem || elem.nodeType == 3 || elem.nodeType == 8 )
+				return undefined;
+			
+			// Clean up in case it is reused
+			event.result = undefined;
+			event.target = elem;
+			
+			// Clone the incoming data, if any
+			data = jQuery.makeArray(data);
+			data.unshift( event );
+		}
+
+		event.currentTarget = elem;
+
+		// Trigger the event, it is assumed that "handle" is a function
+		var handle = jQuery.data(elem, "handle");
+		if ( handle )
+			handle.apply( elem, data );
+
+		// Handle triggering native .onfoo handlers (and on links since we don't call .click() for links)
+		if ( (!elem[type] || (jQuery.nodeName(elem, 'a') && type == "click")) && elem["on"+type] && elem["on"+type].apply( elem, data ) === false )
+			event.result = false;
+
+		// Trigger the native events (except for clicks on links)
+		if ( !bubbling && elem[type] && !event.isDefaultPrevented() && !(jQuery.nodeName(elem, 'a') && type == "click") ) {
+			this.triggered = true;
+			try {
+				elem[ type ]();
+			// prevent IE from throwing an error for some hidden elements
+			} catch (e) {}
+		}
+
+		this.triggered = false;
+
+		if ( !event.isPropagationStopped() ) {
+			var parent = elem.parentNode || elem.ownerDocument;
+			if ( parent )
+				jQuery.event.trigger(event, data, parent, true);
+		}
+	},
+
+	handle: function(event) {
+		// returned undefined or false
+		var all, handlers;
+
+		event = arguments[0] = jQuery.event.fix( event || window.event );
+		event.currentTarget = this;
+		
+		// Namespaced event handlers
+		var namespaces = event.type.split(".");
+		event.type = namespaces.shift();
+
+		// Cache this now, all = true means, any handler
+		all = !namespaces.length && !event.exclusive;
+		
+		var namespace = RegExp("(^|\\.)" + namespaces.slice().sort().join(".*\\.") + "(\\.|$)");
+
+		handlers = ( jQuery.data(this, "events") || {} )[event.type];
+
+		for ( var j in handlers ) {
+			var handler = handlers[j];
+
+			// Filter the functions by class
+			if ( all || namespace.test(handler.type) ) {
+				// Pass in a reference to the handler function itself
+				// So that we can later remove it
+				event.handler = handler;
+				event.data = handler.data;
+
+				var ret = handler.apply(this, arguments);
+
+				if( ret !== undefined ){
+					event.result = ret;
+					if ( ret === false ) {
+						event.preventDefault();
+						event.stopPropagation();
+					}
+				}
+
+				if( event.isImmediatePropagationStopped() )
+					break;
+
+			}
+		}
+	},
+
+	props: "altKey attrChange attrName bubbles button cancelable charCode clientX clientY ctrlKey currentTarget data detail eventPhase fromElement handler keyCode metaKey newValue originalTarget pageX pageY prevValue relatedNode relatedTarget screenX screenY shiftKey srcElement target toElement view wheelDelta which".split(" "),
+
+	fix: function(event) {
+		if ( event[expando] )
+			return event;
+
+		// store a copy of the original event object
+		// and "clone" to set read-only properties
+		var originalEvent = event;
+		event = jQuery.Event( originalEvent );
+
+		for ( var i = this.props.length, prop; i; ){
+			prop = this.props[ --i ];
+			event[ prop ] = originalEvent[ prop ];
+		}
+
+		// Fix target property, if necessary
+		if ( !event.target )
+			event.target = event.srcElement || document; // Fixes #1925 where srcElement might not be defined either
+
+		// check if target is a textnode (safari)
+		if ( event.target.nodeType == 3 )
+			event.target = event.target.parentNode;
+
+		// Add relatedTarget, if necessary
+		if ( !event.relatedTarget && event.fromElement )
+			event.relatedTarget = event.fromElement == event.target ? event.toElement : event.fromElement;
+
+		// Calculate pageX/Y if missing and clientX/Y available
+		if ( event.pageX == null && event.clientX != null ) {
+			var doc = document.documentElement, body = document.body;
+			event.pageX = event.clientX + (doc && doc.scrollLeft || body && body.scrollLeft || 0) - (doc.clientLeft || 0);
+			event.pageY = event.clientY + (doc && doc.scrollTop || body && body.scrollTop || 0) - (doc.clientTop || 0);
+		}
+
+		// Add which for key events
+		if ( !event.which && ((event.charCode || event.charCode === 0) ? event.charCode : event.keyCode) )
+			event.which = event.charCode || event.keyCode;
+
+		// Add metaKey to non-Mac browsers (use ctrl for PC's and Meta for Macs)
+		if ( !event.metaKey && event.ctrlKey )
+			event.metaKey = event.ctrlKey;
+
+		// Add which for click: 1 == left; 2 == middle; 3 == right
+		// Note: button is not normalized, so don't use it
+		if ( !event.which && event.button )
+			event.which = (event.button & 1 ? 1 : ( event.button & 2 ? 3 : ( event.button & 4 ? 2 : 0 ) ));
+
+		return event;
+	},
+
+	proxy: function( fn, proxy ){
+		proxy = proxy || function(){ return fn.apply(this, arguments); };
+		// Set the guid of unique handler to the same of original handler, so it can be removed
+		proxy.guid = fn.guid = fn.guid || proxy.guid || this.guid++;
+		// So proxy can be declared as an argument
+		return proxy;
+	},
+
+	special: {
+		ready: {
+			// Make sure the ready event is setup
+			setup: bindReady,
+			teardown: function() {}
+		}
+	},
+	
+	specialAll: {
+		live: {
+			setup: function( selector, namespaces ){
+				jQuery.event.add( this, namespaces[0], liveHandler );
+			},
+			teardown:  function( namespaces ){
+				if ( namespaces.length ) {
+					var remove = 0, name = RegExp("(^|\\.)" + namespaces[0] + "(\\.|$)");
+					
+					jQuery.each( (jQuery.data(this, "events").live || {}), function(){
+						if ( name.test(this.type) )
+							remove++;
+					});
+					
+					if ( remove < 1 )
+						jQuery.event.remove( this, namespaces[0], liveHandler );
+				}
+			}
+		}
+	}
+};
+
+jQuery.Event = function( src ){
+	// Allow instantiation without the 'new' keyword
+	if( !this.preventDefault )
+		return new jQuery.Event(src);
+	
+	// Event object
+	if( src && src.type ){
+		this.originalEvent = src;
+		this.type = src.type;
+	// Event type
+	}else
+		this.type = src;
+
+	// timeStamp is buggy for some events on Firefox(#3843)
+	// So we won't rely on the native value
+	this.timeStamp = now();
+	
+	// Mark it as fixed
+	this[expando] = true;
+};
+
+function returnFalse(){
+	return false;
+}
+function returnTrue(){
+	return true;
+}
+
+// jQuery.Event is based on DOM3 Events as specified by the ECMAScript Language Binding
+// http://www.w3.org/TR/2003/WD-DOM-Level-3-Events-20030331/ecma-script-binding.html
+jQuery.Event.prototype = {
+	preventDefault: function() {
+		this.isDefaultPrevented = returnTrue;
+
+		var e = this.originalEvent;
+		if( !e )
+			return;
+		// if preventDefault exists run it on the original event
+		if (e.preventDefault)
+			e.preventDefault();
+		// otherwise set the returnValue property of the original event to false (IE)
+		e.returnValue = false;
+	},
+	stopPropagation: function() {
+		this.isPropagationStopped = returnTrue;
+
+		var e = this.originalEvent;
+		if( !e )
+			return;
+		// if stopPropagation exists run it on the original event
+		if (e.stopPropagation)
+			e.stopPropagation();
+		// otherwise set the cancelBubble property of the original event to true (IE)
+		e.cancelBubble = true;
+	},
+	stopImmediatePropagation:function(){
+		this.isImmediatePropagationStopped = returnTrue;
+		this.stopPropagation();
+	},
+	isDefaultPrevented: returnFalse,
+	isPropagationStopped: returnFalse,
+	isImmediatePropagationStopped: returnFalse
+};
+// Checks if an event happened on an element within another element
+// Used in jQuery.event.special.mouseenter and mouseleave handlers
+var withinElement = function(event) {
+	// Check if mouse(over|out) are still within the same parent element
+	var parent = event.relatedTarget;
+	// Traverse up the tree
+	while ( parent && parent != this )
+		try { parent = parent.parentNode; }
+		catch(e) { parent = this; }
+	
+	if( parent != this ){
+		// set the correct event type
+		event.type = event.data;
+		// handle event if we actually just moused on to a non sub-element
+		jQuery.event.handle.apply( this, arguments );
+	}
+};
+	
+jQuery.each({ 
+	mouseover: 'mouseenter', 
+	mouseout: 'mouseleave'
+}, function( orig, fix ){
+	jQuery.event.special[ fix ] = {
+		setup: function(){
+			jQuery.event.add( this, orig, withinElement, fix );
+		},
+		teardown: function(){
+			jQuery.event.remove( this, orig, withinElement );
+		}
+	};			   
+});
+
+jQuery.fn.extend({
+	bind: function( type, data, fn ) {
+		return type == "unload" ? this.one(type, data, fn) : this.each(function(){
+			jQuery.event.add( this, type, fn || data, fn && data );
+		});
+	},
+
+	one: function( type, data, fn ) {
+		var one = jQuery.event.proxy( fn || data, function(event) {
+			jQuery(this).unbind(event, one);
+			return (fn || data).apply( this, arguments );
+		});
+		return this.each(function(){
+			jQuery.event.add( this, type, one, fn && data);
+		});
+	},
+
+	unbind: function( type, fn ) {
+		return this.each(function(){
+			jQuery.event.remove( this, type, fn );
+		});
+	},
+
+	trigger: function( type, data ) {
+		return this.each(function(){
+			jQuery.event.trigger( type, data, this );
+		});
+	},
+
+	triggerHandler: function( type, data ) {
+		if( this[0] ){
+			var event = jQuery.Event(type);
+			event.preventDefault();
+			event.stopPropagation();
+			jQuery.event.trigger( event, data, this[0] );
+			return event.result;
+		}		
+	},
+
+	toggle: function( fn ) {
+		// Save reference to arguments for access in closure
+		var args = arguments, i = 1;
+
+		// link all the functions, so any of them can unbind this click handler
+		while( i < args.length )
+			jQuery.event.proxy( fn, args[i++] );
+
+		return this.click( jQuery.event.proxy( fn, function(event) {
+			// Figure out which function to execute
+			this.lastToggle = ( this.lastToggle || 0 ) % i;
+
+			// Make sure that clicks stop
+			event.preventDefault();
+
+			// and execute the function
+			return args[ this.lastToggle++ ].apply( this, arguments ) || false;
+		}));
+	},
+
+	hover: function(fnOver, fnOut) {
+		return this.mouseenter(fnOver).mouseleave(fnOut);
+	},
+
+	ready: function(fn) {
+		// Attach the listeners
+		bindReady();
+
+		// If the DOM is already ready
+		if ( jQuery.isReady )
+			// Execute the function immediately
+			fn.call( document, jQuery );
+
+		// Otherwise, remember the function for later
+		else
+			// Add the function to the wait list
+			jQuery.readyList.push( fn );
+
+		return this;
+	},
+	
+	live: function( type, fn ){
+		var proxy = jQuery.event.proxy( fn );
+		proxy.guid += this.selector + type;
+
+		jQuery(document).bind( liveConvert(type, this.selector), this.selector, proxy );
+
+		return this;
+	},
+	
+	die: function( type, fn ){
+		jQuery(document).unbind( liveConvert(type, this.selector), fn ? { guid: fn.guid + this.selector + type } : null );
+		return this;
+	}
+});
+
+function liveHandler( event ){
+	var check = RegExp("(^|\\.)" + event.type + "(\\.|$)"),
+		stop = true,
+		elems = [];
+
+	jQuery.each(jQuery.data(this, "events").live || [], function(i, fn){
+		if ( check.test(fn.type) ) {
+			var elem = jQuery(event.target).closest(fn.data)[0];
+			if ( elem )
+				elems.push({ elem: elem, fn: fn });
+		}
+	});
+
+	elems.sort(function(a,b) {
+		return jQuery.data(a.elem, "closest") - jQuery.data(b.elem, "closest");
+	});
+	
+	jQuery.each(elems, function(){
+		if ( this.fn.call(this.elem, event, this.fn.data) === false )
+			return (stop = false);
+	});
+
+	return stop;
+}
+
+function liveConvert(type, selector){
+	return ["live", type, selector.replace(/\./g, "`").replace(/ /g, "|")].join(".");
+}
+
+jQuery.extend({
+	isReady: false,
+	readyList: [],
+	// Handle when the DOM is ready
+	ready: function() {
+		// Make sure that the DOM is not already loaded
+		if ( !jQuery.isReady ) {
+			// Remember that the DOM is ready
+			jQuery.isReady = true;
+
+			// If there are functions bound, to execute
+			if ( jQuery.readyList ) {
+				// Execute all of them
+				jQuery.each( jQuery.readyList, function(){
+					this.call( document, jQuery );
+				});
+
+				// Reset the list of functions
+				jQuery.readyList = null;
+			}
+
+			// Trigger any bound ready events
+			jQuery(document).triggerHandler("ready");
+		}
+	}
+});
+
+var readyBound = false;
+
+function bindReady(){
+	if ( readyBound ) return;
+	readyBound = true;
+
+	// Mozilla, Opera and webkit nightlies currently support this event
+	if ( document.addEventListener ) {
+		// Use the handy event callback
+		document.addEventListener( "DOMContentLoaded", function(){
+			document.removeEventListener( "DOMContentLoaded", arguments.callee, false );
+			jQuery.ready();
+		}, false );
+
+	// If IE event model is used
+	} else if ( document.attachEvent ) {
+		// ensure firing before onload,
+		// maybe late but safe also for iframes
+		document.attachEvent("onreadystatechange", function(){
+			if ( document.readyState === "complete" ) {
+				document.detachEvent( "onreadystatechange", arguments.callee );
+				jQuery.ready();
+			}
+		});
+
+		// If IE and not an iframe
+		// continually check to see if the document is ready
+		if ( document.documentElement.doScroll && window == window.top ) (function(){
+			if ( jQuery.isReady ) return;
+
+			try {
+				// If IE is used, use the trick by Diego Perini
+				// http://javascript.nwbox.com/IEContentLoaded/
+				document.documentElement.doScroll("left");
+			} catch( error ) {
+				setTimeout( arguments.callee, 0 );
+				return;
+			}
+
+			// and execute any waiting functions
+			jQuery.ready();
+		})();
+	}
+
+	// A fallback to window.onload, that will always work
+	jQuery.event.add( window, "load", jQuery.ready );
+}
+
+jQuery.each( ("blur,focus,load,resize,scroll,unload,click,dblclick," +
+	"mousedown,mouseup,mousemove,mouseover,mouseout,mouseenter,mouseleave," +
+	"change,select,submit,keydown,keypress,keyup,error").split(","), function(i, name){
+
+	// Handle event binding
+	jQuery.fn[name] = function(fn){
+		return fn ? this.bind(name, fn) : this.trigger(name);
+	};
+});
+
+// Prevent memory leaks in IE
+// And prevent errors on refresh with events like mouseover in other browsers
+// Window isn't included so as not to unbind existing unload events
+jQuery( window ).bind( 'unload', function(){ 
+	for ( var id in jQuery.cache )
+		// Skip the window
+		if ( id != 1 && jQuery.cache[ id ].handle )
+			jQuery.event.remove( jQuery.cache[ id ].handle.elem );
+}); 
+(function(){
+
+	jQuery.support = {};
+
+	var root = document.documentElement,
+		script = document.createElement("script"),
+		div = document.createElement("div"),
+		id = "script" + (new Date).getTime();
+
+	div.style.display = "none";
+	div.innerHTML = '   <link/><table></table><a href="/a" style="color:red;float:left;opacity:.5;">a</a><select><option>text</option></select><object><param/></object>';
+
+	var all = div.getElementsByTagName("*"),
+		a = div.getElementsByTagName("a")[0];
+
+	// Can't get basic test support
+	if ( !all || !all.length || !a ) {
+		return;
+	}
+
+	jQuery.support = {
+		// IE strips leading whitespace when .innerHTML is used
+		leadingWhitespace: div.firstChild.nodeType == 3,
+		
+		// Make sure that tbody elements aren't automatically inserted
+		// IE will insert them into empty tables
+		tbody: !div.getElementsByTagName("tbody").length,
+		
+		// Make sure that you can get all elements in an <object> element
+		// IE 7 always returns no results
+		objectAll: !!div.getElementsByTagName("object")[0]
+			.getElementsByTagName("*").length,
+		
+		// Make sure that link elements get serialized correctly by innerHTML
+		// This requires a wrapper element in IE
+		htmlSerialize: !!div.getElementsByTagName("link").length,
+		
+		// Get the style information from getAttribute
+		// (IE uses .cssText insted)
+		style: /red/.test( a.getAttribute("style") ),
+		
+		// Make sure that URLs aren't manipulated
+		// (IE normalizes it by default)
+		hrefNormalized: a.getAttribute("href") === "/a",
+		
+		// Make sure that element opacity exists
+		// (IE uses filter instead)
+		opacity: a.style.opacity === "0.5",
+		
+		// Verify style float existence
+		// (IE uses styleFloat instead of cssFloat)
+		cssFloat: !!a.style.cssFloat,
+
+		// Will be defined later
+		scriptEval: false,
+		noCloneEvent: true,
+		boxModel: null
+	};
+	
+	script.type = "text/javascript";
+	try {
+		script.appendChild( document.createTextNode( "window." + id + "=1;" ) );
+	} catch(e){}
+
+	root.insertBefore( script, root.firstChild );
+	
+	// Make sure that the execution of code works by injecting a script
+	// tag with appendChild/createTextNode
+	// (IE doesn't support this, fails, and uses .text instead)
+	if ( window[ id ] ) {
+		jQuery.support.scriptEval = true;
+		delete window[ id ];
+	}
+
+	root.removeChild( script );
+
+	if ( div.attachEvent && div.fireEvent ) {
+		div.attachEvent("onclick", function(){
+			// Cloning a node shouldn't copy over any
+			// bound event handlers (IE does this)
+			jQuery.support.noCloneEvent = false;
+			div.detachEvent("onclick", arguments.callee);
+		});
+		div.cloneNode(true).fireEvent("onclick");
+	}
+
+	// Figure out if the W3C box model works as expected
+	// document.body must exist before we can do this
+	jQuery(function(){
+		var div = document.createElement("div");
+		div.style.width = div.style.paddingLeft = "1px";
+
+		document.body.appendChild( div );
+		jQuery.boxModel = jQuery.support.boxModel = div.offsetWidth === 2;
+		document.body.removeChild( div ).style.display = 'none';
+	});
+})();
+
+var styleFloat = jQuery.support.cssFloat ? "cssFloat" : "styleFloat";
+
+jQuery.props = {
+	"for": "htmlFor",
+	"class": "className",
+	"float": styleFloat,
+	cssFloat: styleFloat,
+	styleFloat: styleFloat,
+	readonly: "readOnly",
+	maxlength: "maxLength",
+	cellspacing: "cellSpacing",
+	rowspan: "rowSpan",
+	tabindex: "tabIndex"
+};
+jQuery.fn.extend({
+	// Keep a copy of the old load
+	_load: jQuery.fn.load,
+
+	load: function( url, params, callback ) {
+		if ( typeof url !== "string" )
+			return this._load( url );
+
+		var off = url.indexOf(" ");
+		if ( off >= 0 ) {
+			var selector = url.slice(off, url.length);
+			url = url.slice(0, off);
+		}
+
+		// Default to a GET request
+		var type = "GET";
+
+		// If the second parameter was provided
+		if ( params )
+			// If it's a function
+			if ( jQuery.isFunction( params ) ) {
+				// We assume that it's the callback
+				callback = params;
+				params = null;
+
+			// Otherwise, build a param string
+			} else if( typeof params === "object" ) {
+				params = jQuery.param( params );
+				type = "POST";
+			}
+
+		var self = this;
+
+		// Request the remote document
+		jQuery.ajax({
+			url: url,
+			type: type,
+			dataType: "html",
+			data: params,
+			complete: function(res, status){
+				// If successful, inject the HTML into all the matched elements
+				if ( status == "success" || status == "notmodified" )
+					// See if a selector was specified
+					self.html( selector ?
+						// Create a dummy div to hold the results
+						jQuery("<div/>")
+							// inject the contents of the document in, removing the scripts
+							// to avoid any 'Permission Denied' errors in IE
+							.append(res.responseText.replace(/<script(.|\s)*?\/script>/g, ""))
+
+							// Locate the specified elements
+							.find(selector) :
+
+						// If not, just inject the full result
+						res.responseText );
+
+				if( callback )
+					self.each( callback, [res.responseText, status, res] );
+			}
+		});
+		return this;
+	},
+
+	serialize: function() {
+		return jQuery.param(this.serializeArray());
+	},
+	serializeArray: function() {
+		return this.map(function(){
+			return this.elements ? jQuery.makeArray(this.elements) : this;
+		})
+		.filter(function(){
+			return this.name && !this.disabled &&
+				(this.checked || /select|textarea/i.test(this.nodeName) ||
+					/text|hidden|password|search/i.test(this.type));
+		})
+		.map(function(i, elem){
+			var val = jQuery(this).val();
+			return val == null ? null :
+				jQuery.isArray(val) ?
+					jQuery.map( val, function(val, i){
+						return {name: elem.name, value: val};
+					}) :
+					{name: elem.name, value: val};
+		}).get();
+	}
+});
+
+// Attach a bunch of functions for handling common AJAX events
+jQuery.each( "ajaxStart,ajaxStop,ajaxComplete,ajaxError,ajaxSuccess,ajaxSend".split(","), function(i,o){
+	jQuery.fn[o] = function(f){
+		return this.bind(o, f);
+	};
+});
+
+var jsc = now();
+
+jQuery.extend({
+  
+	get: function( url, data, callback, type ) {
+		// shift arguments if data argument was ommited
+		if ( jQuery.isFunction( data ) ) {
+			callback = data;
+			data = null;
+		}
+
+		return jQuery.ajax({
+			type: "GET",
+			url: url,
+			data: data,
+			success: callback,
+			dataType: type
+		});
+	},
+
+	getScript: function( url, callback ) {
+		return jQuery.get(url, null, callback, "script");
+	},
+
+	getJSON: function( url, data, callback ) {
+		return jQuery.get(url, data, callback, "json");
+	},
+
+	post: function( url, data, callback, type ) {
+		if ( jQuery.isFunction( data ) ) {
+			callback = data;
+			data = {};
+		}
+
+		return jQuery.ajax({
+			type: "POST",
+			url: url,
+			data: data,
+			success: callback,
+			dataType: type
+		});
+	},
+
+	ajaxSetup: function( settings ) {
+		jQuery.extend( jQuery.ajaxSettings, settings );
+	},
+
+	ajaxSettings: {
+		url: location.href,
+		global: true,
+		type: "GET",
+		contentType: "application/x-www-form-urlencoded",
+		processData: true,
+		async: true,
+		/*
+		timeout: 0,
+		data: null,
+		username: null,
+		password: null,
+		*/
+		// Create the request object; Microsoft failed to properly
+		// implement the XMLHttpRequest in IE7, so we use the ActiveXObject when it is available
+		// This function can be overriden by calling jQuery.ajaxSetup
+		xhr:function(){
+			return window.ActiveXObject ? new ActiveXObject("Microsoft.XMLHTTP") : new XMLHttpRequest();
+		},
+		accepts: {
+			xml: "application/xml, text/xml",
+			html: "text/html",
+			script: "text/javascript, application/javascript",
+			json: "application/json, text/javascript",
+			text: "text/plain",
+			_default: "*/*"
+		}
+	},
+
+	// Last-Modified header cache for next request
+	lastModified: {},
+
+	ajax: function( s ) {
+		// Extend the settings, but re-extend 's' so that it can be
+		// checked again later (in the test suite, specifically)
+		s = jQuery.extend(true, s, jQuery.extend(true, {}, jQuery.ajaxSettings, s));
+
+		var jsonp, jsre = /=\?(&|$)/g, status, data,
+			type = s.type.toUpperCase();
+
+		// convert data if not already a string
+		if ( s.data && s.processData && typeof s.data !== "string" )
+			s.data = jQuery.param(s.data);
+
+		// Handle JSONP Parameter Callbacks
+		if ( s.dataType == "jsonp" ) {
+			if ( type == "GET" ) {
+				if ( !s.url.match(jsre) )
+					s.url += (s.url.match(/\?/) ? "&" : "?") + (s.jsonp || "callback") + "=?";
+			} else if ( !s.data || !s.data.match(jsre) )
+				s.data = (s.data ? s.data + "&" : "") + (s.jsonp || "callback") + "=?";
+			s.dataType = "json";
+		}
+
+		// Build temporary JSONP function
+		if ( s.dataType == "json" && (s.data && s.data.match(jsre) || s.url.match(jsre)) ) {
+			jsonp = "jsonp" + jsc++;
+
+			// Replace the =? sequence both in the query string and the data
+			if ( s.data )
+				s.data = (s.data + "").replace(jsre, "=" + jsonp + "$1");
+			s.url = s.url.replace(jsre, "=" + jsonp + "$1");
+
+			// We need to make sure
+			// that a JSONP style response is executed properly
+			s.dataType = "script";
+
+			// Handle JSONP-style loading
+			window[ jsonp ] = function(tmp){
+				data = tmp;
+				success();
+				complete();
+				// Garbage collect
+				window[ jsonp ] = undefined;
+				try{ delete window[ jsonp ]; } catch(e){}
+				if ( head )
+					head.removeChild( script );
+			};
+		}
+
+		if ( s.dataType == "script" && s.cache == null )
+			s.cache = false;
+
+		if ( s.cache === false && type == "GET" ) {
+			var ts = now();
+			// try replacing _= if it is there
+			var ret = s.url.replace(/(\?|&)_=.*?(&|$)/, "$1_=" + ts + "$2");
+			// if nothing was replaced, add timestamp to the end
+			s.url = ret + ((ret == s.url) ? (s.url.match(/\?/) ? "&" : "?") + "_=" + ts : "");
+		}
+
+		// If data is available, append data to url for get requests
+		if ( s.data && type == "GET" ) {
+			s.url += (s.url.match(/\?/) ? "&" : "?") + s.data;
+
+			// IE likes to send both get and post data, prevent this
+			s.data = null;
+		}
+
+		// Watch for a new set of requests
+		if ( s.global && ! jQuery.active++ )
+			jQuery.event.trigger( "ajaxStart" );
+
+		// Matches an absolute URL, and saves the domain
+		var parts = /^(\w+:)?\/\/([^\/?#]+)/.exec( s.url );
+
+		// If we're requesting a remote document
+		// and trying to load JSON or Script with a GET
+		if ( s.dataType == "script" && type == "GET" && parts
+			&& ( parts[1] && parts[1] != location.protocol || parts[2] != location.host )){
+
+			var head = document.getElementsByTagName("head")[0];
+			var script = document.createElement("script");
+			script.src = s.url;
+			if (s.scriptCharset)
+				script.charset = s.scriptCharset;
+
+			// Handle Script loading
+			if ( !jsonp ) {
+				var done = false;
+
+				// Attach handlers for all browsers
+				script.onload = script.onreadystatechange = function(){
+					if ( !done && (!this.readyState ||
+							this.readyState == "loaded" || this.readyState == "complete") ) {
+						done = true;
+						success();
+						complete();
+
+						// Handle memory leak in IE
+						script.onload = script.onreadystatechange = null;
+						head.removeChild( script );
+					}
+				};
+			}
+
+			head.appendChild(script);
+
+			// We handle everything using the script element injection
+			return undefined;
+		}
+
+		var requestDone = false;
+
+		// Create the request object
+		var xhr = s.xhr();
+
+		// Open the socket
+		// Passing null username, generates a login popup on Opera (#2865)
+		if( s.username )
+			xhr.open(type, s.url, s.async, s.username, s.password);
+		else
+			xhr.open(type, s.url, s.async);
+
+		// Need an extra try/catch for cross domain requests in Firefox 3
+		try {
+			// Set the correct header, if data is being sent
+			if ( s.data )
+				xhr.setRequestHeader("Content-Type", s.contentType);
+
+			// Set the If-Modified-Since header, if ifModified mode.
+			if ( s.ifModified )
+				xhr.setRequestHeader("If-Modified-Since",
+					jQuery.lastModified[s.url] || "Thu, 01 Jan 1970 00:00:00 GMT" );
+
+			// Set header so the called script knows that it's an XMLHttpRequest
+			xhr.setRequestHeader("X-Requested-With", "XMLHttpRequest");
+
+			// Set the Accepts header for the server, depending on the dataType
+			xhr.setRequestHeader("Accept", s.dataType && s.accepts[ s.dataType ] ?
+				s.accepts[ s.dataType ] + ", */*" :
+				s.accepts._default );
+		} catch(e){}
+
+		// Allow custom headers/mimetypes and early abort
+		if ( s.beforeSend && s.beforeSend(xhr, s) === false ) {
+			// Handle the global AJAX counter
+			if ( s.global && ! --jQuery.active )
+				jQuery.event.trigger( "ajaxStop" );
+			// close opended socket
+			xhr.abort();
+			return false;
+		}
+
+		if ( s.global )
+			jQuery.event.trigger("ajaxSend", [xhr, s]);
+
+		// Wait for a response to come back
+		var onreadystatechange = function(isTimeout){
+			// The request was aborted, clear the interval and decrement jQuery.active
+			if (xhr.readyState == 0) {
+				if (ival) {
+					// clear poll interval
+					clearInterval(ival);
+					ival = null;
+					// Handle the global AJAX counter
+					if ( s.global && ! --jQuery.active )
+						jQuery.event.trigger( "ajaxStop" );
+				}
+			// The transfer is complete and the data is available, or the request timed out
+			} else if ( !requestDone && xhr && (xhr.readyState == 4 || isTimeout == "timeout") ) {
+				requestDone = true;
+
+				// clear poll interval
+				if (ival) {
+					clearInterval(ival);
+					ival = null;
+				}
+
+				status = isTimeout == "timeout" ? "timeout" :
+					!jQuery.httpSuccess( xhr ) ? "error" :
+					s.ifModified && jQuery.httpNotModified( xhr, s.url ) ? "notmodified" :
+					"success";
+
+				if ( status == "success" ) {
+					// Watch for, and catch, XML document parse errors
+					try {
+						// process the data (runs the xml through httpData regardless of callback)
+						data = jQuery.httpData( xhr, s.dataType, s );
+					} catch(e) {
+						status = "parsererror";
+					}
+				}
+
+				// Make sure that the request was successful or notmodified
+				if ( status == "success" ) {
+					// Cache Last-Modified header, if ifModified mode.
+					var modRes;
+					try {
+						modRes = xhr.getResponseHeader("Last-Modified");
+					} catch(e) {} // swallow exception thrown by FF if header is not available
+
+					if ( s.ifModified && modRes )
+						jQuery.lastModified[s.url] = modRes;
+
+					// JSONP handles its own success callback
+					if ( !jsonp )
+						success();
+				} else
+					jQuery.handleError(s, xhr, status);
+
+				// Fire the complete handlers
+				complete();
+
+				if ( isTimeout )
+					xhr.abort();
+
+				// Stop memory leaks
+				if ( s.async )
+					xhr = null;
+			}
+		};
+
+		if ( s.async ) {
+			// don't attach the handler to the request, just poll it instead
+			var ival = setInterval(onreadystatechange, 13);
+
+			// Timeout checker
+			if ( s.timeout > 0 )
+				setTimeout(function(){
+					// Check to see if the request is still happening
+					if ( xhr && !requestDone )
+						onreadystatechange( "timeout" );
+				}, s.timeout);
+		}
+
+		// Send the data
+		try {
+			xhr.send(s.data);
+		} catch(e) {
+			jQuery.handleError(s, xhr, null, e);
+		}
+
+		// firefox 1.5 doesn't fire statechange for sync requests
+		if ( !s.async )
+			onreadystatechange();
+
+		function success(){
+			// If a local callback was specified, fire it and pass it the data
+			if ( s.success )
+				s.success( data, status );
+
+			// Fire the global callback
+			if ( s.global )
+				jQuery.event.trigger( "ajaxSuccess", [xhr, s] );
+		}
+
+		function complete(){
+			// Process result
+			if ( s.complete )
+				s.complete(xhr, status);
+
+			// The request was completed
+			if ( s.global )
+				jQuery.event.trigger( "ajaxComplete", [xhr, s] );
+
+			// Handle the global AJAX counter
+			if ( s.global && ! --jQuery.active )
+				jQuery.event.trigger( "ajaxStop" );
+		}
+
+		// return XMLHttpRequest to allow aborting the request etc.
+		return xhr;
+	},
+
+	handleError: function( s, xhr, status, e ) {
+		// If a local callback was specified, fire it
+		if ( s.error ) s.error( xhr, status, e );
+
+		// Fire the global callback
+		if ( s.global )
+			jQuery.event.trigger( "ajaxError", [xhr, s, e] );
+	},
+
+	// Counter for holding the number of active queries
+	active: 0,
+
+	// Determines if an XMLHttpRequest was successful or not
+	httpSuccess: function( xhr ) {
+		try {
+			// IE error sometimes returns 1223 when it should be 204 so treat it as success, see #1450
+			return !xhr.status && location.protocol == "file:" ||
+				( xhr.status >= 200 && xhr.status < 300 ) || xhr.status == 304 || xhr.status == 1223;
+		} catch(e){}
+		return false;
+	},
+
+	// Determines if an XMLHttpRequest returns NotModified
+	httpNotModified: function( xhr, url ) {
+		try {
+			var xhrRes = xhr.getResponseHeader("Last-Modified");
+
+			// Firefox always returns 200. check Last-Modified date
+			return xhr.status == 304 || xhrRes == jQuery.lastModified[url];
+		} catch(e){}
+		return false;
+	},
+
+	httpData: function( xhr, type, s ) {
+		var ct = xhr.getResponseHeader("content-type"),
+			xml = type == "xml" || !type && ct && ct.indexOf("xml") >= 0,
+			data = xml ? xhr.responseXML : xhr.responseText;
+
+		if ( xml && data.documentElement.tagName == "parsererror" )
+			throw "parsererror";
+			
+		// Allow a pre-filtering function to sanitize the response
+		// s != null is checked to keep backwards compatibility
+		if( s && s.dataFilter )
+			data = s.dataFilter( data, type );
+
+		// The filter can actually parse the response
+		if( typeof data === "string" ){
+
+			// If the type is "script", eval it in global context
+			if ( type == "script" )
+				jQuery.globalEval( data );
+
+			// Get the JavaScript object, if JSON is used.
+			if ( type == "json" )
+				data = window["eval"]("(" + data + ")");
+		}
+		
+		return data;
+	},
+
+	// Serialize an array of form elements or a set of
+	// key/values into a query string
+	param: function( a ) {
+		var s = [ ];
+
+		function add( key, value ){
+			s[ s.length ] = encodeURIComponent(key) + '=' + encodeURIComponent(value);
+		};
+
+		// If an array was passed in, assume that it is an array
+		// of form elements
+		if ( jQuery.isArray(a) || a.jquery )
+			// Serialize the form elements
+			jQuery.each( a, function(){
+				add( this.name, this.value );
+			});
+
+		// Otherwise, assume that it's an object of key/value pairs
+		else
+			// Serialize the key/values
+			for ( var j in a )
+				// If the value is an array then the key names need to be repeated
+				if ( jQuery.isArray(a[j]) )
+					jQuery.each( a[j], function(){
+						add( j, this );
+					});
+				else
+					add( j, jQuery.isFunction(a[j]) ? a[j]() : a[j] );
+
+		// Return the resulting serialization
+		return s.join("&").replace(/%20/g, "+");
+	}
+
+});
+var elemdisplay = {},
+	timerId,
+	fxAttrs = [
+		// height animations
+		[ "height", "marginTop", "marginBottom", "paddingTop", "paddingBottom" ],
+		// width animations
+		[ "width", "marginLeft", "marginRight", "paddingLeft", "paddingRight" ],
+		// opacity animations
+		[ "opacity" ]
+	];
+
+function genFx( type, num ){
+	var obj = {};
+	jQuery.each( fxAttrs.concat.apply([], fxAttrs.slice(0,num)), function(){
+		obj[ this ] = type;
+	});
+	return obj;
+}
+
+jQuery.fn.extend({
+	show: function(speed,callback){
+		if ( speed ) {
+			return this.animate( genFx("show", 3), speed, callback);
+		} else {
+			for ( var i = 0, l = this.length; i < l; i++ ){
+				var old = jQuery.data(this[i], "olddisplay");
+				
+				this[i].style.display = old || "";
+				
+				if ( jQuery.css(this[i], "display") === "none" ) {
+					var tagName = this[i].tagName, display;
+					
+					if ( elemdisplay[ tagName ] ) {
+						display = elemdisplay[ tagName ];
+					} else {
+						var elem = jQuery("<" + tagName + " />").appendTo("body");
+						
+						display = elem.css("display");
+						if ( display === "none" )
+							display = "block";
+						
+						elem.remove();
+						
+						elemdisplay[ tagName ] = display;
+					}
+					
+					jQuery.data(this[i], "olddisplay", display);
+				}
+			}
+
+			// Set the display of the elements in a second loop
+			// to avoid the constant reflow
+			for ( var i = 0, l = this.length; i < l; i++ ){
+				this[i].style.display = jQuery.data(this[i], "olddisplay") || "";
+			}
+			
+			return this;
+		}
+	},
+
+	hide: function(speed,callback){
+		if ( speed ) {
+			return this.animate( genFx("hide", 3), speed, callback);
+		} else {
+			for ( var i = 0, l = this.length; i < l; i++ ){
+				var old = jQuery.data(this[i], "olddisplay");
+				if ( !old && old !== "none" )
+					jQuery.data(this[i], "olddisplay", jQuery.css(this[i], "display"));
+			}
+
+			// Set the display of the elements in a second loop
+			// to avoid the constant reflow
+			for ( var i = 0, l = this.length; i < l; i++ ){
+				this[i].style.display = "none";
+			}
+
+			return this;
+		}
+	},
+
+	// Save the old toggle function
+	_toggle: jQuery.fn.toggle,
+
+	toggle: function( fn, fn2 ){
+		var bool = typeof fn === "boolean";
+
+		return jQuery.isFunction(fn) && jQuery.isFunction(fn2) ?
+			this._toggle.apply( this, arguments ) :
+			fn == null || bool ?
+				this.each(function(){
+					var state = bool ? fn : jQuery(this).is(":hidden");
+					jQuery(this)[ state ? "show" : "hide" ]();
+				}) :
+				this.animate(genFx("toggle", 3), fn, fn2);
+	},
+
+	fadeTo: function(speed,to,callback){
+		return this.animate({opacity: to}, speed, callback);
+	},
+
+	animate: function( prop, speed, easing, callback ) {
+		var optall = jQuery.speed(speed, easing, callback);
+
+		return this[ optall.queue === false ? "each" : "queue" ](function(){
+		
+			var opt = jQuery.extend({}, optall), p,
+				hidden = this.nodeType == 1 && jQuery(this).is(":hidden"),
+				self = this;
+	
+			for ( p in prop ) {
+				if ( prop[p] == "hide" && hidden || prop[p] == "show" && !hidden )
+					return opt.complete.call(this);
+
+				if ( ( p == "height" || p == "width" ) && this.style ) {
+					// Store display property
+					opt.display = jQuery.css(this, "display");
+
+					// Make sure that nothing sneaks out
+					opt.overflow = this.style.overflow;
+				}
+			}
+
+			if ( opt.overflow != null )
+				this.style.overflow = "hidden";
+
+			opt.curAnim = jQuery.extend({}, prop);
+
+			jQuery.each( prop, function(name, val){
+				var e = new jQuery.fx( self, opt, name );
+
+				if ( /toggle|show|hide/.test(val) )
+					e[ val == "toggle" ? hidden ? "show" : "hide" : val ]( prop );
+				else {
+					var parts = val.toString().match(/^([+-]=)?([\d+-.]+)(.*)$/),
+						start = e.cur(true) || 0;
+
+					if ( parts ) {
+						var end = parseFloat(parts[2]),
+							unit = parts[3] || "px";
+
+						// We need to compute starting value
+						if ( unit != "px" ) {
+							self.style[ name ] = (end || 1) + unit;
+							start = ((end || 1) / e.cur(true)) * start;
+							self.style[ name ] = start + unit;
+						}
+
+						// If a +=/-= token was provided, we're doing a relative animation
+						if ( parts[1] )
+							end = ((parts[1] == "-=" ? -1 : 1) * end) + start;
+
+						e.custom( start, end, unit );
+					} else
+						e.custom( start, val, "" );
+				}
+			});
+
+			// For JS strict compliance
+			return true;
+		});
+	},
+
+	stop: function(clearQueue, gotoEnd){
+		var timers = jQuery.timers;
+
+		if (clearQueue)
+			this.queue([]);
+
+		this.each(function(){
+			// go in reverse order so anything added to the queue during the loop is ignored
+			for ( var i = timers.length - 1; i >= 0; i-- )
+				if ( timers[i].elem == this ) {
+					if (gotoEnd)
+						// force the next step to be the last
+						timers[i](true);
+					timers.splice(i, 1);
+				}
+		});
+
+		// start the next in the queue if the last step wasn't forced
+		if (!gotoEnd)
+			this.dequeue();
+
+		return this;
+	}
+
+});
+
+// Generate shortcuts for custom animations
+jQuery.each({
+	slideDown: genFx("show", 1),
+	slideUp: genFx("hide", 1),
+	slideToggle: genFx("toggle", 1),
+	fadeIn: { opacity: "show" },
+	fadeOut: { opacity: "hide" }
+}, function( name, props ){
+	jQuery.fn[ name ] = function( speed, callback ){
+		return this.animate( props, speed, callback );
+	};
+});
+
+jQuery.extend({
+
+	speed: function(speed, easing, fn) {
+		var opt = typeof speed === "object" ? speed : {
+			complete: fn || !fn && easing ||
+				jQuery.isFunction( speed ) && speed,
+			duration: speed,
+			easing: fn && easing || easing && !jQuery.isFunction(easing) && easing
+		};
+
+		opt.duration = jQuery.fx.off ? 0 : typeof opt.duration === "number" ? opt.duration :
+			jQuery.fx.speeds[opt.duration] || jQuery.fx.speeds._default;
+
+		// Queueing
+		opt.old = opt.complete;
+		opt.complete = function(){
+			if ( opt.queue !== false )
+				jQuery(this).dequeue();
+			if ( jQuery.isFunction( opt.old ) )
+				opt.old.call( this );
+		};
+
+		return opt;
+	},
+
+	easing: {
+		linear: function( p, n, firstNum, diff ) {
+			return firstNum + diff * p;
+		},
+		swing: function( p, n, firstNum, diff ) {
+			return ((-Math.cos(p*Math.PI)/2) + 0.5) * diff + firstNum;
+		}
+	},
+
+	timers: [],
+
+	fx: function( elem, options, prop ){
+		this.options = options;
+		this.elem = elem;
+		this.prop = prop;
+
+		if ( !options.orig )
+			options.orig = {};
+	}
+
+});
+
+jQuery.fx.prototype = {
+
+	// Simple function for setting a style value
+	update: function(){
+		if ( this.options.step )
+			this.options.step.call( this.elem, this.now, this );
+
+		(jQuery.fx.step[this.prop] || jQuery.fx.step._default)( this );
+
+		// Set display property to block for height/width animations
+		if ( ( this.prop == "height" || this.prop == "width" ) && this.elem.style )
+			this.elem.style.display = "block";
+	},
+
+	// Get the current size
+	cur: function(force){
+		if ( this.elem[this.prop] != null && (!this.elem.style || this.elem.style[this.prop] == null) )
+			return this.elem[ this.prop ];
+
+		var r = parseFloat(jQuery.css(this.elem, this.prop, force));
+		return r && r > -10000 ? r : parseFloat(jQuery.curCSS(this.elem, this.prop)) || 0;
+	},
+
+	// Start an animation from one number to another
+	custom: function(from, to, unit){
+		this.startTime = now();
+		this.start = from;
+		this.end = to;
+		this.unit = unit || this.unit || "px";
+		this.now = this.start;
+		this.pos = this.state = 0;
+
+		var self = this;
+		function t(gotoEnd){
+			return self.step(gotoEnd);
+		}
+
+		t.elem = this.elem;
+
+		if ( t() && jQuery.timers.push(t) && !timerId ) {
+			timerId = setInterval(function(){
+				var timers = jQuery.timers;
+
+				for ( var i = 0; i < timers.length; i++ )
+					if ( !timers[i]() )
+						timers.splice(i--, 1);
+
+				if ( !timers.length ) {
+					clearInterval( timerId );
+					timerId = undefined;
+				}
+			}, 13);
+		}
+	},
+
+	// Simple 'show' function
+	show: function(){
+		// Remember where we started, so that we can go back to it later
+		this.options.orig[this.prop] = jQuery.attr( this.elem.style, this.prop );
+		this.options.show = true;
+
+		// Begin the animation
+		// Make sure that we start at a small width/height to avoid any
+		// flash of content
+		this.custom(this.prop == "width" || this.prop == "height" ? 1 : 0, this.cur());
+
+		// Start by showing the element
+		jQuery(this.elem).show();
+	},
+
+	// Simple 'hide' function
+	hide: function(){
+		// Remember where we started, so that we can go back to it later
+		this.options.orig[this.prop] = jQuery.attr( this.elem.style, this.prop );
+		this.options.hide = true;
+
+		// Begin the animation
+		this.custom(this.cur(), 0);
+	},
+
+	// Each step of an animation
+	step: function(gotoEnd){
+		var t = now();
+
+		if ( gotoEnd || t >= this.options.duration + this.startTime ) {
+			this.now = this.end;
+			this.pos = this.state = 1;
+			this.update();
+
+			this.options.curAnim[ this.prop ] = true;
+
+			var done = true;
+			for ( var i in this.options.curAnim )
+				if ( this.options.curAnim[i] !== true )
+					done = false;
+
+			if ( done ) {
+				if ( this.options.display != null ) {
+					// Reset the overflow
+					this.elem.style.overflow = this.options.overflow;
+
+					// Reset the display
+					this.elem.style.display = this.options.display;
+					if ( jQuery.css(this.elem, "display") == "none" )
+						this.elem.style.display = "block";
+				}
+
+				// Hide the element if the "hide" operation was done
+				if ( this.options.hide )
+					jQuery(this.elem).hide();
+
+				// Reset the properties, if the item has been hidden or shown
+				if ( this.options.hide || this.options.show )
+					for ( var p in this.options.curAnim )
+						jQuery.attr(this.elem.style, p, this.options.orig[p]);
+					
+				// Execute the complete function
+				this.options.complete.call( this.elem );
+			}
+
+			return false;
+		} else {
+			var n = t - this.startTime;
+			this.state = n / this.options.duration;
+
+			// Perform the easing function, defaults to swing
+			this.pos = jQuery.easing[this.options.easing || (jQuery.easing.swing ? "swing" : "linear")](this.state, n, 0, 1, this.options.duration);
+			this.now = this.start + ((this.end - this.start) * this.pos);
+
+			// Perform the next step of the animation
+			this.update();
+		}
+
+		return true;
+	}
+
+};
+
+jQuery.extend( jQuery.fx, {
+	speeds:{
+		slow: 600,
+ 		fast: 200,
+ 		// Default speed
+ 		_default: 400
+	},
+	step: {
+
+		opacity: function(fx){
+			jQuery.attr(fx.elem.style, "opacity", fx.now);
+		},
+
+		_default: function(fx){
+			if ( fx.elem.style && fx.elem.style[ fx.prop ] != null )
+				fx.elem.style[ fx.prop ] = fx.now + fx.unit;
+			else
+				fx.elem[ fx.prop ] = fx.now;
+		}
+	}
+});
+if ( document.documentElement["getBoundingClientRect"] )
+	jQuery.fn.offset = function() {
+		if ( !this[0] ) return { top: 0, left: 0 };
+		if ( this[0] === this[0].ownerDocument.body ) return jQuery.offset.bodyOffset( this[0] );
+		var box  = this[0].getBoundingClientRect(), doc = this[0].ownerDocument, body = doc.body, docElem = doc.documentElement,
+			clientTop = docElem.clientTop || body.clientTop || 0, clientLeft = docElem.clientLeft || body.clientLeft || 0,
+			top  = box.top  + (self.pageYOffset || jQuery.boxModel && docElem.scrollTop  || body.scrollTop ) - clientTop,
+			left = box.left + (self.pageXOffset || jQuery.boxModel && docElem.scrollLeft || body.scrollLeft) - clientLeft;
+		return { top: top, left: left };
+	};
+else 
+	jQuery.fn.offset = function() {
+		if ( !this[0] ) return { top: 0, left: 0 };
+		if ( this[0] === this[0].ownerDocument.body ) return jQuery.offset.bodyOffset( this[0] );
+		jQuery.offset.initialized || jQuery.offset.initialize();
+
+		var elem = this[0], offsetParent = elem.offsetParent, prevOffsetParent = elem,
+			doc = elem.ownerDocument, computedStyle, docElem = doc.documentElement,
+			body = doc.body, defaultView = doc.defaultView,
+			prevComputedStyle = defaultView.getComputedStyle(elem, null),
+			top = elem.offsetTop, left = elem.offsetLeft;
+
+		while ( (elem = elem.parentNode) && elem !== body && elem !== docElem ) {
+			computedStyle = defaultView.getComputedStyle(elem, null);
+			top -= elem.scrollTop, left -= elem.scrollLeft;
+			if ( elem === offsetParent ) {
+				top += elem.offsetTop, left += elem.offsetLeft;
+				if ( jQuery.offset.doesNotAddBorder && !(jQuery.offset.doesAddBorderForTableAndCells && /^t(able|d|h)$/i.test(elem.tagName)) )
+					top  += parseInt( computedStyle.borderTopWidth,  10) || 0,
+					left += parseInt( computedStyle.borderLeftWidth, 10) || 0;
+				prevOffsetParent = offsetParent, offsetParent = elem.offsetParent;
+			}
+			if ( jQuery.offset.subtractsBorderForOverflowNotVisible && computedStyle.overflow !== "visible" )
+				top  += parseInt( computedStyle.borderTopWidth,  10) || 0,
+				left += parseInt( computedStyle.borderLeftWidth, 10) || 0;
+			prevComputedStyle = computedStyle;
+		}
+
+		if ( prevComputedStyle.position === "relative" || prevComputedStyle.position === "static" )
+			top  += body.offsetTop,
+			left += body.offsetLeft;
+
+		if ( prevComputedStyle.position === "fixed" )
+			top  += Math.max(docElem.scrollTop, body.scrollTop),
+			left += Math.max(docElem.scrollLeft, body.scrollLeft);
+
+		return { top: top, left: left };
+	};
+
+jQuery.offset = {
+	initialize: function() {
+		if ( this.initialized ) return;
+		var body = document.body, container = document.createElement('div'), innerDiv, checkDiv, table, td, rules, prop, bodyMarginTop = body.style.marginTop,
+			html = '<div style="position:absolute;top:0;left:0;margin:0;border:5px solid #000;padding:0;width:1px;height:1px;"><div></div></div><table style="position:absolute;top:0;left:0;margin:0;border:5px solid #000;padding:0;width:1px;height:1px;" cellpadding="0" cellspacing="0"><tr><td></td></tr></table>';
+
+		rules = { position: 'absolute', top: 0, left: 0, margin: 0, border: 0, width: '1px', height: '1px', visibility: 'hidden' };
+		for ( prop in rules ) container.style[prop] = rules[prop];
+
+		container.innerHTML = html;
+		body.insertBefore(container, body.firstChild);
+		innerDiv = container.firstChild, checkDiv = innerDiv.firstChild, td = innerDiv.nextSibling.firstChild.firstChild;
+
+		this.doesNotAddBorder = (checkDiv.offsetTop !== 5);
+		this.doesAddBorderForTableAndCells = (td.offsetTop === 5);
+
+		innerDiv.style.overflow = 'hidden', innerDiv.style.position = 'relative';
+		this.subtractsBorderForOverflowNotVisible = (checkDiv.offsetTop === -5);
+
+		body.style.marginTop = '1px';
+		this.doesNotIncludeMarginInBodyOffset = (body.offsetTop === 0);
+		body.style.marginTop = bodyMarginTop;
+
+		body.removeChild(container);
+		this.initialized = true;
+	},
+
+	bodyOffset: function(body) {
+		jQuery.offset.initialized || jQuery.offset.initialize();
+		var top = body.offsetTop, left = body.offsetLeft;
+		if ( jQuery.offset.doesNotIncludeMarginInBodyOffset )
+			top  += parseInt( jQuery.curCSS(body, 'marginTop',  true), 10 ) || 0,
+			left += parseInt( jQuery.curCSS(body, 'marginLeft', true), 10 ) || 0;
+		return { top: top, left: left };
+	}
+};
+
+
+jQuery.fn.extend({
+	position: function() {
+		var left = 0, top = 0, results;
+
+		if ( this[0] ) {
+			// Get *real* offsetParent
+			var offsetParent = this.offsetParent(),
+
+			// Get correct offsets
+			offset       = this.offset(),
+			parentOffset = /^body|html$/i.test(offsetParent[0].tagName) ? { top: 0, left: 0 } : offsetParent.offset();
+
+			// Subtract element margins
+			// note: when an element has margin: auto the offsetLeft and marginLeft 
+			// are the same in Safari causing offset.left to incorrectly be 0
+			offset.top  -= num( this, 'marginTop'  );
+			offset.left -= num( this, 'marginLeft' );
+
+			// Add offsetParent borders
+			parentOffset.top  += num( offsetParent, 'borderTopWidth'  );
+			parentOffset.left += num( offsetParent, 'borderLeftWidth' );
+
+			// Subtract the two offsets
+			results = {
+				top:  offset.top  - parentOffset.top,
+				left: offset.left - parentOffset.left
+			};
+		}
+
+		return results;
+	},
+
+	offsetParent: function() {
+		var offsetParent = this[0].offsetParent || document.body;
+		while ( offsetParent && (!/^body|html$/i.test(offsetParent.tagName) && jQuery.css(offsetParent, 'position') == 'static') )
+			offsetParent = offsetParent.offsetParent;
+		return jQuery(offsetParent);
+	}
+});
+
+
+// Create scrollLeft and scrollTop methods
+jQuery.each( ['Left', 'Top'], function(i, name) {
+	var method = 'scroll' + name;
+	
+	jQuery.fn[ method ] = function(val) {
+		if (!this[0]) return null;
+
+		return val !== undefined ?
+
+			// Set the scroll offset
+			this.each(function() {
+				this == window || this == document ?
+					window.scrollTo(
+						!i ? val : jQuery(window).scrollLeft(),
+						 i ? val : jQuery(window).scrollTop()
+					) :
+					this[ method ] = val;
+			}) :
+
+			// Return the scroll offset
+			this[0] == window || this[0] == document ?
+				self[ i ? 'pageYOffset' : 'pageXOffset' ] ||
+					jQuery.boxModel && document.documentElement[ method ] ||
+					document.body[ method ] :
+				this[0][ method ];
+	};
+});
+// Create innerHeight, innerWidth, outerHeight and outerWidth methods
+jQuery.each([ "Height", "Width" ], function(i, name){
+
+	var tl = i ? "Left"  : "Top",  // top or left
+		br = i ? "Right" : "Bottom", // bottom or right
+		lower = name.toLowerCase();
+
+	// innerHeight and innerWidth
+	jQuery.fn["inner" + name] = function(){
+		return this[0] ?
+			jQuery.css( this[0], lower, false, "padding" ) :
+			null;
+	};
+
+	// outerHeight and outerWidth
+	jQuery.fn["outer" + name] = function(margin) {
+		return this[0] ?
+			jQuery.css( this[0], lower, false, margin ? "margin" : "border" ) :
+			null;
+	};
+	
+	var type = name.toLowerCase();
+
+	jQuery.fn[ type ] = function( size ) {
+		// Get window width or height
+		return this[0] == window ?
+			// Everyone else use document.documentElement or document.body depending on Quirks vs Standards mode
+			document.compatMode == "CSS1Compat" && document.documentElement[ "client" + name ] ||
+			document.body[ "client" + name ] :
+
+			// Get document width or height
+			this[0] == document ?
+				// Either scroll[Width/Height] or offset[Width/Height], whichever is greater
+				Math.max(
+					document.documentElement["client" + name],
+					document.body["scroll" + name], document.documentElement["scroll" + name],
+					document.body["offset" + name], document.documentElement["offset" + name]
+				) :
+
+				// Get or set width or height on the element
+				size === undefined ?
+					// Get width or height on the element
+					(this.length ? jQuery.css( this[0], type ) : null) :
+
+					// Set the width or height on the element (default to pixels if value is unitless)
+					this.css( type, typeof size === "string" ? size : size + "px" );
+	};
+
+});
+})();
diff --git a/main.py b/main.py
new file mode 100644
index 00000000..9a9cbf31
--- /dev/null
+++ b/main.py
@@ -0,0 +1,316 @@
+#!/usr/bin/env python
+#
+# Copyright 2007 Google Inc.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+#
+
+import os
+import sys
+import logging
+import traceback
+import StringIO
+
+from google.appengine.runtime import DeadlineExceededError
+
+from google.appengine.ext.webapp import template
+from google.appengine.api import users
+from google.appengine.ext import webapp
+from google.appengine.ext.webapp import util
+
+from fanficdownloader.downloader import *
+from fanficdownloader.ffnet import *
+from fanficdownloader.output import *
+from fanficdownloader import twilighted
+
+from google.appengine.ext import db
+
+from fanficdownloader.zipdir import *
+
+from ffstorage import *
+
+
+
+class LoginRequired(webapp.RequestHandler):
+	def get(self):
+		user = users.get_current_user()
+		if user:
+			self.redirect('/')
+		else:
+			logging.debug(users.create_login_url('/'))
+			url = users.create_login_url(self.request.uri)
+			template_values = {'login_url' : url}
+			path = os.path.join(os.path.dirname(__file__), 'index-nonlogin.html')
+			self.response.out.write(template.render(path, template_values))
+
+class MainHandler(webapp.RequestHandler):
+	def get(self):
+		user = users.get_current_user()
+		if user:
+			error = self.request.get('error')
+			template_values = {'nickname' : user.nickname(), 'authorized': True}
+			url = self.request.get('url')
+			template_values['url'] = url
+			
+			if error != None and len(error) > 1:
+				if error == 'login_required':
+					template_values['error_message'] = 'This story (or one of the chapters) requires you to be logged in.'
+				elif error == 'bad_url':
+					template_values['error_message'] = 'Unsupported URL: ' + url
+				elif error == 'custom':
+					template_values['error_message'] = 'Error happened: ' + self.request.get('errtext')
+			
+			filename = self.request.get('file')
+			if len(filename) > 1:
+				template_values['yourfile'] = '''<div id='yourfile'><a href='/file?id=%s'>"%s" by %s</a></div>''' % (filename, self.request.get('name'), self.request.get('author'))
+			
+			self.response.headers['Content-Type'] = 'text/html'
+			path = os.path.join(os.path.dirname(__file__), 'index.html')
+
+			self.response.out.write(template.render(path, template_values))
+		else:
+#			self.redirect(users.create_login_url(self.request.uri))
+#			self.redirect('/login')
+			logging.debug(users.create_login_url('/'))
+			url = users.create_login_url(self.request.uri)
+			template_values = {'login_url' : url, 'authorized': False}
+			path = os.path.join(os.path.dirname(__file__), 'index.html')
+			self.response.out.write(template.render(path, template_values))
+
+
+class FileServer(webapp.RequestHandler):
+	def get(self):
+#		user  = users.get_current_user()
+		fileId = self.request.get('id')
+		
+		if fileId == None or len(fileId) < 3:
+			self.redirect('/')
+		
+		key = db.Key(fileId)
+		fanfic = db.get(key)
+		
+		name = fanfic.name.encode('utf-8')
+		
+		name = makeAcceptableFilename(name)
+		
+		logging.info("Serving file: %s" % name)
+
+		if fanfic.format == 'epub':
+			self.response.headers['Content-Type'] = 'application/epub+zip'
+			self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.epub'
+		elif fanfic.format == 'html':
+			self.response.headers['Content-Type'] = 'text/html'
+			self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.html.zip'
+		elif fanfic.format == 'text':
+			self.response.headers['Content-Type'] = 'text/plain'
+			self.response.headers['Content-disposition'] = 'attachment; filename=' +name + '.txt.zip'
+		
+		self.response.out.write(fanfic.blob)
+
+class RecentFilesServer(webapp.RequestHandler):
+	def get(self):
+		user = users.get_current_user()
+		if not user:
+			self.redirect('/login')
+		
+#		fics = db.GqlQuery("Select * From DownloadedFanfic WHERE user = :1 and cleared = :2", user)
+		q = DownloadedFanfic.all()
+		q.filter('user =', user)
+		q.filter('cleared =', False)
+		fics = q.fetch(100)
+		
+		template_values = dict(fics = fics, nickname = user.nickname())
+		path = os.path.join(os.path.dirname(__file__), 'recent.html')
+		self.response.out.write(template.render(path, template_values))
+		
+class RecentAllFilesServer(webapp.RequestHandler):
+	def get(self):
+		user = users.get_current_user()
+		if user.nickname() != 'sigizmund':
+			return
+			
+		fics = db.GqlQuery("Select * From DownloadedFanfic")
+		template_values = dict(fics = fics, nickname = user.nickname())
+		path = os.path.join(os.path.dirname(__file__), 'recent.html')
+		self.response.out.write(template.render(path, template_values))	
+
+class FanfictionDownloader(webapp.RequestHandler):
+	def _printableVersion(self, text):
+		text = removeEntities(text)
+		try:
+			d = text.decode('utf-8')
+		except:
+			d = text
+		return d
+	
+
+	def post(self):
+		logging.getLogger().setLevel(logging.DEBUG)
+		
+		user = users.get_current_user()
+		if not user:
+			self.redirect(users.create_login_url('/'))
+		
+		format = self.request.get('format')
+		url = self.request.get('url')
+		login = self.request.get('login')
+		password = self.request.get('password')
+		
+		logging.info("Downloading: " + url)
+		
+		adapter = None
+		writerClass = None
+
+		download = OneDownload()
+		download.user = user
+		download.url = url
+		download.login = login
+		download.password = password
+		download.format = format
+		logging.info('Creating adapter...')
+		
+		try:
+			if url.find('fictionalley') != -1:
+				adapter = fictionalley.FictionAlley(url)
+			elif url.find('ficwad') != -1:
+				adapter = ficwad.FicWad(url)
+			elif url.find('fanfiction.net') != -1:
+				adapter = ffnet.FFNet(url)
+			elif url.find('fictionpress.com') != -1:
+				adapter = fpcom.FPCom(url)
+			elif url.find('harrypotterfanfiction.com') != -1:
+				adapter = hpfiction.HPFiction(url)
+			elif url.find('twilighted.net') != -1:
+				adapter = twilighted.Twilighted(url)
+			elif url.find('potionsandsnitches.net') != -1:
+				adapter = potionsNsnitches.PotionsNSnitches(url)
+			elif url.find('mediaminer.org') != -1:
+				adapter = mediaminer.MediaMiner(url)
+			else:
+				logging.debug("Bad URL detected")
+				self.redirect('/?error=bad_url&url=' + urlEscape(url) )
+				return
+		except Exception, e:
+			logging.exception(e)
+			download.failure = "Adapter was not created: " + str(e)
+			download.put()
+			
+			self.redirect('/?error=custom&url=' + urlEscape(url) + '&errtext=' + urlEscape(str(traceback.format_exc())) )
+			return
+		
+		logging.info('Created an adaper: %s' % adapter)
+		
+		if len(login) > 1:
+			adapter.setLogin(login)
+			adapter.setPassword(password)
+
+		if format == 'epub':
+			writerClass = output.EPubFanficWriter
+		elif format == 'html':
+			writerClass = output.HTMLWriter
+		else:
+			writerClass = output.TextWriter
+		
+		loader = FanficLoader(adapter, writerClass, quiet = True, inmemory=True, compress=False)
+		try:
+			data = loader.download()
+			
+			if format == 'html' or format == 'text':
+				# data is uncompressed hence huge
+				ext = '.html'
+				if format == 'text':
+					ext = '.txt'
+				logging.debug(data)
+				files = {makeAcceptableFilename(str(adapter.getOutputName())) + ext : StringIO.StringIO(data.decode('utf-8')) }
+				d = inMemoryZip(files)
+				data = d.getvalue()
+			
+		
+		except LoginRequiredException, e:
+			logging.exception(e)
+			download.failure = 'Login problem detected'
+			download.put()
+			
+			self.redirect('/?error=login_required&url=' + urlEscape(url))
+			return
+		except:
+			e = sys.exc_info()[0]
+			
+			logging.exception(e)
+			download.failure = 'Some exception happened in downloader: ' + str(e)
+			download.put()
+			
+			self.redirect('/?error=custom&url=' + urlEscape(url) + '&errtext=' + urlEscape(str(traceback.format_exc())) )
+			return
+			
+		if data == None:
+			if loader.badLogin:
+				logging.debug("Bad login detected")
+				
+				download.failure = 'Login problem detected'
+				download.put()
+				
+				self.redirect('/?error=login_required&url=' + urlEscape(url))
+		else:
+			fic = DownloadedFanfic()
+			fic.user = user
+			fic.url = url
+			fic.format = format
+			fic.name = self._printableVersion(adapter.getOutputName())
+			fic.author = self._printableVersion(adapter.getAuthorName())
+			fic.blob = data
+			
+			try:
+				fic.put()
+				
+				key = fic.key()
+				
+				download.put()
+				self.redirect('/?file='+str(key)+'&name=' + urlEscape(fic.name) + '&author=' + urlEscape(fic.author))
+				
+				logging.info("Download finished OK")
+			except Exception, e:
+				logging.exception(e)
+				# it was too large, won't save it
+				name = str(makeAcceptableFilename(adapter.getStoryName()))
+				if format == 'epub':
+					self.response.headers['Content-Type'] = 'application/epub+zip'
+					self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.epub'
+				elif format == 'html':
+					self.response.headers['Content-Type'] = 'application/zip'
+					self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.html.zip'
+				elif format == 'text':
+					self.response.headers['Content-Type'] = 'application/zip'
+					self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.txt.zip'
+				
+				self.response.out.write(data)
+				
+def toPercentDecimal(match): 
+	"Return the %decimal number for the character for url escaping"
+	s = match.group(1)
+	return "%%%02x" % ord(s)
+
+def urlEscape(data):
+	"Escape text, including unicode, for use in URLs"
+	p = re.compile(r'([^\w])')
+	return p.sub(toPercentDecimal, data.encode("utf-8"))
+
+def main():
+  application = webapp.WSGIApplication([('/', MainHandler), ('/fdown', FanfictionDownloader), ('/file', FileServer), ('/recent', RecentFilesServer), ('/r2d2', RecentAllFilesServer), ('/login', LoginRequired)],
+                                       debug=False)
+  util.run_wsgi_app(application)
+
+
+if __name__ == '__main__':
+	logging.getLogger().setLevel(logging.DEBUG)
+	main()
diff --git a/queue.yaml b/queue.yaml
new file mode 100644
index 00000000..0bfb85d0
--- /dev/null
+++ b/queue.yaml
@@ -0,0 +1,5 @@
+queue:
+- name: default
+  rate: 1/s
+- name: download
+  rate: 10/s
\ No newline at end of file
diff --git a/recent.html b/recent.html
new file mode 100644
index 00000000..1b199e5e
--- /dev/null
+++ b/recent.html
@@ -0,0 +1,69 @@
+<!DOCTYPE html PUBLIC "-//W3C//DTD HTML 4.01//EN">
+<html>
+	<head>
+		<link href="css/index.css" rel="stylesheet" type="text/css">
+		<title>Fanfiction Downloader (fanfiction.net, fanficauthors, fictionalley, ficwad to epub and HTML)</title>
+		<meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
+	</head>
+	<body>
+		<div id='main'>
+			<h1>
+				<a href="/" style="text-decoration: none; color: black;">FanFiction Downloader</a>
+			</h1>
+			
+			
+			<script type="text/javascript"><!--
+			google_ad_client = "pub-2027714004231956";
+			/* 468x60, created 6/9/10 */
+			google_ad_slot = "8817097473";
+			google_ad_width = 468;
+			google_ad_height = 60;
+			//-->
+			</script>
+			<script type="text/javascript"
+			src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
+			</script>			
+			
+			
+			
+<!--			<div id='yourfile'> -->
+			{{yourfile}}
+<!--			</div> -->
+			
+				<div id='urlbox'>
+					<div id='greeting'>
+						Hi, {{ nickname }}! These fanfics you've downloaded previously.
+					</div>
+				</div>
+				
+				<div id='helpbox'>
+					{% for fic in fics %}
+					<p> <a href="/file?id={{ fic.key }}">{{ fic.name }}</a> by {{ fic.author }} ({{ fic.format }})<br/><small><a href="{{ fic.url }}">{{ fic.url }}</a></small></p>
+					{% endfor %}
+				</div>
+				
+				<script type="text/javascript"><!--
+				google_ad_client = "pub-2027714004231956";
+				/* 468x60, created 6/9/10 */
+				google_ad_slot = "2009456648";
+				google_ad_width = 468;
+				google_ad_height = 60;
+				//-->
+				</script>
+				<script type="text/javascript"
+				src="http://pagead2.googlesyndication.com/pagead/show_ads.js">
+				</script>
+				
+				
+		</div>
+		<script type="text/javascript">
+		var gaJsHost = (("https:" == document.location.protocol) ? "https://ssl." : "http://www.");
+		document.write(unescape("%3Cscript src='" + gaJsHost + "google-analytics.com/ga.js' type='text/javascript'%3E%3C/script%3E"));
+		</script>
+		<script type="text/javascript">
+		try {
+		var pageTracker = _gat._getTracker("UA-12136939-1");
+		pageTracker._trackPageview();
+		} catch(err) {}</script>
+	</body>
+</html>
diff --git a/simplejson/__init__.py b/simplejson/__init__.py
new file mode 100644
index 00000000..d5b4d399
--- /dev/null
+++ b/simplejson/__init__.py
@@ -0,0 +1,318 @@
+r"""JSON (JavaScript Object Notation) <http://json.org> is a subset of
+JavaScript syntax (ECMA-262 3rd edition) used as a lightweight data
+interchange format.
+
+:mod:`simplejson` exposes an API familiar to users of the standard library
+:mod:`marshal` and :mod:`pickle` modules. It is the externally maintained
+version of the :mod:`json` library contained in Python 2.6, but maintains
+compatibility with Python 2.4 and Python 2.5 and (currently) has
+significant performance advantages, even without using the optional C
+extension for speedups.
+
+Encoding basic Python object hierarchies::
+
+    >>> import simplejson as json
+    >>> json.dumps(['foo', {'bar': ('baz', None, 1.0, 2)}])
+    '["foo", {"bar": ["baz", null, 1.0, 2]}]'
+    >>> print json.dumps("\"foo\bar")
+    "\"foo\bar"
+    >>> print json.dumps(u'\u1234')
+    "\u1234"
+    >>> print json.dumps('\\')
+    "\\"
+    >>> print json.dumps({"c": 0, "b": 0, "a": 0}, sort_keys=True)
+    {"a": 0, "b": 0, "c": 0}
+    >>> from StringIO import StringIO
+    >>> io = StringIO()
+    >>> json.dump(['streaming API'], io)
+    >>> io.getvalue()
+    '["streaming API"]'
+
+Compact encoding::
+
+    >>> import simplejson as json
+    >>> json.dumps([1,2,3,{'4': 5, '6': 7}], separators=(',',':'))
+    '[1,2,3,{"4":5,"6":7}]'
+
+Pretty printing::
+
+    >>> import simplejson as json
+    >>> s = json.dumps({'4': 5, '6': 7}, sort_keys=True, indent=4)
+    >>> print '\n'.join([l.rstrip() for l in  s.splitlines()])
+    {
+        "4": 5,
+        "6": 7
+    }
+
+Decoding JSON::
+
+    >>> import simplejson as json
+    >>> obj = [u'foo', {u'bar': [u'baz', None, 1.0, 2]}]
+    >>> json.loads('["foo", {"bar":["baz", null, 1.0, 2]}]') == obj
+    True
+    >>> json.loads('"\\"foo\\bar"') == u'"foo\x08ar'
+    True
+    >>> from StringIO import StringIO
+    >>> io = StringIO('["streaming API"]')
+    >>> json.load(io)[0] == 'streaming API'
+    True
+
+Specializing JSON object decoding::
+
+    >>> import simplejson as json
+    >>> def as_complex(dct):
+    ...     if '__complex__' in dct:
+    ...         return complex(dct['real'], dct['imag'])
+    ...     return dct
+    ...
+    >>> json.loads('{"__complex__": true, "real": 1, "imag": 2}',
+    ...     object_hook=as_complex)
+    (1+2j)
+    >>> import decimal
+    >>> json.loads('1.1', parse_float=decimal.Decimal) == decimal.Decimal('1.1')
+    True
+
+Specializing JSON object encoding::
+
+    >>> import simplejson as json
+    >>> def encode_complex(obj):
+    ...     if isinstance(obj, complex):
+    ...         return [obj.real, obj.imag]
+    ...     raise TypeError(repr(o) + " is not JSON serializable")
+    ...
+    >>> json.dumps(2 + 1j, default=encode_complex)
+    '[2.0, 1.0]'
+    >>> json.JSONEncoder(default=encode_complex).encode(2 + 1j)
+    '[2.0, 1.0]'
+    >>> ''.join(json.JSONEncoder(default=encode_complex).iterencode(2 + 1j))
+    '[2.0, 1.0]'
+
+
+Using simplejson.tool from the shell to validate and pretty-print::
+
+    $ echo '{"json":"obj"}' | python -m simplejson.tool
+    {
+        "json": "obj"
+    }
+    $ echo '{ 1.2:3.4}' | python -m simplejson.tool
+    Expecting property name: line 1 column 2 (char 2)
+"""
+__version__ = '2.0.9'
+__all__ = [
+    'dump', 'dumps', 'load', 'loads',
+    'JSONDecoder', 'JSONEncoder',
+]
+
+__author__ = 'Bob Ippolito <bob@redivi.com>'
+
+from decoder import JSONDecoder
+from encoder import JSONEncoder
+
+_default_encoder = JSONEncoder(
+    skipkeys=False,
+    ensure_ascii=True,
+    check_circular=True,
+    allow_nan=True,
+    indent=None,
+    separators=None,
+    encoding='utf-8',
+    default=None,
+)
+
+def dump(obj, fp, skipkeys=False, ensure_ascii=True, check_circular=True,
+        allow_nan=True, cls=None, indent=None, separators=None,
+        encoding='utf-8', default=None, **kw):
+    """Serialize ``obj`` as a JSON formatted stream to ``fp`` (a
+    ``.write()``-supporting file-like object).
+
+    If ``skipkeys`` is true then ``dict`` keys that are not basic types
+    (``str``, ``unicode``, ``int``, ``long``, ``float``, ``bool``, ``None``)
+    will be skipped instead of raising a ``TypeError``.
+
+    If ``ensure_ascii`` is false, then the some chunks written to ``fp``
+    may be ``unicode`` instances, subject to normal Python ``str`` to
+    ``unicode`` coercion rules. Unless ``fp.write()`` explicitly
+    understands ``unicode`` (as in ``codecs.getwriter()``) this is likely
+    to cause an error.
+
+    If ``check_circular`` is false, then the circular reference check
+    for container types will be skipped and a circular reference will
+    result in an ``OverflowError`` (or worse).
+
+    If ``allow_nan`` is false, then it will be a ``ValueError`` to
+    serialize out of range ``float`` values (``nan``, ``inf``, ``-inf``)
+    in strict compliance of the JSON specification, instead of using the
+    JavaScript equivalents (``NaN``, ``Infinity``, ``-Infinity``).
+
+    If ``indent`` is a non-negative integer, then JSON array elements and object
+    members will be pretty-printed with that indent level. An indent level
+    of 0 will only insert newlines. ``None`` is the most compact representation.
+
+    If ``separators`` is an ``(item_separator, dict_separator)`` tuple
+    then it will be used instead of the default ``(', ', ': ')`` separators.
+    ``(',', ':')`` is the most compact JSON representation.
+
+    ``encoding`` is the character encoding for str instances, default is UTF-8.
+
+    ``default(obj)`` is a function that should return a serializable version
+    of obj or raise TypeError. The default simply raises TypeError.
+
+    To use a custom ``JSONEncoder`` subclass (e.g. one that overrides the
+    ``.default()`` method to serialize additional types), specify it with
+    the ``cls`` kwarg.
+
+    """
+    # cached encoder
+    if (not skipkeys and ensure_ascii and
+        check_circular and allow_nan and
+        cls is None and indent is None and separators is None and
+        encoding == 'utf-8' and default is None and not kw):
+        iterable = _default_encoder.iterencode(obj)
+    else:
+        if cls is None:
+            cls = JSONEncoder
+        iterable = cls(skipkeys=skipkeys, ensure_ascii=ensure_ascii,
+            check_circular=check_circular, allow_nan=allow_nan, indent=indent,
+            separators=separators, encoding=encoding,
+            default=default, **kw).iterencode(obj)
+    # could accelerate with writelines in some versions of Python, at
+    # a debuggability cost
+    for chunk in iterable:
+        fp.write(chunk)
+
+
+def dumps(obj, skipkeys=False, ensure_ascii=True, check_circular=True,
+        allow_nan=True, cls=None, indent=None, separators=None,
+        encoding='utf-8', default=None, **kw):
+    """Serialize ``obj`` to a JSON formatted ``str``.
+
+    If ``skipkeys`` is false then ``dict`` keys that are not basic types
+    (``str``, ``unicode``, ``int``, ``long``, ``float``, ``bool``, ``None``)
+    will be skipped instead of raising a ``TypeError``.
+
+    If ``ensure_ascii`` is false, then the return value will be a
+    ``unicode`` instance subject to normal Python ``str`` to ``unicode``
+    coercion rules instead of being escaped to an ASCII ``str``.
+
+    If ``check_circular`` is false, then the circular reference check
+    for container types will be skipped and a circular reference will
+    result in an ``OverflowError`` (or worse).
+
+    If ``allow_nan`` is false, then it will be a ``ValueError`` to
+    serialize out of range ``float`` values (``nan``, ``inf``, ``-inf``) in
+    strict compliance of the JSON specification, instead of using the
+    JavaScript equivalents (``NaN``, ``Infinity``, ``-Infinity``).
+
+    If ``indent`` is a non-negative integer, then JSON array elements and
+    object members will be pretty-printed with that indent level. An indent
+    level of 0 will only insert newlines. ``None`` is the most compact
+    representation.
+
+    If ``separators`` is an ``(item_separator, dict_separator)`` tuple
+    then it will be used instead of the default ``(', ', ': ')`` separators.
+    ``(',', ':')`` is the most compact JSON representation.
+
+    ``encoding`` is the character encoding for str instances, default is UTF-8.
+
+    ``default(obj)`` is a function that should return a serializable version
+    of obj or raise TypeError. The default simply raises TypeError.
+
+    To use a custom ``JSONEncoder`` subclass (e.g. one that overrides the
+    ``.default()`` method to serialize additional types), specify it with
+    the ``cls`` kwarg.
+
+    """
+    # cached encoder
+    if (not skipkeys and ensure_ascii and
+        check_circular and allow_nan and
+        cls is None and indent is None and separators is None and
+        encoding == 'utf-8' and default is None and not kw):
+        return _default_encoder.encode(obj)
+    if cls is None:
+        cls = JSONEncoder
+    return cls(
+        skipkeys=skipkeys, ensure_ascii=ensure_ascii,
+        check_circular=check_circular, allow_nan=allow_nan, indent=indent,
+        separators=separators, encoding=encoding, default=default,
+        **kw).encode(obj)
+
+
+_default_decoder = JSONDecoder(encoding=None, object_hook=None)
+
+
+def load(fp, encoding=None, cls=None, object_hook=None, parse_float=None,
+        parse_int=None, parse_constant=None, **kw):
+    """Deserialize ``fp`` (a ``.read()``-supporting file-like object containing
+    a JSON document) to a Python object.
+
+    If the contents of ``fp`` is encoded with an ASCII based encoding other
+    than utf-8 (e.g. latin-1), then an appropriate ``encoding`` name must
+    be specified. Encodings that are not ASCII based (such as UCS-2) are
+    not allowed, and should be wrapped with
+    ``codecs.getreader(fp)(encoding)``, or simply decoded to a ``unicode``
+    object and passed to ``loads()``
+
+    ``object_hook`` is an optional function that will be called with the
+    result of any object literal decode (a ``dict``). The return value of
+    ``object_hook`` will be used instead of the ``dict``. This feature
+    can be used to implement custom decoders (e.g. JSON-RPC class hinting).
+
+    To use a custom ``JSONDecoder`` subclass, specify it with the ``cls``
+    kwarg.
+
+    """
+    return loads(fp.read(),
+        encoding=encoding, cls=cls, object_hook=object_hook,
+        parse_float=parse_float, parse_int=parse_int,
+        parse_constant=parse_constant, **kw)
+
+
+def loads(s, encoding=None, cls=None, object_hook=None, parse_float=None,
+        parse_int=None, parse_constant=None, **kw):
+    """Deserialize ``s`` (a ``str`` or ``unicode`` instance containing a JSON
+    document) to a Python object.
+
+    If ``s`` is a ``str`` instance and is encoded with an ASCII based encoding
+    other than utf-8 (e.g. latin-1) then an appropriate ``encoding`` name
+    must be specified. Encodings that are not ASCII based (such as UCS-2)
+    are not allowed and should be decoded to ``unicode`` first.
+
+    ``object_hook`` is an optional function that will be called with the
+    result of any object literal decode (a ``dict``). The return value of
+    ``object_hook`` will be used instead of the ``dict``. This feature
+    can be used to implement custom decoders (e.g. JSON-RPC class hinting).
+
+    ``parse_float``, if specified, will be called with the string
+    of every JSON float to be decoded. By default this is equivalent to
+    float(num_str). This can be used to use another datatype or parser
+    for JSON floats (e.g. decimal.Decimal).
+
+    ``parse_int``, if specified, will be called with the string
+    of every JSON int to be decoded. By default this is equivalent to
+    int(num_str). This can be used to use another datatype or parser
+    for JSON integers (e.g. float).
+
+    ``parse_constant``, if specified, will be called with one of the
+    following strings: -Infinity, Infinity, NaN, null, true, false.
+    This can be used to raise an exception if invalid JSON numbers
+    are encountered.
+
+    To use a custom ``JSONDecoder`` subclass, specify it with the ``cls``
+    kwarg.
+
+    """
+    if (cls is None and encoding is None and object_hook is None and
+            parse_int is None and parse_float is None and
+            parse_constant is None and not kw):
+        return _default_decoder.decode(s)
+    if cls is None:
+        cls = JSONDecoder
+    if object_hook is not None:
+        kw['object_hook'] = object_hook
+    if parse_float is not None:
+        kw['parse_float'] = parse_float
+    if parse_int is not None:
+        kw['parse_int'] = parse_int
+    if parse_constant is not None:
+        kw['parse_constant'] = parse_constant
+    return cls(encoding=encoding, **kw).decode(s)
diff --git a/simplejson/__init__.pyc b/simplejson/__init__.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..f01003d4f81d37513d0f8a2a5fb857b8448ae2bd
GIT binary patch
literal 12071
zcmeHNL37+jc5aXoC5<V`wpPhnPEuV{TLC6J1Wiho9hRuFEorN`sg+zqX}5}`Y6b)J
za3Ep;7!8P|C7!%jANIcgVlVj{xu+`sAvx?Z`QGaWW`?31S@tGXTb4L8Xmt1M?$@v1
z`@RSK=|3;Ge(}dYZiT}ByN2J-@X<FMAtE7m@a>2lM??!ES`^Va5uF#&l87#d{Ux!3
zn-|3n?q3p7OB|dN$$7DJUN}^KM;t7P<bv3_ARKi;M9V^56wzg&P<MsDuk!c1BDx`>
z_xSsL5nU6}&*=IaadGDz>Vo#>kD8f3w86!7@%u|+hsD0O&EIev42oGpIC}l95x%f<
zrIyx+#l_FX@3E|_XH|W`RXp2m??ckj2g^eIdi&8s>HRu*9&Cq2oR{*^@R<rr`7kSk
zGS1SDyfZG#d}DR>na)x_EB5coSj#}_YN%Byvr%iNvp!DC;7EE8?)~QTmG#@}@@5f9
z6~#tUrBx&Y>YT*;<ML3^w~T@^XvJx%if|mH`$~?oViJ^otF<x7qK$!$CwZc1^np}I
zd8QR4r1JAGx8x|8#7P_!vdkoe7aG%%<yc8w25A&v>?9r*L2+zFO@cy?gJgjIku=it
zI6O$yKw_vWQQDVVC9RKys3XiN4U*(oP6A929~HHpV;JbA9?3{Cv$KQAFtd$ioXRhc
z%Q2d-`?tGtSe1<^-3qfw4jm7%gz{J(#^re0_!dvG>H9Gky|5|@m6pkIM~(yC((!&8
zkK!;$OPQ;J^_GT82GMie3ig%mO7&c&EIY&4m5$SWUR##amIR5s*P>;nyd(&aI#(*H
zat-xANW(0m4#PmlVLi9Z*vB|lP;7`Fy|K}1N&LHe7p5`Ev!ayKJ)`|5?KCaejG}6i
zYj4*bWtrQRFWg~JxEs>L@7E|l%u>~rYyL-Fx!yT>+Tp(LZX2!JXx&EZ_J-WW@7E}&
zRg%=LpPoE*o00MYo5q9tX1w+uiP)p=M&`_o*Y~R2y=ra!<}J7G!=?7?JGgs$P20Wi
zX!oKWVi{OuduV?H`aS7N4ITCm)Un=tTvW=8`=ZUYGp)JzNi&a8kxk@wiAC>kJ*qdN
zE;p^>Ol~%<JR_PmuGtpsiY^O<lZBnfA#<O0Wt>eL#+kpb%I85+Dcc=8GuNYyJ!st{
z<Axtm)`;HTNY=XR-J9JP?k!lz$6e{(#_uO5n3Yy}Py}UG=uOY<;{S%*G4phHZKw9F
z_QuEE_U-ltdSF&x7OKQqW6Qw$zTc!YG}ov}d#7h~dfTA3G{R}!yfsyxF-dnXb^T{q
zoO-*7UqE+p?sdrR$%H(H)V|K)6B76v?RBjEzu+yTb4H7TCZ=U9PkzG1lUD1#vZt0j
z`}bQQjy9IKTh+(1vgZ<aUOkvNYK>8`R+21;w0HWLzV4KE<mRTtfGmTo{7hl(J#%FF
z%(~pCa`_M+ee@}O#;d*G<`kS^z|$>j*5=_9?0)o==6&jfOlQ&B&Q%x(N&GdP9*(Wn
zUq*IYzTb{SY6J(`r$~{gBQFZe&IXU>`#zb1j7QS#*Y*9rOZJ0S^Npw>48JN;gr-K)
zu8UKi(D6oxT{oTt`>wUMTDt9o`g&0QZTyAZ@)zxyDZmy>Y$yB_iAQM-mn0mQ>nE-;
z+j;<_oc=h=4mPLjG|KnZe!2c^x(_z8K#vfXoH>s*e+|(CPC={w2y-hpZEGKgf_kw5
zox10_)Xj{;cKG@|d^=x8d&oUiy-yyN{pvo(2+o9CLPho6daF(~oY~7=H1kQxT{=iU
z>DU~}TDwIMYb75a=juUGWQA9#yzsJ){H1IY#!0i%m?)4F+iWmQl#PrKF|T41LD$iD
z4Rgbqf+{ID=htPF=<cpl<VN_OiN$=1=sY~2c%TaJH4=Oy(K7>mhd|eQ&^Hzw1I*0}
zKSO$}^@JhP6u<aomL-zC3IofrN)m#b2!Jt=E5H_@WX@q_g}r-yz<(iCIL@T|qD@n5
zZ?v&T?GsnNl(|8KE0Y<R#KW-0XZ*bBD7h!snPA^YhK|=aZu+<0K<a}dIHr=EQeI@h
ziU@*fFi{%-$f=TRFt((c0HsO~AiMzVYU%T!2-r#gpUZQ&qWv%F78?TJqSMc}*bS8L
zppteNXN`8aDcc>_e~<bvvZ36{^9<1~lXr&M@UsH!;CbxBFWrs*8~;4;HqoOI%@qw<
zUc{F^h;xEOB}j_^V66((4|EvE<rUlr$0|JNhj9^BNl=uRa0|daJM5=G!b>QbSX{Pn
zImHbun2iFO;RRRaXyw!L0$N!E4QW|4!u$CA3qJbK_<Fe@mb0&f^KwyS&+v0jWFdae
zi);@+pqDN2?4rmXp#bJ+3SXcA0%-~#qW~W1h-V8T^H6BjH6Nnz4y0cbPU(nvLA(^=
z8%LZhi}Wd~8rdz>FN%{Tkvir!S~ADQoIrCiB`{sg2xOP$a6!=E7X^)aNnkh(@~yZy
zEC1+2@p4(*e|k-vTox}eHl$ppv7N8}UHlFc-}Xou`VUagwsjdw4hAsn0VoymI*xdT
zzm?#61{TtB84N}_8hHWR@nGN|7C4YzXE0dN6%3+a+Z@G-T1nyqMGg)2+5rn8hqpC?
zfZ6~ch6oyB3^AD$HBlUvxJ%Z7TR|y<La}!<#HEA-)GWt?l(HBMy69A;G1;jpfGC)Y
zBun?r6$cP=IfM%^SHw&P1LHUjV|aogxF!rU$70EQs~{p`NRF4zT7YpH_lrf(tY+4N
z&5A}rq7gQEP3&s2iIU;CN)NOoZGojtHOb4F1jjUinYHjFD1?CdfuJ*!hxSuq)Je_Y
ztP&v1ZbqXDxB;+mVz-4M!%tFhVvP|-`E<vKg(q<cfO^aVD!^QzSU5szIThx?BmhSS
z1JZM-i8k=A7qsmiEEL;_KiY3A2~!ON5P3LNsVHR4YHa?9pRKdn0RZld*xi!`;Td?I
z1h8vrj+6me1(@;tCXzP~<QZb9AxkNgM&zS~VUmNvBjf{MDu*0lF)0s&9D<UlIooY~
z(W}#r%VrW}F25yWRSUB_RL5r=3y^rWFUpf(R|w=lB(pIsVcu|e#!};SWG+_t%9t!B
zO>6_SjB#L0mQp7&_~?TDhn!KM>;Ms%#-y9n0V`o9<)gl;VvG->!xMNIJT&8OrK31S
zV#Cg2TAWjiamz+40qitgN!31*BF_~DFV(&(?1|v%1w{dqSBaYNaI{&*QShWDYBHo8
zP`#(KQ5olx6D;f=%%CzsZY1&L=P8CFqGoQeDCqbjBPUCd{(&A4&}6C(nUncYz3~Kf
zs%VmFqf?^11hbTeKu(~|n(#F8*cFond2oc2ep3Z-g$<gPaaLqm0siyE*gMRa45!p)
zwuu~vja(!eaG3r!q)TF&F_7IMx5^E;o~y~LqWj!hSnX#nXfUV)r&$YiCF}qVsG_0$
z%xYnCY)aNK)$_x6Pagkj<x{I6_;G_O86H~&$x)R8x4<Lu&gpShB~eXg0<36?T&2y-
z)f))QkT{H|K(H?#&!~uT-mz(;r%2h(=rLy%$sbg@L~>;?Aaz(gL;9?SVG_VUddlDT
zC1Qh_Wrmp)aRm1QrC3e-_2OtFCJH&hh`f2d0Jyx!q)FkY*)?_G!TB`8{K!R=<Jtf)
zk1){?b8r|G`*yBV^wJ}^(<2DeBiz&@EYu_1)1&C!Bly(2jIW0tV=IDMWX$Eexaiwi
z_IYn%^VDyOoO|4ZzD)QgTm%pz1aw_4;CGatH99xJl+T(4cRM&_Bt`=f2Vqdjk<Wun
z!C(3_T&+HVzVzxrT)-P=&sXmQ%MP=n)%$dkvwU?F!0CjCYPdQD@T>hk`JsN_&yRZ~
z?rVJX-_cd~s&mD0owjpr;j+_m-pBuC=lbFWvE+obaMD);`~D3DfTHCr1Ka{=8{-G)
zFTfAb-wu9&wG6oX4GIlT`wWE!1KvadFwDTde?$Rj%=GyHg%+g0HxK)^8QnFKE$BOM
zKp$=c^x@gYB11pGH9$XrK0rT!K7PnSLj&|-On^SdeY2p?0=hrLVzyrabg<4>0G)*n
zb3V=Da&urA#E{vOXZ!2KWi~0oF}H~|HLjhaA9BhZU*7<SL03&jKIQW`jGd>2mP19r
zQt2=t%t?EMM<LtywzeRHvF+^M`~;bP2xNlVc{BdXAQP|2z$OHu9|oCN7UL*_k#7x|
zSj?Fy!!W-l(Qlj#1Mi<;lVOuT!6tsX{C^0W2r=~t`t+{ii?d4xE-^gf97&I0!&y+M
z_cN+E1C8~rqvFSgJCsZNSA6u(@g@GLhCA;$1b3DIcHVccI-IC8{(uwlAwfq%j<h<?
zczuG466gm|&=KG88x@2)z9ZqpIj3)(rEQOd=^PmGJ}8j^>&#qDHV8qBGT71omI$hO
zJ7ORE3JXl4EUbtMBAGy7#Xc@KYnjGDW+r$f&zuo%%I2a#Kg_mSYS;u)WQ`D7xsGCO
zhW-VQ3JQ`+&JbF}pMc?|D{Fx2jCfER<dk2<I*}QkV@Q;3l@ss?mPBbIL$y`p%Ln!u
z>8b3M3F~Gyp02_%<=CFw+g@4kP=<>IQ4XJz3o7aY3LxcX7!n3JEHD|%d%5jwB8HTX
zEc__%c=bX-Oz<E9ZvfEy7RO+bl(sPt15265CpLW0fH??|X*L*eBAE8Fc1<&8)wu5F
z)q{CzSF`pI%dxX==#$O4VDEzT*iwGvjfgHJcA`ivVwMJRb_~gz18R6r#Zcb)Db=H%
z#iMI+Bn`$gQUM;J8MWh;3(CB4FPI*`p+bgOGex63<RT0+B-*&r`|_SNba9N-1}v*i
zggiczX4*75)K=5XR|p~L2a9Gh$g7(rgofy`yZM05FOiv<M`N5KH)YI*bLggo3>g8}
z(jz|C!@(7t?B`QTUZF>?Se+8yyFvHpouVEQtG|dZqv`w?KAI*Wu3u%c*7z#&$?U5Z
z;qxdDzQhT5qGj+@ra-i8u`UoT<K#Hy>4}yxX`%wrGH@r;hiKV_*U_?O7)#3*3@tNb
zToTz8bOtp81#`q5CURyFTLr#`ss&qRCS$8W;!w3{tITX{l}YEHvsIV^+B($yTj4a>
zeCv1r15|z9?^4=;PYQDdI_@(^yGhc_xLdeYvR*c?H*>e(A@;08wi%}3LgX;s(C_ky
z?0aG6ukpKY=5|>Uxn9oJ{}8v!lIn*G*6p71x-)KbR<olR8FCwv_=yRgZg8}<s>1tZ
z^&43~xy3qq%(yFxO?cO#37Xx8d7p|GoZz-70r3Kfq2ky+mZD@i0R=d2yGy?Of&v{s
z%Z4q%GRZibgf<%Uj&qvbODkk)%YuUonw<&(2nDbNW3Ti^Bjxbuc<~wxe4ytKoKIzW
zb!@;?=+y)t{+?e^XpE$B&OgH1;o{$F<>>b#t{c)QqhGI_)ldh)!C*f8yxF2D<%(TK
z95fr1(KBBHZN%B}NOwc7)DIrIa(ab_6!m+9=3Ny|TbZOd$NE#7YjVhNLh2|~d``(2
z;}kidI5K+*>!61ZjfWsqRnbeW0C>ip|3YD&g8S+COF7<$Uc*!7Q@h6Y3+656+B|Nj
zxQZvvh_L?;(VcL{6%4Nb0T-g}Iyao_j^Qbnk))mdJoMf}6MjbD?;|Aj`;2Y+eVhMB
znMg;!4+o8F;##<_kZ~_;mDK<*o7*x3R>d^E{VRGF%eaSL37V2UP9XP4Nj;iqufa$j
zN<TJzW2AG(yqJ79gnWGqUrWx?!m_ixxU}%D^X>vlbN??bUIMMVdWXMnUth%ajb-P5
E0OpUxq5uE@

literal 0
HcmV?d00001

diff --git a/simplejson/_speedups.c b/simplejson/_speedups.c
new file mode 100644
index 00000000..23b5f4a6
--- /dev/null
+++ b/simplejson/_speedups.c
@@ -0,0 +1,2329 @@
+#include "Python.h"
+#include "structmember.h"
+#if PY_VERSION_HEX < 0x02060000 && !defined(Py_TYPE)
+#define Py_TYPE(ob)     (((PyObject*)(ob))->ob_type)
+#endif
+#if PY_VERSION_HEX < 0x02050000 && !defined(PY_SSIZE_T_MIN)
+typedef int Py_ssize_t;
+#define PY_SSIZE_T_MAX INT_MAX
+#define PY_SSIZE_T_MIN INT_MIN
+#define PyInt_FromSsize_t PyInt_FromLong
+#define PyInt_AsSsize_t PyInt_AsLong
+#endif
+#ifndef Py_IS_FINITE
+#define Py_IS_FINITE(X) (!Py_IS_INFINITY(X) && !Py_IS_NAN(X))
+#endif
+
+#ifdef __GNUC__
+#define UNUSED __attribute__((__unused__))
+#else
+#define UNUSED
+#endif
+
+#define DEFAULT_ENCODING "utf-8"
+
+#define PyScanner_Check(op) PyObject_TypeCheck(op, &PyScannerType)
+#define PyScanner_CheckExact(op) (Py_TYPE(op) == &PyScannerType)
+#define PyEncoder_Check(op) PyObject_TypeCheck(op, &PyEncoderType)
+#define PyEncoder_CheckExact(op) (Py_TYPE(op) == &PyEncoderType)
+
+static PyTypeObject PyScannerType;
+static PyTypeObject PyEncoderType;
+
+typedef struct _PyScannerObject {
+    PyObject_HEAD
+    PyObject *encoding;
+    PyObject *strict;
+    PyObject *object_hook;
+    PyObject *parse_float;
+    PyObject *parse_int;
+    PyObject *parse_constant;
+} PyScannerObject;
+
+static PyMemberDef scanner_members[] = {
+    {"encoding", T_OBJECT, offsetof(PyScannerObject, encoding), READONLY, "encoding"},
+    {"strict", T_OBJECT, offsetof(PyScannerObject, strict), READONLY, "strict"},
+    {"object_hook", T_OBJECT, offsetof(PyScannerObject, object_hook), READONLY, "object_hook"},
+    {"parse_float", T_OBJECT, offsetof(PyScannerObject, parse_float), READONLY, "parse_float"},
+    {"parse_int", T_OBJECT, offsetof(PyScannerObject, parse_int), READONLY, "parse_int"},
+    {"parse_constant", T_OBJECT, offsetof(PyScannerObject, parse_constant), READONLY, "parse_constant"},
+    {NULL}
+};
+
+typedef struct _PyEncoderObject {
+    PyObject_HEAD
+    PyObject *markers;
+    PyObject *defaultfn;
+    PyObject *encoder;
+    PyObject *indent;
+    PyObject *key_separator;
+    PyObject *item_separator;
+    PyObject *sort_keys;
+    PyObject *skipkeys;
+    int fast_encode;
+    int allow_nan;
+} PyEncoderObject;
+
+static PyMemberDef encoder_members[] = {
+    {"markers", T_OBJECT, offsetof(PyEncoderObject, markers), READONLY, "markers"},
+    {"default", T_OBJECT, offsetof(PyEncoderObject, defaultfn), READONLY, "default"},
+    {"encoder", T_OBJECT, offsetof(PyEncoderObject, encoder), READONLY, "encoder"},
+    {"indent", T_OBJECT, offsetof(PyEncoderObject, indent), READONLY, "indent"},
+    {"key_separator", T_OBJECT, offsetof(PyEncoderObject, key_separator), READONLY, "key_separator"},
+    {"item_separator", T_OBJECT, offsetof(PyEncoderObject, item_separator), READONLY, "item_separator"},
+    {"sort_keys", T_OBJECT, offsetof(PyEncoderObject, sort_keys), READONLY, "sort_keys"},
+    {"skipkeys", T_OBJECT, offsetof(PyEncoderObject, skipkeys), READONLY, "skipkeys"},
+    {NULL}
+};
+
+static Py_ssize_t
+ascii_escape_char(Py_UNICODE c, char *output, Py_ssize_t chars);
+static PyObject *
+ascii_escape_unicode(PyObject *pystr);
+static PyObject *
+ascii_escape_str(PyObject *pystr);
+static PyObject *
+py_encode_basestring_ascii(PyObject* self UNUSED, PyObject *pystr);
+void init_speedups(void);
+static PyObject *
+scan_once_str(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr);
+static PyObject *
+scan_once_unicode(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr);
+static PyObject *
+_build_rval_index_tuple(PyObject *rval, Py_ssize_t idx);
+static PyObject *
+scanner_new(PyTypeObject *type, PyObject *args, PyObject *kwds);
+static int
+scanner_init(PyObject *self, PyObject *args, PyObject *kwds);
+static void
+scanner_dealloc(PyObject *self);
+static int
+scanner_clear(PyObject *self);
+static PyObject *
+encoder_new(PyTypeObject *type, PyObject *args, PyObject *kwds);
+static int
+encoder_init(PyObject *self, PyObject *args, PyObject *kwds);
+static void
+encoder_dealloc(PyObject *self);
+static int
+encoder_clear(PyObject *self);
+static int
+encoder_listencode_list(PyEncoderObject *s, PyObject *rval, PyObject *seq, Py_ssize_t indent_level);
+static int
+encoder_listencode_obj(PyEncoderObject *s, PyObject *rval, PyObject *obj, Py_ssize_t indent_level);
+static int
+encoder_listencode_dict(PyEncoderObject *s, PyObject *rval, PyObject *dct, Py_ssize_t indent_level);
+static PyObject *
+_encoded_const(PyObject *const);
+static void
+raise_errmsg(char *msg, PyObject *s, Py_ssize_t end);
+static PyObject *
+encoder_encode_string(PyEncoderObject *s, PyObject *obj);
+static int
+_convertPyInt_AsSsize_t(PyObject *o, Py_ssize_t *size_ptr);
+static PyObject *
+_convertPyInt_FromSsize_t(Py_ssize_t *size_ptr);
+static PyObject *
+encoder_encode_float(PyEncoderObject *s, PyObject *obj);
+
+#define S_CHAR(c) (c >= ' ' && c <= '~' && c != '\\' && c != '"')
+#define IS_WHITESPACE(c) (((c) == ' ') || ((c) == '\t') || ((c) == '\n') || ((c) == '\r'))
+
+#define MIN_EXPANSION 6
+#ifdef Py_UNICODE_WIDE
+#define MAX_EXPANSION (2 * MIN_EXPANSION)
+#else
+#define MAX_EXPANSION MIN_EXPANSION
+#endif
+
+static int
+_convertPyInt_AsSsize_t(PyObject *o, Py_ssize_t *size_ptr)
+{
+    /* PyObject to Py_ssize_t converter */
+    *size_ptr = PyInt_AsSsize_t(o);
+    if (*size_ptr == -1 && PyErr_Occurred());
+        return 1;
+    return 0;
+}
+
+static PyObject *
+_convertPyInt_FromSsize_t(Py_ssize_t *size_ptr)
+{
+    /* Py_ssize_t to PyObject converter */
+    return PyInt_FromSsize_t(*size_ptr);
+}
+
+static Py_ssize_t
+ascii_escape_char(Py_UNICODE c, char *output, Py_ssize_t chars)
+{
+    /* Escape unicode code point c to ASCII escape sequences
+    in char *output. output must have at least 12 bytes unused to
+    accommodate an escaped surrogate pair "\uXXXX\uXXXX" */
+    output[chars++] = '\\';
+    switch (c) {
+        case '\\': output[chars++] = (char)c; break;
+        case '"': output[chars++] = (char)c; break;
+        case '\b': output[chars++] = 'b'; break;
+        case '\f': output[chars++] = 'f'; break;
+        case '\n': output[chars++] = 'n'; break;
+        case '\r': output[chars++] = 'r'; break;
+        case '\t': output[chars++] = 't'; break;
+        default:
+#ifdef Py_UNICODE_WIDE
+            if (c >= 0x10000) {
+                /* UTF-16 surrogate pair */
+                Py_UNICODE v = c - 0x10000;
+                c = 0xd800 | ((v >> 10) & 0x3ff);
+                output[chars++] = 'u';
+                output[chars++] = "0123456789abcdef"[(c >> 12) & 0xf];
+                output[chars++] = "0123456789abcdef"[(c >>  8) & 0xf];
+                output[chars++] = "0123456789abcdef"[(c >>  4) & 0xf];
+                output[chars++] = "0123456789abcdef"[(c      ) & 0xf];
+                c = 0xdc00 | (v & 0x3ff);
+                output[chars++] = '\\';
+            }
+#endif
+            output[chars++] = 'u';
+            output[chars++] = "0123456789abcdef"[(c >> 12) & 0xf];
+            output[chars++] = "0123456789abcdef"[(c >>  8) & 0xf];
+            output[chars++] = "0123456789abcdef"[(c >>  4) & 0xf];
+            output[chars++] = "0123456789abcdef"[(c      ) & 0xf];
+    }
+    return chars;
+}
+
+static PyObject *
+ascii_escape_unicode(PyObject *pystr)
+{
+    /* Take a PyUnicode pystr and return a new ASCII-only escaped PyString */
+    Py_ssize_t i;
+    Py_ssize_t input_chars;
+    Py_ssize_t output_size;
+    Py_ssize_t max_output_size;
+    Py_ssize_t chars;
+    PyObject *rval;
+    char *output;
+    Py_UNICODE *input_unicode;
+
+    input_chars = PyUnicode_GET_SIZE(pystr);
+    input_unicode = PyUnicode_AS_UNICODE(pystr);
+
+    /* One char input can be up to 6 chars output, estimate 4 of these */
+    output_size = 2 + (MIN_EXPANSION * 4) + input_chars;
+    max_output_size = 2 + (input_chars * MAX_EXPANSION);
+    rval = PyString_FromStringAndSize(NULL, output_size);
+    if (rval == NULL) {
+        return NULL;
+    }
+    output = PyString_AS_STRING(rval);
+    chars = 0;
+    output[chars++] = '"';
+    for (i = 0; i < input_chars; i++) {
+        Py_UNICODE c = input_unicode[i];
+        if (S_CHAR(c)) {
+            output[chars++] = (char)c;
+        }
+        else {
+            chars = ascii_escape_char(c, output, chars);
+        }
+        if (output_size - chars < (1 + MAX_EXPANSION)) {
+            /* There's more than four, so let's resize by a lot */
+            Py_ssize_t new_output_size = output_size * 2;
+            /* This is an upper bound */
+            if (new_output_size > max_output_size) {
+                new_output_size = max_output_size;
+            }
+            /* Make sure that the output size changed before resizing */
+            if (new_output_size != output_size) {
+                output_size = new_output_size;
+                if (_PyString_Resize(&rval, output_size) == -1) {
+                    return NULL;
+                }
+                output = PyString_AS_STRING(rval);
+            }
+        }
+    }
+    output[chars++] = '"';
+    if (_PyString_Resize(&rval, chars) == -1) {
+        return NULL;
+    }
+    return rval;
+}
+
+static PyObject *
+ascii_escape_str(PyObject *pystr)
+{
+    /* Take a PyString pystr and return a new ASCII-only escaped PyString */
+    Py_ssize_t i;
+    Py_ssize_t input_chars;
+    Py_ssize_t output_size;
+    Py_ssize_t chars;
+    PyObject *rval;
+    char *output;
+    char *input_str;
+
+    input_chars = PyString_GET_SIZE(pystr);
+    input_str = PyString_AS_STRING(pystr);
+
+    /* Fast path for a string that's already ASCII */
+    for (i = 0; i < input_chars; i++) {
+        Py_UNICODE c = (Py_UNICODE)(unsigned char)input_str[i];
+        if (!S_CHAR(c)) {
+            /* If we have to escape something, scan the string for unicode */
+            Py_ssize_t j;
+            for (j = i; j < input_chars; j++) {
+                c = (Py_UNICODE)(unsigned char)input_str[j];
+                if (c > 0x7f) {
+                    /* We hit a non-ASCII character, bail to unicode mode */
+                    PyObject *uni;
+                    uni = PyUnicode_DecodeUTF8(input_str, input_chars, "strict");
+                    if (uni == NULL) {
+                        return NULL;
+                    }
+                    rval = ascii_escape_unicode(uni);
+                    Py_DECREF(uni);
+                    return rval;
+                }
+            }
+            break;
+        }
+    }
+
+    if (i == input_chars) {
+        /* Input is already ASCII */
+        output_size = 2 + input_chars;
+    }
+    else {
+        /* One char input can be up to 6 chars output, estimate 4 of these */
+        output_size = 2 + (MIN_EXPANSION * 4) + input_chars;
+    }
+    rval = PyString_FromStringAndSize(NULL, output_size);
+    if (rval == NULL) {
+        return NULL;
+    }
+    output = PyString_AS_STRING(rval);
+    output[0] = '"';
+
+    /* We know that everything up to i is ASCII already */
+    chars = i + 1;
+    memcpy(&output[1], input_str, i);
+
+    for (; i < input_chars; i++) {
+        Py_UNICODE c = (Py_UNICODE)(unsigned char)input_str[i];
+        if (S_CHAR(c)) {
+            output[chars++] = (char)c;
+        }
+        else {
+            chars = ascii_escape_char(c, output, chars);
+        }
+        /* An ASCII char can't possibly expand to a surrogate! */
+        if (output_size - chars < (1 + MIN_EXPANSION)) {
+            /* There's more than four, so let's resize by a lot */
+            output_size *= 2;
+            if (output_size > 2 + (input_chars * MIN_EXPANSION)) {
+                output_size = 2 + (input_chars * MIN_EXPANSION);
+            }
+            if (_PyString_Resize(&rval, output_size) == -1) {
+                return NULL;
+            }
+            output = PyString_AS_STRING(rval);
+        }
+    }
+    output[chars++] = '"';
+    if (_PyString_Resize(&rval, chars) == -1) {
+        return NULL;
+    }
+    return rval;
+}
+
+static void
+raise_errmsg(char *msg, PyObject *s, Py_ssize_t end)
+{
+    /* Use the Python function simplejson.decoder.errmsg to raise a nice
+    looking ValueError exception */
+    static PyObject *errmsg_fn = NULL;
+    PyObject *pymsg;
+    if (errmsg_fn == NULL) {
+        PyObject *decoder = PyImport_ImportModule("simplejson.decoder");
+        if (decoder == NULL)
+            return;
+        errmsg_fn = PyObject_GetAttrString(decoder, "errmsg");
+        Py_DECREF(decoder);
+        if (errmsg_fn == NULL)
+            return;
+    }
+    pymsg = PyObject_CallFunction(errmsg_fn, "(zOO&)", msg, s, _convertPyInt_FromSsize_t, &end);
+    if (pymsg) {
+        PyErr_SetObject(PyExc_ValueError, pymsg);
+        Py_DECREF(pymsg);
+    }
+}
+
+static PyObject *
+join_list_unicode(PyObject *lst)
+{
+    /* return u''.join(lst) */
+    static PyObject *joinfn = NULL;
+    if (joinfn == NULL) {
+        PyObject *ustr = PyUnicode_FromUnicode(NULL, 0);
+        if (ustr == NULL)
+            return NULL;
+
+        joinfn = PyObject_GetAttrString(ustr, "join");
+        Py_DECREF(ustr);
+        if (joinfn == NULL)
+            return NULL;
+    }
+    return PyObject_CallFunctionObjArgs(joinfn, lst, NULL);
+}
+
+static PyObject *
+join_list_string(PyObject *lst)
+{
+    /* return ''.join(lst) */
+    static PyObject *joinfn = NULL;
+    if (joinfn == NULL) {
+        PyObject *ustr = PyString_FromStringAndSize(NULL, 0);
+        if (ustr == NULL)
+            return NULL;
+
+        joinfn = PyObject_GetAttrString(ustr, "join");
+        Py_DECREF(ustr);
+        if (joinfn == NULL)
+            return NULL;
+    }
+    return PyObject_CallFunctionObjArgs(joinfn, lst, NULL);
+}
+
+static PyObject *
+_build_rval_index_tuple(PyObject *rval, Py_ssize_t idx) {
+    /* return (rval, idx) tuple, stealing reference to rval */
+    PyObject *tpl;
+    PyObject *pyidx;
+    /*
+    steal a reference to rval, returns (rval, idx)
+    */
+    if (rval == NULL) {
+        return NULL;
+    }
+    pyidx = PyInt_FromSsize_t(idx);
+    if (pyidx == NULL) {
+        Py_DECREF(rval);
+        return NULL;
+    }
+    tpl = PyTuple_New(2);
+    if (tpl == NULL) {
+        Py_DECREF(pyidx);
+        Py_DECREF(rval);
+        return NULL;
+    }
+    PyTuple_SET_ITEM(tpl, 0, rval);
+    PyTuple_SET_ITEM(tpl, 1, pyidx);
+    return tpl;
+}
+
+static PyObject *
+scanstring_str(PyObject *pystr, Py_ssize_t end, char *encoding, int strict, Py_ssize_t *next_end_ptr)
+{
+    /* Read the JSON string from PyString pystr.
+    end is the index of the first character after the quote.
+    encoding is the encoding of pystr (must be an ASCII superset)
+    if strict is zero then literal control characters are allowed
+    *next_end_ptr is a return-by-reference index of the character
+        after the end quote
+
+    Return value is a new PyString (if ASCII-only) or PyUnicode
+    */
+    PyObject *rval;
+    Py_ssize_t len = PyString_GET_SIZE(pystr);
+    Py_ssize_t begin = end - 1;
+    Py_ssize_t next = begin;
+    int has_unicode = 0;
+    char *buf = PyString_AS_STRING(pystr);
+    PyObject *chunks = PyList_New(0);
+    if (chunks == NULL) {
+        goto bail;
+    }
+    if (end < 0 || len <= end) {
+        PyErr_SetString(PyExc_ValueError, "end is out of bounds");
+        goto bail;
+    }
+    while (1) {
+        /* Find the end of the string or the next escape */
+        Py_UNICODE c = 0;
+        PyObject *chunk = NULL;
+        for (next = end; next < len; next++) {
+            c = (unsigned char)buf[next];
+            if (c == '"' || c == '\\') {
+                break;
+            }
+            else if (strict && c <= 0x1f) {
+                raise_errmsg("Invalid control character at", pystr, next);
+                goto bail;
+            }
+            else if (c > 0x7f) {
+                has_unicode = 1;
+            }
+        }
+        if (!(c == '"' || c == '\\')) {
+            raise_errmsg("Unterminated string starting at", pystr, begin);
+            goto bail;
+        }
+        /* Pick up this chunk if it's not zero length */
+        if (next != end) {
+            PyObject *strchunk = PyString_FromStringAndSize(&buf[end], next - end);
+            if (strchunk == NULL) {
+                goto bail;
+            }
+            if (has_unicode) {
+                chunk = PyUnicode_FromEncodedObject(strchunk, encoding, NULL);
+                Py_DECREF(strchunk);
+                if (chunk == NULL) {
+                    goto bail;
+                }
+            }
+            else {
+                chunk = strchunk;
+            }
+            if (PyList_Append(chunks, chunk)) {
+                Py_DECREF(chunk);
+                goto bail;
+            }
+            Py_DECREF(chunk);
+        }
+        next++;
+        if (c == '"') {
+            end = next;
+            break;
+        }
+        if (next == len) {
+            raise_errmsg("Unterminated string starting at", pystr, begin);
+            goto bail;
+        }
+        c = buf[next];
+        if (c != 'u') {
+            /* Non-unicode backslash escapes */
+            end = next + 1;
+            switch (c) {
+                case '"': break;
+                case '\\': break;
+                case '/': break;
+                case 'b': c = '\b'; break;
+                case 'f': c = '\f'; break;
+                case 'n': c = '\n'; break;
+                case 'r': c = '\r'; break;
+                case 't': c = '\t'; break;
+                default: c = 0;
+            }
+            if (c == 0) {
+                raise_errmsg("Invalid \\escape", pystr, end - 2);
+                goto bail;
+            }
+        }
+        else {
+            c = 0;
+            next++;
+            end = next + 4;
+            if (end >= len) {
+                raise_errmsg("Invalid \\uXXXX escape", pystr, next - 1);
+                goto bail;
+            }
+            /* Decode 4 hex digits */
+            for (; next < end; next++) {
+                Py_UNICODE digit = buf[next];
+                c <<= 4;
+                switch (digit) {
+                    case '0': case '1': case '2': case '3': case '4':
+                    case '5': case '6': case '7': case '8': case '9':
+                        c |= (digit - '0'); break;
+                    case 'a': case 'b': case 'c': case 'd': case 'e':
+                    case 'f':
+                        c |= (digit - 'a' + 10); break;
+                    case 'A': case 'B': case 'C': case 'D': case 'E':
+                    case 'F':
+                        c |= (digit - 'A' + 10); break;
+                    default:
+                        raise_errmsg("Invalid \\uXXXX escape", pystr, end - 5);
+                        goto bail;
+                }
+            }
+#ifdef Py_UNICODE_WIDE
+            /* Surrogate pair */
+            if ((c & 0xfc00) == 0xd800) {
+                Py_UNICODE c2 = 0;
+                if (end + 6 >= len) {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                if (buf[next++] != '\\' || buf[next++] != 'u') {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                end += 6;
+                /* Decode 4 hex digits */
+                for (; next < end; next++) {
+                    c2 <<= 4;
+                    Py_UNICODE digit = buf[next];
+                    switch (digit) {
+                        case '0': case '1': case '2': case '3': case '4':
+                        case '5': case '6': case '7': case '8': case '9':
+                            c2 |= (digit - '0'); break;
+                        case 'a': case 'b': case 'c': case 'd': case 'e':
+                        case 'f':
+                            c2 |= (digit - 'a' + 10); break;
+                        case 'A': case 'B': case 'C': case 'D': case 'E':
+                        case 'F':
+                            c2 |= (digit - 'A' + 10); break;
+                        default:
+                            raise_errmsg("Invalid \\uXXXX escape", pystr, end - 5);
+                            goto bail;
+                    }
+                }
+                if ((c2 & 0xfc00) != 0xdc00) {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                c = 0x10000 + (((c - 0xd800) << 10) | (c2 - 0xdc00));
+            }
+            else if ((c & 0xfc00) == 0xdc00) {
+                raise_errmsg("Unpaired low surrogate", pystr, end - 5);
+                goto bail;
+            }
+#endif
+        }
+        if (c > 0x7f) {
+            has_unicode = 1;
+        }
+        if (has_unicode) {
+            chunk = PyUnicode_FromUnicode(&c, 1);
+            if (chunk == NULL) {
+                goto bail;
+            }
+        }
+        else {
+            char c_char = Py_CHARMASK(c);
+            chunk = PyString_FromStringAndSize(&c_char, 1);
+            if (chunk == NULL) {
+                goto bail;
+            }
+        }
+        if (PyList_Append(chunks, chunk)) {
+            Py_DECREF(chunk);
+            goto bail;
+        }
+        Py_DECREF(chunk);
+    }
+
+    rval = join_list_string(chunks);
+    if (rval == NULL) {
+        goto bail;
+    }
+    Py_CLEAR(chunks);
+    *next_end_ptr = end;
+    return rval;
+bail:
+    *next_end_ptr = -1;
+    Py_XDECREF(chunks);
+    return NULL;
+}
+
+
+static PyObject *
+scanstring_unicode(PyObject *pystr, Py_ssize_t end, int strict, Py_ssize_t *next_end_ptr)
+{
+    /* Read the JSON string from PyUnicode pystr.
+    end is the index of the first character after the quote.
+    if strict is zero then literal control characters are allowed
+    *next_end_ptr is a return-by-reference index of the character
+        after the end quote
+
+    Return value is a new PyUnicode
+    */
+    PyObject *rval;
+    Py_ssize_t len = PyUnicode_GET_SIZE(pystr);
+    Py_ssize_t begin = end - 1;
+    Py_ssize_t next = begin;
+    const Py_UNICODE *buf = PyUnicode_AS_UNICODE(pystr);
+    PyObject *chunks = PyList_New(0);
+    if (chunks == NULL) {
+        goto bail;
+    }
+    if (end < 0 || len <= end) {
+        PyErr_SetString(PyExc_ValueError, "end is out of bounds");
+        goto bail;
+    }
+    while (1) {
+        /* Find the end of the string or the next escape */
+        Py_UNICODE c = 0;
+        PyObject *chunk = NULL;
+        for (next = end; next < len; next++) {
+            c = buf[next];
+            if (c == '"' || c == '\\') {
+                break;
+            }
+            else if (strict && c <= 0x1f) {
+                raise_errmsg("Invalid control character at", pystr, next);
+                goto bail;
+            }
+        }
+        if (!(c == '"' || c == '\\')) {
+            raise_errmsg("Unterminated string starting at", pystr, begin);
+            goto bail;
+        }
+        /* Pick up this chunk if it's not zero length */
+        if (next != end) {
+            chunk = PyUnicode_FromUnicode(&buf[end], next - end);
+            if (chunk == NULL) {
+                goto bail;
+            }
+            if (PyList_Append(chunks, chunk)) {
+                Py_DECREF(chunk);
+                goto bail;
+            }
+            Py_DECREF(chunk);
+        }
+        next++;
+        if (c == '"') {
+            end = next;
+            break;
+        }
+        if (next == len) {
+            raise_errmsg("Unterminated string starting at", pystr, begin);
+            goto bail;
+        }
+        c = buf[next];
+        if (c != 'u') {
+            /* Non-unicode backslash escapes */
+            end = next + 1;
+            switch (c) {
+                case '"': break;
+                case '\\': break;
+                case '/': break;
+                case 'b': c = '\b'; break;
+                case 'f': c = '\f'; break;
+                case 'n': c = '\n'; break;
+                case 'r': c = '\r'; break;
+                case 't': c = '\t'; break;
+                default: c = 0;
+            }
+            if (c == 0) {
+                raise_errmsg("Invalid \\escape", pystr, end - 2);
+                goto bail;
+            }
+        }
+        else {
+            c = 0;
+            next++;
+            end = next + 4;
+            if (end >= len) {
+                raise_errmsg("Invalid \\uXXXX escape", pystr, next - 1);
+                goto bail;
+            }
+            /* Decode 4 hex digits */
+            for (; next < end; next++) {
+                Py_UNICODE digit = buf[next];
+                c <<= 4;
+                switch (digit) {
+                    case '0': case '1': case '2': case '3': case '4':
+                    case '5': case '6': case '7': case '8': case '9':
+                        c |= (digit - '0'); break;
+                    case 'a': case 'b': case 'c': case 'd': case 'e':
+                    case 'f':
+                        c |= (digit - 'a' + 10); break;
+                    case 'A': case 'B': case 'C': case 'D': case 'E':
+                    case 'F':
+                        c |= (digit - 'A' + 10); break;
+                    default:
+                        raise_errmsg("Invalid \\uXXXX escape", pystr, end - 5);
+                        goto bail;
+                }
+            }
+#ifdef Py_UNICODE_WIDE
+            /* Surrogate pair */
+            if ((c & 0xfc00) == 0xd800) {
+                Py_UNICODE c2 = 0;
+                if (end + 6 >= len) {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                if (buf[next++] != '\\' || buf[next++] != 'u') {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                end += 6;
+                /* Decode 4 hex digits */
+                for (; next < end; next++) {
+                    c2 <<= 4;
+                    Py_UNICODE digit = buf[next];
+                    switch (digit) {
+                        case '0': case '1': case '2': case '3': case '4':
+                        case '5': case '6': case '7': case '8': case '9':
+                            c2 |= (digit - '0'); break;
+                        case 'a': case 'b': case 'c': case 'd': case 'e':
+                        case 'f':
+                            c2 |= (digit - 'a' + 10); break;
+                        case 'A': case 'B': case 'C': case 'D': case 'E':
+                        case 'F':
+                            c2 |= (digit - 'A' + 10); break;
+                        default:
+                            raise_errmsg("Invalid \\uXXXX escape", pystr, end - 5);
+                            goto bail;
+                    }
+                }
+                if ((c2 & 0xfc00) != 0xdc00) {
+                    raise_errmsg("Unpaired high surrogate", pystr, end - 5);
+                    goto bail;
+                }
+                c = 0x10000 + (((c - 0xd800) << 10) | (c2 - 0xdc00));
+            }
+            else if ((c & 0xfc00) == 0xdc00) {
+                raise_errmsg("Unpaired low surrogate", pystr, end - 5);
+                goto bail;
+            }
+#endif
+        }
+        chunk = PyUnicode_FromUnicode(&c, 1);
+        if (chunk == NULL) {
+            goto bail;
+        }
+        if (PyList_Append(chunks, chunk)) {
+            Py_DECREF(chunk);
+            goto bail;
+        }
+        Py_DECREF(chunk);
+    }
+
+    rval = join_list_unicode(chunks);
+    if (rval == NULL) {
+        goto bail;
+    }
+    Py_DECREF(chunks);
+    *next_end_ptr = end;
+    return rval;
+bail:
+    *next_end_ptr = -1;
+    Py_XDECREF(chunks);
+    return NULL;
+}
+
+PyDoc_STRVAR(pydoc_scanstring,
+    "scanstring(basestring, end, encoding, strict=True) -> (str, end)\n"
+    "\n"
+    "Scan the string s for a JSON string. End is the index of the\n"
+    "character in s after the quote that started the JSON string.\n"
+    "Unescapes all valid JSON string escape sequences and raises ValueError\n"
+    "on attempt to decode an invalid string. If strict is False then literal\n"
+    "control characters are allowed in the string.\n"
+    "\n"
+    "Returns a tuple of the decoded string and the index of the character in s\n"
+    "after the end quote."
+);
+
+static PyObject *
+py_scanstring(PyObject* self UNUSED, PyObject *args)
+{
+    PyObject *pystr;
+    PyObject *rval;
+    Py_ssize_t end;
+    Py_ssize_t next_end = -1;
+    char *encoding = NULL;
+    int strict = 1;
+    if (!PyArg_ParseTuple(args, "OO&|zi:scanstring", &pystr, _convertPyInt_AsSsize_t, &end, &encoding, &strict)) {
+        return NULL;
+    }
+    if (encoding == NULL) {
+        encoding = DEFAULT_ENCODING;
+    }
+    if (PyString_Check(pystr)) {
+        rval = scanstring_str(pystr, end, encoding, strict, &next_end);
+    }
+    else if (PyUnicode_Check(pystr)) {
+        rval = scanstring_unicode(pystr, end, strict, &next_end);
+    }
+    else {
+        PyErr_Format(PyExc_TypeError,
+                     "first argument must be a string, not %.80s",
+                     Py_TYPE(pystr)->tp_name);
+        return NULL;
+    }
+    return _build_rval_index_tuple(rval, next_end);
+}
+
+PyDoc_STRVAR(pydoc_encode_basestring_ascii,
+    "encode_basestring_ascii(basestring) -> str\n"
+    "\n"
+    "Return an ASCII-only JSON representation of a Python string"
+);
+
+static PyObject *
+py_encode_basestring_ascii(PyObject* self UNUSED, PyObject *pystr)
+{
+    /* Return an ASCII-only JSON representation of a Python string */
+    /* METH_O */
+    if (PyString_Check(pystr)) {
+        return ascii_escape_str(pystr);
+    }
+    else if (PyUnicode_Check(pystr)) {
+        return ascii_escape_unicode(pystr);
+    }
+    else {
+        PyErr_Format(PyExc_TypeError,
+                     "first argument must be a string, not %.80s",
+                     Py_TYPE(pystr)->tp_name);
+        return NULL;
+    }
+}
+
+static void
+scanner_dealloc(PyObject *self)
+{
+    /* Deallocate scanner object */
+    scanner_clear(self);
+    Py_TYPE(self)->tp_free(self);
+}
+
+static int
+scanner_traverse(PyObject *self, visitproc visit, void *arg)
+{
+    PyScannerObject *s;
+    assert(PyScanner_Check(self));
+    s = (PyScannerObject *)self;
+    Py_VISIT(s->encoding);
+    Py_VISIT(s->strict);
+    Py_VISIT(s->object_hook);
+    Py_VISIT(s->parse_float);
+    Py_VISIT(s->parse_int);
+    Py_VISIT(s->parse_constant);
+    return 0;
+}
+
+static int
+scanner_clear(PyObject *self)
+{
+    PyScannerObject *s;
+    assert(PyScanner_Check(self));
+    s = (PyScannerObject *)self;
+    Py_CLEAR(s->encoding);
+    Py_CLEAR(s->strict);
+    Py_CLEAR(s->object_hook);
+    Py_CLEAR(s->parse_float);
+    Py_CLEAR(s->parse_int);
+    Py_CLEAR(s->parse_constant);
+    return 0;
+}
+
+static PyObject *
+_parse_object_str(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON object from PyString pystr.
+    idx is the index of the first character after the opening curly brace.
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the closing curly brace.
+
+    Returns a new PyObject (usually a dict, but object_hook can change that)
+    */
+    char *str = PyString_AS_STRING(pystr);
+    Py_ssize_t end_idx = PyString_GET_SIZE(pystr) - 1;
+    PyObject *rval = PyDict_New();
+    PyObject *key = NULL;
+    PyObject *val = NULL;
+    char *encoding = PyString_AS_STRING(s->encoding);
+    int strict = PyObject_IsTrue(s->strict);
+    Py_ssize_t next_idx;
+    if (rval == NULL)
+        return NULL;
+
+    /* skip whitespace after { */
+    while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+    /* only loop if the object is non-empty */
+    if (idx <= end_idx && str[idx] != '}') {
+        while (idx <= end_idx) {
+            /* read key */
+            if (str[idx] != '"') {
+                raise_errmsg("Expecting property name", pystr, idx);
+                goto bail;
+            }
+            key = scanstring_str(pystr, idx + 1, encoding, strict, &next_idx);
+            if (key == NULL)
+                goto bail;
+            idx = next_idx;
+
+            /* skip whitespace between key and : delimiter, read :, skip whitespace */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+            if (idx > end_idx || str[idx] != ':') {
+                raise_errmsg("Expecting : delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* read any JSON data type */
+            val = scan_once_str(s, pystr, idx, &next_idx);
+            if (val == NULL)
+                goto bail;
+
+            if (PyDict_SetItem(rval, key, val) == -1)
+                goto bail;
+
+            Py_CLEAR(key);
+            Py_CLEAR(val);
+            idx = next_idx;
+
+            /* skip whitespace before } or , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* bail if the object is closed or we didn't get the , delimiter */
+            if (idx > end_idx) break;
+            if (str[idx] == '}') {
+                break;
+            }
+            else if (str[idx] != ',') {
+                raise_errmsg("Expecting , delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+
+            /* skip whitespace after , delimiter */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+        }
+    }
+    /* verify that idx < end_idx, str[idx] should be '}' */
+    if (idx > end_idx || str[idx] != '}') {
+        raise_errmsg("Expecting object", pystr, end_idx);
+        goto bail;
+    }
+    /* if object_hook is not None: rval = object_hook(rval) */
+    if (s->object_hook != Py_None) {
+        val = PyObject_CallFunctionObjArgs(s->object_hook, rval, NULL);
+        if (val == NULL)
+            goto bail;
+        Py_DECREF(rval);
+        rval = val;
+        val = NULL;
+    }
+    *next_idx_ptr = idx + 1;
+    return rval;
+bail:
+    Py_XDECREF(key);
+    Py_XDECREF(val);
+    Py_DECREF(rval);
+    return NULL;
+}
+
+static PyObject *
+_parse_object_unicode(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON object from PyUnicode pystr.
+    idx is the index of the first character after the opening curly brace.
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the closing curly brace.
+
+    Returns a new PyObject (usually a dict, but object_hook can change that)
+    */
+    Py_UNICODE *str = PyUnicode_AS_UNICODE(pystr);
+    Py_ssize_t end_idx = PyUnicode_GET_SIZE(pystr) - 1;
+    PyObject *val = NULL;
+    PyObject *rval = PyDict_New();
+    PyObject *key = NULL;
+    int strict = PyObject_IsTrue(s->strict);
+    Py_ssize_t next_idx;
+    if (rval == NULL)
+        return NULL;
+
+    /* skip whitespace after { */
+    while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+    /* only loop if the object is non-empty */
+    if (idx <= end_idx && str[idx] != '}') {
+        while (idx <= end_idx) {
+            /* read key */
+            if (str[idx] != '"') {
+                raise_errmsg("Expecting property name", pystr, idx);
+                goto bail;
+            }
+            key = scanstring_unicode(pystr, idx + 1, strict, &next_idx);
+            if (key == NULL)
+                goto bail;
+            idx = next_idx;
+
+            /* skip whitespace between key and : delimiter, read :, skip whitespace */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+            if (idx > end_idx || str[idx] != ':') {
+                raise_errmsg("Expecting : delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* read any JSON term */
+            val = scan_once_unicode(s, pystr, idx, &next_idx);
+            if (val == NULL)
+                goto bail;
+
+            if (PyDict_SetItem(rval, key, val) == -1)
+                goto bail;
+
+            Py_CLEAR(key);
+            Py_CLEAR(val);
+            idx = next_idx;
+
+            /* skip whitespace before } or , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* bail if the object is closed or we didn't get the , delimiter */
+            if (idx > end_idx) break;
+            if (str[idx] == '}') {
+                break;
+            }
+            else if (str[idx] != ',') {
+                raise_errmsg("Expecting , delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+
+            /* skip whitespace after , delimiter */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+        }
+    }
+
+    /* verify that idx < end_idx, str[idx] should be '}' */
+    if (idx > end_idx || str[idx] != '}') {
+        raise_errmsg("Expecting object", pystr, end_idx);
+        goto bail;
+    }
+
+    /* if object_hook is not None: rval = object_hook(rval) */
+    if (s->object_hook != Py_None) {
+        val = PyObject_CallFunctionObjArgs(s->object_hook, rval, NULL);
+        if (val == NULL)
+            goto bail;
+        Py_DECREF(rval);
+        rval = val;
+        val = NULL;
+    }
+    *next_idx_ptr = idx + 1;
+    return rval;
+bail:
+    Py_XDECREF(key);
+    Py_XDECREF(val);
+    Py_DECREF(rval);
+    return NULL;
+}
+
+static PyObject *
+_parse_array_str(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON array from PyString pystr.
+    idx is the index of the first character after the opening brace.
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the closing brace.
+
+    Returns a new PyList
+    */
+    char *str = PyString_AS_STRING(pystr);
+    Py_ssize_t end_idx = PyString_GET_SIZE(pystr) - 1;
+    PyObject *val = NULL;
+    PyObject *rval = PyList_New(0);
+    Py_ssize_t next_idx;
+    if (rval == NULL)
+        return NULL;
+
+    /* skip whitespace after [ */
+    while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+    /* only loop if the array is non-empty */
+    if (idx <= end_idx && str[idx] != ']') {
+        while (idx <= end_idx) {
+
+            /* read any JSON term and de-tuplefy the (rval, idx) */
+            val = scan_once_str(s, pystr, idx, &next_idx);
+            if (val == NULL)
+                goto bail;
+
+            if (PyList_Append(rval, val) == -1)
+                goto bail;
+
+            Py_CLEAR(val);
+            idx = next_idx;
+
+            /* skip whitespace between term and , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* bail if the array is closed or we didn't get the , delimiter */
+            if (idx > end_idx) break;
+            if (str[idx] == ']') {
+                break;
+            }
+            else if (str[idx] != ',') {
+                raise_errmsg("Expecting , delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+
+            /* skip whitespace after , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+        }
+    }
+
+    /* verify that idx < end_idx, str[idx] should be ']' */
+    if (idx > end_idx || str[idx] != ']') {
+        raise_errmsg("Expecting object", pystr, end_idx);
+        goto bail;
+    }
+    *next_idx_ptr = idx + 1;
+    return rval;
+bail:
+    Py_XDECREF(val);
+    Py_DECREF(rval);
+    return NULL;
+}
+
+static PyObject *
+_parse_array_unicode(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON array from PyString pystr.
+    idx is the index of the first character after the opening brace.
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the closing brace.
+
+    Returns a new PyList
+    */
+    Py_UNICODE *str = PyUnicode_AS_UNICODE(pystr);
+    Py_ssize_t end_idx = PyUnicode_GET_SIZE(pystr) - 1;
+    PyObject *val = NULL;
+    PyObject *rval = PyList_New(0);
+    Py_ssize_t next_idx;
+    if (rval == NULL)
+        return NULL;
+
+    /* skip whitespace after [ */
+    while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+    /* only loop if the array is non-empty */
+    if (idx <= end_idx && str[idx] != ']') {
+        while (idx <= end_idx) {
+
+            /* read any JSON term  */
+            val = scan_once_unicode(s, pystr, idx, &next_idx);
+            if (val == NULL)
+                goto bail;
+
+            if (PyList_Append(rval, val) == -1)
+                goto bail;
+
+            Py_CLEAR(val);
+            idx = next_idx;
+
+            /* skip whitespace between term and , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+
+            /* bail if the array is closed or we didn't get the , delimiter */
+            if (idx > end_idx) break;
+            if (str[idx] == ']') {
+                break;
+            }
+            else if (str[idx] != ',') {
+                raise_errmsg("Expecting , delimiter", pystr, idx);
+                goto bail;
+            }
+            idx++;
+
+            /* skip whitespace after , */
+            while (idx <= end_idx && IS_WHITESPACE(str[idx])) idx++;
+        }
+    }
+
+    /* verify that idx < end_idx, str[idx] should be ']' */
+    if (idx > end_idx || str[idx] != ']') {
+        raise_errmsg("Expecting object", pystr, end_idx);
+        goto bail;
+    }
+    *next_idx_ptr = idx + 1;
+    return rval;
+bail:
+    Py_XDECREF(val);
+    Py_DECREF(rval);
+    return NULL;
+}
+
+static PyObject *
+_parse_constant(PyScannerObject *s, char *constant, Py_ssize_t idx, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON constant from PyString pystr.
+    constant is the constant string that was found
+        ("NaN", "Infinity", "-Infinity").
+    idx is the index of the first character of the constant
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the constant.
+
+    Returns the result of parse_constant
+    */
+    PyObject *cstr;
+    PyObject *rval;
+    /* constant is "NaN", "Infinity", or "-Infinity" */
+    cstr = PyString_InternFromString(constant);
+    if (cstr == NULL)
+        return NULL;
+
+    /* rval = parse_constant(constant) */
+    rval = PyObject_CallFunctionObjArgs(s->parse_constant, cstr, NULL);
+    idx += PyString_GET_SIZE(cstr);
+    Py_DECREF(cstr);
+    *next_idx_ptr = idx;
+    return rval;
+}
+
+static PyObject *
+_match_number_str(PyScannerObject *s, PyObject *pystr, Py_ssize_t start, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON number from PyString pystr.
+    idx is the index of the first character of the number
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the number.
+
+    Returns a new PyObject representation of that number:
+        PyInt, PyLong, or PyFloat.
+        May return other types if parse_int or parse_float are set
+    */
+    char *str = PyString_AS_STRING(pystr);
+    Py_ssize_t end_idx = PyString_GET_SIZE(pystr) - 1;
+    Py_ssize_t idx = start;
+    int is_float = 0;
+    PyObject *rval;
+    PyObject *numstr;
+
+    /* read a sign if it's there, make sure it's not the end of the string */
+    if (str[idx] == '-') {
+        idx++;
+        if (idx > end_idx) {
+            PyErr_SetNone(PyExc_StopIteration);
+            return NULL;
+        }
+    }
+
+    /* read as many integer digits as we find as long as it doesn't start with 0 */
+    if (str[idx] >= '1' && str[idx] <= '9') {
+        idx++;
+        while (idx <= end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+    }
+    /* if it starts with 0 we only expect one integer digit */
+    else if (str[idx] == '0') {
+        idx++;
+    }
+    /* no integer digits, error */
+    else {
+        PyErr_SetNone(PyExc_StopIteration);
+        return NULL;
+    }
+
+    /* if the next char is '.' followed by a digit then read all float digits */
+    if (idx < end_idx && str[idx] == '.' && str[idx + 1] >= '0' && str[idx + 1] <= '9') {
+        is_float = 1;
+        idx += 2;
+        while (idx <= end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+    }
+
+    /* if the next char is 'e' or 'E' then maybe read the exponent (or backtrack) */
+    if (idx < end_idx && (str[idx] == 'e' || str[idx] == 'E')) {
+
+        /* save the index of the 'e' or 'E' just in case we need to backtrack */
+        Py_ssize_t e_start = idx;
+        idx++;
+
+        /* read an exponent sign if present */
+        if (idx < end_idx && (str[idx] == '-' || str[idx] == '+')) idx++;
+
+        /* read all digits */
+        while (idx <= end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+
+        /* if we got a digit, then parse as float. if not, backtrack */
+        if (str[idx - 1] >= '0' && str[idx - 1] <= '9') {
+            is_float = 1;
+        }
+        else {
+            idx = e_start;
+        }
+    }
+
+    /* copy the section we determined to be a number */
+    numstr = PyString_FromStringAndSize(&str[start], idx - start);
+    if (numstr == NULL)
+        return NULL;
+    if (is_float) {
+        /* parse as a float using a fast path if available, otherwise call user defined method */
+        if (s->parse_float != (PyObject *)&PyFloat_Type) {
+            rval = PyObject_CallFunctionObjArgs(s->parse_float, numstr, NULL);
+        }
+        else {
+            rval = PyFloat_FromDouble(PyOS_ascii_atof(PyString_AS_STRING(numstr)));
+        }
+    }
+    else {
+        /* parse as an int using a fast path if available, otherwise call user defined method */
+        if (s->parse_int != (PyObject *)&PyInt_Type) {
+            rval = PyObject_CallFunctionObjArgs(s->parse_int, numstr, NULL);
+        }
+        else {
+            rval = PyInt_FromString(PyString_AS_STRING(numstr), NULL, 10);
+        }
+    }
+    Py_DECREF(numstr);
+    *next_idx_ptr = idx;
+    return rval;
+}
+
+static PyObject *
+_match_number_unicode(PyScannerObject *s, PyObject *pystr, Py_ssize_t start, Py_ssize_t *next_idx_ptr) {
+    /* Read a JSON number from PyUnicode pystr.
+    idx is the index of the first character of the number
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the number.
+
+    Returns a new PyObject representation of that number:
+        PyInt, PyLong, or PyFloat.
+        May return other types if parse_int or parse_float are set
+    */
+    Py_UNICODE *str = PyUnicode_AS_UNICODE(pystr);
+    Py_ssize_t end_idx = PyUnicode_GET_SIZE(pystr) - 1;
+    Py_ssize_t idx = start;
+    int is_float = 0;
+    PyObject *rval;
+    PyObject *numstr;
+
+    /* read a sign if it's there, make sure it's not the end of the string */
+    if (str[idx] == '-') {
+        idx++;
+        if (idx > end_idx) {
+            PyErr_SetNone(PyExc_StopIteration);
+            return NULL;
+        }
+    }
+
+    /* read as many integer digits as we find as long as it doesn't start with 0 */
+    if (str[idx] >= '1' && str[idx] <= '9') {
+        idx++;
+        while (idx <= end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+    }
+    /* if it starts with 0 we only expect one integer digit */
+    else if (str[idx] == '0') {
+        idx++;
+    }
+    /* no integer digits, error */
+    else {
+        PyErr_SetNone(PyExc_StopIteration);
+        return NULL;
+    }
+
+    /* if the next char is '.' followed by a digit then read all float digits */
+    if (idx < end_idx && str[idx] == '.' && str[idx + 1] >= '0' && str[idx + 1] <= '9') {
+        is_float = 1;
+        idx += 2;
+        while (idx < end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+    }
+
+    /* if the next char is 'e' or 'E' then maybe read the exponent (or backtrack) */
+    if (idx < end_idx && (str[idx] == 'e' || str[idx] == 'E')) {
+        Py_ssize_t e_start = idx;
+        idx++;
+
+        /* read an exponent sign if present */
+        if (idx < end_idx && (str[idx] == '-' || str[idx] == '+')) idx++;
+
+        /* read all digits */
+        while (idx <= end_idx && str[idx] >= '0' && str[idx] <= '9') idx++;
+
+        /* if we got a digit, then parse as float. if not, backtrack */
+        if (str[idx - 1] >= '0' && str[idx - 1] <= '9') {
+            is_float = 1;
+        }
+        else {
+            idx = e_start;
+        }
+    }
+
+    /* copy the section we determined to be a number */
+    numstr = PyUnicode_FromUnicode(&str[start], idx - start);
+    if (numstr == NULL)
+        return NULL;
+    if (is_float) {
+        /* parse as a float using a fast path if available, otherwise call user defined method */
+        if (s->parse_float != (PyObject *)&PyFloat_Type) {
+            rval = PyObject_CallFunctionObjArgs(s->parse_float, numstr, NULL);
+        }
+        else {
+            rval = PyFloat_FromString(numstr, NULL);
+        }
+    }
+    else {
+        /* no fast path for unicode -> int, just call */
+        rval = PyObject_CallFunctionObjArgs(s->parse_int, numstr, NULL);
+    }
+    Py_DECREF(numstr);
+    *next_idx_ptr = idx;
+    return rval;
+}
+
+static PyObject *
+scan_once_str(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr)
+{
+    /* Read one JSON term (of any kind) from PyString pystr.
+    idx is the index of the first character of the term
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the number.
+
+    Returns a new PyObject representation of the term.
+    */
+    char *str = PyString_AS_STRING(pystr);
+    Py_ssize_t length = PyString_GET_SIZE(pystr);
+    if (idx >= length) {
+        PyErr_SetNone(PyExc_StopIteration);
+        return NULL;
+    }
+    switch (str[idx]) {
+        case '"':
+            /* string */
+            return scanstring_str(pystr, idx + 1,
+                PyString_AS_STRING(s->encoding),
+                PyObject_IsTrue(s->strict),
+                next_idx_ptr);
+        case '{':
+            /* object */
+            return _parse_object_str(s, pystr, idx + 1, next_idx_ptr);
+        case '[':
+            /* array */
+            return _parse_array_str(s, pystr, idx + 1, next_idx_ptr);
+        case 'n':
+            /* null */
+            if ((idx + 3 < length) && str[idx + 1] == 'u' && str[idx + 2] == 'l' && str[idx + 3] == 'l') {
+                Py_INCREF(Py_None);
+                *next_idx_ptr = idx + 4;
+                return Py_None;
+            }
+            break;
+        case 't':
+            /* true */
+            if ((idx + 3 < length) && str[idx + 1] == 'r' && str[idx + 2] == 'u' && str[idx + 3] == 'e') {
+                Py_INCREF(Py_True);
+                *next_idx_ptr = idx + 4;
+                return Py_True;
+            }
+            break;
+        case 'f':
+            /* false */
+            if ((idx + 4 < length) && str[idx + 1] == 'a' && str[idx + 2] == 'l' && str[idx + 3] == 's' && str[idx + 4] == 'e') {
+                Py_INCREF(Py_False);
+                *next_idx_ptr = idx + 5;
+                return Py_False;
+            }
+            break;
+        case 'N':
+            /* NaN */
+            if ((idx + 2 < length) && str[idx + 1] == 'a' && str[idx + 2] == 'N') {
+                return _parse_constant(s, "NaN", idx, next_idx_ptr);
+            }
+            break;
+        case 'I':
+            /* Infinity */
+            if ((idx + 7 < length) && str[idx + 1] == 'n' && str[idx + 2] == 'f' && str[idx + 3] == 'i' && str[idx + 4] == 'n' && str[idx + 5] == 'i' && str[idx + 6] == 't' && str[idx + 7] == 'y') {
+                return _parse_constant(s, "Infinity", idx, next_idx_ptr);
+            }
+            break;
+        case '-':
+            /* -Infinity */
+            if ((idx + 8 < length) && str[idx + 1] == 'I' && str[idx + 2] == 'n' && str[idx + 3] == 'f' && str[idx + 4] == 'i' && str[idx + 5] == 'n' && str[idx + 6] == 'i' && str[idx + 7] == 't' && str[idx + 8] == 'y') {
+                return _parse_constant(s, "-Infinity", idx, next_idx_ptr);
+            }
+            break;
+    }
+    /* Didn't find a string, object, array, or named constant. Look for a number. */
+    return _match_number_str(s, pystr, idx, next_idx_ptr);
+}
+
+static PyObject *
+scan_once_unicode(PyScannerObject *s, PyObject *pystr, Py_ssize_t idx, Py_ssize_t *next_idx_ptr)
+{
+    /* Read one JSON term (of any kind) from PyUnicode pystr.
+    idx is the index of the first character of the term
+    *next_idx_ptr is a return-by-reference index to the first character after
+        the number.
+
+    Returns a new PyObject representation of the term.
+    */
+    Py_UNICODE *str = PyUnicode_AS_UNICODE(pystr);
+    Py_ssize_t length = PyUnicode_GET_SIZE(pystr);
+    if (idx >= length) {
+        PyErr_SetNone(PyExc_StopIteration);
+        return NULL;
+    }
+    switch (str[idx]) {
+        case '"':
+            /* string */
+            return scanstring_unicode(pystr, idx + 1,
+                PyObject_IsTrue(s->strict),
+                next_idx_ptr);
+        case '{':
+            /* object */
+            return _parse_object_unicode(s, pystr, idx + 1, next_idx_ptr);
+        case '[':
+            /* array */
+            return _parse_array_unicode(s, pystr, idx + 1, next_idx_ptr);
+        case 'n':
+            /* null */
+            if ((idx + 3 < length) && str[idx + 1] == 'u' && str[idx + 2] == 'l' && str[idx + 3] == 'l') {
+                Py_INCREF(Py_None);
+                *next_idx_ptr = idx + 4;
+                return Py_None;
+            }
+            break;
+        case 't':
+            /* true */
+            if ((idx + 3 < length) && str[idx + 1] == 'r' && str[idx + 2] == 'u' && str[idx + 3] == 'e') {
+                Py_INCREF(Py_True);
+                *next_idx_ptr = idx + 4;
+                return Py_True;
+            }
+            break;
+        case 'f':
+            /* false */
+            if ((idx + 4 < length) && str[idx + 1] == 'a' && str[idx + 2] == 'l' && str[idx + 3] == 's' && str[idx + 4] == 'e') {
+                Py_INCREF(Py_False);
+                *next_idx_ptr = idx + 5;
+                return Py_False;
+            }
+            break;
+        case 'N':
+            /* NaN */
+            if ((idx + 2 < length) && str[idx + 1] == 'a' && str[idx + 2] == 'N') {
+                return _parse_constant(s, "NaN", idx, next_idx_ptr);
+            }
+            break;
+        case 'I':
+            /* Infinity */
+            if ((idx + 7 < length) && str[idx + 1] == 'n' && str[idx + 2] == 'f' && str[idx + 3] == 'i' && str[idx + 4] == 'n' && str[idx + 5] == 'i' && str[idx + 6] == 't' && str[idx + 7] == 'y') {
+                return _parse_constant(s, "Infinity", idx, next_idx_ptr);
+            }
+            break;
+        case '-':
+            /* -Infinity */
+            if ((idx + 8 < length) && str[idx + 1] == 'I' && str[idx + 2] == 'n' && str[idx + 3] == 'f' && str[idx + 4] == 'i' && str[idx + 5] == 'n' && str[idx + 6] == 'i' && str[idx + 7] == 't' && str[idx + 8] == 'y') {
+                return _parse_constant(s, "-Infinity", idx, next_idx_ptr);
+            }
+            break;
+    }
+    /* Didn't find a string, object, array, or named constant. Look for a number. */
+    return _match_number_unicode(s, pystr, idx, next_idx_ptr);
+}
+
+static PyObject *
+scanner_call(PyObject *self, PyObject *args, PyObject *kwds)
+{
+    /* Python callable interface to scan_once_{str,unicode} */
+    PyObject *pystr;
+    PyObject *rval;
+    Py_ssize_t idx;
+    Py_ssize_t next_idx = -1;
+    static char *kwlist[] = {"string", "idx", NULL};
+    PyScannerObject *s;
+    assert(PyScanner_Check(self));
+    s = (PyScannerObject *)self;
+    if (!PyArg_ParseTupleAndKeywords(args, kwds, "OO&:scan_once", kwlist, &pystr, _convertPyInt_AsSsize_t, &idx))
+        return NULL;
+
+    if (PyString_Check(pystr)) {
+        rval = scan_once_str(s, pystr, idx, &next_idx);
+    }
+    else if (PyUnicode_Check(pystr)) {
+        rval = scan_once_unicode(s, pystr, idx, &next_idx);
+    }
+    else {
+        PyErr_Format(PyExc_TypeError,
+                 "first argument must be a string, not %.80s",
+                 Py_TYPE(pystr)->tp_name);
+        return NULL;
+    }
+    return _build_rval_index_tuple(rval, next_idx);
+}
+
+static PyObject *
+scanner_new(PyTypeObject *type, PyObject *args, PyObject *kwds)
+{
+    PyScannerObject *s;
+    s = (PyScannerObject *)type->tp_alloc(type, 0);
+    if (s != NULL) {
+        s->encoding = NULL;
+        s->strict = NULL;
+        s->object_hook = NULL;
+        s->parse_float = NULL;
+        s->parse_int = NULL;
+        s->parse_constant = NULL;
+    }
+    return (PyObject *)s;
+}
+
+static int
+scanner_init(PyObject *self, PyObject *args, PyObject *kwds)
+{
+    /* Initialize Scanner object */
+    PyObject *ctx;
+    static char *kwlist[] = {"context", NULL};
+    PyScannerObject *s;
+
+    assert(PyScanner_Check(self));
+    s = (PyScannerObject *)self;
+
+    if (!PyArg_ParseTupleAndKeywords(args, kwds, "O:make_scanner", kwlist, &ctx))
+        return -1;
+
+    /* PyString_AS_STRING is used on encoding */
+    s->encoding = PyObject_GetAttrString(ctx, "encoding");
+    if (s->encoding == Py_None) {
+        Py_DECREF(Py_None);
+        s->encoding = PyString_InternFromString(DEFAULT_ENCODING);
+    }
+    else if (PyUnicode_Check(s->encoding)) {
+        PyObject *tmp = PyUnicode_AsEncodedString(s->encoding, NULL, NULL);
+        Py_DECREF(s->encoding);
+        s->encoding = tmp;
+    }
+    if (s->encoding == NULL || !PyString_Check(s->encoding))
+        goto bail;
+
+    /* All of these will fail "gracefully" so we don't need to verify them */
+    s->strict = PyObject_GetAttrString(ctx, "strict");
+    if (s->strict == NULL)
+        goto bail;
+    s->object_hook = PyObject_GetAttrString(ctx, "object_hook");
+    if (s->object_hook == NULL)
+        goto bail;
+    s->parse_float = PyObject_GetAttrString(ctx, "parse_float");
+    if (s->parse_float == NULL)
+        goto bail;
+    s->parse_int = PyObject_GetAttrString(ctx, "parse_int");
+    if (s->parse_int == NULL)
+        goto bail;
+    s->parse_constant = PyObject_GetAttrString(ctx, "parse_constant");
+    if (s->parse_constant == NULL)
+        goto bail;
+
+    return 0;
+
+bail:
+    Py_CLEAR(s->encoding);
+    Py_CLEAR(s->strict);
+    Py_CLEAR(s->object_hook);
+    Py_CLEAR(s->parse_float);
+    Py_CLEAR(s->parse_int);
+    Py_CLEAR(s->parse_constant);
+    return -1;
+}
+
+PyDoc_STRVAR(scanner_doc, "JSON scanner object");
+
+static
+PyTypeObject PyScannerType = {
+    PyObject_HEAD_INIT(NULL)
+    0,                    /* tp_internal */
+    "simplejson._speedups.Scanner",       /* tp_name */
+    sizeof(PyScannerObject), /* tp_basicsize */
+    0,                    /* tp_itemsize */
+    scanner_dealloc, /* tp_dealloc */
+    0,                    /* tp_print */
+    0,                    /* tp_getattr */
+    0,                    /* tp_setattr */
+    0,                    /* tp_compare */
+    0,                    /* tp_repr */
+    0,                    /* tp_as_number */
+    0,                    /* tp_as_sequence */
+    0,                    /* tp_as_mapping */
+    0,                    /* tp_hash */
+    scanner_call,         /* tp_call */
+    0,                    /* tp_str */
+    0,/* PyObject_GenericGetAttr, */                    /* tp_getattro */
+    0,/* PyObject_GenericSetAttr, */                    /* tp_setattro */
+    0,                    /* tp_as_buffer */
+    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,   /* tp_flags */
+    scanner_doc,          /* tp_doc */
+    scanner_traverse,                    /* tp_traverse */
+    scanner_clear,                    /* tp_clear */
+    0,                    /* tp_richcompare */
+    0,                    /* tp_weaklistoffset */
+    0,                    /* tp_iter */
+    0,                    /* tp_iternext */
+    0,                    /* tp_methods */
+    scanner_members,                    /* tp_members */
+    0,                    /* tp_getset */
+    0,                    /* tp_base */
+    0,                    /* tp_dict */
+    0,                    /* tp_descr_get */
+    0,                    /* tp_descr_set */
+    0,                    /* tp_dictoffset */
+    scanner_init,                    /* tp_init */
+    0,/* PyType_GenericAlloc, */        /* tp_alloc */
+    scanner_new,          /* tp_new */
+    0,/* PyObject_GC_Del, */              /* tp_free */
+};
+
+static PyObject *
+encoder_new(PyTypeObject *type, PyObject *args, PyObject *kwds)
+{
+    PyEncoderObject *s;
+    s = (PyEncoderObject *)type->tp_alloc(type, 0);
+    if (s != NULL) {
+        s->markers = NULL;
+        s->defaultfn = NULL;
+        s->encoder = NULL;
+        s->indent = NULL;
+        s->key_separator = NULL;
+        s->item_separator = NULL;
+        s->sort_keys = NULL;
+        s->skipkeys = NULL;
+    }
+    return (PyObject *)s;
+}
+
+static int
+encoder_init(PyObject *self, PyObject *args, PyObject *kwds)
+{
+    /* initialize Encoder object */
+    static char *kwlist[] = {"markers", "default", "encoder", "indent", "key_separator", "item_separator", "sort_keys", "skipkeys", "allow_nan", NULL};
+
+    PyEncoderObject *s;
+    PyObject *allow_nan;
+
+    assert(PyEncoder_Check(self));
+    s = (PyEncoderObject *)self;
+
+    if (!PyArg_ParseTupleAndKeywords(args, kwds, "OOOOOOOOO:make_encoder", kwlist,
+        &s->markers, &s->defaultfn, &s->encoder, &s->indent, &s->key_separator, &s->item_separator, &s->sort_keys, &s->skipkeys, &allow_nan))
+        return -1;
+
+    Py_INCREF(s->markers);
+    Py_INCREF(s->defaultfn);
+    Py_INCREF(s->encoder);
+    Py_INCREF(s->indent);
+    Py_INCREF(s->key_separator);
+    Py_INCREF(s->item_separator);
+    Py_INCREF(s->sort_keys);
+    Py_INCREF(s->skipkeys);
+    s->fast_encode = (PyCFunction_Check(s->encoder) && PyCFunction_GetFunction(s->encoder) == (PyCFunction)py_encode_basestring_ascii);
+    s->allow_nan = PyObject_IsTrue(allow_nan);
+    return 0;
+}
+
+static PyObject *
+encoder_call(PyObject *self, PyObject *args, PyObject *kwds)
+{
+    /* Python callable interface to encode_listencode_obj */
+    static char *kwlist[] = {"obj", "_current_indent_level", NULL};
+    PyObject *obj;
+    PyObject *rval;
+    Py_ssize_t indent_level;
+    PyEncoderObject *s;
+    assert(PyEncoder_Check(self));
+    s = (PyEncoderObject *)self;
+    if (!PyArg_ParseTupleAndKeywords(args, kwds, "OO&:_iterencode", kwlist,
+        &obj, _convertPyInt_AsSsize_t, &indent_level))
+        return NULL;
+    rval = PyList_New(0);
+    if (rval == NULL)
+        return NULL;
+    if (encoder_listencode_obj(s, rval, obj, indent_level)) {
+        Py_DECREF(rval);
+        return NULL;
+    }
+    return rval;
+}
+
+static PyObject *
+_encoded_const(PyObject *obj)
+{
+    /* Return the JSON string representation of None, True, False */
+    if (obj == Py_None) {
+        static PyObject *s_null = NULL;
+        if (s_null == NULL) {
+            s_null = PyString_InternFromString("null");
+        }
+        Py_INCREF(s_null);
+        return s_null;
+    }
+    else if (obj == Py_True) {
+        static PyObject *s_true = NULL;
+        if (s_true == NULL) {
+            s_true = PyString_InternFromString("true");
+        }
+        Py_INCREF(s_true);
+        return s_true;
+    }
+    else if (obj == Py_False) {
+        static PyObject *s_false = NULL;
+        if (s_false == NULL) {
+            s_false = PyString_InternFromString("false");
+        }
+        Py_INCREF(s_false);
+        return s_false;
+    }
+    else {
+        PyErr_SetString(PyExc_ValueError, "not a const");
+        return NULL;
+    }
+}
+
+static PyObject *
+encoder_encode_float(PyEncoderObject *s, PyObject *obj)
+{
+    /* Return the JSON representation of a PyFloat */
+    double i = PyFloat_AS_DOUBLE(obj);
+    if (!Py_IS_FINITE(i)) {
+        if (!s->allow_nan) {
+            PyErr_SetString(PyExc_ValueError, "Out of range float values are not JSON compliant");
+            return NULL;
+        }
+        if (i > 0) {
+            return PyString_FromString("Infinity");
+        }
+        else if (i < 0) {
+            return PyString_FromString("-Infinity");
+        }
+        else {
+            return PyString_FromString("NaN");
+        }
+    }
+    /* Use a better float format here? */
+    return PyObject_Repr(obj);
+}
+
+static PyObject *
+encoder_encode_string(PyEncoderObject *s, PyObject *obj)
+{
+    /* Return the JSON representation of a string */
+    if (s->fast_encode)
+        return py_encode_basestring_ascii(NULL, obj);
+    else
+        return PyObject_CallFunctionObjArgs(s->encoder, obj, NULL);
+}
+
+static int
+_steal_list_append(PyObject *lst, PyObject *stolen)
+{
+    /* Append stolen and then decrement its reference count */
+    int rval = PyList_Append(lst, stolen);
+    Py_DECREF(stolen);
+    return rval;
+}
+
+static int
+encoder_listencode_obj(PyEncoderObject *s, PyObject *rval, PyObject *obj, Py_ssize_t indent_level)
+{
+    /* Encode Python object obj to a JSON term, rval is a PyList */
+    PyObject *newobj;
+    int rv;
+
+    if (obj == Py_None || obj == Py_True || obj == Py_False) {
+        PyObject *cstr = _encoded_const(obj);
+        if (cstr == NULL)
+            return -1;
+        return _steal_list_append(rval, cstr);
+    }
+    else if (PyString_Check(obj) || PyUnicode_Check(obj))
+    {
+        PyObject *encoded = encoder_encode_string(s, obj);
+        if (encoded == NULL)
+            return -1;
+        return _steal_list_append(rval, encoded);
+    }
+    else if (PyInt_Check(obj) || PyLong_Check(obj)) {
+        PyObject *encoded = PyObject_Str(obj);
+        if (encoded == NULL)
+            return -1;
+        return _steal_list_append(rval, encoded);
+    }
+    else if (PyFloat_Check(obj)) {
+        PyObject *encoded = encoder_encode_float(s, obj);
+        if (encoded == NULL)
+            return -1;
+        return _steal_list_append(rval, encoded);
+    }
+    else if (PyList_Check(obj) || PyTuple_Check(obj)) {
+        return encoder_listencode_list(s, rval, obj, indent_level);
+    }
+    else if (PyDict_Check(obj)) {
+        return encoder_listencode_dict(s, rval, obj, indent_level);
+    }
+    else {
+        PyObject *ident = NULL;
+        if (s->markers != Py_None) {
+            int has_key;
+            ident = PyLong_FromVoidPtr(obj);
+            if (ident == NULL)
+                return -1;
+            has_key = PyDict_Contains(s->markers, ident);
+            if (has_key) {
+                if (has_key != -1)
+                    PyErr_SetString(PyExc_ValueError, "Circular reference detected");
+                Py_DECREF(ident);
+                return -1;
+            }
+            if (PyDict_SetItem(s->markers, ident, obj)) {
+                Py_DECREF(ident);
+                return -1;
+            }
+        }
+        newobj = PyObject_CallFunctionObjArgs(s->defaultfn, obj, NULL);
+        if (newobj == NULL) {
+            Py_XDECREF(ident);
+            return -1;
+        }
+        rv = encoder_listencode_obj(s, rval, newobj, indent_level);
+        Py_DECREF(newobj);
+        if (rv) {
+            Py_XDECREF(ident);
+            return -1;
+        }
+        if (ident != NULL) {
+            if (PyDict_DelItem(s->markers, ident)) {
+                Py_XDECREF(ident);
+                return -1;
+            }
+            Py_XDECREF(ident);
+        }
+        return rv;
+    }
+}
+
+static int
+encoder_listencode_dict(PyEncoderObject *s, PyObject *rval, PyObject *dct, Py_ssize_t indent_level)
+{
+    /* Encode Python dict dct a JSON term, rval is a PyList */
+    static PyObject *open_dict = NULL;
+    static PyObject *close_dict = NULL;
+    static PyObject *empty_dict = NULL;
+    PyObject *kstr = NULL;
+    PyObject *ident = NULL;
+    PyObject *key, *value;
+    Py_ssize_t pos;
+    int skipkeys;
+    Py_ssize_t idx;
+
+    if (open_dict == NULL || close_dict == NULL || empty_dict == NULL) {
+        open_dict = PyString_InternFromString("{");
+        close_dict = PyString_InternFromString("}");
+        empty_dict = PyString_InternFromString("{}");
+        if (open_dict == NULL || close_dict == NULL || empty_dict == NULL)
+            return -1;
+    }
+    if (PyDict_Size(dct) == 0)
+        return PyList_Append(rval, empty_dict);
+
+    if (s->markers != Py_None) {
+        int has_key;
+        ident = PyLong_FromVoidPtr(dct);
+        if (ident == NULL)
+            goto bail;
+        has_key = PyDict_Contains(s->markers, ident);
+        if (has_key) {
+            if (has_key != -1)
+                PyErr_SetString(PyExc_ValueError, "Circular reference detected");
+            goto bail;
+        }
+        if (PyDict_SetItem(s->markers, ident, dct)) {
+            goto bail;
+        }
+    }
+
+    if (PyList_Append(rval, open_dict))
+        goto bail;
+
+    if (s->indent != Py_None) {
+        /* TODO: DOES NOT RUN */
+        indent_level += 1;
+        /*
+            newline_indent = '\n' + (' ' * (_indent * _current_indent_level))
+            separator = _item_separator + newline_indent
+            buf += newline_indent
+        */
+    }
+
+    /* TODO: C speedup not implemented for sort_keys */
+
+    pos = 0;
+    skipkeys = PyObject_IsTrue(s->skipkeys);
+    idx = 0;
+    while (PyDict_Next(dct, &pos, &key, &value)) {
+        PyObject *encoded;
+
+        if (PyString_Check(key) || PyUnicode_Check(key)) {
+            Py_INCREF(key);
+            kstr = key;
+        }
+        else if (PyFloat_Check(key)) {
+            kstr = encoder_encode_float(s, key);
+            if (kstr == NULL)
+                goto bail;
+        }
+        else if (PyInt_Check(key) || PyLong_Check(key)) {
+            kstr = PyObject_Str(key);
+            if (kstr == NULL)
+                goto bail;
+        }
+        else if (key == Py_True || key == Py_False || key == Py_None) {
+            kstr = _encoded_const(key);
+            if (kstr == NULL)
+                goto bail;
+        }
+        else if (skipkeys) {
+            continue;
+        }
+        else {
+            /* TODO: include repr of key */
+            PyErr_SetString(PyExc_ValueError, "keys must be a string");
+            goto bail;
+        }
+
+        if (idx) {
+            if (PyList_Append(rval, s->item_separator))
+                goto bail;
+        }
+
+        encoded = encoder_encode_string(s, kstr);
+        Py_CLEAR(kstr);
+        if (encoded == NULL)
+            goto bail;
+        if (PyList_Append(rval, encoded)) {
+            Py_DECREF(encoded);
+            goto bail;
+        }
+        Py_DECREF(encoded);
+        if (PyList_Append(rval, s->key_separator))
+            goto bail;
+        if (encoder_listencode_obj(s, rval, value, indent_level))
+            goto bail;
+        idx += 1;
+    }
+    if (ident != NULL) {
+        if (PyDict_DelItem(s->markers, ident))
+            goto bail;
+        Py_CLEAR(ident);
+    }
+    if (s->indent != Py_None) {
+        /* TODO: DOES NOT RUN */
+        indent_level -= 1;
+        /*
+            yield '\n' + (' ' * (_indent * _current_indent_level))
+        */
+    }
+    if (PyList_Append(rval, close_dict))
+        goto bail;
+    return 0;
+
+bail:
+    Py_XDECREF(kstr);
+    Py_XDECREF(ident);
+    return -1;
+}
+
+
+static int
+encoder_listencode_list(PyEncoderObject *s, PyObject *rval, PyObject *seq, Py_ssize_t indent_level)
+{
+    /* Encode Python list seq to a JSON term, rval is a PyList */
+    static PyObject *open_array = NULL;
+    static PyObject *close_array = NULL;
+    static PyObject *empty_array = NULL;
+    PyObject *ident = NULL;
+    PyObject *s_fast = NULL;
+    Py_ssize_t num_items;
+    PyObject **seq_items;
+    Py_ssize_t i;
+
+    if (open_array == NULL || close_array == NULL || empty_array == NULL) {
+        open_array = PyString_InternFromString("[");
+        close_array = PyString_InternFromString("]");
+        empty_array = PyString_InternFromString("[]");
+        if (open_array == NULL || close_array == NULL || empty_array == NULL)
+            return -1;
+    }
+    ident = NULL;
+    s_fast = PySequence_Fast(seq, "_iterencode_list needs a sequence");
+    if (s_fast == NULL)
+        return -1;
+    num_items = PySequence_Fast_GET_SIZE(s_fast);
+    if (num_items == 0) {
+        Py_DECREF(s_fast);
+        return PyList_Append(rval, empty_array);
+    }
+
+    if (s->markers != Py_None) {
+        int has_key;
+        ident = PyLong_FromVoidPtr(seq);
+        if (ident == NULL)
+            goto bail;
+        has_key = PyDict_Contains(s->markers, ident);
+        if (has_key) {
+            if (has_key != -1)
+                PyErr_SetString(PyExc_ValueError, "Circular reference detected");
+            goto bail;
+        }
+        if (PyDict_SetItem(s->markers, ident, seq)) {
+            goto bail;
+        }
+    }
+
+    seq_items = PySequence_Fast_ITEMS(s_fast);
+    if (PyList_Append(rval, open_array))
+        goto bail;
+    if (s->indent != Py_None) {
+        /* TODO: DOES NOT RUN */
+        indent_level += 1;
+        /*
+            newline_indent = '\n' + (' ' * (_indent * _current_indent_level))
+            separator = _item_separator + newline_indent
+            buf += newline_indent
+        */
+    }
+    for (i = 0; i < num_items; i++) {
+        PyObject *obj = seq_items[i];
+        if (i) {
+            if (PyList_Append(rval, s->item_separator))
+                goto bail;
+        }
+        if (encoder_listencode_obj(s, rval, obj, indent_level))
+            goto bail;
+    }
+    if (ident != NULL) {
+        if (PyDict_DelItem(s->markers, ident))
+            goto bail;
+        Py_CLEAR(ident);
+    }
+    if (s->indent != Py_None) {
+        /* TODO: DOES NOT RUN */
+        indent_level -= 1;
+        /*
+            yield '\n' + (' ' * (_indent * _current_indent_level))
+        */
+    }
+    if (PyList_Append(rval, close_array))
+        goto bail;
+    Py_DECREF(s_fast);
+    return 0;
+
+bail:
+    Py_XDECREF(ident);
+    Py_DECREF(s_fast);
+    return -1;
+}
+
+static void
+encoder_dealloc(PyObject *self)
+{
+    /* Deallocate Encoder */
+    encoder_clear(self);
+    Py_TYPE(self)->tp_free(self);
+}
+
+static int
+encoder_traverse(PyObject *self, visitproc visit, void *arg)
+{
+    PyEncoderObject *s;
+    assert(PyEncoder_Check(self));
+    s = (PyEncoderObject *)self;
+    Py_VISIT(s->markers);
+    Py_VISIT(s->defaultfn);
+    Py_VISIT(s->encoder);
+    Py_VISIT(s->indent);
+    Py_VISIT(s->key_separator);
+    Py_VISIT(s->item_separator);
+    Py_VISIT(s->sort_keys);
+    Py_VISIT(s->skipkeys);
+    return 0;
+}
+
+static int
+encoder_clear(PyObject *self)
+{
+    /* Deallocate Encoder */
+    PyEncoderObject *s;
+    assert(PyEncoder_Check(self));
+    s = (PyEncoderObject *)self;
+    Py_CLEAR(s->markers);
+    Py_CLEAR(s->defaultfn);
+    Py_CLEAR(s->encoder);
+    Py_CLEAR(s->indent);
+    Py_CLEAR(s->key_separator);
+    Py_CLEAR(s->item_separator);
+    Py_CLEAR(s->sort_keys);
+    Py_CLEAR(s->skipkeys);
+    return 0;
+}
+
+PyDoc_STRVAR(encoder_doc, "_iterencode(obj, _current_indent_level) -> iterable");
+
+static
+PyTypeObject PyEncoderType = {
+    PyObject_HEAD_INIT(NULL)
+    0,                    /* tp_internal */
+    "simplejson._speedups.Encoder",       /* tp_name */
+    sizeof(PyEncoderObject), /* tp_basicsize */
+    0,                    /* tp_itemsize */
+    encoder_dealloc, /* tp_dealloc */
+    0,                    /* tp_print */
+    0,                    /* tp_getattr */
+    0,                    /* tp_setattr */
+    0,                    /* tp_compare */
+    0,                    /* tp_repr */
+    0,                    /* tp_as_number */
+    0,                    /* tp_as_sequence */
+    0,                    /* tp_as_mapping */
+    0,                    /* tp_hash */
+    encoder_call,         /* tp_call */
+    0,                    /* tp_str */
+    0,                    /* tp_getattro */
+    0,                    /* tp_setattro */
+    0,                    /* tp_as_buffer */
+    Py_TPFLAGS_DEFAULT | Py_TPFLAGS_HAVE_GC,   /* tp_flags */
+    encoder_doc,          /* tp_doc */
+    encoder_traverse,     /* tp_traverse */
+    encoder_clear,        /* tp_clear */
+    0,                    /* tp_richcompare */
+    0,                    /* tp_weaklistoffset */
+    0,                    /* tp_iter */
+    0,                    /* tp_iternext */
+    0,                    /* tp_methods */
+    encoder_members,      /* tp_members */
+    0,                    /* tp_getset */
+    0,                    /* tp_base */
+    0,                    /* tp_dict */
+    0,                    /* tp_descr_get */
+    0,                    /* tp_descr_set */
+    0,                    /* tp_dictoffset */
+    encoder_init,         /* tp_init */
+    0,                    /* tp_alloc */
+    encoder_new,          /* tp_new */
+    0,                    /* tp_free */
+};
+
+static PyMethodDef speedups_methods[] = {
+    {"encode_basestring_ascii",
+        (PyCFunction)py_encode_basestring_ascii,
+        METH_O,
+        pydoc_encode_basestring_ascii},
+    {"scanstring",
+        (PyCFunction)py_scanstring,
+        METH_VARARGS,
+        pydoc_scanstring},
+    {NULL, NULL, 0, NULL}
+};
+
+PyDoc_STRVAR(module_doc,
+"simplejson speedups\n");
+
+void
+init_speedups(void)
+{
+    PyObject *m;
+    PyScannerType.tp_new = PyType_GenericNew;
+    if (PyType_Ready(&PyScannerType) < 0)
+        return;
+    PyEncoderType.tp_new = PyType_GenericNew;
+    if (PyType_Ready(&PyEncoderType) < 0)
+        return;
+    m = Py_InitModule3("_speedups", speedups_methods, module_doc);
+    Py_INCREF((PyObject*)&PyScannerType);
+    PyModule_AddObject(m, "make_scanner", (PyObject*)&PyScannerType);
+    Py_INCREF((PyObject*)&PyEncoderType);
+    PyModule_AddObject(m, "make_encoder", (PyObject*)&PyEncoderType);
+}
diff --git a/simplejson/decoder.py b/simplejson/decoder.py
new file mode 100644
index 00000000..b769ea48
--- /dev/null
+++ b/simplejson/decoder.py
@@ -0,0 +1,354 @@
+"""Implementation of JSONDecoder
+"""
+import re
+import sys
+import struct
+
+from simplejson.scanner import make_scanner
+try:
+    from simplejson._speedups import scanstring as c_scanstring
+except ImportError:
+    c_scanstring = None
+
+__all__ = ['JSONDecoder']
+
+FLAGS = re.VERBOSE | re.MULTILINE | re.DOTALL
+
+def _floatconstants():
+    _BYTES = '7FF80000000000007FF0000000000000'.decode('hex')
+    if sys.byteorder != 'big':
+        _BYTES = _BYTES[:8][::-1] + _BYTES[8:][::-1]
+    nan, inf = struct.unpack('dd', _BYTES)
+    return nan, inf, -inf
+
+NaN, PosInf, NegInf = _floatconstants()
+
+
+def linecol(doc, pos):
+    lineno = doc.count('\n', 0, pos) + 1
+    if lineno == 1:
+        colno = pos
+    else:
+        colno = pos - doc.rindex('\n', 0, pos)
+    return lineno, colno
+
+
+def errmsg(msg, doc, pos, end=None):
+    # Note that this function is called from _speedups
+    lineno, colno = linecol(doc, pos)
+    if end is None:
+        #fmt = '{0}: line {1} column {2} (char {3})'
+        #return fmt.format(msg, lineno, colno, pos)
+        fmt = '%s: line %d column %d (char %d)'
+        return fmt % (msg, lineno, colno, pos)
+    endlineno, endcolno = linecol(doc, end)
+    #fmt = '{0}: line {1} column {2} - line {3} column {4} (char {5} - {6})'
+    #return fmt.format(msg, lineno, colno, endlineno, endcolno, pos, end)
+    fmt = '%s: line %d column %d - line %d column %d (char %d - %d)'
+    return fmt % (msg, lineno, colno, endlineno, endcolno, pos, end)
+
+
+_CONSTANTS = {
+    '-Infinity': NegInf,
+    'Infinity': PosInf,
+    'NaN': NaN,
+}
+
+STRINGCHUNK = re.compile(r'(.*?)(["\\\x00-\x1f])', FLAGS)
+BACKSLASH = {
+    '"': u'"', '\\': u'\\', '/': u'/',
+    'b': u'\b', 'f': u'\f', 'n': u'\n', 'r': u'\r', 't': u'\t',
+}
+
+DEFAULT_ENCODING = "utf-8"
+
+def py_scanstring(s, end, encoding=None, strict=True, _b=BACKSLASH, _m=STRINGCHUNK.match):
+    """Scan the string s for a JSON string. End is the index of the
+    character in s after the quote that started the JSON string.
+    Unescapes all valid JSON string escape sequences and raises ValueError
+    on attempt to decode an invalid string. If strict is False then literal
+    control characters are allowed in the string.
+    
+    Returns a tuple of the decoded string and the index of the character in s
+    after the end quote."""
+    if encoding is None:
+        encoding = DEFAULT_ENCODING
+    chunks = []
+    _append = chunks.append
+    begin = end - 1
+    while 1:
+        chunk = _m(s, end)
+        if chunk is None:
+            raise ValueError(
+                errmsg("Unterminated string starting at", s, begin))
+        end = chunk.end()
+        content, terminator = chunk.groups()
+        # Content is contains zero or more unescaped string characters
+        if content:
+            if not isinstance(content, unicode):
+                content = unicode(content, encoding)
+            _append(content)
+        # Terminator is the end of string, a literal control character,
+        # or a backslash denoting that an escape sequence follows
+        if terminator == '"':
+            break
+        elif terminator != '\\':
+            if strict:
+                msg = "Invalid control character %r at" % (terminator,)
+                #msg = "Invalid control character {0!r} at".format(terminator)
+                raise ValueError(errmsg(msg, s, end))
+            else:
+                _append(terminator)
+                continue
+        try:
+            esc = s[end]
+        except IndexError:
+            raise ValueError(
+                errmsg("Unterminated string starting at", s, begin))
+        # If not a unicode escape sequence, must be in the lookup table
+        if esc != 'u':
+            try:
+                char = _b[esc]
+            except KeyError:
+                msg = "Invalid \\escape: " + repr(esc)
+                raise ValueError(errmsg(msg, s, end))
+            end += 1
+        else:
+            # Unicode escape sequence
+            esc = s[end + 1:end + 5]
+            next_end = end + 5
+            if len(esc) != 4:
+                msg = "Invalid \\uXXXX escape"
+                raise ValueError(errmsg(msg, s, end))
+            uni = int(esc, 16)
+            # Check for surrogate pair on UCS-4 systems
+            if 0xd800 <= uni <= 0xdbff and sys.maxunicode > 65535:
+                msg = "Invalid \\uXXXX\\uXXXX surrogate pair"
+                if not s[end + 5:end + 7] == '\\u':
+                    raise ValueError(errmsg(msg, s, end))
+                esc2 = s[end + 7:end + 11]
+                if len(esc2) != 4:
+                    raise ValueError(errmsg(msg, s, end))
+                uni2 = int(esc2, 16)
+                uni = 0x10000 + (((uni - 0xd800) << 10) | (uni2 - 0xdc00))
+                next_end += 6
+            char = unichr(uni)
+            end = next_end
+        # Append the unescaped character
+        _append(char)
+    return u''.join(chunks), end
+
+
+# Use speedup if available
+scanstring = c_scanstring or py_scanstring
+
+WHITESPACE = re.compile(r'[ \t\n\r]*', FLAGS)
+WHITESPACE_STR = ' \t\n\r'
+
+def JSONObject((s, end), encoding, strict, scan_once, object_hook, _w=WHITESPACE.match, _ws=WHITESPACE_STR):
+    pairs = {}
+    # Use a slice to prevent IndexError from being raised, the following
+    # check will raise a more specific ValueError if the string is empty
+    nextchar = s[end:end + 1]
+    # Normally we expect nextchar == '"'
+    if nextchar != '"':
+        if nextchar in _ws:
+            end = _w(s, end).end()
+            nextchar = s[end:end + 1]
+        # Trivial empty object
+        if nextchar == '}':
+            return pairs, end + 1
+        elif nextchar != '"':
+            raise ValueError(errmsg("Expecting property name", s, end))
+    end += 1
+    while True:
+        key, end = scanstring(s, end, encoding, strict)
+
+        # To skip some function call overhead we optimize the fast paths where
+        # the JSON key separator is ": " or just ":".
+        if s[end:end + 1] != ':':
+            end = _w(s, end).end()
+            if s[end:end + 1] != ':':
+                raise ValueError(errmsg("Expecting : delimiter", s, end))
+
+        end += 1
+
+        try:
+            if s[end] in _ws:
+                end += 1
+                if s[end] in _ws:
+                    end = _w(s, end + 1).end()
+        except IndexError:
+            pass
+
+        try:
+            value, end = scan_once(s, end)
+        except StopIteration:
+            raise ValueError(errmsg("Expecting object", s, end))
+        pairs[key] = value
+
+        try:
+            nextchar = s[end]
+            if nextchar in _ws:
+                end = _w(s, end + 1).end()
+                nextchar = s[end]
+        except IndexError:
+            nextchar = ''
+        end += 1
+
+        if nextchar == '}':
+            break
+        elif nextchar != ',':
+            raise ValueError(errmsg("Expecting , delimiter", s, end - 1))
+
+        try:
+            nextchar = s[end]
+            if nextchar in _ws:
+                end += 1
+                nextchar = s[end]
+                if nextchar in _ws:
+                    end = _w(s, end + 1).end()
+                    nextchar = s[end]
+        except IndexError:
+            nextchar = ''
+
+        end += 1
+        if nextchar != '"':
+            raise ValueError(errmsg("Expecting property name", s, end - 1))
+
+    if object_hook is not None:
+        pairs = object_hook(pairs)
+    return pairs, end
+
+def JSONArray((s, end), scan_once, _w=WHITESPACE.match, _ws=WHITESPACE_STR):
+    values = []
+    nextchar = s[end:end + 1]
+    if nextchar in _ws:
+        end = _w(s, end + 1).end()
+        nextchar = s[end:end + 1]
+    # Look-ahead for trivial empty array
+    if nextchar == ']':
+        return values, end + 1
+    _append = values.append
+    while True:
+        try:
+            value, end = scan_once(s, end)
+        except StopIteration:
+            raise ValueError(errmsg("Expecting object", s, end))
+        _append(value)
+        nextchar = s[end:end + 1]
+        if nextchar in _ws:
+            end = _w(s, end + 1).end()
+            nextchar = s[end:end + 1]
+        end += 1
+        if nextchar == ']':
+            break
+        elif nextchar != ',':
+            raise ValueError(errmsg("Expecting , delimiter", s, end))
+
+        try:
+            if s[end] in _ws:
+                end += 1
+                if s[end] in _ws:
+                    end = _w(s, end + 1).end()
+        except IndexError:
+            pass
+
+    return values, end
+
+class JSONDecoder(object):
+    """Simple JSON <http://json.org> decoder
+
+    Performs the following translations in decoding by default:
+
+    +---------------+-------------------+
+    | JSON          | Python            |
+    +===============+===================+
+    | object        | dict              |
+    +---------------+-------------------+
+    | array         | list              |
+    +---------------+-------------------+
+    | string        | unicode           |
+    +---------------+-------------------+
+    | number (int)  | int, long         |
+    +---------------+-------------------+
+    | number (real) | float             |
+    +---------------+-------------------+
+    | true          | True              |
+    +---------------+-------------------+
+    | false         | False             |
+    +---------------+-------------------+
+    | null          | None              |
+    +---------------+-------------------+
+
+    It also understands ``NaN``, ``Infinity``, and ``-Infinity`` as
+    their corresponding ``float`` values, which is outside the JSON spec.
+
+    """
+
+    def __init__(self, encoding=None, object_hook=None, parse_float=None,
+            parse_int=None, parse_constant=None, strict=True):
+        """``encoding`` determines the encoding used to interpret any ``str``
+        objects decoded by this instance (utf-8 by default).  It has no
+        effect when decoding ``unicode`` objects.
+
+        Note that currently only encodings that are a superset of ASCII work,
+        strings of other encodings should be passed in as ``unicode``.
+
+        ``object_hook``, if specified, will be called with the result
+        of every JSON object decoded and its return value will be used in
+        place of the given ``dict``.  This can be used to provide custom
+        deserializations (e.g. to support JSON-RPC class hinting).
+
+        ``parse_float``, if specified, will be called with the string
+        of every JSON float to be decoded. By default this is equivalent to
+        float(num_str). This can be used to use another datatype or parser
+        for JSON floats (e.g. decimal.Decimal).
+
+        ``parse_int``, if specified, will be called with the string
+        of every JSON int to be decoded. By default this is equivalent to
+        int(num_str). This can be used to use another datatype or parser
+        for JSON integers (e.g. float).
+
+        ``parse_constant``, if specified, will be called with one of the
+        following strings: -Infinity, Infinity, NaN.
+        This can be used to raise an exception if invalid JSON numbers
+        are encountered.
+
+        """
+        self.encoding = encoding
+        self.object_hook = object_hook
+        self.parse_float = parse_float or float
+        self.parse_int = parse_int or int
+        self.parse_constant = parse_constant or _CONSTANTS.__getitem__
+        self.strict = strict
+        self.parse_object = JSONObject
+        self.parse_array = JSONArray
+        self.parse_string = scanstring
+        self.scan_once = make_scanner(self)
+
+    def decode(self, s, _w=WHITESPACE.match):
+        """Return the Python representation of ``s`` (a ``str`` or ``unicode``
+        instance containing a JSON document)
+
+        """
+        obj, end = self.raw_decode(s, idx=_w(s, 0).end())
+        end = _w(s, end).end()
+        if end != len(s):
+            raise ValueError(errmsg("Extra data", s, end, len(s)))
+        return obj
+
+    def raw_decode(self, s, idx=0):
+        """Decode a JSON document from ``s`` (a ``str`` or ``unicode`` beginning
+        with a JSON document) and return a 2-tuple of the Python
+        representation and the index in ``s`` where the document ended.
+
+        This can be used to decode a JSON document from a string that may
+        have extraneous data at the end.
+
+        """
+        try:
+            obj, end = self.scan_once(s, idx)
+        except StopIteration:
+            raise ValueError("No JSON object could be decoded")
+        return obj, end
diff --git a/simplejson/decoder.pyc b/simplejson/decoder.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..2ae9b3591ee9c6400d5cd09eb0a05999ef680bdc
GIT binary patch
literal 11292
zcmcIq&2tmkcE2sjACi&37_iM}!weOf0h^grg(*VjJp*RO4@U6XFwFBak=p8(-B{|D
zyIWwr$eTbG*{8C4o2;@-Ro*I9S){Vde~_xAD%-5H%x3cYo!i}#{XArtI09eY&vVZ`
z=iKvk^}GKnmp=LJZ`T?s`IPbfbNogBXei|<wSm%5PEPF_Y6BHr&#8@ETF<MEywvk*
zx1d@hYGXthy^o};pms-9YfNp7E8~T~pbBnLy(+1otPFer6$5@w8Q(c0Y8x9&DA!Ql
zDJje99vhSD-o})2M%6nYGp*cd^;W4(Y&xShX4S@N<&4P?HUvuJ>K(wGQ9BBIomM%g
zsO}crSyW1_%%C!%?rxlw9p;pSt)|pl;4v>toH8a%Vx}{N$}}rnGRq2~eZ<NcRL-(8
zhsr!F3#go9<vc1E0DnO_7uCi&qU4@e?t*gXm3Kiom(;t0+PJ9Pan&g(!^Nbr6qU;<
zDwmXFstq(RagBRfIaky>plA;DT$P?H3UqU?swTMdF{uF3{A%N4Zo6Ljgj~FYVy)e2
zxoy{v?br)^GiaK>SbtJ|;5Gus4NKnl_*5(4wu(=oXxqDPEo#`l?}oa!L_p|>;?VQA
z;|Vl}0Epz|(Km*_`<&WE0Xgwd=G0q59RM<#;7(q>%B$d(GWr-RC=>F<|0C)z@@hf%
zT|U$|hqb<;j5x2n0)+sRz^%=kIsn|9>Km$$GN&e*c^sK2RAUq6?S~J)xHa@ad#H8m
z762-><L=A%mbdMVqb;O}bEr8^WdvXGDC<HfnHcq=xQMQ;UhD=Ts3#LZmu@4LYS-`B
zjok`?OS^XOSI<`0Wvy@f^6mM}3Wk*w(a%s@ejd4Dw7lzuUaJ+nUVab;ovmPh`GNb|
zZ3Ug>rtLSq#v6BQIr7NLS5e?EYplYhPA{GUj9Rl5*l{BOldw-TgRY2tQ^u4rZQL^E
zjRwzEz#k7Ld|F2Z^dz6;R)d&tag+0Ej+E8x%Bi3Pc7fP=<)4!pmtg+Tl6ef04SCh1
z;Bk{`M1d*+w#>$HxqZyN8$s9C)PguU?!L?y(l|jwzB@rA)N6UZ>j%lAmLHrj-6$>G
zq7k&tqnglb!6+N0+=9{IG01F6hR|ytl^7%wnM<UwpbkcOa7gW|aTQ!r1_*NiITcau
z7gQg^In^wvv+E+rdVM~X;xTnF&TDdX$(ZVor!*bIS`n#gbQvgIi|&|2+q~wOK)u`c
zS*tX5>=2d3=!+kmbMrmx%$r;+T(Zvcpu)w#cPpfUu%#VsTeE0br_&zScdU=tb0+O+
zwqv;=7)iKC@}UJxPn?0goo*NcuTM~mCQ+!|8KayZg}k3Z84>rJYq&nX7x!YKk~Mfo
zt9CUa>XoJIKU=K)`s(K9=Kif)H#he`Yrb6UQi88SbD@;_rpWZB)R(1yS?c3b-;(+%
zsW+uwlDaSTveZMV7o{FYybRsAdGm_~4??0+wTh_y9N6&&&Wlvx24V>=B_(KECBg!Q
zdH^wzt2hrS+W+qyg-rwu(s@u+{bCB?f~ZjN6r#o%<Gkrm&3|qPOic7fXgr`*Ss!J6
z6EI5ZU_$j_us;I;Y*tbrB7k>JqYVKq5le1X(r{!7;2OlVKOq_)Dg+L}Q~!zXDTobN
zK?9~>5%&c+Ptby$Jvc=<1Csqy=`m6y_pTU5AHXMww6XVxvRiL5nYM6HRxkWdRRN+$
z@8Ys}7aG<v2d2N#FVmXP8g0N?0U+#JRtpD{0QAQIR1!eT+D#c#FnSoq-gECkQXCo0
zkJ})m{}MP0H=q*c*gvl3t^n1fdN4(UtHHueAud-z4v_qZ=^!cu5P&^M0lH7qh3QYL
zLjIK@su~^)YCt7t1pfjiO)3xG)1-P;P{BU{{1m|_XaOJMG7Yrg=DY%1GdcNv76?c6
zaj<~vW_g?$Im8TUlN{oIfe{1!nH2q51-A<5;}G+3uD<M}<BXcWH;04uf%jQ;8)TAG
zqXVuVt^t^ZLqJd=50j}pz!&posC6*|xQQKFz-@~D9`|>>Vf$vh<C@xoF(b1Xgr+TS
zP|~+#uKJGYMKVpy68$8sDVg|Cx7v-^4NcF-YP-oQ0q%8!*hS5b0mlww*O6|zM=4+d
z@Z5LdL3LcLZMDqTcFS{ycQ^H@8M%91*KcqdunBE1LiJm_)pb|HFbD+{JUBa!-F7E7
z<G|Ez0Hy;o4OX9V$y{p+2921fdT6&I;_3P@0YKhv>2n2s90sky`LJ>5635^Tj)KDu
zsJ0|4q_Et$8~T`Q#$EU$38fNToaEqg1TG(@=3pnGq(B=`6J|nFbO{ayct>mZ+y}aC
z&$mh2lz${OTu~6hGC7g6H)Z--LIrq2hfii+1IJ_0yj^jR(wUo@_IFHZK=>*&dtwu^
z@$Pr{BpmXlIY<2~itqo8#rK%~G5QYA-qdTNF1WT0%*~Ds=Z^kHL^o)&>rvCgIf7eE
zFU?c`j)GQzzO$-U#LUj28gs)3s}EP6KYmtQt=@m~V6FO<I7fD;1A0MGDK(G~>mr&K
z1z+ZDhe5X!$s8~8#5ZiX(Bs(0_vrr1&>Fok5iqfkkKCSakQAZY3B~xg5I^M6;rX#e
zJ1Q&N_I?UTkO$D6P&|iMf#+AmPY_OOl(Z{=eHlh@0r?5fnKY?w>94j7G<LfFZX}r2
zl7o^vTkbaY7blVvWSpD^Zh}uLDnV$?6GtKp_6kP4!*V_!UVn|G<0#OVQOx>WD(LvU
zf`JqC&lys8dJ<D<0bW5z)Zr#Y_?pJ3QAC-Cr(Q<6V4N~$b7Sz@PaBi@vN3|*F{7Nj
zkSpOkZ%pD}-Z+=zT-K+Ji<ox?5KaTq1!F3=B;OZ|Gw4CvIEPuMj8Uu*7x&lZX1wWd
zhA*#2<gi&Rl^YZZqDjy1KK`P=2612|=mUt0x&z+;4h2*$tUf$eShOoJ`fvbXU}?JE
z!l0uKn>wn3>uA8N%WPOF2>M&B$I7GY#i#%V0z<e7vsi{rG<d4;z26DcWD6P=LqSXs
zIwr6){{RyOmaM%^Z|LuGU~uraIRk7>_SKGiK~6RC`}n{U;Yq&vQOGBg2ROmu*XPY}
z`pP(hQ}36_oP~r=cd=E5v0k1IT^z!K)E*||-rs1*FZ|PRRe&{oo-uJ%#0BXsFd|8?
z(ZTX5o>sd^;LyND(&Pl*hf&v_4EzLe1L>09y%cZF@&x-ocn^xnVG_SkQa=fzN$O`@
zd`5A_1{BC7K^(><z(<dEjm(VskTSs*RGB~I#rC$3Mf347ME(iq*gKmSc7DKF^vxJx
zo(ke2%=i8Y4lVv(zy);>MHW>s4U93jDDF;Cd)9I<#I2#}sEUCU<0mHVAfmBY-S4;!
zF^nCg5RjednZDh2WyT#bYJ(YfV6IzUo6bN)8#5RQwq5}W0$nIjD(@RdR^Aw_tWcwi
zZnv(pM(ZP5^jX+-EiSf}*hST{9tWK@x*kkISwy$OZqfQnx2)T!TMS(#e1x;)*8+G#
zl5Nr$)pmklR~v~pqPuHvBI}R1Oza)40?llcDS6TORPwuSPmBf}q^^6y%ANL??%orj
z+Fzj+?W4%6qA{AEfzB;M51+yJENUk8yc#pk7Z9H!Mm2M#T;7;L?~HK`T6zSn1$<vb
z1|pB%GFr1}PoS+WftmD|lF_pqg=Huk*DzyRXDx^mgJIF+{|PoEnp~0<N&E=;f`%SR
zG`ZFQ(85sOymp8ZWx`?2g9S&IiP9YtBakR?=s^vY!Yad~%okB5KR3X>;2XoBhJrE{
zU{GwdGDRj*w1xs20}WMR(g^k;nVc$Dt)XC1<dVpBIkDpi`nQ?a$qpv^h*k|fI)J6(
z*SMurIjoDI>g9L~P{pJwRs8_)p&_dJA0qhPKPRew?=PY1weHrc9v#MaEM7nz1GMM{
zI#pUX$kly$?A5j&Vb*&tHJt%{sTWy$%;Fms*&UZ#U7?s+RTfWJ{E~&mVsI&mkKDS*
zdd88vEWSl?!ncrl9^S&0FtmIBfkt!>g<L{hEnXvi1&eb1vP+hZ$z`IWb>Yx;Eae)2
zA|KL(AfpE;T)ade+(ijr1WX<J??Q<i>fI<GL0kyFNYFbxNx;Y<OIVQSiK4RBE8_p2
zg9o-QNnITd-rb4g&Yk6Drg)cvaQn+7s0vFGDm`^WM6PWer8WbGX$*tn5Xt$LDAtH^
zl>~(x*y^F)w7aeNjt21Q&BLFgZH|5_TlF<UjDF?QH=p+69R#04pT5le^iK|dj<z|P
z!ql2P1<^Mhxc_NOe<v^xqj~dvc-rK72BePwH~K%rOajdWYTrzvoNO1<{BS(|ZhH%9
zg9;*;MXU#-;u~fw0Gra!Plp-0c54wZ<rN?WC*L0q6R#QW07T!UEg!U5`*4^|$v>n}
z`bj<_ZT~cweix~f?9(@^NLFV}seA~YBFbwqavxCucH?b_FDXuB*6YX;*XuV>Npr_+
zF+o$WXSwBi-LxZtfs}_AA~7F^Zqx~U#=4j&jKL(W3~!ikb`UBvGZS><$a5q&qi<XU
zA8twCRtd|fc^DvzF^3@+%ZYdy70Kn+U`X@wnh4{H@tW95zAiHGL0jx%2Sx+t1Nw+v
zu$%HeQ7bZzXU~MB@lYu%qzu`E>?Bfdh}-}lO{DA$yzLN^s0m-IUPq!zB6*w&i3CZ~
zAX~+ZPdZ|DBPPTGin<$iLKo!qd!PocSG_LOBA>KUh!R!jP;13IAWfREFe{QJAJS%v
zOQs24?bwm&2N@i<*@WW?(jv>1sla+Yxw}9!*(jkdx2|UCy9RPKNF%g*X5gbpkH7;V
zxhGjMGwQ;rj&KU323OYaudSJHf^hdnhJe-@;AztgK!<P$O0*MnTR0k1K@q6}H4W^C
zup7dvUe}n4$4g=JkjsNucumiBAUk*_B%}uNbb$26i+6<V5IAW13>#p92gI<a#VXOf
zI$!9B_<C_<f+tAjX|c=z3)?(DgVbr+jV#Nz?Y#zl>vgK`dL4{-Mqa^RCrT;95r4d<
zR5!X&9JDh)j*FL0582P(B*v=ZE^RMSLO|M15XOS*P3!4>v(W;b%pFJ$F3{p3;&f~<
zK|gr@c;aZ@WSAT#j#isM14l?Gv}E4PjAtT_k%{!IhZ_tz0nQmLSzUp8uVE92=5Yi8
zVL)>&6^@OU_+AGT4IvFUi%#rP9+{Vx<gvhvOidr4<hAYA(gXc{95q0v6QTtmks&{c
z5?Fh}bO1zm8<#GjgplR9^QSN0KaL2r6p#Si(E$@PZz{RPcg#$=-!N0nf5U_^(3x<u
z>o`tJ)*iez-Tj8!kzZWk`g%!TT9~Un0c|b_hT4S+2k+u;=sH8fo@9b0IDQJ%D`Bh<
zK?38Un_zv;Vfw+k6NHnLXzl)!>iV;l>a%rOQLAmcF@pYftp+`xPEM&O0l4*okoZ#&
z4M}Sb3qJ(nGg#UyUYCUULsK>B7z5~-Kz@)R34zFMHFb>7V_2IkUb3jOVBCMg5dkw3
zwHn`jYqcu~fg`?Ct4l@XTBjwq${PPQm?2>DfQD9#?4O|mlZUJ&U%6oZU{_I*hfYMY
zZ)p<^#;kdD023>t2=<tvlTmgeG?ac=Pv#V_!TQS6CL>uu92$O$m4k;^{)z=Lfr@^E
zLcg<!Zcm(VrsJVQhknWfV+zYwu~Vx`r7~nyGWpJoDf8tv=mNJSc>%-EF1q}A(4zJ_
zD3Ow1@tl3o0Jt#FTir*LVN!MJU&gR6wBOXUy42y~XXqOQi89YZl#~R7j1L7a1WM+g
zEXOVK?-%4WQBxz=CI5ZRkRxPFX4EB2{u-6ug#n+z#v~IVTz%nRM!XH?ArpbOZhXK`
z$U?#@$y<t}C1JOCMUSyJG&EjSjuO^vhC!PQdLO5taq+l8zGOTT%YKweV!9KvZJVFp
zJoE&o#Uul8L|o{z(m&HLa_~SjN^qE<fH;s!0<@8HNDm#S=rre#KdYTS)rt4iwtE>$
zJN9cRI|`HU23<IPkSILN$@bWFNcYKmUNt!6zCcH6FG_Fj$j@SQ`XS3u9F@B!IBo5)
zV4m=Vg>D-lpJzf>%;Ujj5?O_+Bu69@S*tMz3w2Aetkv3q(`~Uyajn%r@mfu?p*qik
z)PjCmd-3%eemVAZ<^HPZ{5F2vwId>Kam&Feq;?WNBeN*P`Sd8G7e;eMW41CiA-^NE
zc8M2fgswdQSv*b5XUf5E(w3OD#jgfM|Hss~Lt`~Ku&#sG$brph3_Xd7Wx)>>;RDL!
zqmU$_5!~E_Uf-@-_nxe;ikbTcFQRLY*Q%@XVEEw4vz5n>g;Wn8uY9#`@kenMACP7E
zX%NALOSS55qbk2~(yyg|%1Pu#BWQQLmQFdZKeO=AdjIR^)km`1y_Nfq)*r8|e{GTA
znpbVszGBfrA?9?zwHhFZCDn$LdM7cYq~iYr|Dtigy{pCROHoL7(J_jbKm5y0<F)W3
s$rTrKbGhQ!Y`$1LHB}G`IFX+<3dVV3IX{}4ua<MOcq^QJH2cZ_08a|RG5`Po

literal 0
HcmV?d00001

diff --git a/simplejson/encoder.py b/simplejson/encoder.py
new file mode 100644
index 00000000..cf582903
--- /dev/null
+++ b/simplejson/encoder.py
@@ -0,0 +1,440 @@
+"""Implementation of JSONEncoder
+"""
+import re
+
+try:
+    from simplejson._speedups import encode_basestring_ascii as c_encode_basestring_ascii
+except ImportError:
+    c_encode_basestring_ascii = None
+try:
+    from simplejson._speedups import make_encoder as c_make_encoder
+except ImportError:
+    c_make_encoder = None
+
+ESCAPE = re.compile(r'[\x00-\x1f\\"\b\f\n\r\t]')
+ESCAPE_ASCII = re.compile(r'([\\"]|[^\ -~])')
+HAS_UTF8 = re.compile(r'[\x80-\xff]')
+ESCAPE_DCT = {
+    '\\': '\\\\',
+    '"': '\\"',
+    '\b': '\\b',
+    '\f': '\\f',
+    '\n': '\\n',
+    '\r': '\\r',
+    '\t': '\\t',
+}
+for i in range(0x20):
+    #ESCAPE_DCT.setdefault(chr(i), '\\u{0:04x}'.format(i))
+    ESCAPE_DCT.setdefault(chr(i), '\\u%04x' % (i,))
+
+# Assume this produces an infinity on all machines (probably not guaranteed)
+INFINITY = float('1e66666')
+FLOAT_REPR = repr
+
+def encode_basestring(s):
+    """Return a JSON representation of a Python string
+
+    """
+    def replace(match):
+        return ESCAPE_DCT[match.group(0)]
+    return '"' + ESCAPE.sub(replace, s) + '"'
+
+
+def py_encode_basestring_ascii(s):
+    """Return an ASCII-only JSON representation of a Python string
+
+    """
+    if isinstance(s, str) and HAS_UTF8.search(s) is not None:
+        s = s.decode('utf-8')
+    def replace(match):
+        s = match.group(0)
+        try:
+            return ESCAPE_DCT[s]
+        except KeyError:
+            n = ord(s)
+            if n < 0x10000:
+                #return '\\u{0:04x}'.format(n)
+                return '\\u%04x' % (n,)
+            else:
+                # surrogate pair
+                n -= 0x10000
+                s1 = 0xd800 | ((n >> 10) & 0x3ff)
+                s2 = 0xdc00 | (n & 0x3ff)
+                #return '\\u{0:04x}\\u{1:04x}'.format(s1, s2)
+                return '\\u%04x\\u%04x' % (s1, s2)
+    return '"' + str(ESCAPE_ASCII.sub(replace, s)) + '"'
+
+
+encode_basestring_ascii = c_encode_basestring_ascii or py_encode_basestring_ascii
+
+class JSONEncoder(object):
+    """Extensible JSON <http://json.org> encoder for Python data structures.
+
+    Supports the following objects and types by default:
+
+    +-------------------+---------------+
+    | Python            | JSON          |
+    +===================+===============+
+    | dict              | object        |
+    +-------------------+---------------+
+    | list, tuple       | array         |
+    +-------------------+---------------+
+    | str, unicode      | string        |
+    +-------------------+---------------+
+    | int, long, float  | number        |
+    +-------------------+---------------+
+    | True              | true          |
+    +-------------------+---------------+
+    | False             | false         |
+    +-------------------+---------------+
+    | None              | null          |
+    +-------------------+---------------+
+
+    To extend this to recognize other objects, subclass and implement a
+    ``.default()`` method with another method that returns a serializable
+    object for ``o`` if possible, otherwise it should call the superclass
+    implementation (to raise ``TypeError``).
+
+    """
+    item_separator = ', '
+    key_separator = ': '
+    def __init__(self, skipkeys=False, ensure_ascii=True,
+            check_circular=True, allow_nan=True, sort_keys=False,
+            indent=None, separators=None, encoding='utf-8', default=None):
+        """Constructor for JSONEncoder, with sensible defaults.
+
+        If skipkeys is false, then it is a TypeError to attempt
+        encoding of keys that are not str, int, long, float or None.  If
+        skipkeys is True, such items are simply skipped.
+
+        If ensure_ascii is true, the output is guaranteed to be str
+        objects with all incoming unicode characters escaped.  If
+        ensure_ascii is false, the output will be unicode object.
+
+        If check_circular is true, then lists, dicts, and custom encoded
+        objects will be checked for circular references during encoding to
+        prevent an infinite recursion (which would cause an OverflowError).
+        Otherwise, no such check takes place.
+
+        If allow_nan is true, then NaN, Infinity, and -Infinity will be
+        encoded as such.  This behavior is not JSON specification compliant,
+        but is consistent with most JavaScript based encoders and decoders.
+        Otherwise, it will be a ValueError to encode such floats.
+
+        If sort_keys is true, then the output of dictionaries will be
+        sorted by key; this is useful for regression tests to ensure
+        that JSON serializations can be compared on a day-to-day basis.
+
+        If indent is a non-negative integer, then JSON array
+        elements and object members will be pretty-printed with that
+        indent level.  An indent level of 0 will only insert newlines.
+        None is the most compact representation.
+
+        If specified, separators should be a (item_separator, key_separator)
+        tuple.  The default is (', ', ': ').  To get the most compact JSON
+        representation you should specify (',', ':') to eliminate whitespace.
+
+        If specified, default is a function that gets called for objects
+        that can't otherwise be serialized.  It should return a JSON encodable
+        version of the object or raise a ``TypeError``.
+
+        If encoding is not None, then all input strings will be
+        transformed into unicode using that encoding prior to JSON-encoding.
+        The default is UTF-8.
+
+        """
+
+        self.skipkeys = skipkeys
+        self.ensure_ascii = ensure_ascii
+        self.check_circular = check_circular
+        self.allow_nan = allow_nan
+        self.sort_keys = sort_keys
+        self.indent = indent
+        if separators is not None:
+            self.item_separator, self.key_separator = separators
+        if default is not None:
+            self.default = default
+        self.encoding = encoding
+
+    def default(self, o):
+        """Implement this method in a subclass such that it returns
+        a serializable object for ``o``, or calls the base implementation
+        (to raise a ``TypeError``).
+
+        For example, to support arbitrary iterators, you could
+        implement default like this::
+
+            def default(self, o):
+                try:
+                    iterable = iter(o)
+                except TypeError:
+                    pass
+                else:
+                    return list(iterable)
+                return JSONEncoder.default(self, o)
+
+        """
+        raise TypeError(repr(o) + " is not JSON serializable")
+
+    def encode(self, o):
+        """Return a JSON string representation of a Python data structure.
+
+        >>> JSONEncoder().encode({"foo": ["bar", "baz"]})
+        '{"foo": ["bar", "baz"]}'
+
+        """
+        # This is for extremely simple cases and benchmarks.
+        if isinstance(o, basestring):
+            if isinstance(o, str):
+                _encoding = self.encoding
+                if (_encoding is not None
+                        and not (_encoding == 'utf-8')):
+                    o = o.decode(_encoding)
+            if self.ensure_ascii:
+                return encode_basestring_ascii(o)
+            else:
+                return encode_basestring(o)
+        # This doesn't pass the iterator directly to ''.join() because the
+        # exceptions aren't as detailed.  The list call should be roughly
+        # equivalent to the PySequence_Fast that ''.join() would do.
+        chunks = self.iterencode(o, _one_shot=True)
+        if not isinstance(chunks, (list, tuple)):
+            chunks = list(chunks)
+        return ''.join(chunks)
+
+    def iterencode(self, o, _one_shot=False):
+        """Encode the given object and yield each string
+        representation as available.
+
+        For example::
+
+            for chunk in JSONEncoder().iterencode(bigobject):
+                mysocket.write(chunk)
+
+        """
+        if self.check_circular:
+            markers = {}
+        else:
+            markers = None
+        if self.ensure_ascii:
+            _encoder = encode_basestring_ascii
+        else:
+            _encoder = encode_basestring
+        if self.encoding != 'utf-8':
+            def _encoder(o, _orig_encoder=_encoder, _encoding=self.encoding):
+                if isinstance(o, str):
+                    o = o.decode(_encoding)
+                return _orig_encoder(o)
+
+        def floatstr(o, allow_nan=self.allow_nan, _repr=FLOAT_REPR, _inf=INFINITY, _neginf=-INFINITY):
+            # Check for specials.  Note that this type of test is processor- and/or
+            # platform-specific, so do tests which don't depend on the internals.
+
+            if o != o:
+                text = 'NaN'
+            elif o == _inf:
+                text = 'Infinity'
+            elif o == _neginf:
+                text = '-Infinity'
+            else:
+                return _repr(o)
+
+            if not allow_nan:
+                raise ValueError(
+                    "Out of range float values are not JSON compliant: " +
+                    repr(o))
+
+            return text
+
+
+        if _one_shot and c_make_encoder is not None and not self.indent and not self.sort_keys:
+            _iterencode = c_make_encoder(
+                markers, self.default, _encoder, self.indent,
+                self.key_separator, self.item_separator, self.sort_keys,
+                self.skipkeys, self.allow_nan)
+        else:
+            _iterencode = _make_iterencode(
+                markers, self.default, _encoder, self.indent, floatstr,
+                self.key_separator, self.item_separator, self.sort_keys,
+                self.skipkeys, _one_shot)
+        return _iterencode(o, 0)
+
+def _make_iterencode(markers, _default, _encoder, _indent, _floatstr, _key_separator, _item_separator, _sort_keys, _skipkeys, _one_shot,
+        ## HACK: hand-optimized bytecode; turn globals into locals
+        False=False,
+        True=True,
+        ValueError=ValueError,
+        basestring=basestring,
+        dict=dict,
+        float=float,
+        id=id,
+        int=int,
+        isinstance=isinstance,
+        list=list,
+        long=long,
+        str=str,
+        tuple=tuple,
+    ):
+
+    def _iterencode_list(lst, _current_indent_level):
+        if not lst:
+            yield '[]'
+            return
+        if markers is not None:
+            markerid = id(lst)
+            if markerid in markers:
+                raise ValueError("Circular reference detected")
+            markers[markerid] = lst
+        buf = '['
+        if _indent is not None:
+            _current_indent_level += 1
+            newline_indent = '\n' + (' ' * (_indent * _current_indent_level))
+            separator = _item_separator + newline_indent
+            buf += newline_indent
+        else:
+            newline_indent = None
+            separator = _item_separator
+        first = True
+        for value in lst:
+            if first:
+                first = False
+            else:
+                buf = separator
+            if isinstance(value, basestring):
+                yield buf + _encoder(value)
+            elif value is None:
+                yield buf + 'null'
+            elif value is True:
+                yield buf + 'true'
+            elif value is False:
+                yield buf + 'false'
+            elif isinstance(value, (int, long)):
+                yield buf + str(value)
+            elif isinstance(value, float):
+                yield buf + _floatstr(value)
+            else:
+                yield buf
+                if isinstance(value, (list, tuple)):
+                    chunks = _iterencode_list(value, _current_indent_level)
+                elif isinstance(value, dict):
+                    chunks = _iterencode_dict(value, _current_indent_level)
+                else:
+                    chunks = _iterencode(value, _current_indent_level)
+                for chunk in chunks:
+                    yield chunk
+        if newline_indent is not None:
+            _current_indent_level -= 1
+            yield '\n' + (' ' * (_indent * _current_indent_level))
+        yield ']'
+        if markers is not None:
+            del markers[markerid]
+
+    def _iterencode_dict(dct, _current_indent_level):
+        if not dct:
+            yield '{}'
+            return
+        if markers is not None:
+            markerid = id(dct)
+            if markerid in markers:
+                raise ValueError("Circular reference detected")
+            markers[markerid] = dct
+        yield '{'
+        if _indent is not None:
+            _current_indent_level += 1
+            newline_indent = '\n' + (' ' * (_indent * _current_indent_level))
+            item_separator = _item_separator + newline_indent
+            yield newline_indent
+        else:
+            newline_indent = None
+            item_separator = _item_separator
+        first = True
+        if _sort_keys:
+            items = dct.items()
+            items.sort(key=lambda kv: kv[0])
+        else:
+            items = dct.iteritems()
+        for key, value in items:
+            if isinstance(key, basestring):
+                pass
+            # JavaScript is weakly typed for these, so it makes sense to
+            # also allow them.  Many encoders seem to do something like this.
+            elif isinstance(key, float):
+                key = _floatstr(key)
+            elif key is True:
+                key = 'true'
+            elif key is False:
+                key = 'false'
+            elif key is None:
+                key = 'null'
+            elif isinstance(key, (int, long)):
+                key = str(key)
+            elif _skipkeys:
+                continue
+            else:
+                raise TypeError("key " + repr(key) + " is not a string")
+            if first:
+                first = False
+            else:
+                yield item_separator
+            yield _encoder(key)
+            yield _key_separator
+            if isinstance(value, basestring):
+                yield _encoder(value)
+            elif value is None:
+                yield 'null'
+            elif value is True:
+                yield 'true'
+            elif value is False:
+                yield 'false'
+            elif isinstance(value, (int, long)):
+                yield str(value)
+            elif isinstance(value, float):
+                yield _floatstr(value)
+            else:
+                if isinstance(value, (list, tuple)):
+                    chunks = _iterencode_list(value, _current_indent_level)
+                elif isinstance(value, dict):
+                    chunks = _iterencode_dict(value, _current_indent_level)
+                else:
+                    chunks = _iterencode(value, _current_indent_level)
+                for chunk in chunks:
+                    yield chunk
+        if newline_indent is not None:
+            _current_indent_level -= 1
+            yield '\n' + (' ' * (_indent * _current_indent_level))
+        yield '}'
+        if markers is not None:
+            del markers[markerid]
+
+    def _iterencode(o, _current_indent_level):
+        if isinstance(o, basestring):
+            yield _encoder(o)
+        elif o is None:
+            yield 'null'
+        elif o is True:
+            yield 'true'
+        elif o is False:
+            yield 'false'
+        elif isinstance(o, (int, long)):
+            yield str(o)
+        elif isinstance(o, float):
+            yield _floatstr(o)
+        elif isinstance(o, (list, tuple)):
+            for chunk in _iterencode_list(o, _current_indent_level):
+                yield chunk
+        elif isinstance(o, dict):
+            for chunk in _iterencode_dict(o, _current_indent_level):
+                yield chunk
+        else:
+            if markers is not None:
+                markerid = id(o)
+                if markerid in markers:
+                    raise ValueError("Circular reference detected")
+                markers[markerid] = o
+            o = _default(o)
+            for chunk in _iterencode(o, _current_indent_level):
+                yield chunk
+            if markers is not None:
+                del markers[markerid]
+
+    return _iterencode
diff --git a/simplejson/encoder.pyc b/simplejson/encoder.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..e59d372a7ab88749c287a7a2a77dfad41ebd616b
GIT binary patch
literal 13938
zcmcgz%WoV<das@tK4$ooM3ItguUoX&8m>u6UVGPCtt?yCBhuPSIZfHJC2EJw=^C=d
zVfU!JM<i`B*u+A}<Q6131Tc_W@&{}V0dmVN2yzdC9C8T|Ag2Vm<dV(r_f>b#3`xaN
zKxe3_sjlZ&Rp0mf9@YBQzmHU2|K^)Jb(MZj<M#u6<3F^N@|1dj)KXqSty$`UrM4#I
zv8dJxs##PIO3Jz)oK_{>ryf^SIHD|k&>9s%L0O-t?Mu>rKs^|IUi(4QUR%m9E3Z#|
zjp-^Xee9RVq3m%$9*5PcQYCLt6}+;#Qt~Ru3^6l|%m_21$c!;Fj?6J;jw5q|nF(Z0
zsw)ph)aF}Ck1B7HW8Qf5ntCv%^oa7ul|H8Q7)!k=W*U~7{2EJo@^9+CKCZk|Lc|HB
zC)9(J$~&!|VY4QccSbVkQc^AKj-FBvipqOQ=~EoSdzsZ=EA_>L(@LLF8Wk@q{fg4x
zQy5jhs<f^2S*53yeog7umHxi+UQy3R)Ppy83JcZm@o<>jS#LG<x(*UI@x#Cl8}`o@
z?#|x~>Y=BjivMeT=BqeFl}sVgQeInjV;v`vAFR~exbFL=!7v)EyKA~;T1D|G6g*tq
zym)bLar3Rl;^Oq;@?v8#Sd12vNAVacs}E85X#3$W7VWv;dNdOcnGToOq0x907x28e
z7<2kX^Dv$8VcI+_OU<BpXvo8`c?jg8Vjd!S7%>ltJd}MK!^Hg@xc&W$?`$Rm$iAh2
z%uk(DaOx7i*YS<dA_4zm&v%526Qz7hZQ~zKp`fO)rBe&lBAfmQiKCNt6xgn8r5)*3
zq~q=#cI{8Ll2z=s*~3c3#z$u5%p7KcLmfkcnJ@<?!}MUH(+gD+Ht!=*l1(be-CVeS
z?US3e8`tk8eRy1n!gkA?2_M(pq`q23MoALCkKBb%V;#j8*8IqCHp8bEZbV^gIo!N(
zLqFBcuyvu~1`WTyp_ebjJ~`xZ90nKCb3NbMlI_C6nr>acf#GCtmF18)Ll(Ezkd?^3
zw3kgeR~S3o?IWg$yLEs)r#TysQI*Pt{9L&y*IBcK#OyHG3I`d^C@U!_zbFTbO)sg(
zWfh)K77w8>J%k;l0!tB}QidohbWi$~KhWU`9M+UqBwKK{_!^RoEdu-6!u30M=E9)4
z^+GHXbEtOGn7brP;S;~YEPsp)i4;b~<Y3gTVbTRIJ-u*0h*b$IBf72#y5dw&!-fU5
zT_7ktRw^9BvQSYFoLYGD2Uxh&T|z5t1|Ry=`(D5L;KLo@5!Q<mc`7Mj=r;P6RHL9K
z7X-IG5LYdOGQ+SS&gvFAU;RBOCIkDw29x;eAF)$J5hIf(t@8LBuG3*I8AS4t-ntn@
zVI-^-MxN}kLzZ(mnqWkL<zl$E%+C*xmfM7Z-{Sa_NR%~Z6|G@w6yK4;Sg~Rqw?+#h
z4D(geD?;kWeh?>aP}fExl1SEa``SY7(|flrfqyWZcBA@g!iCO<ftE5)6N?k>ODgBW
zJ`VR)WJ=cjU5L~f%+T6O;rsyTzlqwIt5c;ntP@swJRy8{X^%SV_~Ds+h;O`zL_@(r
zvXFvxpq{}-qUfRfb$|8`qBbc1P>W1SJu6e|gZZAJBUF38WT4v7azH)9I77-YycWZ1
zP&YRd9mM`}QyU4pvYI5V%NH&X$Ige*%2hiBGrJK+8610V;u4eFb>O#-&l_M~Xt!Em
zwb)KpHCh8MH=y|JaQU&Wqtp#NJK1XK*k0bUJ>78I&E&G_`R3fg&;GJE1^l-&5~vB%
z&$gjFd$hNu<(uyv{Om8w#`OGpl6RNPc1m_unvQvp%(>^$+4SRN)=t{c3F#o)wi`w6
zRyJft=L?L9EuXd9flod+!)&LjF&p&7>GT7T*$jh~S-a5;UF^fQ9kkb%b@YE9^Ip`>
z7M%{VZG&67%3hq#TW&M%8UW*N+l`*G7ax<*k*(7Fa_!A#r|d<>6t=q;+L|H-USIVg
z3L(szdbkq!UurvqU__Zb%-V5#x!!bRBN<{m(7d!=8E0wfd@3W=nWZIrUBeFY><vFz
zg&>)M(z0X~hZcz?g`sSiE56(GzjPteGLn%$5#Oby5M%ibyA{SF^RtGg4If+UCw9CV
zwws<^cd-Q&;<(+?k<ch3<un=-xXQ)3?7Fmc4}vY4W@%|Ag#$5luu5u|%XXJaCd%;(
zO=hf%Um{~{#2PYCvr5&VkHxsC;Su^2C3x(U3?BO>gU10vBTbJ<Xy5_0XgWjPq62&!
zSRdN}LDK}@5*}DnHZ{=0c&M=6n2Yg6!1VPH+K12vyd&my0rjjo0NAJoG1C*u0FZ2R
zr(wryerru{#Wv1gI216jssnB?N?beND{_aMBznD-$o{gwpsm1W!<Iqhc-=_bICTp9
ztbIUYK_of(JZH}b>ZXG7NPerYf(X41A~2rVt6M^COMB^|rAxp90qn+SA<-0GS%n?8
zlU7?6veI@VH%PPwtB3Y7227%S_6+n5!-AcBI7I7QR|a48RdlZ>Fs^MK*Ikm(L;rpf
zIy;%sumOvl^JXKOIeQmUU)A-sTHTN8?WP;`EG4iB(ebQJ^v4hNQ@tH0;d-j_yhB!F
zW|UE}Zn8%{cBC6R!tp`Dd2PCUowH2Bd?>g$PesbX5AYlUoCgu29mVu2s~f964rwD5
z!!~5g4eYy5bp&kQ5CMaD@sRkrOFW_M&Vo72@d{;j0_QTe#p&qX4hVL*Q426;_n`*%
zygNT@-!b%TnXQ=19>Mdn>U>&b5O}s5%bYm2dxW}Wz3M*ou_MTnS1C7k+|qR)4w69(
zut2NngK1{-!Ilj()gg2^4epGv%z7AO1ox@CP>=jpV$+fKGE>ALrZM*-2%p)Fp8bHV
zW$fYFpSjJpK__ymA>VA5XuSR63mc}E$#2g1fdFF4{c!%tG&nIg^0CwVcPPdXAQyHH
z#`&qy1lScEXQSN|u8H&t3@17B1Q7yJ6o%vT)rjDmP0S#jGsb}DfNamrgdBS|_{Oz8
zcWW*Q=kUY5^7pOD4?J!yXmD{h!CatMa3W6u`Vin14Nwt;lG(&a$*IsL=wY@zRVC}1
z=0Uz}8$6vPTXQWiJ(n#9Nb2)J(&?M@nZYjC$ooQ&lrWZZ(d?mkda(X=l-PmZX!-%I
z%j|qbU1JSYO~N3u1u)%uBL}@KpK_q~0Du}B<^tEjxJJ`q8(q6fOswUVvplrU<4iui
z*mA<{I<sH7qt$b>Hve6=&&{wlv{!U;kVfupK2$Hk_Ey-=C^F=3aa0-f+>G#S(+7CE
zzzP5a7^a1A!gH6IY9({pjdmc63W8uJfHLw=vx#FOc%?9%(<P0-U+0o8!+_A9a-ad}
z+)yx92ewccM+7T3J9ucoEn#sSFwZPyAIxja2DjI6=v|PEMij*s6Ha*eDVx$f@dK(M
zs2nuOIkB@2Xr>qoT*o@WlwqzT+VCw`%wFUZfNwz(8gUhKS#gK$?t%2KJ%tZCcd3ik
z`6}HxaZxj!D?Vtq0!v2Gq*oUubW3wQmM6l7Adk4SMns&G9Gu;IxilF;Q4ga^s41mW
zsL57R6<43Ga;%#Tht8_=5|fviyuyS5PUlr5;(+I(5Ie82g2ADq4GRc;wHno5tp-Oo
z4G)|zTb;iVYtkCQU!4XdzeRknvn^MEXq1WBATk5{Z3;iXgB(M)Y!|<d9(l+X2M#Vu
z?PZ^EncLoC6baiyWu#Vg&PHgLK`$NTlz%BWVoAe#hW^JH8c3p!vU_dhe58)8ypQQK
zYnkG53&ZJ6mtjP3IyJgD)Uei;{UmauEn05|z-9$A>a-K`Ir6D<Zf*K&TGoC!b+kDP
zKVXxrQI$-AmCRhu2QqDJSbbXu3t1^-a7W&gY&GnFWY$-2);08YZtEUCPz&zQfoU}y
zy~CTQctg95pdArx4o;o6qBP$$;rZN^%GPSa4x}~a4NQhH0%P4rK5t^N6xDns5_BSf
zo0!t;WJU&S!=n`uk-9&{xZ*&m<01wWVtz#o{stKaWf4*}LD?q=%9`hb1ZjT?hX=S(
z%tDtYNP8Bg5>a|wP{R_k#U&72DfE$O=#z)a62}Q$`&BrKK_y&^+Jz^-jVHKG5)fU;
zTEVFj(F1sVZCQwSk_x0l3P6Y;Cj!Q;adaGFDJLnKxNuSVBWY0@{rxj6$?3TiFbKa-
z!_#8O?*@8<QC+}%_3G7b=dC((UJy}NznX4@;q+zu;q<Z_P0!l+`EvTvPKT4uJ*UOF
zF1}%)RYJ@H-8E>Z8jOkrOGikuO2BsHUV`9DWH1YHj<e!5CIoheQBecN$S6lN344&c
z4Yk5<bl@aI)|aabF-D~5ap(so_DfcDW{?<?GW-{9QeSNcYw^*ts0?hV{1s*uTvmhQ
z);Lgn1VP>@tAg<EXz3)7eB7!R(T4XKT%<6t4Y47ELUt<3TE(Ri7-ImD^*-iUgPR7_
zAPl^N3r^Hv!N{>j?id~yjpLse;ijP=ZRz-<Rlfr7f?@G*2=V%7=q{WdE@3RW_+;#0
z!8EQw9B!NJ5VG${6BC8-htntog76#{Y>RYMQgAi$W0K<Lw5)deRd5-d$I}o-PiF~X
z9Nr&-QekICHy}?X%FRMmqTLAptDAylVo0sPbjKB>1Xjgw-SRc!Hrj>nX!tA#)qR#G
zd^R{$ev`=AB`RH-XTPeTwiD)oA+=AOI!sz!_E!u!hp3VDtvIZ&>E!%IgdSBHZ00aY
z5)L7k@GF-!bI1@(1Y)rr*$tCi#Slr%4HLEtO$bnOnKv&cfQX-wH%gf)6X~GoR0|`2
zCA)xie#i#+9^u8`ASW@x5&aYLa)+uQ2PdpLv4iJID3^5-HLwEwBTIwjVbXw8gP#aH
zf(L=sQVi}!@w6!ho~OkS5EKugSOQ?&3G7Mh47d>YTqQA;WP?&WNszk_+eJ#|<(dT{
z0I|w4w?8hUDh~q0+@ZU$xPiQ|tyd7>mtgTzy4K*SG(IH?H23l^+eUp7&^kW2!;KcU
z7OWBjR3NQJUKL1#Vb~CJwgyL)d2UpKxaxOsMkWN1ME{H_<RV^`Mu1!Cw@@hz;L56K
zO%woAM0SF@v780K#gJx=V7Ebbn$%)Q-}?COwR<(^<|mHX+WA{|=I`A5!gvF<?pFZB
z_%>!Zt!?Kl6Pt+`yW_~2_FXbZEOm0scYc6J*|c>xT7%=|{FwDuSxUsMb@jyK(Q&#%
zA^kgi<2N{NrD9bI{n$aK<JM%~>61Ue{vF5PWT9xC#P66jU*#>GY)TE`sC8Yd$%fTx
z>!H_f@{y~n)x5A?tC@}9mI$B7O@MPAk4A@bTCtX#cbFqN9X^rVQQYJ^G!$>)8&ie%
zzua$`zp{1mQhB0$rq0(s_+>i+Sp2U@cJZ&Ec8hAaq;`kYZok?cP`iU_x2$$6YPV1A
zj;P&HwR=qM9#^|3)b51ZJ*jpl)$Wwq#Vag$)x}c3tJLqI3#zQH(a<*^4YQa5F~x8;
z=6Khz-D94jo5V3O@BctvPTSaX#=*NuMH%Om+B*d-p^(mtnM#50$M<b~<1gTe0oYmy
zzhf<*SspNt__K$baNr&E@4I-Ah&~ZrpdEFOVSB=8+{4R4Vwu9bOYKcm0_Lvp2?W4W
z*c;DAdItz7s`FjGe*zn!pOq+@n3#g$um?-Eq^4*C$OZhnG&o2XOb@9=&E5!g@aE^V
zA8tJQ#M*)J3sQi|d&fkz!wkVi1gFI?18Q$jY;C^!fFdkaUYDBs%zE;dD8l^&);K7y
zYM~xiu$>yr)KxRsU309vrkvHJ6IyDolA6_`4>9eD-f7c@VtHpxu;3obia3h2-Ep;t
z7q0Twdswlt_@QlZiSjm<Zk9TfEp-p}P<Im^)I?9wCP*5@1`eqmY<d}!J^4@TKKA53
zP9Qz^SF_W)bnvu36CVU`nSsi@0~DM&{P*PW`O*ZTZC+fYhmT@{@%1d$pU30j=_a^=
z)}FX&5Alu=xROal3T)9Xy!JC{hNd>vqFgvgi$`Kr2-uid3dOq#L!26*hS)t!^#nSL
zA<deEGzHlV4*Q;{*X4FYU_Xs&rmaobCksoOY5gcQ@kO^flp(1QyQwNlhsZ9YBDQ5Z
zQ5hSnKhtN<bu=<A2!kgeLzGBI3)JXKII|pzub5FkbVWgBFL*618AiJg^k<=g;h%7-
ziyTQ%JB?i3X6Xec;`H1=?X5u;7v5aVTJlr>=WS%Xm8c&`LXXB5~>1%6x{5QEbL
zsvoV4QaXX!&fg?VGMHtBKDa3+H)gRlTU4O1`tU2TMqbNd?KYU;P*@wz*qg8hArZSP
zg|*=v*6>Q>eprJ{bzlu_56jKq<AqF4x=;<18&rezi(gHA1HwRVQb3am!Wv*pU@d$N
z<A4+3yaVsV&wzskNWz;V&p;(!cVb^QftxN(Hm3>zzZ;Ln3X8yk0m1>18mI?XAGRmn
zxD5UR%QR)^g)(9RND;6>m*9^uBsv&KqiG8d3B^06ctVhl#qfPl+>l}}9H7Z!00@fj
z=93hNyD3<4s>!aY@Kze&J_JHP`4<(u1nU>jftR}ky`WsCypb$Y2nZKUpAgHrAG4MS
zHNYw%99ilrE(}XHi^V%%tOwq+3Nu*9r<9h3(!4ZXElUOZOj|%CSH)7|8b?Sc=w1}3
z!J@jRNgJ8%Wi__<VD(9=fi4tBn8rkEaB{ftCW@QYjOHi~r?tBYw{xneh$vn*C=SQh
z5M8(r!tYa=8SXp`#WU_qQGAqJnac%HTzI{M;shXr;$Q9juTcD}E);iuhTZ~)h=<n+
z?EDh+7VwofufWrw7B7XeMhtmDB6*be-qxO)0#vJ`uoguDTxq)N%bt7HB~Ec<=VK;6
zXYvsedEpW?+cBXz3qrc73ooi?r%J#vmjF~s1nF2HnU@8E_(XImcFwUW*I{lX08q*U
zM1R8K-(<r5aBL=@GFf3#XYv`7x0&2WQsw)|j*CQ87Ox~a_hHWGto(w>117&<B2Ljm
z<`$WV=RwWlJYsSki81f<8x99=dMIa!74$P}+0Ds5ed63^v+qiWaQcsVHouR|K^;Qe
zH#(#YSB8HB&@WSkVQ7b8XpB;kp{~?XlwXFq2CRX?8PPO-)(~{ZINY5P35YQ$R)&rl
zV_D%_bWI5q@ykPrzX6dn!H^njlOQ1KN1!P9(jsb89#eQBKn0$ZrdB3Fr@+#AQ#ziv
z6`gU(5*rT_z`87FFv4k$ry2}hPvnh^t;lML(-|uM1CNHtV_gO%l+NZqD5D6WvY;Wv
zC=@dv82Gp9e(+a$M+3C%^5>$~1V{FF`7d<YLzmnv?C~E!5Hw$p|A0uE+zxg54@KiY
z5QmI@R%-KQv7-;2@`-i7GhJ$h7F7qoB#a_5-4XF`!!ZFLV^s2>O)x}cl`<#-Tb*D|
zq-mejQKa@uod}$WV@J3K(XN(W3jV*!)(uSjCzLG)AQ<*KR0<dv7E23~#NR^4f`f#i
zgfc@!Q&qaw#-<IJlT9H+85CM$PQa$g+&U8mL=1pPtU!!Z*(2E=K`?<V*;+v`0UFss
zu~=!*n#oUdD49|w+IJX-L0~WXIYL!_ERHNei0qKY*#vYC1HGfrNzR9up`T|$u29E5
z`q90g-+r|!TH`lRAc_!|XJoq0e`Yve!z&5eYqw&Dy%KIk{duoCOQZ?cuFy^LvXTkV
zU`pj&W9I>O#(OJ%Q#&NWkyAav9A!X!83`|n^7BP$#5&1twW-nStC7(@AFvmX$9bO#
zjdSM|61kNy!DxxuJf8)={q$wa3=3f7qjO*61g@A^*Hv07@jWE{)-WPu6L4RK7;)rp
mVGM#ZW|bfaoxh>Ni0Ut#Ee>1#g>t!kdZaM<*Njmf_V?dj3=-%7

literal 0
HcmV?d00001

diff --git a/simplejson/scanner.py b/simplejson/scanner.py
new file mode 100644
index 00000000..adbc6ec9
--- /dev/null
+++ b/simplejson/scanner.py
@@ -0,0 +1,65 @@
+"""JSON token scanner
+"""
+import re
+try:
+    from simplejson._speedups import make_scanner as c_make_scanner
+except ImportError:
+    c_make_scanner = None
+
+__all__ = ['make_scanner']
+
+NUMBER_RE = re.compile(
+    r'(-?(?:0|[1-9]\d*))(\.\d+)?([eE][-+]?\d+)?',
+    (re.VERBOSE | re.MULTILINE | re.DOTALL))
+
+def py_make_scanner(context):
+    parse_object = context.parse_object
+    parse_array = context.parse_array
+    parse_string = context.parse_string
+    match_number = NUMBER_RE.match
+    encoding = context.encoding
+    strict = context.strict
+    parse_float = context.parse_float
+    parse_int = context.parse_int
+    parse_constant = context.parse_constant
+    object_hook = context.object_hook
+
+    def _scan_once(string, idx):
+        try:
+            nextchar = string[idx]
+        except IndexError:
+            raise StopIteration
+
+        if nextchar == '"':
+            return parse_string(string, idx + 1, encoding, strict)
+        elif nextchar == '{':
+            return parse_object((string, idx + 1), encoding, strict, _scan_once, object_hook)
+        elif nextchar == '[':
+            return parse_array((string, idx + 1), _scan_once)
+        elif nextchar == 'n' and string[idx:idx + 4] == 'null':
+            return None, idx + 4
+        elif nextchar == 't' and string[idx:idx + 4] == 'true':
+            return True, idx + 4
+        elif nextchar == 'f' and string[idx:idx + 5] == 'false':
+            return False, idx + 5
+
+        m = match_number(string, idx)
+        if m is not None:
+            integer, frac, exp = m.groups()
+            if frac or exp:
+                res = parse_float(integer + (frac or '') + (exp or ''))
+            else:
+                res = parse_int(integer)
+            return res, m.end()
+        elif nextchar == 'N' and string[idx:idx + 3] == 'NaN':
+            return parse_constant('NaN'), idx + 3
+        elif nextchar == 'I' and string[idx:idx + 8] == 'Infinity':
+            return parse_constant('Infinity'), idx + 8
+        elif nextchar == '-' and string[idx:idx + 9] == '-Infinity':
+            return parse_constant('-Infinity'), idx + 9
+        else:
+            raise StopIteration
+
+    return _scan_once
+
+make_scanner = c_make_scanner or py_make_scanner
diff --git a/simplejson/scanner.pyc b/simplejson/scanner.pyc
new file mode 100644
index 0000000000000000000000000000000000000000..30d94445f0a0c941ee46b6c4fa3bd255e662f6ef
GIT binary patch
literal 2340
zcmb_dUvC>l5T8B&cj6S1v}wr$X-SKd%5~uhP(>h$k&IGTvRgn&D(iB$PA@s%o$fXz
z5y=AtVOzZO)Mvf`?|cM43}2x9X3kDsMZDG4&dtuw@3*rvb9;aNTPd%;dewAj{43%4
z6-F|IaEW#x6}c82DcVtVx+v2O9a-dOXeUeR``{L3b&d|p6jnX8C{7O5ZHEFAz?
zAg#zNlA9ByB(hAKY@MOa3jk)x&C{>gutGXZ5r}n#b~3zmr&{2M79hUuJZY_%@JI(M
ziDL(Wj?3O_{909oRWl3Gw~uspyx7K^k~N5GZKJyJ#ly4RPimh(-*ea3)~b6C_T2kx
z8`WLic)nY^|9nHH4ioX1!N_1FzeAi6c|@aBQ8X%x#iCJ>OoqHHjk03N(I_WMo<=26
z3N*4rDbh%ZQle2_lroJnG|16F(ZHfXi3VjFWN83no(4pN0u74Po8grIhTRJ^EFc*c
z;%PZ7ix_-l&P?(LET?l!e5UBuxkXYKLsNw@ihfaPVa_aOJ+vrXCN-4f0ET2Qq42{D
zU1X^fye7qd8Sz_%UvW&&em#p)*I|i<dAi5}@J|ZJUJ^@I#>5OL5o+BD{!IPQGzefF
z6A7CA^0ai@Er@-d6dG`B1h^A~DXjQEu+jvEl1#%sOJU`!uo>QM_7a9@5dw^|o5F#m
zm@p#hbC9APk<Su^9w<@w99<CYW#~Lh=Q%n@S#uN>u$HIr9^j}vIAKFOyA@i3eWG3{
zIxkRwH)e>o$Wl5#EAS>B(n%yi{GG-=Cow+6<T6v&IQI9%eiI}G!UQCI0xSvm=M?<@
zRq#B67pB1r6EKzpyp@6%uY#{L_{KE&#srKd0V4-#vmsxd>Js|1g*nk3Pu^1&KZ#*i
zWPmpauP=+>*!RU|WNPALEz=&74Hp(Y+fOta8&f7~dHkB9=1}c)n<nlWm{>G}o)>uL
zR9tHw-){+v+GIg47gH8jSD!TEIE+mN(~b$FrqQu&yfBbpT4A6?dCF07DBnmZd1wc5
zcpN1Xg$~@R?9cYZ#9nY9cF#SLkOF;ToELU1A@vPkZeC#YfsTc|7u!zCa}voj)=8Cb
zBLVBc30-F7Lqv9*=q|v9*V9?g4{c*6TRYQBb{yNM<4Y0|bc5smJ~m}+xPPb}(|r+!
zM`rGl%L#+T*r4ZICZ$guC0}yOcEiBYQ|sw@tMI2}1ET&c(Q#5g@?y{T!<Y4~IE?ng
zllqo^sr@jj_iPl%`BCrJ6R#in`Y;KD`uO^O5S_M}X_?6$L6FL*Is9j=idt3`wTiK<
z?yC98u&%*!9Uk|rS+xl3&B?GNh3$_)(*B6W8iXXV_3ZIxqup&cq@sNrnQ4E>9(P#W
zX0gKJ9*esW>9>Z<hWr>5Q%*a@zrvmZWcT(e3t<!r_Lkk#4LF#0ktuTxMA2z?`uoSG
z<R%2E($&9JTdi`fr31TNH*~sP!{3!yn?*d{6y!lSiL`dn;POS44sqVvNt&qHkMQou
z8`PeELu~s#h|_%aBhS~Of7fVlKIt^11dpF>KW%O|TMg;kttU^v-rjDngP~o6NYe`?
n)!s$2k|Nk1^+WgA*I)9HlN%6uHH!vYlm;tVdFUTlrBD9@kb}!4

literal 0
HcmV?d00001

diff --git a/simplejson/tests/__init__.py b/simplejson/tests/__init__.py
new file mode 100644
index 00000000..17c97963
--- /dev/null
+++ b/simplejson/tests/__init__.py
@@ -0,0 +1,23 @@
+import unittest
+import doctest
+
+def additional_tests():
+    import simplejson
+    import simplejson.encoder
+    import simplejson.decoder
+    suite = unittest.TestSuite()
+    for mod in (simplejson, simplejson.encoder, simplejson.decoder):
+        suite.addTest(doctest.DocTestSuite(mod))
+    suite.addTest(doctest.DocFileSuite('../../index.rst'))
+    return suite
+
+def main():
+    suite = additional_tests()
+    runner = unittest.TextTestRunner()
+    runner.run(suite)
+
+if __name__ == '__main__':
+    import os
+    import sys
+    sys.path.insert(0, os.path.dirname(os.path.dirname(os.path.dirname(os.path.abspath(__file__)))))
+    main()
diff --git a/simplejson/tests/test_check_circular.py b/simplejson/tests/test_check_circular.py
new file mode 100644
index 00000000..af6463d6
--- /dev/null
+++ b/simplejson/tests/test_check_circular.py
@@ -0,0 +1,30 @@
+from unittest import TestCase
+import simplejson as json
+
+def default_iterable(obj):
+    return list(obj)
+
+class TestCheckCircular(TestCase):
+    def test_circular_dict(self):
+        dct = {}
+        dct['a'] = dct
+        self.assertRaises(ValueError, json.dumps, dct)
+
+    def test_circular_list(self):
+        lst = []
+        lst.append(lst)
+        self.assertRaises(ValueError, json.dumps, lst)
+
+    def test_circular_composite(self):
+        dct2 = {}
+        dct2['a'] = []
+        dct2['a'].append(dct2)
+        self.assertRaises(ValueError, json.dumps, dct2)
+
+    def test_circular_default(self):
+        json.dumps([set()], default=default_iterable)
+        self.assertRaises(TypeError, json.dumps, [set()])
+
+    def test_circular_off_default(self):
+        json.dumps([set()], default=default_iterable, check_circular=False)
+        self.assertRaises(TypeError, json.dumps, [set()], check_circular=False)
diff --git a/simplejson/tests/test_decode.py b/simplejson/tests/test_decode.py
new file mode 100644
index 00000000..1cd701d4
--- /dev/null
+++ b/simplejson/tests/test_decode.py
@@ -0,0 +1,22 @@
+import decimal
+from unittest import TestCase
+
+import simplejson as json
+
+class TestDecode(TestCase):
+    def test_decimal(self):
+        rval = json.loads('1.1', parse_float=decimal.Decimal)
+        self.assert_(isinstance(rval, decimal.Decimal))
+        self.assertEquals(rval, decimal.Decimal('1.1'))
+
+    def test_float(self):
+        rval = json.loads('1', parse_int=float)
+        self.assert_(isinstance(rval, float))
+        self.assertEquals(rval, 1.0)
+
+    def test_decoder_optimizations(self):
+        # Several optimizations were made that skip over calls to
+        # the whitespace regex, so this test is designed to try and
+        # exercise the uncommon cases. The array cases are already covered.
+        rval = json.loads('{   "key"    :    "value"    ,  "k":"v"    }')
+        self.assertEquals(rval, {"key":"value", "k":"v"})
diff --git a/simplejson/tests/test_default.py b/simplejson/tests/test_default.py
new file mode 100644
index 00000000..139e42bf
--- /dev/null
+++ b/simplejson/tests/test_default.py
@@ -0,0 +1,9 @@
+from unittest import TestCase
+
+import simplejson as json
+
+class TestDefault(TestCase):
+    def test_default(self):
+        self.assertEquals(
+            json.dumps(type, default=repr),
+            json.dumps(repr(type)))
diff --git a/simplejson/tests/test_dump.py b/simplejson/tests/test_dump.py
new file mode 100644
index 00000000..4de37cf4
--- /dev/null
+++ b/simplejson/tests/test_dump.py
@@ -0,0 +1,21 @@
+from unittest import TestCase
+from cStringIO import StringIO
+
+import simplejson as json
+
+class TestDump(TestCase):
+    def test_dump(self):
+        sio = StringIO()
+        json.dump({}, sio)
+        self.assertEquals(sio.getvalue(), '{}')
+
+    def test_dumps(self):
+        self.assertEquals(json.dumps({}), '{}')
+
+    def test_encode_truefalse(self):
+        self.assertEquals(json.dumps(
+                 {True: False, False: True}, sort_keys=True),
+                 '{"false": true, "true": false}')
+        self.assertEquals(json.dumps(
+                {2: 3.0, 4.0: 5L, False: 1, 6L: True, "7": 0}, sort_keys=True),
+                '{"false": 1, "2": 3.0, "4.0": 5, "6": true, "7": 0}')
diff --git a/simplejson/tests/test_encode_basestring_ascii.py b/simplejson/tests/test_encode_basestring_ascii.py
new file mode 100644
index 00000000..7128495f
--- /dev/null
+++ b/simplejson/tests/test_encode_basestring_ascii.py
@@ -0,0 +1,38 @@
+from unittest import TestCase
+
+import simplejson.encoder
+
+CASES = [
+    (u'/\\"\ucafe\ubabe\uab98\ufcde\ubcda\uef4a\x08\x0c\n\r\t`1~!@#$%^&*()_+-=[]{}|;:\',./<>?', '"/\\\\\\"\\ucafe\\ubabe\\uab98\\ufcde\\ubcda\\uef4a\\b\\f\\n\\r\\t`1~!@#$%^&*()_+-=[]{}|;:\',./<>?"'),
+    (u'\u0123\u4567\u89ab\ucdef\uabcd\uef4a', '"\\u0123\\u4567\\u89ab\\ucdef\\uabcd\\uef4a"'),
+    (u'controls', '"controls"'),
+    (u'\x08\x0c\n\r\t', '"\\b\\f\\n\\r\\t"'),
+    (u'{"object with 1 member":["array with 1 element"]}', '"{\\"object with 1 member\\":[\\"array with 1 element\\"]}"'),
+    (u' s p a c e d ', '" s p a c e d "'),
+    (u'\U0001d120', '"\\ud834\\udd20"'),
+    (u'\u03b1\u03a9', '"\\u03b1\\u03a9"'),
+    ('\xce\xb1\xce\xa9', '"\\u03b1\\u03a9"'),
+    (u'\u03b1\u03a9', '"\\u03b1\\u03a9"'),
+    ('\xce\xb1\xce\xa9', '"\\u03b1\\u03a9"'),
+    (u'\u03b1\u03a9', '"\\u03b1\\u03a9"'),
+    (u'\u03b1\u03a9', '"\\u03b1\\u03a9"'),
+    (u"`1~!@#$%^&*()_+-={':[,]}|;.</>?", '"`1~!@#$%^&*()_+-={\':[,]}|;.</>?"'),
+    (u'\x08\x0c\n\r\t', '"\\b\\f\\n\\r\\t"'),
+    (u'\u0123\u4567\u89ab\ucdef\uabcd\uef4a', '"\\u0123\\u4567\\u89ab\\ucdef\\uabcd\\uef4a"'),
+]
+
+class TestEncodeBaseStringAscii(TestCase):
+    def test_py_encode_basestring_ascii(self):
+        self._test_encode_basestring_ascii(simplejson.encoder.py_encode_basestring_ascii)
+
+    def test_c_encode_basestring_ascii(self):
+        if not simplejson.encoder.c_encode_basestring_ascii:
+            return
+        self._test_encode_basestring_ascii(simplejson.encoder.c_encode_basestring_ascii)
+
+    def _test_encode_basestring_ascii(self, encode_basestring_ascii):
+        fname = encode_basestring_ascii.__name__
+        for input_string, expect in CASES:
+            result = encode_basestring_ascii(input_string)
+            self.assertEquals(result, expect,
+                '%r != %r for %s(%r)' % (result, expect, fname, input_string))
diff --git a/simplejson/tests/test_fail.py b/simplejson/tests/test_fail.py
new file mode 100644
index 00000000..002eea08
--- /dev/null
+++ b/simplejson/tests/test_fail.py
@@ -0,0 +1,76 @@
+from unittest import TestCase
+
+import simplejson as json
+
+# Fri Dec 30 18:57:26 2005
+JSONDOCS = [
+    # http://json.org/JSON_checker/test/fail1.json
+    '"A JSON payload should be an object or array, not a string."',
+    # http://json.org/JSON_checker/test/fail2.json
+    '["Unclosed array"',
+    # http://json.org/JSON_checker/test/fail3.json
+    '{unquoted_key: "keys must be quoted}',
+    # http://json.org/JSON_checker/test/fail4.json
+    '["extra comma",]',
+    # http://json.org/JSON_checker/test/fail5.json
+    '["double extra comma",,]',
+    # http://json.org/JSON_checker/test/fail6.json
+    '[   , "<-- missing value"]',
+    # http://json.org/JSON_checker/test/fail7.json
+    '["Comma after the close"],',
+    # http://json.org/JSON_checker/test/fail8.json
+    '["Extra close"]]',
+    # http://json.org/JSON_checker/test/fail9.json
+    '{"Extra comma": true,}',
+    # http://json.org/JSON_checker/test/fail10.json
+    '{"Extra value after close": true} "misplaced quoted value"',
+    # http://json.org/JSON_checker/test/fail11.json
+    '{"Illegal expression": 1 + 2}',
+    # http://json.org/JSON_checker/test/fail12.json
+    '{"Illegal invocation": alert()}',
+    # http://json.org/JSON_checker/test/fail13.json
+    '{"Numbers cannot have leading zeroes": 013}',
+    # http://json.org/JSON_checker/test/fail14.json
+    '{"Numbers cannot be hex": 0x14}',
+    # http://json.org/JSON_checker/test/fail15.json
+    '["Illegal backslash escape: \\x15"]',
+    # http://json.org/JSON_checker/test/fail16.json
+    '["Illegal backslash escape: \\\'"]',
+    # http://json.org/JSON_checker/test/fail17.json
+    '["Illegal backslash escape: \\017"]',
+    # http://json.org/JSON_checker/test/fail18.json
+    '[[[[[[[[[[[[[[[[[[[["Too deep"]]]]]]]]]]]]]]]]]]]]',
+    # http://json.org/JSON_checker/test/fail19.json
+    '{"Missing colon" null}',
+    # http://json.org/JSON_checker/test/fail20.json
+    '{"Double colon":: null}',
+    # http://json.org/JSON_checker/test/fail21.json
+    '{"Comma instead of colon", null}',
+    # http://json.org/JSON_checker/test/fail22.json
+    '["Colon instead of comma": false]',
+    # http://json.org/JSON_checker/test/fail23.json
+    '["Bad value", truth]',
+    # http://json.org/JSON_checker/test/fail24.json
+    "['single quote']",
+    # http://code.google.com/p/simplejson/issues/detail?id=3
+    u'["A\u001FZ control characters in string"]',
+]
+
+SKIPS = {
+    1: "why not have a string payload?",
+    18: "spec doesn't specify any nesting limitations",
+}
+
+class TestFail(TestCase):
+    def test_failures(self):
+        for idx, doc in enumerate(JSONDOCS):
+            idx = idx + 1
+            if idx in SKIPS:
+                json.loads(doc)
+                continue
+            try:
+                json.loads(doc)
+            except ValueError:
+                pass
+            else:
+                self.fail("Expected failure for fail%d.json: %r" % (idx, doc))
diff --git a/simplejson/tests/test_float.py b/simplejson/tests/test_float.py
new file mode 100644
index 00000000..1a2b98a2
--- /dev/null
+++ b/simplejson/tests/test_float.py
@@ -0,0 +1,15 @@
+import math
+from unittest import TestCase
+
+import simplejson as json
+
+class TestFloat(TestCase):
+    def test_floats(self):
+        for num in [1617161771.7650001, math.pi, math.pi**100, math.pi**-100, 3.1]:
+            self.assertEquals(float(json.dumps(num)), num)
+            self.assertEquals(json.loads(json.dumps(num)), num)
+
+    def test_ints(self):
+        for num in [1, 1L, 1<<32, 1<<64]:
+            self.assertEquals(json.dumps(num), str(num))
+            self.assertEquals(int(json.dumps(num)), num)
diff --git a/simplejson/tests/test_indent.py b/simplejson/tests/test_indent.py
new file mode 100644
index 00000000..66e19b9e
--- /dev/null
+++ b/simplejson/tests/test_indent.py
@@ -0,0 +1,41 @@
+from unittest import TestCase
+
+import simplejson as json
+import textwrap
+
+class TestIndent(TestCase):
+    def test_indent(self):
+        h = [['blorpie'], ['whoops'], [], 'd-shtaeou', 'd-nthiouh', 'i-vhbjkhnth',
+             {'nifty': 87}, {'field': 'yes', 'morefield': False} ]
+
+        expect = textwrap.dedent("""\
+        [
+          [
+            "blorpie"
+          ],
+          [
+            "whoops"
+          ],
+          [],
+          "d-shtaeou",
+          "d-nthiouh",
+          "i-vhbjkhnth",
+          {
+            "nifty": 87
+          },
+          {
+            "field": "yes",
+            "morefield": false
+          }
+        ]""")
+
+
+        d1 = json.dumps(h)
+        d2 = json.dumps(h, indent=2, sort_keys=True, separators=(',', ': '))
+
+        h1 = json.loads(d1)
+        h2 = json.loads(d2)
+
+        self.assertEquals(h1, h)
+        self.assertEquals(h2, h)
+        self.assertEquals(d2, expect)
diff --git a/simplejson/tests/test_pass1.py b/simplejson/tests/test_pass1.py
new file mode 100644
index 00000000..c3d6302d
--- /dev/null
+++ b/simplejson/tests/test_pass1.py
@@ -0,0 +1,76 @@
+from unittest import TestCase
+
+import simplejson as json
+
+# from http://json.org/JSON_checker/test/pass1.json
+JSON = r'''
+[
+    "JSON Test Pattern pass1",
+    {"object with 1 member":["array with 1 element"]},
+    {},
+    [],
+    -42,
+    true,
+    false,
+    null,
+    {
+        "integer": 1234567890,
+        "real": -9876.543210,
+        "e": 0.123456789e-12,
+        "E": 1.234567890E+34,
+        "":  23456789012E666,
+        "zero": 0,
+        "one": 1,
+        "space": " ",
+        "quote": "\"",
+        "backslash": "\\",
+        "controls": "\b\f\n\r\t",
+        "slash": "/ & \/",
+        "alpha": "abcdefghijklmnopqrstuvwyz",
+        "ALPHA": "ABCDEFGHIJKLMNOPQRSTUVWYZ",
+        "digit": "0123456789",
+        "special": "`1~!@#$%^&*()_+-={':[,]}|;.</>?",
+        "hex": "\u0123\u4567\u89AB\uCDEF\uabcd\uef4A",
+        "true": true,
+        "false": false,
+        "null": null,
+        "array":[  ],
+        "object":{  },
+        "address": "50 St. James Street",
+        "url": "http://www.JSON.org/",
+        "comment": "// /* <!-- --",
+        "# -- --> */": " ",
+        " s p a c e d " :[1,2 , 3
+
+,
+
+4 , 5        ,          6           ,7        ],
+        "compact": [1,2,3,4,5,6,7],
+        "jsontext": "{\"object with 1 member\":[\"array with 1 element\"]}",
+        "quotes": "&#34; \u0022 %22 0x22 034 &#x22;",
+        "\/\\\"\uCAFE\uBABE\uAB98\uFCDE\ubcda\uef4A\b\f\n\r\t`1~!@#$%^&*()_+-=[]{}|;:',./<>?"
+: "A key can be any string"
+    },
+    0.5 ,98.6
+,
+99.44
+,
+
+1066
+
+
+,"rosebud"]
+'''
+
+class TestPass1(TestCase):
+    def test_parse(self):
+        # test in/out equivalence and parsing
+        res = json.loads(JSON)
+        out = json.dumps(res)
+        self.assertEquals(res, json.loads(out))
+        try:
+            json.dumps(res, allow_nan=False)
+        except ValueError:
+            pass
+        else:
+            self.fail("23456789012E666 should be out of range")
diff --git a/simplejson/tests/test_pass2.py b/simplejson/tests/test_pass2.py
new file mode 100644
index 00000000..de4ee00b
--- /dev/null
+++ b/simplejson/tests/test_pass2.py
@@ -0,0 +1,14 @@
+from unittest import TestCase
+import simplejson as json
+
+# from http://json.org/JSON_checker/test/pass2.json
+JSON = r'''
+[[[[[[[[[[[[[[[[[[["Not too deep"]]]]]]]]]]]]]]]]]]]
+'''
+
+class TestPass2(TestCase):
+    def test_parse(self):
+        # test in/out equivalence and parsing
+        res = json.loads(JSON)
+        out = json.dumps(res)
+        self.assertEquals(res, json.loads(out))
diff --git a/simplejson/tests/test_pass3.py b/simplejson/tests/test_pass3.py
new file mode 100644
index 00000000..f591aba9
--- /dev/null
+++ b/simplejson/tests/test_pass3.py
@@ -0,0 +1,20 @@
+from unittest import TestCase
+
+import simplejson as json
+
+# from http://json.org/JSON_checker/test/pass3.json
+JSON = r'''
+{
+    "JSON Test Pattern pass3": {
+        "The outermost value": "must be an object or array.",
+        "In this test": "It is an object."
+    }
+}
+'''
+
+class TestPass3(TestCase):
+    def test_parse(self):
+        # test in/out equivalence and parsing
+        res = json.loads(JSON)
+        out = json.dumps(res)
+        self.assertEquals(res, json.loads(out))
diff --git a/simplejson/tests/test_recursion.py b/simplejson/tests/test_recursion.py
new file mode 100644
index 00000000..97422a66
--- /dev/null
+++ b/simplejson/tests/test_recursion.py
@@ -0,0 +1,67 @@
+from unittest import TestCase
+
+import simplejson as json
+
+class JSONTestObject:
+    pass
+
+
+class RecursiveJSONEncoder(json.JSONEncoder):
+    recurse = False
+    def default(self, o):
+        if o is JSONTestObject:
+            if self.recurse:
+                return [JSONTestObject]
+            else:
+                return 'JSONTestObject'
+        return json.JSONEncoder.default(o)
+
+
+class TestRecursion(TestCase):
+    def test_listrecursion(self):
+        x = []
+        x.append(x)
+        try:
+            json.dumps(x)
+        except ValueError:
+            pass
+        else:
+            self.fail("didn't raise ValueError on list recursion")
+        x = []
+        y = [x]
+        x.append(y)
+        try:
+            json.dumps(x)
+        except ValueError:
+            pass
+        else:
+            self.fail("didn't raise ValueError on alternating list recursion")
+        y = []
+        x = [y, y]
+        # ensure that the marker is cleared
+        json.dumps(x)
+
+    def test_dictrecursion(self):
+        x = {}
+        x["test"] = x
+        try:
+            json.dumps(x)
+        except ValueError:
+            pass
+        else:
+            self.fail("didn't raise ValueError on dict recursion")
+        x = {}
+        y = {"a": x, "b": x}
+        # ensure that the marker is cleared
+        json.dumps(x)
+
+    def test_defaultrecursion(self):
+        enc = RecursiveJSONEncoder()
+        self.assertEquals(enc.encode(JSONTestObject), '"JSONTestObject"')
+        enc.recurse = True
+        try:
+            enc.encode(JSONTestObject)
+        except ValueError:
+            pass
+        else:
+            self.fail("didn't raise ValueError on default recursion")
diff --git a/simplejson/tests/test_scanstring.py b/simplejson/tests/test_scanstring.py
new file mode 100644
index 00000000..b08dec71
--- /dev/null
+++ b/simplejson/tests/test_scanstring.py
@@ -0,0 +1,111 @@
+import sys
+import decimal
+from unittest import TestCase
+
+import simplejson as json
+import simplejson.decoder
+
+class TestScanString(TestCase):
+    def test_py_scanstring(self):
+        self._test_scanstring(simplejson.decoder.py_scanstring)
+
+    def test_c_scanstring(self):
+        if not simplejson.decoder.c_scanstring:
+            return
+        self._test_scanstring(simplejson.decoder.c_scanstring)
+
+    def _test_scanstring(self, scanstring):
+        self.assertEquals(
+            scanstring('"z\\ud834\\udd20x"', 1, None, True),
+            (u'z\U0001d120x', 16))
+
+        if sys.maxunicode == 65535:
+            self.assertEquals(
+                scanstring(u'"z\U0001d120x"', 1, None, True),
+                (u'z\U0001d120x', 6))
+        else:
+            self.assertEquals(
+                scanstring(u'"z\U0001d120x"', 1, None, True),
+                (u'z\U0001d120x', 5))
+
+        self.assertEquals(
+            scanstring('"\\u007b"', 1, None, True),
+            (u'{', 8))
+
+        self.assertEquals(
+            scanstring('"A JSON payload should be an object or array, not a string."', 1, None, True),
+            (u'A JSON payload should be an object or array, not a string.', 60))
+
+        self.assertEquals(
+            scanstring('["Unclosed array"', 2, None, True),
+            (u'Unclosed array', 17))
+
+        self.assertEquals(
+            scanstring('["extra comma",]', 2, None, True),
+            (u'extra comma', 14))
+
+        self.assertEquals(
+            scanstring('["double extra comma",,]', 2, None, True),
+            (u'double extra comma', 21))
+
+        self.assertEquals(
+            scanstring('["Comma after the close"],', 2, None, True),
+            (u'Comma after the close', 24))
+
+        self.assertEquals(
+            scanstring('["Extra close"]]', 2, None, True),
+            (u'Extra close', 14))
+
+        self.assertEquals(
+            scanstring('{"Extra comma": true,}', 2, None, True),
+            (u'Extra comma', 14))
+
+        self.assertEquals(
+            scanstring('{"Extra value after close": true} "misplaced quoted value"', 2, None, True),
+            (u'Extra value after close', 26))
+
+        self.assertEquals(
+            scanstring('{"Illegal expression": 1 + 2}', 2, None, True),
+            (u'Illegal expression', 21))
+
+        self.assertEquals(
+            scanstring('{"Illegal invocation": alert()}', 2, None, True),
+            (u'Illegal invocation', 21))
+
+        self.assertEquals(
+            scanstring('{"Numbers cannot have leading zeroes": 013}', 2, None, True),
+            (u'Numbers cannot have leading zeroes', 37))
+
+        self.assertEquals(
+            scanstring('{"Numbers cannot be hex": 0x14}', 2, None, True),
+            (u'Numbers cannot be hex', 24))
+
+        self.assertEquals(
+            scanstring('[[[[[[[[[[[[[[[[[[[["Too deep"]]]]]]]]]]]]]]]]]]]]', 21, None, True),
+            (u'Too deep', 30))
+
+        self.assertEquals(
+            scanstring('{"Missing colon" null}', 2, None, True),
+            (u'Missing colon', 16))
+
+        self.assertEquals(
+            scanstring('{"Double colon":: null}', 2, None, True),
+            (u'Double colon', 15))
+
+        self.assertEquals(
+            scanstring('{"Comma instead of colon", null}', 2, None, True),
+            (u'Comma instead of colon', 25))
+
+        self.assertEquals(
+            scanstring('["Colon instead of comma": false]', 2, None, True),
+            (u'Colon instead of comma', 25))
+
+        self.assertEquals(
+            scanstring('["Bad value", truth]', 2, None, True),
+            (u'Bad value', 12))
+
+    def test_issue3623(self):
+        self.assertRaises(ValueError, json.decoder.scanstring, "xxx", 1,
+                          "xxx")
+        self.assertRaises(UnicodeDecodeError,
+                          json.encoder.encode_basestring_ascii, "xx\xff")
diff --git a/simplejson/tests/test_separators.py b/simplejson/tests/test_separators.py
new file mode 100644
index 00000000..8fa0dac6
--- /dev/null
+++ b/simplejson/tests/test_separators.py
@@ -0,0 +1,42 @@
+import textwrap
+from unittest import TestCase
+
+import simplejson as json
+
+
+class TestSeparators(TestCase):
+    def test_separators(self):
+        h = [['blorpie'], ['whoops'], [], 'd-shtaeou', 'd-nthiouh', 'i-vhbjkhnth',
+             {'nifty': 87}, {'field': 'yes', 'morefield': False} ]
+
+        expect = textwrap.dedent("""\
+        [
+          [
+            "blorpie"
+          ] ,
+          [
+            "whoops"
+          ] ,
+          [] ,
+          "d-shtaeou" ,
+          "d-nthiouh" ,
+          "i-vhbjkhnth" ,
+          {
+            "nifty" : 87
+          } ,
+          {
+            "field" : "yes" ,
+            "morefield" : false
+          }
+        ]""")
+
+
+        d1 = json.dumps(h)
+        d2 = json.dumps(h, indent=2, sort_keys=True, separators=(' ,', ' : '))
+
+        h1 = json.loads(d1)
+        h2 = json.loads(d2)
+
+        self.assertEquals(h1, h)
+        self.assertEquals(h2, h)
+        self.assertEquals(d2, expect)
diff --git a/simplejson/tests/test_unicode.py b/simplejson/tests/test_unicode.py
new file mode 100644
index 00000000..6f4384a5
--- /dev/null
+++ b/simplejson/tests/test_unicode.py
@@ -0,0 +1,64 @@
+from unittest import TestCase
+
+import simplejson as json
+
+class TestUnicode(TestCase):
+    def test_encoding1(self):
+        encoder = json.JSONEncoder(encoding='utf-8')
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        s = u.encode('utf-8')
+        ju = encoder.encode(u)
+        js = encoder.encode(s)
+        self.assertEquals(ju, js)
+
+    def test_encoding2(self):
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        s = u.encode('utf-8')
+        ju = json.dumps(u, encoding='utf-8')
+        js = json.dumps(s, encoding='utf-8')
+        self.assertEquals(ju, js)
+
+    def test_encoding3(self):
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        j = json.dumps(u)
+        self.assertEquals(j, '"\\u03b1\\u03a9"')
+
+    def test_encoding4(self):
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        j = json.dumps([u])
+        self.assertEquals(j, '["\\u03b1\\u03a9"]')
+
+    def test_encoding5(self):
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        j = json.dumps(u, ensure_ascii=False)
+        self.assertEquals(j, u'"%s"' % (u,))
+
+    def test_encoding6(self):
+        u = u'\N{GREEK SMALL LETTER ALPHA}\N{GREEK CAPITAL LETTER OMEGA}'
+        j = json.dumps([u], ensure_ascii=False)
+        self.assertEquals(j, u'["%s"]' % (u,))
+
+    def test_big_unicode_encode(self):
+        u = u'\U0001d120'
+        self.assertEquals(json.dumps(u), '"\\ud834\\udd20"')
+        self.assertEquals(json.dumps(u, ensure_ascii=False), u'"\U0001d120"')
+
+    def test_big_unicode_decode(self):
+        u = u'z\U0001d120x'
+        self.assertEquals(json.loads('"' + u + '"'), u)
+        self.assertEquals(json.loads('"z\\ud834\\udd20x"'), u)
+
+    def test_unicode_decode(self):
+        for i in range(0, 0xd7ff):
+            u = unichr(i)
+            s = '"\\u%04x"' % (i,)
+            self.assertEquals(json.loads(s), u)
+
+    def test_default_encoding(self):
+        self.assertEquals(json.loads(u'{"a": "\xe9"}'.encode('utf-8')),
+            {'a': u'\xe9'})
+
+    def test_unicode_preservation(self):
+        self.assertEquals(type(json.loads(u'""')), unicode)
+        self.assertEquals(type(json.loads(u'"a"')), unicode)
+        self.assertEquals(type(json.loads(u'["a"]')[0]), unicode)
\ No newline at end of file
diff --git a/simplejson/tool.py b/simplejson/tool.py
new file mode 100644
index 00000000..90443317
--- /dev/null
+++ b/simplejson/tool.py
@@ -0,0 +1,37 @@
+r"""Command-line tool to validate and pretty-print JSON
+
+Usage::
+
+    $ echo '{"json":"obj"}' | python -m simplejson.tool
+    {
+        "json": "obj"
+    }
+    $ echo '{ 1.2:3.4}' | python -m simplejson.tool
+    Expecting property name: line 1 column 2 (char 2)
+
+"""
+import sys
+import simplejson
+
+def main():
+    if len(sys.argv) == 1:
+        infile = sys.stdin
+        outfile = sys.stdout
+    elif len(sys.argv) == 2:
+        infile = open(sys.argv[1], 'rb')
+        outfile = sys.stdout
+    elif len(sys.argv) == 3:
+        infile = open(sys.argv[1], 'rb')
+        outfile = open(sys.argv[2], 'wb')
+    else:
+        raise SystemExit(sys.argv[0] + " [infile [outfile]]")
+    try:
+        obj = simplejson.load(infile)
+    except ValueError, e:
+        raise SystemExit(e)
+    simplejson.dump(obj, outfile, sort_keys=True, indent=4)
+    outfile.write('\n')
+
+
+if __name__ == '__main__':
+    main()
diff --git a/static/ajax-loader.gif b/static/ajax-loader.gif
new file mode 100644
index 0000000000000000000000000000000000000000..f16ebf7cbd4f28620c0daba2f4a36ae0196b3d4c
GIT binary patch
literal 10819
zcmb`NXHZjX->;L91QJksO9Fy4X^NnNiVC_BuprxlbVKhX^w84?z4u<FS4FB|0BI2r
z>7CGf5evn_!Tr3?d(NECJ2Pu0AJ)uTvu54bx_-a^t*&`j>8i;TfD`Z)060EAmb_Eg
z)wf#RL@#+W)ka%x?pW*}*_fIC+&j2FF}pLjxVO0SWp(}A+xH6{y(=4A-?w-72Szu)
zd^`O1{b+b%YyaTK$DxhUsqNjpgDLv%hfiy@)VYJh9~E^o`Bf9b$IM!4PoLaT)mD=~
zFUJ4`006?j5qF#|Ok6F@g*<Frt%Xc%O>p)Y6Z7*nj+PjJ@F5rmKRHY0<N*A+NdV+n
zNGQVGCd0b8+<v1OEA!FSVHQ`u<Fj*2&BAJcnV{r6=WhFJnf-;X_saAu#!B6<u~ma1
zq_*92B*wHVuc_&}+0L&izcj{nkoCA7>xC_AA8$W@FCrO7u?zADA-VZ`x<p1J2}EcZ
zJ|a0PAl4Oa2{D#7GUwptgTr&mLC8GBYo<3$NOP>?tC|{EeZ$+PS}L}+>0Lu3YulS{
zT4!^6L+^W9RZs87mhra9j_Iz!%2vK2CI%TW6b5HzImN~dVJ!O2!OQxY?dQ)g-}ZOc
zHbx@}1$YJ+?K<v)uqp|_zU|%BpV3C-hG@O#>z}{t&;P~OkgsY^BS?Vr*pM7Zz+VGy
zGfn8J#m3_yoX+b#a<TCrb(B1oHxD@r`?FU<W|XfHRzJQ}Pd_3{JuU9ddKP=Ly<xEU
zQ=xu=^YB`{?ej!wCX_BfbwySm`$RA4{%9-F9c$HHc75N`xQYAVdwZ(Kg%|JqPmQV>
zDpjI8oCMB@qx33`Xw_VU0cm=BragGsS+$bevLq%hnO&KCcBH=3mDfvuPp-Rdj{6&R
zHa8Kz$xJs|?B}2IQQUsp?)jr!!0=#iu`;qPU^}gDYqibg#q;S@SNLF|EZL!#x_2<U
z1j!tYLT^re+v?4Xtnl;mYTlg=t-X+0_xtCsCHEIbE4V-qjtkonGHF?P5s(66ai?ct
z*tNR!16WNpvcbKYNy34>db)8GULs#w(5+~toZv=1YdVas3W&uFU4AzBgx@vEBz#;l
z-pu9tZ)?LyrFGoG)7w(&W-(&|Hk`4;RUNspd=I*5q2ess%;1CmgIS<4v~VcVWaPQH
zANrnVeu}B%aK0|an0w{9^-)|O9DS)D9?uwbcai9O^ScC@pw(ezOGyY?wF-n!Sm#Ke
zZy3)y(6~018z!}0`0yn?_&rY+<>YT(f~^#{5m)wlacRx^dP!x6)JAFbi0ww11o>n&
z{9EsPXXod0%vV-{ohI1IX%fgQW4U^o;-lR1D2o$i=iuqZ>VxzPB9Jhr87P6lwqYLL
zzAmxh0lsOW7;-|8F98?s9psNE+IvPo(qi06Ws!-wc9~e{KMO$+^=Bn?AdpZ9E6B?F
z1A=K_u-m%NuW@h!26eF-W1SeBa_##tKQP?qva-5}9POT49d`BGnqS=b_~meVq;S`!
zgb_=kIvvv?GI&6n9GF3ujY-D@NP@D-pFf91Cy^u1oI&?!IJb}(xK)nDnXbl&f}s>;
z;#;8si@QnEH<n9nIF~!)gv54TZC)*WOqbQ1XE}<td>k&J3gSNcYVjbRBW<Eu>RIc(
zvKzVb5N~!MFj(-4jL_9=*-X>+JQKFctTLloj<B`(gsg2ci^t*WW%2Os*+zaa>)kA>
z9G&XPD<bDp=P=*pjr>ujY_f!g_$c1eN~62X^~Q5s<^MdWux&z|6ZtNq_x%Nv)pIs%
z<@aqc7|CWG#B)lO2<M5Bz}Tf7V4J(*rC&s;9PG~X<w$3u2}fU6;5YAOW>7spFDxV{
zdYr!DyZ`O|<bBM>uSUbIfsI>M$}+#ezuJX`W_;eY)V^^4y_63+2J*_W0U<oPIw?>%
zepJ^$z`V=Il-pRMH-O)ERX<>)`;978*j-52{u7^zX^6D`^EA)}O5Ge(0N%+LbVWZ3
z7{O(%Xc&Ih8OP#|MC*!1{kR+_8YV)k6N#2`rwV(Ym*O{JWIvY#0x~KwnK+*jILrpH
zgsEGa3u@KiQ+VRWO+tOg#nRJmpN$nKR4-XirTUoGoH4@A*S|=2kmW7Na^0?<&XIR7
zOh~8kdrd<lW+Vxo1&4|F#B+E_OJ^3UdJ;%lGSRf?HqkQ89pSDm6}n$kJnv0{T+M=%
zAei)VmF`g}HyOm2ze9vyd8He7o|U$<iP@U4EAPMhWAoUm;~v_M^7=fb7~FOGN6}v<
zH&;cfJAE{k!t<|Q1%};}*PM&nnNXUyLTISGq`=UXrNQ6M>pif%1ohd7+!_eVX}T-u
z5(Z#qmf?p!n&=XXnBierie$(vu4-qu#{&x`ScFc29Zax*vO;;4wG^3Ly>pi2dQBUe
zbn0P&ztrG*zPEG!kCk45uPjJ2c}{EBa&mFKYwyEbh)Y9wN5z&wFSW8F5PKN_dY3b9
z;`7C$R?X?Lu(C_}IaUiLI}_}`M=#WHpaA=gENGdp>e$%g{UTdV>#4Ev@4p1+=Eh|Y
zro1mdCCr%)mL1?cSM=v5Lq9Hsj%wJ?9j;^ro<BmY<~{kO#$H%Zezaa%yM44#*?IoQ
zX7#AwZKi(@7lDj6IHoJsU-1iAzKJbW;fF73PvL5nqgB3eqU>=bC<80f*9MQpkSM;v
zL4@!y?`T^T#xa7`-zO=YObN=sCp&rsK!P*uQ*+WYZ3q>q-g%jJaSkZK)98~=ryUBy
z2k%0_Pmlq!a)q!m4GqDWdi$e#2Zx7ykyeufGs7^bb-%U6(h%L%cXMWRWg-Z<_=RaD
z#O82mXO+I86OmbWX%C*m%p0DiNZOz0kJ1LV0C>PqrE_SsDg%>{>IpYgh~2Rqg2z5A
zl6$I}Fc>=JX*Y)`iIH17<*mx=<%c2iX8DHQdzM=1%E1)FU8;FN(#6;jGWN^Mz6`Zg
z&<)Aqf{`qahF9kBr`Ecq!X-Ie#WAW3V6YsIbQW-t+~{$LdQAb4@DSW*OFC&20rFy&
z2lu6B?cSk=GAiD6KiHjZ_Y_mQlBneTpfipWpo2P4u;}B|Sh(zvl(O1bEWwtawu#vs
zDoxa*pm3GTgXO|jcs36RP#Groh?);nb#dXA(O`Z1h~(A`%ekL<(?k`t@zKbxR*vAa
ze{vyYUvs+mw~hW<#_t);DWKTB-sc_>zRKTrezuR!80~y^%k=lqqYE7S#8-7r8!^k*
zu@c*hu!cZ3ZM2|$xRF&72sAaU>RIVf`2g2N9%~6ACNs@m=ChA#32CY?oRJsOQZWma
zc%1tn;!=!N3wm^FY!rGnMkz1+0<F$0_=XNoZiLKj{*237I>{;Ffh|Fz;WC!gr9iD1
zMbiLDHYx$kZmpCK5pN38^<Hk5%(ix&u_*AOy-hfi#(|eug|c+jrdaOk1+I`@341N&
zP_}JmEv7WB9!GA-M!oQK&!`K_jD|{CV?9Cej7Yes_A1FbM+MKoQr$gGtp3C~9diBd
zK{oWF9$-0y#r0rH{s02oG^Z(d3YLrLvz5AylHKhXG0+X0V-xX<p&PGnnMxCCIvvF`
zD(Y?rZQkLwwsSNokTocO9joTer&i}Yx()-gNlC{w=;f*;h&oE1mj^IQibH9xo}%$M
zS<eUZ#*g{Ub7A)n#X>Ko=!}~{zBHD+P|(rL2v)lL1JiZcvF1V8IYn<d2i=@B`iDJ^
zDS7+-6gj|UHc@LJlo8!v;7I|=e!ZD8aOl!s;0xD%d0+jiL@o#TR}R#lUn>36ul$2*
zPXmQA!6NM!`ns)A&3bQWMdGq~84qeH)gynuzVDvLTL$P*=d`W^bhACum14kqbeDh~
zp_|ifzbq4R#1?r$S+!ur`v(`>1h<z<VaoQn;mG^ESJfK3@Hgq6F_VY}A`&<AQZp5!
z*f1TD*{l>n)7e!bfAk@|=b<uQ___O@7o+?~M1Jn|DDM3H(yxBu*Vm!vm|x%iRS^la
zlH271r@9_>Iq{*e2U%I=tP_;ClNTT5apGYplxKjaubZEPcYqHo($AKNbHXsNM!Sbn
zpuPlK5683&f*%7Glan49m06IMkdz#S^YTh8!&k>)Q5LLLGDaR42)y$IEGJ~K4n6_P
zAQODB*FVbU)6jIUwO{nq^e7bh(SKoaEM{_GXoP8VZhQJOY<a>Ky0duT_T$K{jZrJ6
zfw0{Fa!$S6Q1uq;)Ke8XJcRIsl`4m)RxJ=gjG{p(&pB06gdp>A&;ucY1u;hA@7ub&
z=)8wX@>Vws`(G7+)8uU?3}IYiq!ez$5SjI=<^Du*7r}U{i|A0&xq$EHhYH0#xytqD
zzomRr?TY89xoC~Y<JC?>I5bFd*^bjJG7If(LTG|fBTfvJ%7Y=zzH|H1k()r@ou!h>
z^c2FBs_5;*M>-Ul@f1okzm#+hBjTc!zu%o>fp8Xr<zPtsvmcv$yVjT@;W{H#p=>gZ
zb5XdTUO|K~2l0yP-o+uH3!TxU&-#3XzQP71v?a<DZC%%RYGS?pln<TfdpQk1miypb
zPR+c2^oZV!JY01zQmoBy_L*Kd+TzXh9Dc|!>&Cg6fBP7-@|Vyo7}s6H2Sq;U2fEjE
zkDvm0ep{%LSKY)_pu9H|@MIe5iAgYjPT~W35#u0~vye{i^DsWa#1<&+X<|=^;C5lQ
zvC7R3vpc9)xY6LLX${jrkI!8K%G_r?vWb#kb?{IwdLZh)@Jt)k!<`T;XvQ36!|x(V
zi?#Ip6kOet_Q75*--oAbZC)NW6`Yh@Sd?4<hV1Px`**GBol3!)p0kR4#h<?n_BtAq
zNDk&$&&mERb}+)g?kZ`-$dWcTeo5Ia%QkpUwt&}3rpR`#_@z!_j>ao}73o;S*{qpj
zdE1rZ@Zr1()!az|g|P~%@v5CXO^{^wIxodG^0?|%->BW?r@++ABGReRtzteY-tnA{
zqd+k@7@MV1m^)G@97TuKCtcQDW)hApI2*O&|3fM@EF2k?v=R7oyFjHyjE2ZICx8BC
z?*5$vD%<A1cFw~5)=e8xXvGn8UYNjB)T2(B0c!^<ju&0?4H7JJ>_%g2AuT}riLuc<
z#TDg;X0vJ@E_Km@`d`2|0+puvSj8QxKo3Mhz5?&)bGr2ku-sVsc$fL%W%-zkrwSl<
zHeNm$8jpY2H@p-tP+oyKvQkx(#ybswbIwySsZ2k~MU_I6Ni5HdOqI@bAp~`ma%jS*
ztH6w0g7yo-tx|--@k4~tnBoOv<AqOJJXh8I#t7w`mvcq*9q3o2b~%?nt!>qrN16SW
zg<g34T6NtYMu#w~+YA3gmY<)yo}XCD|3{WFEB}AhTCAv&-tg3FuRF_1GrK^qba5oh
zX=T6NG11?6cMlIwXIq#bi~&OmqXhbeV!fa~uKpGzay+ZQT?i_L?2HeJj!p4-8JryM
z5ov>W4D&i&oMCH@wLn4s<b8KmRwyeR(S`Vc?1+M$u;m0TgT21_exF9BVSV{Q9n&LY
zQDcjv(5kBbfuR|?-PG>L>_qU_#o5H|HKzTHwb0SPzB<=lHsSRr_%;GihDqkEyKoD`
zNyxD^)TZOfkwRjILv>ZLWU$1oV|{xSc@Yvw_(_QQ_@3CkI0;TezVVX)6oq#;Ew$m0
z=wiI2DSrUtSfM4bC4hdtR<P+#Rq>R%JpNSTapC<NIbTJxlc6AX?`Ne#=oWG<R^n%o
z;;B26b=bePN-RIh8rQ>qPq(L<I9_gsLl@HR9umyjvCNF_VQ4+mccEgg3#kAX^QJYS
zmEld@Hsep6@cSxvWyhD^6%UT90f1X@(8g1p13O>~#UJK=Y{Zsyo(kuYdH+TQb>O(<
zlqymlin{i7`BlJ$PUA-{ov{8{`3uIqUq8R&tlRl^Uihl<nk%WzEi*$|d1oS*H`DU)
z2Y6D7&XZ=eYEcQa2p7{qAA{lqzK=O$_*chF%3<1c!b{0qA$vxh4g~1LPzcU*nn84V
zM3BZ=SB?}b;~@SXUXwtdVX?D;m&-jwO!!7t$Dsah+I++j>R5|EJ3kg^z+A^@#CYa!
zQj!Ntzarvlw}!R_4x<+Q!1HOj#=QEugnA$Yn--geg{2oX17fHD`T@uwL=hO5vemwv
zJg>L%GEK5UEeB^VZYHSm&{;AO{9#w|p_Nwa8%ufn0T?e{l0KsD{m8u^$PoMRFuGvg
z6TWU7NL!IC%8XH$4Ek7h#N%{^M-Nyur|B`4J52DfD&f4QR9u=b&sS>JR<6HkIi!Kz
zi2hR4$qW71Y*l)k+c|f%QPjA1?@azVYkdItQJ>N@S!yDA0?M~)vk=tW7X*wJ+SWaP
zFHTE(KDs-)c(nXhvs!U|P<_IALv`qAO7q3$wW8oMO_*o|du}T5T|YvpA{SWFxZTmY
z?Jdd7pn=ANeD{7x5FPYjGnwIU(x!T_g81S%{qLIA8R*Bsg3v1$(!^3Qt&p!?N<W4%
z&gv^cgqN7xj9(LXmD8<<cu=wy0mON3tLXH#pL@2KPe06ru$2KQV73P;gxKol3HyqA
zak&e_2TcyL(DRSg31jaGVPAk;yUfq&>{gm}IRq=E{aKwWGg%&?lZQ5u8=5M0ZLcR}
zml9LnJ$$VI$(s4)xf(X<TR7_k1B6Xz*bDy&IgUTJ>i(pkxBJ^acK&NECv1`US2+@K
z!jbFm1H!$Ugs;zF`-Gab#;#&WcaE2pH}SUSP_j411qlldfsuT?ph3a0;kYPrG^<-!
zLVyoLN@{$P&*?08+pvf{EB~-!R7O$^-aUfi?Gj?Ij{6TvTu7|te^AoX!-VXP3x?2`
zMn?OyLt)*cGvh_E(=#Leb45doOP@k*yW#8ojc!A`i&NQ!$hFVV)IruEVXA~|s)~#K
zW|#=0))OED2eeX%PM9Du;|2fYD2#s`MN-vFJ<?zFSX9WfWl@ufMKH|p>YgeoQSM1`
z-njF^horN>V0+ImOX?}2_jzu>o{HU1d|<JimrND!%hgoV|0U_R(qH!X9r1}nJoPU$
z-^D`iN;Gk@mUFYPjmon<8UOw5@EfEef!c&s=z3F-C5NtaX6G`_r&k)Zz~~oAqjj>g
z@gsXTU!(Y5E4HPv-`7phyJOMpBzEqK!^h9ymf{MNLhbC$zx>ZKhm!3~hyhk0k1s}S
zdg)~NTVGDrh^g{`rI4mx_sJi!U+o&iL^CVXD&MSOyl-77Z<%x&8f7-PerpP2JlH7v
zbpJ+_vn!-^>vm?^^d=kx71ajXz_P@Xyh3Ef0mm<RP#VcM`0Q1Ttm3M4lE^+5l`W>d
ze3o=dp2bKK#@)s`Qi16&r8%&GD^>`!)PkD}i6r12dWu}LI_n<l5T!~%n(hlw9Nn~Y
zEpJ%TGvNSZIUzrmsID9XT(GW|^-!>@2;uKNu^1b9`B*AwFL-4nvG<aKcsNg1^0JE2
zk$6VJNLC%eqKQ9Q-}T%pvDuJ}maY`=-#Usb))(Oo;uwbxp4=pd-j&J3n0DRK7)ijn
zVaP<)m}w{rS0dVd$ag}uP}taIs^Ez}UMlI;GitG$UvEHK-V}GixToj3W|~*%oP=s<
z1`(lGIi7rEQ<xl{l8NcKl1hI)v?VcpT$XXvVQ-wLg_nc_c(R5gy#x>GQJ0!6bA#Xq
zK^qYUHL0p@cdyhD^vOm_6_EE6p)J0v2^*=DWBG(d11~rQlYT@~FKq~z>q?1KiGkWT
z_EXg5!b&dpAX{3*HL7Z5ScC`w#)IyPI1W@)RuEZybk(ZiqV{qoCmM@y4=Z|*?jw6&
zXAEEdkgeK=ha<!#A@_!L3QgeWRhLqDn4Y-dwaGxBwevlJ>Xram+vgt!jDlU<%oXf=
zjd?VxL3|vAs)Qk0@Or6x9Y<{?h(R0+fNcFrwGQF#ku92mTo50adK*xj5Z3TZKq)EY
zK2^yuC{jv>?nzt0%}0NftyG?2zoUE5>$rA9$|puKgZgf<2YLVov3$A0VX#>KWBVVD
zJazs1{h##nha(mLO+T4zpnt7S2>`XUNnY<e{m7)v5d%e4i)8p!a^jSyg%nu?J&~Rk
zK0a1{?l>Y0<9(Xq9~MKjgeF7<$9SOvtb;r}VNMCor~N%bb0QN13qnG$C3!*FF;$er
z0!O5}1<J%&njt5R74HdUMVvIRACTR|fj@FGI>rS1^rm}!Y!W|U4;q<e>UYmtTUqT6
zaah`#bPO5(0u3$PU+F*kzTB*uDjGgpi`^Le=7KK317RoatDME=Z9y39{{aeDGM(5F
zAqYGU7qxK~xpx8-v|;e)#Sck*oTWWubg>?@YgQ?nhkGIq(`9`-SnfS;)y_O~Az~5s
zY*|a0H7LhiTWEz=pva8sPY%St2SQ~`bwmG@C!F)Nbo@#xs201T)ulbUZP4W8meIzX
zR8F>obJYG~=6hrcL2z)6d{AtWhcJmMjBF?wEcQAd3f>LV16tP;71XtSyej&J$4(Mf
zc=l}w%<?%KU!`iEsVn!qev;f2vBsT)$Y2}=sNb7+O1_?Hkal(19v;J5a6a92d9iiH
z{aps1^5-v{Ns4Vc#`VT)?}StRXMaxEo|;&4tj*AKbKjrWt4T4hFH$*qGEV{H#}**2
zj!~mXRZE1M(~ScIOHNQi3zSW~MxTTbucYJoAB&&$=5UN6P*CSdIU!DN{i*>dQ+f{(
zPSwy0?^F8H6Ee5eE=*xxR~n_f6y_O+UKH%k4Md=|(QroNEIJV>*PmzDZDO4X)q89`
z7T()cAci)&+rg5=q9S4FY$qS9l6uq*kx;lP4oHNwe@<TZ`mlO+DhwmIJRi=n_$ED*
zGSg{^YY!&(W+NBXP?<c`LyN409Er8;j}L-d2|Cm9X<>!5E)^H{d*TF05y$AXVu6<2
zf}g~IJ}?`oRcly2j+Zd2U^f=AFBT}BD6VQeo4OfXmcl4qO!Eq)9{ap6vQ0MX%&=-H
z4f!Rp4r6o=XfXl-))vh!6eB01jKwV%8%NbB!eO-o8phH5EREBYE8D5L4aYTO>(rWZ
zyUf6=6SR`3m(!zip_})DDzR;F@wq1O26Ed>D#ET6z`=x7f#8-5R-2PALXGls)fxf$
ztrlJY3WK=5OCCq5yO^KV<CRH#^qQeWkCI)D3Zsvgw2i^@lq;`|<;>i-&0Ge06oP}-
zG~e`&j`7ueaPjq;HdRnRVF}+eEERY`{rQXbF<QGJ_166pmb?pTs+{o|^l+=|hD6Lv
zGx$9x%(+XjVaWme(^63U<b<nN#2HjQ{d+O=V9EK#4WWxm6tjlnSw7Rh2!NK-@b^6b
z)4n=h|5Kg(4^aNEnEad7NdU2p&W}Y|U#hRPX;ifQdi4fQbo=1_c+{1H8}3LP5ry)x
z^(S}`y(nfjr`=%0Ff7F{DkcnP8EEDg<4KN64k395`ax4X!;3RZ+(SdXE3;TJAQ-E~
zABMo7=+m!A5LN_&iAF=V#l^z9n1)A~S{poBhen56;~Y-BWIWzsakMqoae;Maw*U3V
zo!yQ3xV4e}P~y?&P0;T<yALK)30`o%s6UN~2?u2^TIKK7KQkO#!(F;cJDBUjNxb>2
zss<AhI}UoU!2x23m5`3G@4hJ39;cw$`~ddKN-LZN?xTFDu<#*UIP`WQ|C5&kS!Z^#
zeDtZ7?eVgSi2EwklUano#UM3&_5=mOIZ&LA?MxxsqCb_VM`f2y+JYAQ-Z1kLh;Lm6
ziBDCMO7)uT80~}%6NKig-NfEngzZ<MVIw@xPou_n7TXBp;@Xu-awb%ljffhG$;I_I
z#TTCz3T1D=L5%L2es&IbAk3V2=1wRpu${`oBYN)qoX74PTJm!ZX=U8kM)QIa$W37{
zlbKibnCE?sl};=3jTb7u|H7g7HWSlX1)9E^p4uL4ljv={>TI7ci6=Nnu?bOc=Sj9@
z9s{y1Dpm0x((Ve_=f-!=Lc4}7CVV-ZzYCGeEe?cDdad!oRwY%8yc7Xfz$9tEJFo@H
zpQV9NV3)$?;CPhy&_w^<;T+26GF>xUZjdG#4(56S4Biu?;zRB9RM;_aTcIVgtr34V
z(V)-brMXy40u{8TCubSlYfl9vCQ6bPOs(Kn5^8(#tK#t=%k;u6Bb*8>vAEl7EDXai
zb@mAVl!N>fQpD8)pTd`cR=Eh7U=YyFa6HLgmXgBb32c2vD4a4{IaT=a?@p?hqa-~;
zU$$8)JxX8<&RSBvoRVk26(F@)l3yiJ0&b<;+l=hgk1DOmXlLYbYinJ9etfyN{+wai
z2jA!6`4X2TxuEn<tHPL34ogQ{5wDuDhRMT1z52_0t7b*(BloidUT!7ngxW_N$ms2A
z0kEL5=vBRzs1_!RW;+2x9)I2uW;vtW-up@5--yk#tr-Nyau|b#5EaPHBm+!&rjKs{
ze%ecTo@3MWbHRjoZIaOYvOCN&k9_a@VtB-x%{?Get42Q2cJD!Qsf@(EX#4itMi%-{
z5)sy!w#G%@^d?o0oXyOWyPe~ozp}KvBaJ6Kro9r>PA}Oa78s3HJU(R(V$|Lh?CMGC
zsG4<=l)!dze4Vz%ve;wm=p1anG36pPyq+Jz88yliqFE7XkTE6{`ucoKi3KitJigp=
z=0@teVqPw2CIj%U`h+KSEC11wKRo&0>g0d5<X`5A_AU#`y1Hdf(tc)Fr1RpV>(EHD
zUnYI16H34#y~)1*1R^UX%+Ji-BNRr7^&>=`Bp!yKM4S&984(3d4uDzN;qCH$66}Is
zdd3DsRE0QsK^V;c!3l_i^>hm61Sm|1-d-d$yBgVj5_6bZQap#pMkcV;(=#n$7}&zt
z(p=XGPCj`Jtc`9Au5Rxv?PY@w7eCz&$YG3}y-H*X;s3)Epb4CduP#fSs0NEgsEl<v
zsS+4?I1S(Ks)%%kGYcN$-}5=&>5fJ6E7xf#wA@dUw=)&B*)yj_$#CwHVJ#y4QFl!8
z!IB(ny|Gtq^dG?8#5+Pb3Z28Go=Ma6U`$F}St`pA7CyGT@N@svB?=E-<<k+A8tg*I
zTb=#X$+wsleS_3pjB!2kZ1Kxb-d%7s;%xq#@6^hfQ%s@;gZ+G!^sdos8}V6n6`)U8
z3AKnqzHi`qj!mK#`mk(@nOjPOt&vD2Ks>lhO5|E@f1c-g)%4-6as`B$nM3B0$`o#9
zb+F`&Vnn)Q({ktR-3z}2cE4=5a%=Sa8F?)?z%P}0uuS{@+>6Mqh(LKZyVZ@gkMe@P
zTvcqr#eDuV6Xvk41Va0!0#!i~O$h+I50y2lIInn~7v@OBx#xfV9KLJ<jR+5#la~m=
z2?zK7#dQ`f;?)@jLb|J%nV#9ZykNpBA8TTX{B30jRc<ZR0iA0eCPZkMu9^k>?N^8=
zO3Eb##*8pg@t!>BYJUImx^FMgr!0BQl9wOiqZP~tmeZUtt^EAPR+MB*a$2&@l#647
zm6etMdi^-w`K(8phTIhrK5<fZf-ZkM;SiPeQ4ef&!_tc<H41?~AxpPz9@TvP+3sR2
zX1EiPQ@nog!eg=0168(jF_E`~r7kcW#I4Q5ThYA7y;*+kyOg12Pg%n{n3lp5t=7l!
zqxjf#=-ChRYFF7iMoxW#tJ0;DWi*EuIT<PdK@N03Z_q=*gd`6{2Xd6O3k%9^Qg7~(
zF;Z)_Fam8SKzEXPmK!H*_;owi!J79PRo|BCcxK``3z8O7ew;2@Fx%d)HE&~mN7?Zf
zmtWiMJUE|P4x|2&6o_<`b;-w*Ik9ICy*s<F!Z}2t<l2QE$^6bWLtt<izxx_kg}F;6
zZ^THy+Vb<^Pl+Lg*H^wJmenBKypXP5MG!MqCP`=fy8WoHV&K+y^#0{PlJZGeHsEdp
z{EQJ~UdFM-&h#%;Kk#gj10;}vC%y4pi3b33_jJb2O!y<}`hxMJ4|UXzZ~EBVT`^D2
zE3H(}6tB+P{Y^7m#^>D30>|ExHJ)F*LH{s)GCcloUGk?r`F~>0e}+8&W_xm?DZA%b
zl_IKzw|2R%>>e!llzR&Xzx9i_a&XLmgCRZ1C|`d+0x5tL=w?qKhr=T6@x-`De=}%k
z7#8N57?K<tA7p2f=@n6wRNxgDjK_dHEs!S-?1`g*PIj8S^CqJ~2pWxv2?-^CA~*I9
z_kQ$B9vbO=mmS*xnwo}^X6F`|W(HtgYwe%HAgpU+pSQm3EX{fzE_~no>14nQKXb#5
zPjnMOB?9Ci%zQ$BCdKWc9D<krneZ?&av1j1REcy(a{P6iUyW1E)r??KF@3wbCq|2h
zaahXO$me%u!VLB{S6xJVvn4)<vFHyjc81*bXeQGYSnp;(G3%>VvbH8c5qNg%b1FcF
z2of7wB}+xM|DUiU^q6qD7DVq$k5Uz#wB_SkoJNlB=r`Ika$cG0DML4TZ<LpPPr|-{
zIi}iZuy~ehoC-opN65_W%+f+H)~bbhZCkv_QuB!L)@vQ(2A`I}%e9O*!Z~HYyffZy
zN)VnUeWCJg#km<+8neX7$oOl&eE?+EZrXKW(J8U>%}kAxBAwhl`K(e;;AnS&v+`X@
zdgZn62e02{+TFOabTrw%GV(`LfDG&^m4suntv6y+7hemV3=$h{lt+Q9Reh3pSoM+$
z<=5>HRuCi>3cp}B&0?`*)wj&H6uVuA_73;un>XgqI~bK0hX&;s^z8DPG75CXFZjgy
zYUnbu6Yrwo(6iR;!8sSRP)<*XBUu0)4oi0L-$jEjBQtIE9)i4r6;&Da$_sm-X3#P5
zB!noH>N@nMJ`9R=ELe^kD|(H`;nsuk^6p2HiE1ehl+`TU`9zD$K^>CMlM%|nL;^EY
zLb46)sfwtNfZT4*<+Fzxc}0EE`nIluet|QEpQo32aJl7hyYSi$HEGv4UkPAzeKXC@
zfQQ{6ue>CHr})+TS2P_`>$wf-<C1J)X;o~$>10^G#G<$^B*<YzC$ij$Z=+tmoCnz`
zAs8(1_9pGRL)ckkrR;D!o_Z6{g3muTqL;4(l~=fGR+@$*57u`gdF9`VN1#AH+fl41
zg%&fz`>#~F5=j1-v#5l53iNE7nvvm)zSL3YcQq`!7K5@OdZe^d>PEMBXgo8Sj2hPG
z6GL8=rq~emG*JoanRhRBKVUEv8@f^wU_L<W4rl@DU^@EYXfpVf8U0j&^uV~ob;EZo
zJ$(5ZTzQFuwyhn#(^IY@9{A}YJzl=)bq%)t3crfl3^}KgLn$bM;Jz_q*SWv%(*-+U
z8}e0Es}Pb8O)$UBrCn<%y|N*^3%Gz5scQf4Rue5XUbUe=E$shj%73r|69xdT|JjoH
H&+q>L_7_0j

literal 0
HcmV?d00001

diff --git a/static/favicon.ico b/static/favicon.ico
new file mode 100644
index 0000000000000000000000000000000000000000..ad4ca66a17637746a5c33e5a1cfc46e35754fac8
GIT binary patch
literal 21792
zcmeHv2UwKH^Z&l}`q2ag8^(eim7pLN>;*+)iBgRs8VhO=>2e36#%@FrrA3LTNz^C?
zMVis5!2-qxh=LspNE9QSl>5!zduQcPN%`ja|Jlb6yKmXq*?DJoXJ_X`h(HX&i9lw^
zR0pBYq1?SYcl~91gciU(Gc)eGgC0V8RtPn1%3U88z{|rC($!VJPa|~L5up{14#Oov
zQz1N+j2tm!9Da(yXCZU--ZcXu>CKTt22SuNN@KlNyG}GYm1E;K!?)^yTPKTIXI70F
z^-UgWI-;%qFFH>@xo^Dm*I#wEMnyGESP^15Y<JO$GTk*H-FpyALRz;S_H_sTH2<Ww
z;l1~-39}RJDLqo^>*rhCJl^uU$&5n}va?G{O1zYr(Iwf}wglz$%P9+ZT$XV*-Ln6V
zJ59|HF@_vyId}UqME4|UyB2nKQHa!a=)Y|+A{;4Q-S%=69x?X5t{u9B=x~7<x_QT-
z53P%=5HXeH+gU5ZrBF@MSglbc|6MKlmJEBUw=4Hi%J>k&z{q>evb`!UXIQN-_%iw8
z9Odkvo%bbmujyp)N5?-motgMJGPpe8uIrlgq?i(GbmX$4m$%Cr;^1(DIYSWfqh93>
zqtux>eqIK)hc2~UoL(I5u>0_$!gZ52Jesv|?!6IL61Et08`Cmr$4uM1?6CAhi7{To
z$0ZabPS1(!*NZoJ3*SuM)6*lvqOj_Rn1UxufAK3lYMI?4bN-=)MFE)$bDv!ZanBkn
zJUXU2Cxt4ru6S6G-EXE>TF)Yf{xPl>oJ+i(4+^%v=q>%iIwr{ZbfToyk=emDEsE~X
zO7tAv*G*O%y23!`n%|s7cMK*iz4ap7>4;Z)`N4o6;+1J*g7Z#1$n^+(eEE|9ow6Q<
z%CaU?nlIY>lLsjk^!(9sx*cja`qJ66`?CyczbL%up8rK^aiQXQO8A5P6@wM@?IAt}
z%Lo5n=v+W=vrd^8?;GHxo9ulm&3JtUJGVks<50Y>N^YN9`t^gv;U2fmb55R2PubJ=
z`mAQR){N7$Lpw&D%F6bi)U5Nds$P2!&dJKx3o86-zRtES^Ib-YTy7Sm>`VQ0k#!1H
zn&q(gme;MTeTuX5OKO(gNRK`caVnzQm}1{<IybL+WdxpJi?bJ>9kRY)=GYq(zV-~>
z;YNFw#LSMLar>8<<~v(mO}bDyywm3EpLNVGxV$I!(6r#2p(n2$ij2xGSn2LkR$~(#
zn|Wuu?%uR(%bOhvU+~L!vDLOyPu2QP`|5b<&{CecYt8+O`=2~&clFjDePFxYs9`^J
zUgKZ6WA}@qj9k;QiXN3uO3&yW4PVGpese26wVQb>UY_HcdC#6YUi0_rlu`MOWAKct
zzKYVL1K6^awksd5D+xYo$r~SdxqWPWf=x5!s1b<R*uA6g)^k^OM5I3I{2;F4vS*87
zll3Ne9ZH|mHSdH#@q!-k=-M;U{wFsw^8BZLzpG_R#;)Kj>8DQ(+s#U-h@Nlp{eZNf
zy&-2ty~s{G-uk@NgX0fad#4d*C+?V@J3|;}6h4~ld?o8}+O4bMvF4&kS4X4J8pH9~
zEfiiJ&mS4*pNiZZerxO8<!R<W**57t<>7Hj)wpW=c|lnx{TGfAL{*xYoo^Nz*?sO(
zof*4#7g^oQn6=N!Gh&LR;5(O<rw=(Pf^Hu%8sA3#^S2?9T`c!KOFkA<aA82L^W45O
zrsmt9yG_fSI`r@VxcW*`+e=Bk#PotIiN4mMclQKG9yR#tv9V(R&l9RHeLK6APT?if
z;{7qSuANP}_pm=Z+26R^wAF!#C6+B(jI|wnc$-Je&US5&jy$U0en*0R@=&*|okW=%
zllS|*@B9925T;z*`{ZJm!Id|v$?6mRgZ(EO4NIWf$Pv5Dd!p%qHFFM1=Ew$nCndW}
zXa1I|RDShDv1e~r<QI4S_fKPXBy9{4n8`!3BvbpB<;KpRRDQj%Y<s7heN&&zw;tSI
zY~B2N?Y--R%2zdCH1%wT^%t=wXS*3q@6d*z9Z&vvwqo}m(cMg%r9X(PP5ttRySf9G
z#d|-wAC_@-Ug-7K)@zZGW5>&UvctqaMt<$D&U};<YktLO?0L_=d91&GF;TMNM%IZI
z2a?V{4@HBWfQth&67%<MH>%DXk?A%%>v6eDEfZ4HEwNv`8}d1=5T>S`Pdn=PIm!R_
z$1VFqPWY7Uxos({nU(4G<HY15*YI<;Rk4}5iV|D0WbKW$zpS;JTRKHiVe0c~*2Q1+
z?a-3DHs`O5M)R9TD=y}~@bWoZ6j;`s`6+8@*Vx7VZr%znHT?00Zeo&E+&-3|e=?oG
zyLxZb+MAQSB?IRVyt9t5;6J{Qol+7+Df4Zz%b&t<xO*mRd&@odg9^$|p}{6kPsxo_
z7c441CjG8*T(Nb|nc<+@7UrvhK0Ua}|4CSoNzwG)wK1&*6)znyOSXFK^9$@nX*{YR
z#qkQKL%*g~$vpY-+3WV)cv?PbTJT}3Y!4g3Pdvx$w3r_02Mqh=bsJUv<*wkA%Mbe2
z&RA{H(tDQdkyXnxBjx?%-uLdVzCUr!-J;UtJCm1JtW}ntj{n0yrYhe=FWlcepVGCE
zhaAgEt$4mU^F`3ShzghfF1r^Gh^G%Gr=?%9j=S)C`g4!gH3!f2J>E`^mYqr6Xn&^j
z!BU~`9wxe*j-qqs!{p?gH9?uB3y1z0CrU5cVnLiut@X{H_T&qX=X*W6wV3U2E_0m0
z{jJZ&Rm5dW!tFA`d(S@?G;8i=okQ0hCu9UJ>d=2yMf2VVhWr?HtTr!i&H$;mU(5KS
z&i8jXCAI(?tNZjDo~|*A{VEyT;L5xQFCr(+Nd4hUpI@uiD3%XQW-@~|Tg)qXc-*Mq
zLhln(%Z!JQ3oOn!d2Le3h0O8ugnir!(lU~1-J@5ZTAa9GA-=gXr|PQ3*xW72D5l`c
z0g~jD88cCdb<voZ>RCTMWQ$iF8XsI9QnhkH)o1H>=DmntJ6+*E9Dhj^v~g}(e`Vav
zIltY0zOwW{LB#V%R>iqq<&O_snXsx=d49SgbGqO2(FHld!&9Hktcfa5$STZlR@^e+
zyB>bI_8n_m7u7}=Ou5G1zS~xgMn!FQKKJ=PLfoc}$L)m63$NNZOue0G;<D(}4{dH2
zFWX)d=sv;ymsClzcX7nhgn(&P0e|eCG%fJq-An$JPGz!%W)o^p<Sg-PGdZKexXD1p
zk)8Po)dq!2no2LXT6`%b_o_=^vAgV;!;RFU+()wD-&2+r6<+iVP0lX1Fpo(t2r^%1
zU2!tiHz8+Waa?l#^K&`Q`z!iHUfwaVup0vdcjc#DN`8&?D@^%gY5!Ac`)aPGp5Eu2
zRIqtT-s7O_`4)=W!y8=3rkW(X6g4@z+Wu6zNk+BR07dkul3%~Ix;xFa()P}tp-(4!
zlZ9)GM->h|GHDR$dm+;%%GkOve&$!h`kTr16TKXlBO~Yjt>?@3Y@1be&q5IsyzkE!
zPg{8{{N_;8#a>qIqIn*QbkEcCV9M(~C`~6cDM}uD$y1K#31CxSK5NjMUX93a#b#!s
z5y3Z)Ki^u8b`gBOfgL)QW$wc_L$eWijMkMecq(W?^5v#-d3S;~iwPdI9ICO6)fz?e
zAJmc?%J9^Atxc-V1jC*ejU4JQWbdFa!a6`1HrMD20N!zHOG>2@HKI`ljXKb%1OE#h
zP$(4Wui%A3K>{cZfEK~w1*K4Y6i9d<psN4DJpC_Z_MSFLcuoOu{@%G=CX=DRf|c@6
z<Mp9o=79F=Lc`jI%Vj*7>}zqTe3Q9czOlVrmE&@Kh-fR9uWK%oFA>UQfxr(&Fp|qd
zNx3|X=J=Bnb@8cfUHgFhBz~tQLZJf@Iz9lQj6Mkc0=GILq(2NHm*WUIWpKGOlqVn4
zj!8!mnwWx+!)}CZ*MZ;K73i1(a3TPl>sxjC<{y@2QA5CESrXTqpwnbexM53Wm|-(z
zph0V;xq!7{`9s|GB|DTllJAuIlATIjNg@E}^<jrnSNxr-j*fU!nMCM+SitW$m1Tu|
zjz2zC7oTtT=EJW*C@T36=S$+eB}P^AB?ixCi;bVQq|m2`w3#Sk*H`h`b>%{K!wUiX
zO_hM%P^}#sl>#<ODd5Edwp0t*$Z8?)Tcv>6@RX(|Za{>{062pt3H&YomZaf-6kn3y
zD=|_olo-62CvK`RqrhuV+B%8ZNF|@$SSbX)SSBEcriKO3)aWHNHA+TP_MrgzD>$xX
zDAzb1voM*@tiC5;p&#t}XHd5mml@hA8dQi6B7<{}zb9$<AIX<&TcqaSOWd@gl}i47
zCX3mP!2dTDLUyx~p`5mGt!itZfNx3h2qZEhiOvozJ$o<Lhlol6i?LNnk%Jd<G$=~l
zgTM4GUgLken*S=`zY_Qd`D6Y!0sk9-|0v+!8RUn*J<Wq0cqKrN1n{8&31ti}5roJH
z`Wz)-W8gb%Pzcy9H9TfTDM6TY<=#`t0q8YcpFWO%mssEosxWH)ar+vcRXJSKaOQ>k
zhjaWgU&^Ds(gkcZ^kE&y0rZG+*~;~hd*|QdAIl#nN~6Efm->>r4}@tq;QdblyRk~h
zZmr=nVRs1Bv?Is2HeIZb?yF}XCx7P{t|q0K$MM{S`=AEa0}WL7;1SnXmiG7o>p#q8
z&+#{)i6M(PS}Z=bY;gLE{A0egCG|7aIH5?Q<8U?qFc&A(GSswPoSwb>mfGmld;cHg
zU)?U|A18q>pIP?|<{?-=wkUZ_@MVMy+i}lc8}l%rpaKJ+KLjvYu=ssE|9`;z^S1uf
zCx4E$mw!o`r52u2t#7J6tg9f%_Jg^{G^`1KEe++1qyItvp`QfFQcls_T)Gx?C?3{=
zo|8DPS)oP`j7ZwDFDqQpn-v7wutK>tD_jf+(SpVBj;uE;40IFep7-I_ud2D+`c>Eb
z-%$Chz7wp|VFES|#_;MgA-l7dBKyu%^Dn|WfXm%k!Q3z%W91^Lp)yEnr1S&$zXt*E
ze38TuYzLM7Q1kcm&y4|^8tN<L`2R!5O9c53TEOwo2ww8f@Mnign<{-IhSh<<j~~GQ
z0|4*;3;d4=!gD9cU(NqeUp4=HJXUeJ1I<pJBQ_}dLZo-zQ>2&gA=0}tU8I+*4e&e<
zaCx4%$<u#M{@hwXQ)5@W;(sT$g}gQLhg_v&LV`4IPB8;bDB9YTqHO_v-h;mI+{RI$
zlcX8Hpg-E|pTD60B#d8|SUi5Q`~_@cElJvXa{RL*E^qkXVgKy>1B_7&OZ)tW=YFsy
zo@2X|B)d;g^Z#-U#(G2(gb*NjA1HW-0V9zl2-co2Nz}-{9{aNa@_)I0>G9dMU;}M}
zy}+g#0lVr6Nw(?7@vpJtK3@Ksd3VGs`@cT>`6Kw(*u*OPfh5U}BRJWE9nFiag+0y*
z2-Y&@I9Bx$S0L4(Ab&5Qu4=8uG+_Vo-G|GcR?XFTO?qXoY3#Pwb4;1D^%#1(%6=2D
zYs!VZ1hAneZNg7MUH;PA3;l$D2z{XZKgNCrx_F;}h1$Xr@1X^-9|jv5_F)^IkVH2J
z{7l0?2!g`8{4v1ege3?Gi~}C%|IYWz-!+btH;ebMU^-#hV*61ATn6C%Er!O%=IgNZ
z{7h_na^p5m$<lL=AjFfvJE}bnN0aMKL;nuriDTZ+zq5MZ^wQ>4eLHoV>hh~w1fl;4
z-fQtyd#?zEkllo3|0hXw8o||h#XrbVSD&Q18hjkOG$E;OP_MHCU%E%bzxMeb%OCFz
z1rTG2=WHxPo>&dI7U&R!PBW4)?M{=nU-D?5OqDN%-3WW%h)N+ZPDxV^Uvs>_w3$^M
zZb!4@W{3^Wd43$u;yTmC2B#N@o0Q@8*GFPd{VxAlcALR}5|YPI6C?0Go}ng3!QOl;
z_DQG#W%unY?Ue%i!yMpOHOC8h>tW6WpAg>n(r()k;zQpx`*zjXQ}N%G5qJbijcWp=
z##I2ESAQr1;awl8;fwhaqZbP#1{Jf!O`m}O!4mvelf>Y&;<M}j6tWTEyV?kIH|AwC
zK$GLL2KZjIQpm<s3wWDhuNzq-WVeC;YHcY^ja!5FFr4hMze1H>DqByXj)&Z!g;Lf)
zENRk0xwJ`3Wq6Zj%Ebm|%8o*|5B47#sQiZsN<EeD5PXAhtsURNvjhO-qU}nlc>P_8
zaNdtXzV&35<*EFXEGwX){En{^dSe3)*T{wfoB@#?5ZVNYXp7JWpw|L|eg`5n_7LD8
zLXMDQsIIl-4#^1F??q@JjPovwVSTa(I-oDAgk`Q?H@G=leP5M@fd4#57Sdn@L)}-9
zAxuvuUnY{v)-`(z&EZ-L)|$#?EA+6>Tqg4Y_yIz&|C|E<IaQzk9L@*`^;rQvFK7sG
z{kQSna|ftX*E^UFt;PqPU#QQH)Mq}Lv!B0|<Fg;2htGmO79V$Zgn8E@hsOJL>qnzp
z8s*Zc1An6qyuOw-mK!DTu@V5g3z-4z0EDUpg*sB>I#;K?^RLfkYJ2H@@hzH|8XOM;
z@2cz|ZSgeq#?1Un-yPeE*lv8UJnM=fdHdd~&`{IJuq8cLhlV!C&qC!J+lI=wb`6zp
z>GCF`I?3hh;hg}mxBbE1*4Wx$!>i+J-sY)}q4CZw2v(S5hfuaLLTW#;T|C61WC4DI
z7?jsA=>$TflMu364SRXDPmqhN&=7sQ{kmc}-o7_PthXwpNps~$ss2X%Oeze!q$}C3
z+TY=rl2_OT_YMH|Dy5<&xdOiBSO`mbV~_WC`x?IL%lojxCEjojF@Pt6enHP@A2|Pt
zsAj0oH&SGu>95dl7ERiR@tD91LSDR*&nzz{2!qzI`-K|PzAY<Ux)9Da?0BNJT>HMK
z!S|{pi1x6rd^eHAC$>EBQQ*Bj_!_=_{f)n~eUj)gk@JtK{AX&v8Fvm&5?viIkKl8t
zB#_uh!^7X(zQt!6x^L#3Pl(4X&IMm1oNx4=qIs^ZeF8e74R8*)tS<SJgtqo^YXkwl
zl2zE(!qD#9-q*h7d0n{;E0BMD``F)VIT?Qg9^;>_p<7q~q2DB&clOi<@JYrtq<w-g
zv*y}gSz2HF;LzZ^3H7qI;Y*Q0af8}NMi73s34B=_Ycyl9uKt7KiUQ&6QyYBY47FkH
z8@A=z-&9*)`{47YyE1%FZTL(eO>R*8M9WWc`+R17WqtD3Jkyr<Vg!K=Y5(OMz=Yk<
z(5_4V_!-Cm$2!yr7=K@XeES4RlOscL|5<7-#6ogOOZzYcUix6)DQla5wU2-G{6qVl
zgZ677#!jwo{vCS&--iZYKkRv@4DD-~f9jlnRX$mQXlIA@9`_&O#5&j4zUG;>9M-?E
zy5tY*&!D>M5JYPmSOd>ve=_*N(_Vk)ZTZ8Yi*O)MyrDig3w3|{N@Dl|*56f_7LQ&8
z=cf_X5K9?Bk=9dR0k6MfmhzZ@^W6Ho`VW$5hJSW~zo{y{-M%i%Gg@ubN?9M4<9Jr^
zOWRBJw{Z4H=tW)ecBRhSP{p(ESKA-UuM7CLE-XvD&;Ag1LnyI6SRk~k2SPtc5mK*X
zgA*VQIQv~-n`{jDj(e?zDQ$?l%PM_Pm*3GpxlBeZlgo8J1WROcK4*VMnumtQ^aS(>
z4UK*U`Bn?L{F_!>ytJRn-z$^JU)r9y?%VSJhps=^{>J+Wb<95AW7G?H7yEV9`;RKv
zf7FHgWA^`{{{CBX{ePw%&3O3#HOGDu_|I%qzsYO#le~YQu5H}br#}=Tc$N%*K|fZq
znol4hN%V4p*uyO}^%=z1k6+7B<5n}&XR9C<-=BcERzh_ijwxzlZM0HXt!E4(bex2e
z%sJwwB{~Gsr>JS$MEIPRje|4t1f`I-9f0%i;k<VT*g+n92qZPpO7+zP4Sn$hfh5IK
zY<yQrARUTwje^(#ID5C3QDiT7ysv__cM44o_2)4@Cxy5Tdg@M&j3#d4B~eUMvkrr)
zhYv9c>E{AT+Dx(WL*QSRqNc>bS+f!m&0slvGhrKsM`N2}6T~}Wy9Xy6L!dnYeepzr
zBz1<^_yO<_^xdN|eXxz-=QR}6#jyuCW{D5+2YA0^K2*ql4}EZo;;6pt1GdRD`$HTX
zgv%rg^2huG{fC@<++#TUX1%!jn(xTjg9MToK}^669P<k?8LhZ?wEtD}f8<^IZTfJv
zxV<)KKH@tx5AXN!zMmw_dTS_yjm6U?$hJBJX$EMmhM56Db#W3(PXPV<YWb-7|HOu?
ztKlDCac$Am@IcTfpx<%0hCal8boCJFUvm=bo`gMIj*C$5w5w3>oU2ejd%jrznTN>e
zmM-Wg3Gx@I<X;zkPSz01Izz-uf<3#1qlUf-Nm~a?jg|8yO)7AFD)?e*aGWRPwZ4)j
z%4s5_8$cgIR@}F~k3LP=dJ2I)#2vk)Ps6Y8bxEq74oS5Je4<8c1Cs9g;qu{Paqw6c
z^7a7zF8It|lQep-xmM-St_Y7Wtp9K7Po3WvXwZCyc81txh#4f>^nHUEH?}nGyc}Pk
z{~G<o`u`sNl$!AAup-dWB7!i+O9W0h$OFfgYvRx;br}W_p$qz-{@VBg`kS#|>aFpG
zV|(!U>M~l$?uPN@7LTtrI>nXW{rj5!KjP$r=Lfu>G41m9+XT_3ACHk2aQ+@kC+<1T
z7ZIe%1c6TKIDt;`c!5p|;IJAg69l?P=8E-8K|gPD`subs1pL#KTO3U~EK`AUTmio^
z_@2)!DT3b{z#QtL=ADam)FY_&GSE%X&zi-Mt5F*QWr*Xc4UjfbdWZ}$eHbQKKcm4X
z76oxk_%~Jf_dIbBXS1zVz-)n7zR8<4bCIThcz@J}V#a(zG4_DbZ-O1&o@U0GQG9#w
zVUPsbb3CjmYjJ!yO^pdx{l1H|52eU{vk8RfRMi*;9l_HXm$a>GjrTd5KqIIBN{$C5
z4!$x2{Fm)EU=Jsio`D_2#~0?b(9J=>+fERztOQKRRhVb4@tLK!0JkBQGKC<F+T-`2
znri;S1$+hbq$)1D2P5&BCgS}Haf>5`Ok_0$YZ0DrX=;c+p9#$sFkcrzY#RP;r6y_W
z3-ApKMzX+F$fiR5;R0sKEugH9+f=R31fTi(HbaeFs;P|UIVj_GUW)JaWF)>*gzQlq
zHz{DSPgBPfOaY)Fg`*L$XQ<KG_kSLj)#;t~-Gyu>*Z%T{FxFLcIU0BXcNm6a+BNZY
z{aMkf86y2Vu%`a*Ce%3xcHW=PLiP|%cD4szp}r8S0wk^<U?X+m{5?7<8?PI~pJ6YM
zBo5<Cq6hH>>s^F~7hHtw5sK_I3S<TKar`At+}cYJ&AVg!3hWeBf8fCz{C8o*bKHb%
z2G{@B>vMJ(*k$AS%&NzlenDI=4?{qZs&8V+N&-0fbq4vZC;=aZ>OTH$Am)Oh++xAE
za{`y4VF->UBqSmrNSADa?}7aNUVXo1_ra_I`;F5TEIWu-1iPV^3x2mH#SHcZpRSk0
zupEBR3%S7`{!&w=yO5Vk6CFn3I9?tde2GVg<nox%>v$f97};1{7vw=p2(ndgMi5}h
z2o_i|LSL}s=UXwNfc6yp-<j~6KWt}#Uw=D8Pfdj1%EnVf*D)L~96$f-`IGBM!~gyt
D$c9dJ

literal 0
HcmV?d00001

diff --git a/utils/remover.py b/utils/remover.py
new file mode 100644
index 00000000..327db984
--- /dev/null
+++ b/utils/remover.py
@@ -0,0 +1,53 @@
+#!/usr/bin/env python
+# encoding: utf-8
+"""
+remover.py
+
+Created by Roman on 2010-06-20.
+Copyright (c) 2010 __MyCompanyName__. All rights reserved.
+"""
+
+import datetime
+import logging
+
+from google.appengine.ext.webapp import util
+from google.appengine.ext import webapp
+from google.appengine.api import users
+
+from ffstorage import *
+
+class Remover(webapp.RequestHandler):
+	def get(self):
+		logging.debug("Starting r3m0v3r")
+		user = users.get_current_user()
+		logging.debug("Working as user %s" % user)
+		theDate = datetime.date.today() - datetime.timedelta(days=2)
+		logging.debug("Will delete stuff older than %s" % theDate)
+
+		fics = DownloadedFanfic.all()
+		fics.order("date")
+		
+		results = fics.fetch(50)
+		
+		
+		logging.debug([x.name for x in results])
+		                        
+		num = 0
+		for d in results:
+#			d.blob = None
+#			d.cleared = True
+			d.delete()
+			num = num + 1
+		logging.info('Deleted instances: %d' % num)
+		self.response.out.write('Deleted instances: %d' % num)
+		
+
+def main():
+	application = webapp.WSGIApplication([('/r3m0v3r', Remover)],
+                                               debug=False)
+	util.run_wsgi_app(application)
+
+
+if __name__ == '__main__':
+	logging.getLogger().setLevel(logging.DEBUG)
+	main()
\ No newline at end of file

From edb4f5a3bd382df1f178c157802c7a90af836ee8 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Tue, 23 Nov 2010 12:49:57 -0600
Subject: [PATCH 83/94] Change a couple of the example story URLs.

---
 index.html | 4 ++--
 1 file changed, 2 insertions(+), 2 deletions(-)

diff --git a/index.html b/index.html
index f5736129..4ee35c4f 100644
--- a/index.html
+++ b/index.html
@@ -98,7 +98,7 @@
 				    <dt>fanfiction.net
 				    <dd>Use the URL of any story chapter, with or without story title such as
 				      <br /><a href="http://www.fanfiction.net/s/5192986/1/A_Fox_in_Tokyo">http://www.fanfiction.net/s/5192986/1/A_Fox_in_Tokyo</a> or 
-				      <br /><a href="http://www.fanfiction.net/s/5192986/5/">http://www.fanfiction.net/s/5192986/5/</a>.
+				      <br /><a href="http://www.fanfiction.net/s/2345466/3/">http://www.fanfiction.net/s/5192986/5/</a>.
 				    <dt>fictionpress.com
 				    <dd>Use the URL of any story chapter, such as
 				      <br /><a href="http://www.fictionpress.com/s/2851771/1/Untouchable_Love">http://www.fictionpress.com/s/2851771/1/Untouchable_Love</a> or 
@@ -117,7 +117,7 @@
 				      <br /><a href="http://potionsandsnitches.net/fanfiction/viewstory.php?sid=2332">http://potionsandsnitches.net/fanfiction/viewstory.php?sid=2332</a>.
 				    <dt>mediaminer.org
 				    <dd>Use the URL of the story's chapter list, such as
-				      <br /><a href="http://www.mediaminer.org/fanfic/view_st.php/166653">http://www.mediaminer.org/fanfic/view_st.php/166653</a>.
+				      <br /><a href="http://www.mediaminer.org/fanfic/view_st.php/156934">http://www.mediaminer.org/fanfic/view_st.php/166653</a>.
 				      Or the story URL for one-shots, such as
 				      <br /><a href="http://www.mediaminer.org/fanfic/view_st.php/167618">http://www.mediaminer.org/fanfic/view_st.php/167618</a>.
 				  </dl>	

From 708f750bab20ac33885752321e5374cd821fc546 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Wed, 24 Nov 2010 09:37:49 +0000
Subject: [PATCH 84/94] Added Mobipocket support to the Web UI

---
 index.html | 1 +
 main.py    | 6 +++++-
 2 files changed, 6 insertions(+), 1 deletion(-)

diff --git a/index.html b/index.html
index 4ee35c4f..ac1c0426 100644
--- a/index.html
+++ b/index.html
@@ -51,6 +51,7 @@
 						<input type='radio' name='format' value='epub' checked>EPub</input>
 						<input type='radio' name='format' value='html'>HTML</input>
 						<input type='radio' name='format' value='text'>Plain Text</input>
+						<input type='radio' name='format' value='mobi'>Mobi (Kindle)</input>
 					</div>
 				</div>
 				
diff --git a/main.py b/main.py
index 9a9cbf31..e124982b 100644
--- a/main.py
+++ b/main.py
@@ -218,6 +218,8 @@ class FanfictionDownloader(webapp.RequestHandler):
 			writerClass = output.EPubFanficWriter
 		elif format == 'html':
 			writerClass = output.HTMLWriter
+		elif format == 'mobi':
+			writerClass = output.MobiWriter
 		else:
 			writerClass = output.TextWriter
 		
@@ -292,7 +294,9 @@ class FanfictionDownloader(webapp.RequestHandler):
 				elif format == 'text':
 					self.response.headers['Content-Type'] = 'application/zip'
 					self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.txt.zip'
-				
+				elif format == 'mobi':
+					self.response.headers['Content-Type'] = 'application/x-mobipocket-ebook'
+					self.response.headers['Content-disposition'] = 'attachment; filename=' + name + '.mobi'
 				self.response.out.write(data)
 				
 def toPercentDecimal(match): 

From ccef466090d6050681b2efea40d05e4904091b5a Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Wed, 24 Nov 2010 12:36:38 -0600
Subject: [PATCH 85/94] Change no-class div tags to p tags in mediaminer
 stories to get paragraph breaks.

---
 fanficdownloader/mediaminer.py | 6 ++++++
 1 file changed, 6 insertions(+)

diff --git a/fanficdownloader/mediaminer.py b/fanficdownloader/mediaminer.py
index 6a4c03a7..daa48fa6 100644
--- a/fanficdownloader/mediaminer.py
+++ b/fanficdownloader/mediaminer.py
@@ -346,6 +346,12 @@ class MediaMiner(FanfictionSiteAdapter):
 			soup = bs.BeautifulSoup(data)
 		except:
 			raise FailedToDownload("Error downloading Chapter: %s!  Problem decoding page!" % url)
+
+		# convert div's to p's.  mediaminer uses div with a
+		# margin for paragraphs.
+		divlist = soup.findAll('div', {'class' : None})
+		for tag in divlist:
+			tag.name='p';
 		
 		nvs = bs.NavigableString('')
 		sst=''

From 719aed32a98e1c23f7ea56aad36446f646fc4164 Mon Sep 17 00:00:00 2001
From: sigizmund <sigizmund@gmail.com>
Date: Fri, 26 Nov 2010 15:55:04 +0000
Subject: [PATCH 86/94] Tiny static changes - preparing for doing some SEO

---
 index.html | 3 ++-
 1 file changed, 2 insertions(+), 1 deletion(-)

diff --git a/index.html b/index.html
index ac1c0426..c084a399 100644
--- a/index.html
+++ b/index.html
@@ -2,7 +2,7 @@
 <html>
 	<head>
 		<link href="css/index.css" rel="stylesheet" type="text/css">
-		<title>Fanfiction Downloader &mdash; twilighted.net, fanfiction.net, fictionpress.com, fictionalley.org, ficwad.com, potionsandsnitches.net, harrypotterfanfiction.com, mediaminer.org to epub and HTML to Stanza, Kindle, Nook, Sony Reader</title>
+		<title>Fanfiction Downloader - read fanfiction from twilighted.net, fanfiction.net, fictionpress.com, fictionalley.org, ficwad.com, potionsandsnitches.net, harrypotterfanfiction.com, mediaminer.org on Kindle, Nook, Sony Reader, iPad, iPhone, Android, Aldiko, Stanza</title>
 		<meta http-equiv="Content-Type" content="text/html; charset=UTF-8">
 		<meta name="google-site-verification" content="kCFc-G4bka_pJN6Rv8CapPBcwmq0hbAUZPkKWqRsAYU" />
 	</head>
@@ -35,6 +35,7 @@
 					<div id='greeting'>
 					  <p>Hi, {{ nickname }}! This is a fan fiction downloader, which makes reading stories from various websites
 					  much easier. </p>
+					  <p>For Amazon Kindle use Mobi output, for Sony Reader, Nook and iPad use ePub</p>
 					  <p>To support new features, such as including story summaries,
 					    the URL you need to use for some sites has changed.  See below for example URLs for each site.  </p>
 					  <p>Or see your personal list of <a href="/recent">previously downloaded fanfics</a>.</p>

From 2d7f6c2e5c64d9f354d676fdaf2b78bf5a4bfcb5 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Fri, 26 Nov 2010 19:36:53 -0600
Subject: [PATCH 87/94] Correct story status for ficwad, change story status
 for fictionalley to 'Unknown' (site doesn't tell us status), change mobi file
 output mode to 'wb'(binary) so it works on windows.

---
 fanficdownloader/fictionalley.py |  2 +-
 fanficdownloader/ficwad.py       | 34 +++++++++++---------------------
 fanficdownloader/output.py       |  2 +-
 3 files changed, 14 insertions(+), 24 deletions(-)

diff --git a/fanficdownloader/fictionalley.py b/fanficdownloader/fictionalley.py
index 68cd36e4..b1a32125 100644
--- a/fanficdownloader/fictionalley.py
+++ b/fanficdownloader/fictionalley.py
@@ -69,7 +69,7 @@ class FictionAlley(FanfictionSiteAdapter):
 		self.numWords = 0
 		self.genre = ''
 		self.category = 'Harry Potter'
-		self.storyStatus = 'In-Progress'
+		self.storyStatus = 'Unknown' # fictionalley doesn't give us in-progress/completed anywhere.
 		self.storyRating = 'K'
 		self.storyUserRating = '0'
 		self.storyCharacters = []
diff --git a/fanficdownloader/ficwad.py b/fanficdownloader/ficwad.py
index 058528bc..9cb353ce 100644
--- a/fanficdownloader/ficwad.py
+++ b/fanficdownloader/ficwad.py
@@ -111,26 +111,20 @@ class FicWad(FanfictionSiteAdapter):
 		
 		meta = soup.find('p', {'class' : 'meta'})
 		if meta is not None:
-			s = unicode(meta).replace('\n',' ').replace('\t','').split(' - ')
-			#logging.debug('meta.s=%s' % s)
+			logging.debug('meta.s pre=%s' % meta.__str__('utf8'))
+			s = re.sub('<[^>]+>','',unicode(meta)).replace('\n',' ').replace('\t','').split(' - ')
+			#logging.debug('meta.s post=%s' % s)
 			for ss in s:
 				s1 = ss.replace('&nbsp;','').split(':')
-				#logging.debug('meta.s.s1=%s' % s1)
+				#logging.debug('ss=%s' % ss)
 				if len(s1) > 1:
-					s2 = re.split ('<[^>]+>', s1[0])
-					#logging.debug('meta.s.s1.s2=%s' % s2)
-					if len(s2) > 1:
-						s1[0] = s2[1]
 					skey = s1[0].strip()
 					#logging.debug('Checking = %s' % skey)
 					if skey == 'Category':
-						soup1 = bs.BeautifulStoneSoup(s1[1])
-						allAs = soup1.findAll('a')
-						for a in allAs:
-							if self.category == 'Category':
-								self.category = unicode(a.string)
-								logging.debug('self.category=%s' % self.category)
-							self.addSubject(self.category)
+						# ficwad doesn't allow multiple categories.
+						self.category = unicode(s1[1])
+						logging.debug('self.category=%s' % self.category)
+						self.addSubject(self.category)
 						logging.debug('self.subjects=%s' % self.subjects)
 					elif skey == 'Rating':
 						self.storyRating = s1[1]
@@ -159,14 +153,10 @@ class FicWad(FanfictionSiteAdapter):
 						self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(s1[1].strip(' '), "%Y/%m/%d")))
 						logging.debug('self.storyUpdated=%s' % self.storyUpdated)
 				else:
-					s3 = re.split ('<[^>]+>', s1[0])
-					#logging.debug('meta.s.s1.s3=%s' % s3)
-					if len(s3) > 1:
-						s1[0] = s3[0]
-					s4 = s1[0].split('w')
-					#logging.debug('meta.s.s1.s4=%s' % s4)
-					if len(s4) > 1 and s4[1] == 'ords':
-						self.numWords = s4[0]
+					if ss == 'Complete' :
+						self.storyStatus = 'Completed'
+					elif ss.endswith('words'):
+						self.numWords=ss.replace('words','').replace('&nbsp;','')
 						logging.debug('self.numWords=%s' % self.numWords)
 					
 		
diff --git a/fanficdownloader/output.py b/fanficdownloader/output.py
index 10fb6198..25487d6f 100644
--- a/fanficdownloader/output.py
+++ b/fanficdownloader/output.py
@@ -109,7 +109,7 @@ class MobiWriter(FanficWriter):
 		if self.inmemory:
 			self.output = StringIO.StringIO()
 		else:
-			self.output = open(self.fileName, 'w')
+			self.output = open(self.fileName, 'wb')
 
 		self.xhtmlTemplate = string.Template(html_constants.XHTML_START)
 		self.chapterStartTemplate = string.Template(html_constants.XHTML_CHAPTER_START)

From 617dc21eb99d44a284cb1d70e89911660a21903b Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Sat, 27 Nov 2010 17:32:31 -0600
Subject: [PATCH 88/94] Kludge fix for uniode in story descs in appengine.

---
 fanficdownloader/output.py | 8 ++++++--
 1 file changed, 6 insertions(+), 2 deletions(-)

diff --git a/fanficdownloader/output.py b/fanficdownloader/output.py
index 25487d6f..b5a1ff8a 100644
--- a/fanficdownloader/output.py
+++ b/fanficdownloader/output.py
@@ -341,9 +341,13 @@ class EPubFanficWriter(FanficWriter):
 		
 		description = self.adapter.getStoryDescription()
 		if hasattr(description, "text"):
-			description = unicode(description.text)
-		else:
+			description = description.text
+		prevalue=description
+		try:
 			description = unicode(description)
+		except:
+			description=prevalue
+			
 		if description is not None and len(description) > 0:
 			description = description.replace ('\\\'', '\'').replace('\\\"', '\"')
 			description =  removeEntities(description)

From cfb218f21e9eea22554d2c6701f208e282520890 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Mon, 29 Nov 2010 18:45:47 -0600
Subject: [PATCH 89/94] Moved the check for a completed story higher in the
 code, this makes the continue's that are in that portion of the if statement
 not skip that check.

---
 fanficdownloader/ffnet.py | 8 ++++----
 1 file changed, 4 insertions(+), 4 deletions(-)

diff --git a/fanficdownloader/ffnet.py b/fanficdownloader/ffnet.py
index 4caa13fa..d156f9fa 100644
--- a/fanficdownloader/ffnet.py
+++ b/fanficdownloader/ffnet.py
@@ -186,6 +186,10 @@ class FFNet(FanfictionSiteAdapter):
 				(u1, u2, self.authorId, u3) = s2.a['href'].split('/')
 				logging.debug('self.authorId=%s, self.authorName=%s' % (self.authorId, self.authorName))
 			elif l.find("Rated: <a href=") != -1:
+				if "Complete" in l:
+					self.storyStatus = 'Completed'
+				else:
+					self.storyStatus = 'In-Progress'
 				s2 = bs.BeautifulStoneSoup(l)
 				self.storyRating = unicode(s2.a.string).strip()
 				logging.debug('self.storyRating=%s' % self.storyRating)
@@ -207,10 +211,6 @@ class FFNet(FanfictionSiteAdapter):
 						logging.debug('self.genre=%s' % self.genre)
 						self._splitGenre(self.genre)
 						logging.debug('self.subjects=%s' % self.subjects)
-				if "Complete" in l:
-					self.storyStatus = 'Completed'
-				else:
-					self.storyStatus = 'In-Progress'
 			elif l.find("<SELECT title='chapter navigation'") != -1:
 				if len(urls) > 0:
 					continue

From 30455bfda2207f5681c3f1fb3b7e39249246dd3d Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Tue, 30 Nov 2010 12:13:00 -0600
Subject: [PATCH 90/94] Updated the processing for fictionpress.com of the
 information line to correctly extract the Updated and Published dates, and
 the Completion status

---
 fanficdownloader/fpcom.py | 66 ++++++++++++++++++++-------------------
 1 file changed, 34 insertions(+), 32 deletions(-)

diff --git a/fanficdownloader/fpcom.py b/fanficdownloader/fpcom.py
index 471c0b85..fcf4a7ac 100644
--- a/fanficdownloader/fpcom.py
+++ b/fanficdownloader/fpcom.py
@@ -136,6 +136,38 @@ class FPCom(FanfictionSiteAdapter):
 				self.addSubject(subj)
 		return True
 	
+	def _processInfoLine(self, line):
+		have_lang = False
+		words = line.split(' - ')
+		if words is not None:
+			for word in words:
+				if word.find(': ') != -1:
+					sds = word.split(': ')
+					if sds is not None and len(sds) > 1:
+						if sds[0] == 'Updated':
+							self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sds[1].strip(' '), "%m-%d-%y")))
+							logging.debug('self.storyUpdated=%s' % self.storyUpdated)
+						elif sds[0] == 'Published':
+							self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sds[1].strip(' '), "%m-%d-%y")))
+							logging.debug('self.storyPublished=%s' % self.storyPublished)
+						elif sds[0] == 'Reviews':
+							reviews = sds[1] 
+							logging.debug('reviews=%s' % reviews)							
+				elif word.find('Complete') != -1:
+					self.storyStatus = 'Completed'
+					logging.debug('self.storyStatus=%s' % self.storyStatus)
+				elif not have_lang:
+					have_lang = True
+					language = word
+					logging.debug('language=%s' % language)
+				else:
+					self.category = word
+					logging.debug('self.category=%s' % self.category)
+					sgs = self.category.split('/')
+					for sg in sgs:
+						self.addSubject(sg)
+					logging.debug('self.subjects=%s' % self.subjects)
+		
 	def extractIndividualUrls(self):
 		data = ''
 		try:
@@ -250,39 +282,9 @@ class FPCom(FanfictionSiteAdapter):
 							self.storyRating = ss[1]
 							logging.debug('self.storyRating=%s' % self.storyRating)
 					if ll > 3:
-						ss = tdas[3].split(' - ')
-						if ss is not None:
-							lls = len(ss)
-							if lls > 1:
-								language = ss[1]
-								logging.debug('language=%s' % language)
-							if lls > 2:
-								self.category = ss[2]
-								logging.debug('self.category=%s' % self.category)
-								sgs = self.category.split('/')
-								for sg in sgs:
-									self.addSubject(sg)
-								logging.debug('self.subjects=%s' % self.subjects)
-							if lls > 3 and ss[3].strip() == 'Reviews:' and ll > 4:
-								reviews = tdas[4] 
-								logging.debug('reviews=%s' % reviews)
+						self._processInfoLine (tdas[3])
 					if ll > 5:
-						ss = tdas[5].split(' - ')
-						if ss is not None:
-							lls = len(ss)
-							if lls > 1:
-								sds = ss[1].split(': ')
-								if sds is not None and len(sds) > 1 and sds[0] == 'Published':
-									self.storyPublished = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sds[1].strip(' '), "%m-%d-%y")))
-									logging.debug('self.storyPublished=%s' % self.storyPublished)
-							lls = len(ss)
-							if lls > 2:
-								sds = ss[2].split(': ')
-								if sds is not None and len(sds) > 1 and sds[0] == 'Updated':
-									self.storyUpdated = datetime.datetime.fromtimestamp(time.mktime(time.strptime(sds[1].strip(' '), "%m-%d-%y")))
-									logging.debug('self.storyUpdated=%s' % self.storyUpdated)
-									
-
+						self._processInfoLine (tdas[5])
 
 		self.authorURL = 'http://' + self.host + '/u/' + self.authorId
 

From 2f0bb31e2487966af862566477d83ad68837e954 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Tue, 30 Nov 2010 13:56:18 -0600
Subject: [PATCH 91/94] Take out adding the id: field as a subject.

---
 fanficdownloader/fpcom.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/fanficdownloader/fpcom.py b/fanficdownloader/fpcom.py
index fcf4a7ac..ad89b37e 100644
--- a/fanficdownloader/fpcom.py
+++ b/fanficdownloader/fpcom.py
@@ -141,7 +141,7 @@ class FPCom(FanfictionSiteAdapter):
 		words = line.split(' - ')
 		if words is not None:
 			for word in words:
-				if word.find(': ') != -1:
+				if word.find(':') != -1:
 					sds = word.split(': ')
 					if sds is not None and len(sds) > 1:
 						if sds[0] == 'Updated':

From f114a2438eee22034b89712ff3d088bb63445df8 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Tue, 30 Nov 2010 14:06:12 -0600
Subject: [PATCH 92/94] This one might be controversial..

Since none of the EBook readers are really for update-able stories I added tags/subjects in for Last Update Year/Month and Last Update, which at least in FBReader I can order by, and see all stories updated for a certain month, or a certain date.  This will let you know to reread the story.
---
 fanficdownloader/output.py | 9 +++++++++
 1 file changed, 9 insertions(+)

diff --git a/fanficdownloader/output.py b/fanficdownloader/output.py
index b5a1ff8a..98c93827 100644
--- a/fanficdownloader/output.py
+++ b/fanficdownloader/output.py
@@ -337,6 +337,9 @@ class EPubFanficWriter(FanficWriter):
 		createda = self.adapter.getStoryCreated().strftime("%Y-%m-%d %H:%M:%S")
 		created = self.adapter.getStoryCreated().strftime("%Y-%m-%d")
 		updated = self.adapter.getStoryUpdated().strftime("%Y-%m-%d")
+		updateyy = self.adapter.getStoryUpdated().strftime("%Y")
+		updatemm = self.adapter.getStoryUpdated().strftime("%m")
+		updatedd = self.adapter.getStoryUpdated().strftime("%d")
 		calibre = self.adapter.getStoryUpdated().strftime("%Y-%m-%dT%H:%M:%S")
 		
 		description = self.adapter.getStoryDescription()
@@ -387,6 +390,12 @@ class EPubFanficWriter(FanficWriter):
 			i = i + 1
 		if (i <= 0):
 			self._writeFile(opfFilePath, CONTENT_SUBJECT % "FanFiction")
+		
+		subj = "Last Update Year/Month: " + updateyy + "/" + updatemm
+		self._writeFile(opfFilePath, CONTENT_SUBJECT % subj)
+
+		subj = "Last Update: " + updateyy + "/" + updatemm + "/" + updatedd
+		self._writeFile(opfFilePath, CONTENT_SUBJECT % subj)
 
 		self._writeFile(opfFilePath, CONTENT_END_METADATA % (self.adapter.getPublisher(), self.adapter.getUUID(), self.adapter.getStoryURL(), self.adapter.getStoryURL(), self.adapter.getStoryUserRating()))
 #		print >> opf, CONTENT_START % (uuid.uuid4().urn, self.storyTitle, self.authorName)

From c6b79cb57bc42ec3a60e40fc8f24179d6592d482 Mon Sep 17 00:00:00 2001
From: wsuetholz <wsuetholz@localhost>
Date: Tue, 30 Nov 2010 15:11:20 -0600
Subject: [PATCH 93/94] Changed the "Title Page" reference in the TOC and
 CONTENT epub files to be title_page instead.

---
 fanficdownloader/output.py | 2 +-
 1 file changed, 1 insertion(+), 1 deletion(-)

diff --git a/fanficdownloader/output.py b/fanficdownloader/output.py
index 98c93827..da7503e1 100644
--- a/fanficdownloader/output.py
+++ b/fanficdownloader/output.py
@@ -406,7 +406,7 @@ class EPubFanficWriter(FanficWriter):
 
 		t = "Title Page"
 		f = "title_page.xhtml"
-		chapterId = "Title Page"		
+		chapterId = "title_page"		
 		self._writeFile(tocFilePath, TOC_ITEM % (chapterId, i, t, f))
 		self._writeFile(opfFilePath, CONTENT_ITEM % (chapterId, f))
 		

From 8f58164ddea94731be7caef9f415838919d11f47 Mon Sep 17 00:00:00 2001
From: retiefjimm <retiefjimm@gmail.com>
Date: Thu, 2 Dec 2010 17:36:52 -0600
Subject: [PATCH 94/94] Added tag fanficdownloader-0.4 for changeset
 f23fd0e4cbc3