diff --git a/.vscode/settings.json b/.vscode/settings.json
new file mode 100644
index 00000000..b2a92142
--- /dev/null
+++ b/.vscode/settings.json
@@ -0,0 +1,10 @@
+{
+    "python.analysis.extraPaths": [
+        ".",
+        "./poster",
+        "./tests",
+        "./wikitools",
+        "/Library/Frameworks/Python.framework/Versions/3.8/lib/python3.8/site-packages"
+    ],
+    "python.pythonPath": "/usr/local/bin/python3.8"
+}
\ No newline at end of file
diff --git a/dumpgenerator.py b/dumpgenerator.py
index 536cd0ed..f13b1a46 100755
--- a/dumpgenerator.py
+++ b/dumpgenerator.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # dumpgenerator.py A generator of dumps for wikis
@@ -22,44 +22,38 @@
 try:
     from kitchen.text.converters import getwriter, to_unicode
 except ImportError:
-    print "Please install the kitchen module."
-import cookielib
-import cPickle
+    print ("Please install the kitchen module.")
+import http.cookiejar
+import pickle
 import datetime
 import sys
 try:
     import argparse
 except ImportError:
-    print "Please install the argparse module."
+    print ("Please install the argparse module.")
     sys.exit(1)
 import json
-try:
-    from hashlib import md5
-except ImportError:             # Python 2.4 compatibility
-    from md5 import new as md5
+from hashlib import md5
 import os
 import re
-import subprocess
+# import subprocess
 try:
     import requests
 except ImportError:
-    print "Please install or update the Requests module."
+    print ("Please install or update the Requests module.")
     sys.exit(1)
 try:
     import mwclient
 except ImportError:
-    print "Please install the mwclient module if you want to use --xmlrevisions."
+    print ("Please install the mwclient module if you want to use --xmlrevisions.")
 try:
     from lxml import etree
     from lxml.builder import E
 except ImportError:
-    print "Please install the lxml module if you want to use --xmlrevisions."
+    print ("Please install the lxml module if you want to use --xmlrevisions.")
 import time
 import urllib
-try:
-    from urlparse import urlparse, urlunparse
-except ImportError:
-    from urllib.parse import urlparse, urlunparse
+from urllib.parse import urlparse, urlunparse
 UTF8Writer = getwriter('utf8')
 sys.stdout = UTF8Writer(sys.stdout)
 
@@ -83,22 +77,22 @@ def getVersion():
 
 
 def truncateFilename(other={}, filename=''):
-    """ Truncate filenames when downloading images with large filenames """
+    """Truncate filenames when downloading images with large filenames"""
     return filename[:other['filenamelimit']] + \
         md5(filename.encode('utf-8')).hexdigest() + '.' + filename.split('.')[-1]
 
 
 def delay(config={}, session=None):
-    """ Add a delay if configured for that """
+    """Add a delay if configured for that"""
     if config['delay'] > 0:
-        print 'Sleeping... %d seconds...' % (config['delay'])
+        print ('Sleeping... %d seconds...' % (config['delay']))
         time.sleep(config['delay'])
 
 
 def cleanHTML(raw=''):
-    """ Extract only the real wiki content and remove rubbish """
-    """ This function is ONLY used to retrieve page titles and file names when no API is available """
-    """ DO NOT use this function to extract page content """
+    """Extract only the real wiki content and remove rubbish"""
+    """This function is ONLY used to retrieve page titles and file names when no API is available"""
+    """DO NOT use this function to extract page content"""
     # different "tags" used by different MediaWiki versions to mark where
     # starts and ends content
     if re.search('<!-- bodytext -->', raw):
@@ -118,8 +112,8 @@ def cleanHTML(raw=''):
         raw = raw.split('<body class=')[1].split(
             '<div class="printfooter">')[0]
     else:
-        print raw[:250]
-        print 'This wiki doesn\'t use marks to split content'
+        print (raw[:250])
+        print ('This wiki doesn\'t use marks to split content')
         sys.exit()
     return raw
 
@@ -129,37 +123,37 @@ def handleStatusCode(response):
     if statuscode >= 200 and statuscode < 300:
         return
 
-    print "HTTP Error %d." % statuscode
+    print ("HTTP Error %d." % statuscode)
     if statuscode >= 300 and statuscode < 400:
-        print "Redirect should happen automatically: please report this as a bug."
-        print response.url
+        print ("Redirect should happen automatically: please report this as a bug.")
+        print (response.url)
 
     elif statuscode == 400:
-        print "Bad Request: The wiki may be malfunctioning."
-        print "Please try again later."
-        print response.url
+        print ("Bad Request: The wiki may be malfunctioning.")
+        print ("Please try again later.")
+        print (response.url)
         sys.exit(1)
 
     elif statuscode == 401 or statuscode == 403:
-        print "Authentication required."
-        print "Please use --user and --pass."
-        print response.url
+        print ("Authentication required.")
+        print ("Please use --user and --pass.")
+        print (response.url)
 
     elif statuscode == 404:
-        print "Not found. Is Special:Export enabled for this wiki?"
-        print response.url
+        print ("Not found. Is Special:Export enabled for this wiki?")
+        print (response.url)
         sys.exit(1)
 
     elif statuscode == 429 or (statuscode >= 500 and statuscode < 600):
-        print "Server error, max retries exceeded."
-        print "Please resume the dump later."
-        print response.url
+        print ("Server error, max retries exceeded.")
+        print ("Please resume the dump later.")
+        print (response.url)
         sys.exit(1)
 
 
 def getNamespacesScraper(config={}, session=None):
-    """ Hackishly gets the list of namespaces names and ids from the dropdown in the HTML of Special:AllPages """
-    """ Function called if no API is available """
+    """Hackishly gets the list of namespaces names and ids from the dropdown in the HTML of Special:AllPages"""
+    """Function called if no API is available"""
     namespaces = config['namespaces']
     namespacenames = {0: ''}  # main is 0, no prefix
     if namespaces:
@@ -190,12 +184,12 @@ def getNamespacesScraper(config={}, session=None):
         namespaces = [0]
 
     namespaces = list(set(namespaces))  # uniques
-    print '%d namespaces found' % (len(namespaces))
+    print ('%d namespaces found' % (len(namespaces)))
     return namespaces, namespacenames
 
 
 def getNamespacesAPI(config={}, session=None):
-    """ Uses the API to get the list of namespaces names and ids """
+    """Uses the API to get the list of namespaces names and ids"""
     namespaces = config['namespaces']
     namespacenames = {0: ''}  # main is 0, no prefix
     if namespaces:
@@ -213,9 +207,9 @@ def getNamespacesAPI(config={}, session=None):
         try:
             nsquery = result['query']['namespaces']
         except KeyError:
-            print "Error: could not get namespaces from the API request."
-            print "HTTP %d" % r.status_code
-            print r.text
+            print ("Error: could not get namespaces from the API request.")
+            print ("HTTP %d" % r.status_code)
+            print (r.text)
             return None
 
         if 'all' in namespaces:
@@ -241,22 +235,22 @@ def getNamespacesAPI(config={}, session=None):
         namespaces = [0]
 
     namespaces = list(set(namespaces))  # uniques
-    print '%d namespaces found' % (len(namespaces))
+    print ('%d namespaces found' % (len(namespaces)))
     return namespaces, namespacenames
 
 
 def getPageTitlesAPI(config={}, session=None):
-    """ Uses the API to get the list of page titles """
+    """Uses the API to get the list of page titles"""
     titles = []
     namespaces, namespacenames = getNamespacesAPI(
         config=config, session=session)
     for namespace in namespaces:
         if namespace in config['exnamespaces']:
-            print '    Skipping namespace = %d' % (namespace)
+            print ('    Skipping namespace = %d' % (namespace))
             continue
 
         c = 0
-        print '    Retrieving titles in the namespace %d' % (namespace)
+        print ('    Retrieving titles in the namespace %d' % (namespace))
         apiurl = urlparse(config['api'])
         site = mwclient.Site(apiurl.netloc, apiurl.path.replace("api.php", ""), scheme=apiurl.scheme)
         for page in site.allpages(namespace=namespace):
@@ -266,19 +260,19 @@ def getPageTitlesAPI(config={}, session=None):
             yield title
 
         if len(titles) != len(set(titles)):
-            print 'Probably a loop, switching to next namespace'
+            print ('Probably a loop, switching to next namespace')
             titles = list(set(titles))
 
             delay(config=config, session=session)
-        print '    %d titles retrieved in the namespace %d' % (c, namespace)
+        print ('    %d titles retrieved in the namespace %d' % (c, namespace))
 
 def getPageTitlesScraper(config={}, session=None):
-    """ Scrape the list of page titles from Special:Allpages """
+    """Scrape the list of page titles from Special:Allpages"""
     titles = []
     namespaces, namespacenames = getNamespacesScraper(
         config=config, session=session)
     for namespace in namespaces:
-        print '    Retrieving titles in the namespace', namespace
+        print ('    Retrieving titles in the namespace', namespace)
         url = '%s?title=Special:Allpages&namespace=%s' % (
             config['index'], namespace)
         r = session.get(url=url, timeout=30)
@@ -342,13 +336,13 @@ def getPageTitlesScraper(config={}, session=None):
                     checked_suballpages.append(name)
                     delay(config=config, session=session)
                     r = session.get(url=url, timeout=10)
-                    #print 'Fetching URL: ', url
+                    #print ('Fetching URL: ', url)
                     raw = r.text
                     raw = cleanHTML(raw)
                     rawacum += raw  # merge it after removed junk
-                    print '    Reading', name, len(raw), 'bytes', \
+                    print ('    Reading', name, len(raw), 'bytes', \
                         len(re.findall(r_suballpages, raw)), 'subpages', \
-                        len(re.findall(r_title, raw)), 'pages'
+                        len(re.findall(r_title, raw)), 'pages')
 
                 delay(config=config, session=session)
             oldfr = currfr
@@ -362,24 +356,24 @@ def getPageTitlesScraper(config={}, session=None):
                 if t not in titles:
                     titles.append(t)
                     c += 1
-        print '    %d titles retrieved in the namespace %d' % (c, namespace)
+        print ('    %d titles retrieved in the namespace %d' % (c, namespace))
     return titles
 
 
 def getPageTitles(config={}, session=None):
-    """ Get list of page titles """
+    """Get list of page titles"""
     # http://en.wikipedia.org/wiki/Special:AllPages
     # http://archiveteam.org/index.php?title=Special:AllPages
     # http://www.wikanda.es/wiki/Especial:Todas
-    print 'Loading page titles from namespaces = %s' % (config['namespaces'] and ','.join([str(i) for i in config['namespaces']]) or 'None')
-    print 'Excluding titles from namespaces = %s' % (config['exnamespaces'] and ','.join([str(i) for i in config['exnamespaces']]) or 'None')
+    print ('Loading page titles from namespaces = %s' % (config['namespaces'] and ','.join([str(i) for i in config['namespaces']]) or 'None'))
+    print ('Excluding titles from namespaces = %s' % (config['exnamespaces'] and ','.join([str(i) for i in config['exnamespaces']]) or 'None'))
 
     titles = []
     if 'api' in config and config['api']:
         try:
             titles = getPageTitlesAPI(config=config, session=session)
         except:
-            print "Error: could not get page titles from the API"
+            print ("Error: could not get page titles from the API")
             titles = getPageTitlesScraper(config=config, session=session)
     elif 'index' in config and config['index']:
         titles = getPageTitlesScraper(config=config, session=session)
@@ -396,15 +390,15 @@ def getPageTitles(config={}, session=None):
     # We can use sort -u in UNIX, but is it worth it?
     titlesfile.write(u'--END--\n')
     titlesfile.close()
-    print 'Titles saved at...', titlesfilename
+    print ('Titles saved at...', titlesfilename)
 
-    print '%d page titles loaded' % (c)
+    print ('%d page titles loaded' % (c))
     return titlesfilename
 
 def getImageNames(config={}, session=None):
-    """ Get list of image names """
+    """Get list of image names"""
 
-    print 'Retrieving image filenames'
+    print (')Retrieving image filenames')
     images = []
     if 'api' in config and config['api']:
         images = getImageNamesAPI(config=config, session=session)
@@ -414,21 +408,21 @@ def getImageNames(config={}, session=None):
     # images = list(set(images)) # it is a list of lists
     images.sort()
 
-    print '%d image names loaded' % (len(images))
+    print ('%d image names loaded' % (len(images)))
     return images
 
 
 def getXMLHeader(config={}, session=None):
-    """ Retrieve a random page to extract XML headers (namespace info, etc) """
+    """Retrieve a random page to extract XML headers (namespace info, etc)"""
     # get the header of a random page, to attach it in the complete XML backup
     # similar to: <mediawiki xmlns="http://www.mediawiki.org/xml/export-0.3/"
     # xmlns:x....
     randomtitle = 'Main_Page'  # previously AMF5LKE43MNFGHKSDMRTJ
-    print config['api']
+    print (config['api'])
     xml = ''
     if config['xmlrevisions'] and config['api'] and config['api'].endswith("api.php"):
         try:
-            print 'Getting the XML header from the API'
+            print ('Getting the XML header from the API')
             # Export and exportnowrap exist from MediaWiki 1.15, allpages from 1.18
             r = requests.get(config['api'] + '?action=query&export=1&exportnowrap=1&list=allpages&aplimit=1', timeout=10)
             xml = r.text
@@ -465,7 +459,7 @@ def getXMLHeader(config={}, session=None):
         except ExportAbortedError:
             try:
                 if config['api']:
-                    print "Trying the local name for the Special namespace instead"
+                    print ("Trying the local name for the Special namespace instead")
                     r = session.get(
                     url=config['api'],
                     params={
@@ -487,24 +481,24 @@ def getXMLHeader(config={}, session=None):
     if not re.match(r"\s*<mediawiki", xml):
         if config['xmlrevisions']:
             # Try again the old way
-            print 'Export test via the API failed. Wiki too old? Trying without xmlrevisions.'
+            print ('Export test via the API failed. Wiki too old? Trying without xmlrevisions.')
             config['xmlrevisions'] = False
             header, config = getXMLHeader(config=config, session=session)
         else:
-            print 'XML export on this wiki is broken, quitting.'
+            print ('XML export on this wiki is broken, quitting.')
             logerror(u'XML export on this wiki is broken, quitting.')
             sys.exit()
     return header, config
 
 
 def getXMLFileDesc(config={}, title='', session=None):
-    """ Get XML for image description page """
+    """Get XML for image description page"""
     config['curonly'] = 1  # tricky to get only the most recent desc
     return("".join([x for x in getXMLPage( config=config, title=title, verbose=False, session=session)]))
 
 
 def getUserAgent():
-    """ Return a cool user-agent to hide Python user-agent """
+    """Return a cool user-agent to hide Python user-agent"""
     useragents = [
         # firefox
         #'Mozilla/5.0 (X11; Linux x86_64; rv:72.0) Gecko/20100101 Firefox/72.0',
@@ -515,7 +509,7 @@ def getUserAgent():
 
 
 def logerror(config={}, text=''):
-    """ Log error in file """
+    """Log error in file"""
     if text:
         with open('%s/errors.log' % (config['path']), 'a') as outfile:
             output = u'%s: %s\n' % (
@@ -524,7 +518,7 @@ def logerror(config={}, text=''):
 
 
 def getXMLPageCore(headers={}, params={}, config={}, session=None):
-    """  """
+    """"""
     # returns a XML containing params['limit'] revisions (or current only), ending in </mediawiki>
     # if retrieving params['limit'] revisions fails, returns a current only version
     # if all fail, returns the empty string
@@ -538,17 +532,17 @@ def getXMLPageCore(headers={}, params={}, config={}, session=None):
         if c > 0 and c < maxretries:
             wait = increment * c < maxseconds and increment * \
                 c or maxseconds  # incremental until maxseconds
-            print '    In attempt %d, XML for "%s" is wrong. Waiting %d seconds and reloading...' %(c, params['pages'], wait)
+            print ('    In attempt %d, XML for "%s" is wrong. Waiting %d seconds and reloading...' %(c, params['pages'], wait))
             time.sleep(wait)
             # reducing server load requesting smallest chunks (if curonly then
             # limit = 1 from mother function)
             if params['limit'] > 1:
                 params['limit'] = params['limit'] / 2  # half
         if c >= maxretries:
-            print '    We have retried %d times' % (c)
-            print '    MediaWiki error for "%s", network error or whatever...' % (params['pages'])
+            print ('    We have retried %d times' % (c))
+            print ('    MediaWiki error for "%s", network error or whatever...' % (params['pages']))
             if config['failfast']:
-                print "Exit, it will be for another time"
+                print ("Exit, it will be for another time")
                 sys.exit()
             # If it's not already what we tried: our last chance, preserve only the last revision...
             # config['curonly'] means that the whole dump is configured to save only the last,
@@ -556,7 +550,7 @@ def getXMLPageCore(headers={}, params={}, config={}, session=None):
             # fallback, because it's set by the following if and passed to
             # getXMLPageCore
             if not config['curonly'] and not 'curonly' in params:
-                print '    Trying to save only the last revision for this page...'
+                print ('    Trying to save only the last revision for this page...')
                 params['curonly'] = 1
                 logerror(
                     config=config,
@@ -570,7 +564,7 @@ def getXMLPageCore(headers={}, params={}, config={}, session=None):
                     session=session
                 )
             else:
-                print '    Saving in the errors log, and skipping...'
+                print ('    Saving in the errors log, and skipping...')
                 logerror(
                     config=config,
                     text=u'Error while retrieving the last revision of "%s". Skipping.' %
@@ -583,10 +577,10 @@ def getXMLPageCore(headers={}, params={}, config={}, session=None):
             handleStatusCode(r)
             xml = fixBOM(r)
         except requests.exceptions.ConnectionError as e:
-            print '    Connection error: %s'%(str(e[0]))
+            print ('    Connection error: %s'%(str(e[0])))
             xml = ''
         except requests.exceptions.ReadTimeout as e:
-            print '    Read timeout: %s'%(str(e[0]))
+            print ('    Read timeout: %s'%(str(e[0])))
             xml = ''       
         c += 1
 
@@ -594,7 +588,7 @@ def getXMLPageCore(headers={}, params={}, config={}, session=None):
 
 
 def getXMLPage(config={}, title='', verbose=True, session=None):
-    """ Get the full history (or current only) of a page """
+    """Get the full history (or current only) of a page"""
 
     # if server errors occurs while retrieving the full page history, it may return [oldest OK versions] + last version, excluding middle revisions, so it would be partialy truncated
     # http://www.mediawiki.org/wiki/Manual_talk:Parameters_to_Special:Export#Parameters_no_longer_in_use.3F
@@ -649,7 +643,7 @@ def getXMLPage(config={}, title='', verbose=True, session=None):
                 xml2 = getXMLPageCore(
                     params=params, config=config, session=session)
             except MemoryError:
-                print "The page's history exceeds our memory, halving limit."
+                print ("The page's history exceeds our memory, halving limit.")
                 params['limit'] = params['limit'] / 2
                 continue
 
@@ -659,11 +653,11 @@ def getXMLPage(config={}, title='', verbose=True, session=None):
                     # again the same XML, this wiki does not support params in
                     # Special:Export, offer complete XML up to X edits (usually
                     # 1000)
-                    print 'ATTENTION: This wiki does not allow some parameters in Special:Export, therefore pages with large histories may be truncated'
+                    print ('ATTENTION: This wiki does not allow some parameters in Special:Export, therefore pages with large histories may be truncated')
                     truncated = True
                     break
                 else:
-                    """    </namespaces>
+                    """   </namespaces>
                       </siteinfo>
                       <page>
                         <title>Main Page</title>
@@ -673,14 +667,14 @@ def getXMLPage(config={}, title='', verbose=True, session=None):
                           <id>418009832</id>
                           <timestamp>2011-03-09T19:57:06Z</timestamp>
                           <contributor>
-                    """
+                   """
                     # offset is OK in this wiki, merge with the previous chunk
                     # of this page history and continue
                     try:
                         xml2 = xml2.split("</page>")[0]
                         yield '  <revision>' + ('<revision>'.join(xml2.split('<revision>')[1:]))
                     except MemoryError:
-                        print "The page's history exceeds our memory, halving limit."
+                        "The page's history exceeds our memory, halving limit."
                         params['limit'] = params['limit'] / 2
                         continue
                     xml = xml2
@@ -691,13 +685,13 @@ def getXMLPage(config={}, title='', verbose=True, session=None):
 
     if verbose:
         if (numberofedits == 1):
-           print '    %s, 1 edit' % (title.strip())
+           print ('    %s, 1 edit' % (title.strip()))
         else:
-           print '    %s, %d edits' % (title.strip(), numberofedits)
+           print ('    %s, %d edits' % (title.strip(), numberofedits))
 
 
 def makeXmlPageFromRaw(xml):
-    """ Discard the metadata around a <page> element in <mediawiki> string"""
+    """Discard the metadata around a <page> element in <mediawiki> string"""
     root = etree.XML(xml)
     find = etree.XPath("//*[local-name() = 'page']")
     # The tag will inherit the namespace, like:
@@ -707,7 +701,7 @@ def makeXmlPageFromRaw(xml):
 
 
 def cleanXML(xml=''):
-    """ Trim redundant info from the XML however it comes """
+    """Trim redundant info from the XML however it comes"""
     # do not touch XML codification, leave AS IS
     if re.search(r'</siteinfo>\n', xml):
         xml = xml.split('</siteinfo>\n')[1]
@@ -717,7 +711,7 @@ def cleanXML(xml=''):
 
 
 def generateXMLDump(config={}, titles=[], start=None, session=None):
-    """ Generates a XML dump for a list of titles or from revision IDs """
+    """Generates a XML dump for a list of titles or from revision IDs"""
     # TODO: titles is now unused.
 
     header, config = getXMLHeader(config=config, session=session)
@@ -733,7 +727,7 @@ def generateXMLDump(config={}, titles=[], start=None, session=None):
             print("WARNING: will try to start the download from title: {}".format(start))
             xmlfile = open('%s/%s' % (config['path'], xmlfilename), 'a')
         else:
-            print 'Retrieving the XML for every page from the beginning'
+            print ('Retrieving the XML for every page from the beginning')
             xmlfile = open('%s/%s' % (config['path'], xmlfilename), 'w')
             xmlfile.write(header.encode('utf-8'))
         try:
@@ -742,17 +736,17 @@ def generateXMLDump(config={}, titles=[], start=None, session=None):
                 numrevs = len(re.findall(r_timestamp, xml))
                 # Due to how generators work, it's expected this may be less
                 # TODO: get the page title and reuse the usual format "X title, y edits"
-                print "        %d more revisions exported" % numrevs
+                print ("        %d more revisions exported" % numrevs)
                 xml = cleanXML(xml=xml)
                 xmlfile.write(xml.encode('utf-8'))
         except AttributeError as e:
             print(e)
-            print "This API library version is not working"
+            print ("This API library version is not working")
             sys.exit()
     else:
-        print 'Retrieving the XML for every page from "%s"' % (start and start or 'start')
+        print ('Retrieving the XML for every page from "%s"' % (start and start or 'start'))
         if start:
-            print "Removing the last chunk of past XML dump: it is probably incomplete."
+            print ("Removing the last chunk of past XML dump: it is probably incomplete.")
             for i in reverse_readline('%s/%s' % (config['path'], xmlfilename), truncate=True):
                 pass
         else:
@@ -773,7 +767,7 @@ def generateXMLDump(config={}, titles=[], start=None, session=None):
                 continue
             delay(config=config, session=session)
             if c % 10 == 0:
-                print 'Downloaded %d pages' % (c)
+                print ('Downloaded %d pages' % (c))
             try:
                 for xml in getXMLPage(config=config, title=title, session=session):
                     xml = cleanXML(xml=xml)
@@ -791,7 +785,7 @@ def generateXMLDump(config={}, titles=[], start=None, session=None):
 
     xmlfile.write(footer)
     xmlfile.close()
-    print 'XML dump saved at...', xmlfilename
+    print ('XML dump saved at...', xmlfilename)
 
 def getXMLRevisions(config={}, session=None, allpages=False, start=None):
     # FIXME: actually figure out the various strategies for each MediaWiki version
@@ -874,7 +868,7 @@ def getXMLRevisions(config={}, session=None, allpages=False, start=None):
                     for page in arvrequest['query']['allrevisions']:
                         for revision in page['revisions']:
                             revids.append(str(revision['revid']))
-                    print "        %d more revisions listed, until %s" % (len(revids), revids[-1])
+                    print ("        %d more revisions listed, until %s" % (len(revids), revids[-1]))
 
                     # We can now get the XML for one revision at a time
                     # FIXME: we can actually get them in batches as we used to
@@ -922,7 +916,7 @@ def getXMLRevisions(config={}, session=None, allpages=False, start=None):
     except (KeyError, mwclient.errors.InvalidResponse) as e:
         print(e)
         # TODO: check whether the KeyError was really for a missing arv API
-        print "Warning. Could not use allrevisions. Wiki too old?"
+        print ("Warning. Could not use allrevisions. Wiki too old?")
         if config['curonly']:
             # The raw XML export in the API gets a title and gives the latest revision.
             # We could also use the allpages API as generator but let's be consistent.
@@ -1022,7 +1016,7 @@ def getXMLRevisions(config={}, session=None, allpages=False, start=None):
                     if 'continue' in prequest.keys():
                         print("Getting more revisions for the page")
                         for key, value in prequest['continue']:
-                            params[key] = value
+                            pparams[key] = value
                     elif 'query-continue' in prequest.keys():
                         rvstartid = prequest['query-continue']['revisions']['rvstartid']
                         pparams['rvstartid'] = rvstartid
@@ -1047,11 +1041,11 @@ def getXMLRevisions(config={}, session=None, allpages=False, start=None):
 
     except mwclient.errors.MwClientError as e:
         print(e)
-        print "This mwclient version seems not to work for us. Exiting."
+        print ("This mwclient version seems not to work for us. Exiting.")
         sys.exit()
 
 def makeXmlFromPage(page):
-    """ Output an XML document as a string from a page as in the API JSON """
+    """Output an XML document as a string from a page as in the API JSON"""
     try:
         p = E.page(
                 E.title(to_unicode(page['title'])),
@@ -1098,7 +1092,7 @@ def makeXmlFromPage(page):
     return etree.tostring(p, pretty_print=True, encoding='unicode')
 
 def readTitles(config={}, start=None, batch=False):
-    """ Read title list from a file, from the title "start" """
+    """Read title list from a file, from the title "start" """
 
     titlesfilename = '%s-%s-titles.txt' % (
         domain2prefix(config=config), config['date'])
@@ -1173,7 +1167,7 @@ def reverse_readline(filename, buf_size=8192, truncate=False):
         yield segment
 
 def saveImageNames(config={}, images=[], session=None):
-    """ Save image list in a file, including filename, url and uploader """
+    """Save image list in a file, including filename, url and uploader"""
 
     imagesfilename = '%s-%s-images.txt' % (
         domain2prefix(config=config), config['date'])
@@ -1193,11 +1187,11 @@ def saveImageNames(config={}, images=[], session=None):
     imagesfile.write('\n--END--')
     imagesfile.close()
 
-    print 'Image filenames and URLs saved at...', imagesfilename
+    print ('Image filenames and URLs saved at...', imagesfilename)
 
 
 def curateImageURL(config={}, url=''):
-    """ Returns an absolute URL for an image, adding the domain if missing """
+    """Returns an absolute URL for an image, adding the domain if missing"""
 
     if 'index' in config and config['index']:
         # remove from :// (http or https) until the first / after domain
@@ -1207,7 +1201,7 @@ def curateImageURL(config={}, url=''):
         domainalone = config['api'].split(
             '://')[0] + '://' + config['api'].split('://')[1].split('/')[0]
     else:
-        print 'ERROR: no index nor API'
+        print ('ERROR: no index nor API')
         sys.exit()
 
     if url.startswith('//'):  # Orain wikifarm returns URLs starting with //
@@ -1227,7 +1221,7 @@ def curateImageURL(config={}, url=''):
 
 
 def getImageNamesScraper(config={}, session=None):
-    """ Retrieve file list: filename, url, uploader """
+    """Retrieve file list: filename, url, uploader"""
 
     # (?<! http://docs.python.org/library/re.html
     r_next = r'(?<!&amp;dir=prev)&amp;offset=(?P<offset>\d+)&amp;'
@@ -1253,15 +1247,15 @@ def getImageNamesScraper(config={}, session=None):
                 ur'(?i)(allowed memory size of \d+ bytes exhausted|Call to a member function getURL)',
                 raw):
             if limit > 10:
-                print 'Error: listing %d images in a chunk is not possible, trying tiny chunks' % (limit)
+                print ('Error: listing %d images in a chunk is not possible, trying tiny chunks' % (limit))
                 limit = limit / 10
                 continue
             elif retries > 0:  # waste retries, then exit
                 retries -= 1
-                print 'Retrying...'
+                print ('Retrying...')
                 continue
             else:
-                print 'No more retries, exit...'
+                print ('No more retries, exit...')
                 break
 
         raw = cleanHTML(raw)
@@ -1309,7 +1303,7 @@ def getImageNamesScraper(config={}, session=None):
             uploader = undoHTMLEntities(text=uploader)
             uploader = urllib.unquote(uploader)
             images.append([filename, url, uploader])
-            # print filename, url
+            # print (filename, url)
 
         if re.search(r_next, raw):
             new_offset = re.findall(r_next, raw)[0]
@@ -1323,16 +1317,16 @@ def getImageNamesScraper(config={}, session=None):
             offset = ''
 
     if (len(images) == 1):
-        print '    Found 1 image'
+        print ('    Found 1 image')
     else:
-        print '    Found %d images' % (len(images))
+        print ('    Found %d images' % (len(images)))
 
     images.sort()
     return images
 
 
 def getImageNamesAPI(config={}, session=None):
-    """ Retrieve file list: filename, url, uploader """
+    """Retrieve file list: filename, url, uploader"""
     oldAPI = False
     aifrom = '!'
     images = []
@@ -1366,7 +1360,7 @@ def getImageNamesAPI(config={}, session=None):
                     aifrom = jsonimages['continue']['aicontinue']
                 elif 'aifrom' in jsonimages['continue']:
                     aifrom = jsonimages['continue']['aifrom']
-            # print aifrom
+            # print (aifrom)
 
             for image in jsonimages['query']['allimages']:
                 url = image['url']
@@ -1375,9 +1369,9 @@ def getImageNamesAPI(config={}, session=None):
                 # http://bugs.python.org/issue8136
                 if 'api' in config and ('.wikia.' in config['api'] or '.fandom.com' in config['api']):
                     #to avoid latest?cb=20120816112532 in filenames
-                    filename = unicode(urllib.unquote((re.sub('_', ' ', url.split('/')[-3])).encode('ascii', 'ignore')), 'utf-8')
+                    filename = str(urllib.unquote((re.sub('_', ' ', url.split('/')[-3])).encode('ascii', 'ignore')), 'utf-8')
                 else:
-                    filename = unicode(urllib.unquote((re.sub('_', ' ', url.split('/')[-1])).encode('ascii', 'ignore')), 'utf-8')
+                    filename = str(urllib.unquote((re.sub('_', ' ', url.split('/')[-1])).encode('ascii', 'ignore')), 'utf-8')
                 uploader = re.sub('_', ' ', image['user'])
                 images.append([filename, url, uploader])
         else:
@@ -1416,8 +1410,8 @@ def getImageNamesAPI(config={}, session=None):
                     if 'gapfrom' in jsonimages['query-continue']['allpages']:
                         gapfrom = jsonimages[
                             'query-continue']['allpages']['gapfrom']
-                # print gapfrom
-                # print jsonimages['query']
+                # print (gapfrom)
+                # print (jsonimages['query'])
 
                 for image, props in jsonimages['query']['pages'].items():
                     url = props['imageinfo'][0]['url']
@@ -1433,15 +1427,15 @@ def getImageNamesAPI(config={}, session=None):
                 break
 
     if (len(images) == 1):
-        print '    Found 1 image'
+        print ('    Found 1 image')
     else:
-        print '    Found %d images' % (len(images))
+        print ('    Found %d images' % (len(images)))
 
     return images
 
 
 def undoHTMLEntities(text=''):
-    """ Undo some HTML codes """
+    """Undo some HTML codes"""
 
     # i guess only < > & " ' need conversion
     # http://www.w3schools.com/html/html_entities.asp
@@ -1455,13 +1449,13 @@ def undoHTMLEntities(text=''):
 
 
 def generateImageDump(config={}, other={}, images=[], start='', session=None):
-    """ Save files and descriptions using a file list """
+    """Save files and descriptions using a file list"""
 
     # fix use subdirectories md5
-    print 'Retrieving images from "%s"' % (start and start or 'start')
+    print ('Retrieving images from "%s"' % (start and start or 'start'))
     imagepath = '%s/images' % (config['path'])
     if not os.path.isdir(imagepath):
-        print 'Creating "%s" directory' % (imagepath)
+        print ('Creating "%s" directory' % (imagepath))
         os.makedirs(imagepath)
 
     c = 0
@@ -1482,7 +1476,7 @@ def generateImageDump(config={}, other={}, images=[], start='', session=None):
         if len(filename2) > other['filenamelimit']:
             # split last . (extension) and then merge
             filename2 = truncateFilename(other=other, filename=filename2)
-            print 'Filename is too long, truncating. Now it is:', filename2
+            print ('Filename is too long, truncating. Now it is:', filename2)
         filename3 = u'%s/%s' % (imagepath, filename2)
         imagefile = open(filename3, 'wb')
 
@@ -1543,13 +1537,13 @@ def generateImageDump(config={}, other={}, images=[], start='', session=None):
         delay(config=config, session=session)
         c += 1
         if c % 10 == 0:
-            print '    Downloaded %d images' % (c)
+            print ('    Downloaded %d images' % (c))
 
-    print 'Downloaded %d images' % (c)
+    print ('Downloaded %d images' % (c))
 
 
 def saveLogs(config={}, session=None):
-    """ Save Special:Log """
+    """Save Special:Log"""
     # get all logs from Special:Log
     """parse
     <select name='type'>
@@ -1565,12 +1559,12 @@ def saveLogs(config={}, session=None):
     <option value="upload">Subidas de archivos</option>
     <option value="">Todos los registros</option>
     </select>
-    """
+   """
     delay(config=config, session=session)
 
 
 def domain2prefix(config={}, session=None):
-    """ Convert domain name to a valid prefix filename. """
+    """Convert domain name to a valid prefix filename."""
 
     # At this point, both api and index are supposed to be defined
     domain = ''
@@ -1589,30 +1583,30 @@ def domain2prefix(config={}, session=None):
 
 
 def loadConfig(config={}, configfilename=''):
-    """ Load config file """
+    """Load config file"""
 
     try:
         with open('%s/%s' % (config['path'], configfilename), 'r') as infile:
-            config = cPickle.load(infile)
+            config = pickle.load(infile)
     except:
-        print 'There is no config file. we can\'t resume. Start a new dump.'
+        print ('There is no config file. we can\'t resume. Start a new dump.')
         sys.exit()
 
     return config
 
 
 def saveConfig(config={}, configfilename=''):
-    """ Save config file """
+    """Save config file"""
 
     with open('%s/%s' % (config['path'], configfilename), 'w') as outfile:
-        cPickle.dump(config, outfile)
+        pickle.dump(config, outfile)
 
 
 def welcome():
     message = ''
-    """ Opening message """
+    """Opening message"""
     message += "#" * 73
-    message += """
+    message +="""
 # Welcome to DumpGenerator %s by WikiTeam (GPL v3)                   #
 # More info at: https://github.com/WikiTeam/wikiteam                    #""" % (getVersion())
     message += "\n"
@@ -1623,7 +1617,7 @@ def welcome():
     message += "#" * 73
     message += "\n"
     message += "# Copyright (C) 2011-%d WikiTeam developers                           #\n" % (datetime.datetime.now().year)
-    message += """
+    message +="""
 # This program is free software: you can redistribute it and/or modify  #
 # it under the terms of the GNU General Public License as published by  #
 # the Free Software Foundation, either version 3 of the License, or     #
@@ -1645,11 +1639,11 @@ def welcome():
 
 
 def bye():
-    """ Closing message """
-    print "---> Congratulations! Your dump is complete <---"
-    print "If you found any bug, report a new issue here: https://github.com/WikiTeam/wikiteam/issues"
-    print "If this is a public wiki, please, consider publishing this dump. Do it yourself as explained in https://github.com/WikiTeam/wikiteam/wiki/Tutorial#Publishing_the_dump or contact us at https://github.com/WikiTeam/wikiteam"
-    print "Good luck! Bye!"
+    """Closing message"""
+    print ("---> Congratulations! Your dump is complete <---")
+    print ("If you found any bug, report a new issue here: https://github.com/WikiTeam/wikiteam/issues"
+    "If this is a public wiki, please, consider publishing this dump. Do it yourself as explained in https://github.com/WikiTeam/wikiteam/wiki/Tutorial#Publishing_the_dump or contact us at https://github.com/WikiTeam/wikiteam")
+    print ("Good luck! Bye!")
 
 
 def getParameters(params=[]):
@@ -1738,37 +1732,37 @@ def getParameters(params=[]):
         help="Avoid resuming, discard failing wikis quickly. Useful only for mass downloads.")
 
     args = parser.parse_args()
-    # print args
+    # print (args)
 
     # Don't mix download params and meta info params
     if (args.xml or args.images) and \
             (args.get_wiki_engine):
-        print 'ERROR: Don\'t mix download params and meta info params'
+        print ('ERROR: Don\'t mix download params and meta info params')
         parser.print_help()
         sys.exit(1)
 
     # No download params and no meta info params? Exit
     if (not args.xml and not args.images) and \
             (not args.get_wiki_engine):
-        print 'ERROR: Use at least one download param or meta info param'
+        print ('ERROR: Use at least one download param or meta info param')
         parser.print_help()
         sys.exit(1)
 
     # Execute meta info params
     if args.wiki:
         if args.get_wiki_engine:
-            print getWikiEngine(url=args.wiki)
+            print (getWikiEngine(url=args.wiki))
             sys.exit()
 
     # Create session
-    cj = cookielib.MozillaCookieJar()
+    cj = http.cookiejar.MozillaCookieJar()
     if args.cookies:
         cj.load(args.cookies)
-        print 'Using cookies from %s' % args.cookies
+        print ('Using cookies from %s' % args.cookies)
 
     session = requests.Session()
     try:
-        from requests.packages.urllib3.util.retry import Retry
+        from urllib3.util.retry import Retry
         from requests.adapters import HTTPAdapter
         # Courtesy datashaman https://stackoverflow.com/a/35504626
         __retries__ = Retry(total=5,
@@ -1787,8 +1781,8 @@ def getParameters(params=[]):
     # check URLs
     for url in [args.api, args.index, args.wiki]:
         if url and (not url.startswith('http://') and not url.startswith('https://')):
-            print url
-            print 'ERROR: URLs must start with http:// or https://\n'
+            print (url)
+            print ('ERROR: URLs must start with http:// or https://\n')
             parser.print_help()
             sys.exit(1)
 
@@ -1804,7 +1798,7 @@ def getParameters(params=[]):
                 if not index:
                     index = index2
             else:
-                print 'ERROR: Unsupported wiki. Wiki engines supported are: MediaWiki'
+                print ('ERROR: Unsupported wiki. Wiki engines supported are: MediaWiki')
                 sys.exit(1)
         else:
             if api == '':
@@ -1812,8 +1806,8 @@ def getParameters(params=[]):
             elif index == '':
                 index = '/'.join(api.split('/')[:-1]) + '/index.php'
 
-    # print api
-    # print index
+    # print (api)
+    # print (index)
     index2 = None
 
     if api:
@@ -1823,20 +1817,20 @@ def getParameters(params=[]):
         # Replace the index URL we got from the API check
         index2 = check[1]
         api = checkedapi
-        print 'API is OK: ' + checkedapi
+        print ('API is OK: ' + checkedapi)
     else:
         if index and not args.wiki:
-            print 'API not available. Trying with index.php only.'
+            print ('API not available. Trying with index.php only.')
             args.api = None
         else:
-            print 'Error in API. Please, provide a correct path to API'
+            print ('Error in API. Please, provide a correct path to API')
             sys.exit(1)
 
     if index and checkIndex(
             index=index,
             cookies=args.cookies,
             session=session):
-        print 'index.php is OK'
+        print ('index.php is OK')
     else:
         index = index2
         if index and index.startswith('//'):
@@ -1845,7 +1839,7 @@ def getParameters(params=[]):
                 index=index,
                 cookies=args.cookies,
                 session=session):
-            print 'index.php is OK'
+            print ('index.php is OK')
         else:
             try:
                 index = '/'.join(index.split('/')[:-1])
@@ -1855,16 +1849,16 @@ def getParameters(params=[]):
                     index=index,
                     cookies=args.cookies,
                     session=session):
-                print 'index.php is OK'
+                print ('index.php is OK')
             else:
-                print 'Error in index.php.'
+                print ('Error in index.php.')
                 if not args.xmlrevisions:
-                    print 'Please, provide a correct path to index.php or use --xmlrevisions. Terminating.'
+                    print ('Please, provide a correct path to index.php or use --xmlrevisions. Terminating.')
                     sys.exit(1)
 
     # check user and pass (one requires both)
     if (args.user and not args.password) or (args.password and not args.user):
-        print 'ERROR: Both --user and --pass are required for authentication.'
+        print ('ERROR: Both --user and --pass are required for authentication.')
         parser.print_help()
         sys.exit(1)
 
@@ -1876,7 +1870,7 @@ def getParameters(params=[]):
         if re.search(
                 r'[^\d, \-]',
                 args.namespaces) and args.namespaces.lower() != 'all':
-            print "Invalid namespace values.\nValid format is integer(s) separated by commas"
+            print ("Invalid namespace values.\nValid format is integer(s) separated by commas")
             sys.exit()
         else:
             ns = re.sub(' ', '', args.namespaces)
@@ -1888,19 +1882,19 @@ def getParameters(params=[]):
     # Process namespace exclusions
     if args.exnamespaces:
         if re.search(r'[^\d, \-]', args.exnamespaces):
-            print "Invalid namespace values.\nValid format is integer(s) separated by commas"
+            print ("Invalid namespace values.\nValid format is integer(s) separated by commas")
             sys.exit(1)
         else:
             ns = re.sub(' ', '', args.exnamespaces)
             if ns.lower() == 'all':
-                print 'You cannot exclude all namespaces.'
+                print ('You cannot exclude all namespaces.')
                 sys.exit(1)
             else:
                 exnamespaces = [int(i) for i in ns.split(',')]
 
     # --curonly requires --xml
     if args.curonly and not args.xml:
-        print "--curonly requires --xml\n"
+        print ("--curonly requires --xml\n")
         parser.print_help()
         sys.exit(1)
 
@@ -1938,7 +1932,7 @@ def getParameters(params=[]):
 
 
 def checkRetryAPI(api=None, retries=5, apiclient=False, session=None):
-    """ Call checkAPI and mwclient if necessary """
+    """Call checkAPI and mwclient if necessary"""
     retry = 0
     retrydelay = 20
     check = None
@@ -1947,9 +1941,9 @@ def checkRetryAPI(api=None, retries=5, apiclient=False, session=None):
             check = checkAPI(api, session=session)
             break
         except requests.exceptions.ConnectionError as e:
-            print 'Connection error: %s'%(str(e))
+            print ('Connection error: %s'%(str(e)))
             retry += 1
-            print "Start retry attempt %d in %d seconds."%(retry+1, retrydelay)
+            print ("Start retry attempt %d in %d seconds."%(retry+1, retrydelay))
             time.sleep(retrydelay)
 
     if check and apiclient:
@@ -1974,11 +1968,11 @@ def checkRetryAPI(api=None, retries=5, apiclient=False, session=None):
     return check, api
 
 def checkAPI(api=None, session=None):
-    """ Checking API availability """
+    """Checking API availability"""
     global cj
     # handle redirects
     for i in range(4):
-        print 'Checking API...', api
+        print ('Checking API...', api)
         r = session.get(
             url=api,
             params={
@@ -1993,7 +1987,7 @@ def checkAPI(api=None, session=None):
             p = r.url
             api = urlunparse([p.scheme, p.netloc, p.path, '', '', ''])
         elif r.status_code > 400:
-            print "MediaWiki API URL not found or giving error: HTTP %d" % r.status_code
+            print ("MediaWiki API URL not found or giving error: HTTP %d" % r.status_code)
             return False
     if "MediaWiki API is not enabled for this site." in r.text:
         return False
@@ -2006,33 +2000,33 @@ def checkAPI(api=None, session=None):
                     result['query']['general']['script']
                 return ( True, index, api )
             except KeyError:
-                print "MediaWiki API seems to work but returned no index URL"
+                print ("MediaWiki API seems to work but returned no index URL")
                 return (True, None, api)
     except ValueError:
-        print repr(r.text)
-        print "MediaWiki API returned data we could not parse"
+        print (repr(r.text))
+        print ("MediaWiki API returned data we could not parse")
         return False
     return False
 
 
 def checkIndex(index=None, cookies=None, session=None):
-    """ Checking index.php availability """
+    """Checking index.php availability"""
     r = session.post(url=index, data={'title': 'Special:Version'}, timeout=30)
     if r.status_code >= 400:
         print("ERROR: The wiki returned status code HTTP {}".format(r.status_code))
         return False
     raw = r.text
-    print 'Checking index.php...', index
+    print ('Checking index.php...', index)
     # Workaround for issue 71
     if re.search(
             r'(Special:Badtitle</a>|class="permissions-errors"|"wgCanonicalSpecialPageName":"Badtitle"|Login Required</h1>)',
             raw) and not cookies:
-        print "ERROR: This wiki requires login and we are not authenticated"
+        print ("ERROR: This wiki requires login and we are not authenticated")
         return False
     if re.search(
             r'(page-Index_php|"wgPageName":"Index.php"|"firstHeading"><span dir="auto">Index.php</span>)',
             raw):
-        print "Looks like the page called Index.php, not index.php itself"
+        print ("Looks like the page called Index.php, not index.php itself")
         return False
     if re.search(
             r'(This wiki is powered by|<h2 id="mw-version-license">|meta name="generator" content="MediaWiki)',
@@ -2042,7 +2036,7 @@ def checkIndex(index=None, cookies=None, session=None):
 
 
 def removeIP(raw=''):
-    """ Remove IP from HTML comments <!-- --> """
+    """Remove IP from HTML comments <!-- -->"""
 
     raw = re.sub(r'\d+\.\d+\.\d+\.\d+', '0.0.0.0', raw)
     # http://www.juniper.net/techpubs/software/erx/erx50x/swconfig-routing-vol1/html/ipv6-config5.html
@@ -2074,10 +2068,10 @@ def fixBOM(request):
 
 
 def checkXMLIntegrity(config={}, titles=[], session=None):
-    """ Check XML dump integrity, to detect broken XML chunks """
+    """Check XML dump integrity, to detect broken XML chunks"""
     return
 
-    print 'Verifying dump...'
+    print ('Verifying dump...')
     checktitles = 0
     checkpageopen = 0
     checkpageclose = 0
@@ -2107,7 +2101,7 @@ def checkXMLIntegrity(config={}, titles=[], session=None):
     if (checktitles == checkpageopen and checktitles == checkpageclose and checkrevisionopen == checkrevisionclose):
         pass
     else:
-        print 'XML dump seems to be corrupted.'
+        print ('XML dump seems to be corrupted.')
         reply = ''
         if config['failfast']:
             reply = 'yes'
@@ -2116,12 +2110,12 @@ def checkXMLIntegrity(config={}, titles=[], session=None):
         if reply.lower() in ['yes', 'y']:
             generateXMLDump(config=config, titles=titles, session=session)
         elif reply.lower() in ['no', 'n']:
-            print 'Not generating a new dump.'
+            print ('Not generating a new dump.')
 
 
 def createNewDump(config={}, other={}):
     images = []
-    print 'Trying generating a new dump into a new directory...'
+    print ('Trying generating a new dump into a new directory...')
     if config['xml']:
         getPageTitles(config=config, session=other['session'])
         titles=readTitles(config)
@@ -2144,7 +2138,7 @@ def createNewDump(config={}, other={}):
 
 def resumePreviousDump(config={}, other={}):
     images = []
-    print 'Resuming previous dump process...'
+    print ('Resuming previous dump process...')
     if config['xml']:
         titles=readTitles(config)
         try:
@@ -2160,9 +2154,9 @@ def resumePreviousDump(config={}, other={}):
             lasttitle = ''  # probably file does not exists
         if lasttitle == '--END--':
             # titles list is complete
-            print 'Title list was completed in the previous session'
+            print ('Title list was completed in the previous session')
         else:
-            print 'Title list is incomplete. Reloading...'
+            print ('Title list is incomplete. Reloading...')
             # do not resume, reload, to avoid inconsistences, deleted pages or
             # so
             getPageTitles(config=config, session=other['session'])
@@ -2194,10 +2188,10 @@ def resumePreviousDump(config={}, other={}):
             pass  # probably file does not exists
 
         if xmliscomplete:
-            print 'XML dump was completed in the previous session'
+            print ('XML dump was completed in the previous session')
         elif lastxmltitle:
             # resuming...
-            print 'Resuming XML dump from "%s"' % (lastxmltitle)
+            print ('Resuming XML dump from "%s"' % (lastxmltitle))
             titles = readTitles(config, start=lastxmltitle)
             generateXMLDump(
                 config=config,
@@ -2206,7 +2200,7 @@ def resumePreviousDump(config={}, other={}):
                 session=other['session'])
         else:
             # corrupt? only has XML header?
-            print 'XML is corrupt? Regenerating...'
+            print ('XML is corrupt? Regenerating...')
             titles = readTitles(config)
             generateXMLDump(
                 config=config, titles=titles, session=other['session'])
@@ -2222,7 +2216,7 @@ def resumePreviousDump(config={}, other={}):
                     config=config),
                     config['date']),
                 'r')
-            raw = unicode(f.read(), 'utf-8').strip()
+            raw = str(f.read(), 'utf-8').strip()
             lines = raw.split('\n')
             for l in lines:
                 if re.search(r'\t', l):
@@ -2232,9 +2226,9 @@ def resumePreviousDump(config={}, other={}):
         except:
             pass  # probably file does not exists
         if lastimage == u'--END--':
-            print 'Image list was completed in the previous session'
+            print ('Image list was completed in the previous session')
         else:
-            print 'Image list is incomplete. Reloading...'
+            print ('Image list is incomplete. Reloading...')
             # do not resume, reload, to avoid inconsistences, deleted images or
             # so
             images = getImageNames(config=config, session=other['session'])
@@ -2261,10 +2255,10 @@ def resumePreviousDump(config={}, other={}):
                 complete = False
                 break
             c += 1
-        print '%d images were found in the directory from a previous session' % (c)
+        print ('%d images were found in the directory from a previous session' % (c))
         if complete:
             # image dump is complete
-            print 'Image dump was completed in the previous session'
+            print ('Image dump was completed in the previous session')
         else:
             # we resume from previous image, which may be corrupted (or missing
             # .desc)  by the previous session ctrl-c or abort
@@ -2281,12 +2275,12 @@ def resumePreviousDump(config={}, other={}):
 
 
 def saveSpecialVersion(config={}, session=None):
-    """ Save Special:Version as .html, to preserve extensions details """
+    """Save Special:Version as .html, to preserve extensions details"""
 
     if os.path.exists('%s/Special:Version.html' % (config['path'])):
-        print 'Special:Version.html exists, do not overwrite'
+        print ('Special:Version.html exists, do not overwrite')
     else:
-        print 'Downloading Special:Version with extensions and other related info'
+        print ('Downloading Special:Version with extensions and other related info')
         r = session.post(
             url=config['index'], params={'title': 'Special:Version'}, timeout=10)
         raw = r.text
@@ -2297,12 +2291,12 @@ def saveSpecialVersion(config={}, session=None):
 
 
 def saveIndexPHP(config={}, session=None):
-    """ Save index.php as .html, to preserve license details available at the botom of the page """
+    """Save index.php as .html, to preserve license details available at the botom of the page"""
 
     if os.path.exists('%s/index.html' % (config['path'])):
-        print 'index.html exists, do not overwrite'
+        print ('index.html exists, do not overwrite')
     else:
-        print 'Downloading index.php (Main Page) as index.html'
+        print ('Downloading index.php (Main Page) as index.html')
         r = session.post(url=config['index'], params={}, timeout=10)
         raw = r.text
         delay(config=config, session=session)
@@ -2311,13 +2305,13 @@ def saveIndexPHP(config={}, session=None):
             outfile.write(raw.encode('utf-8'))
 
 def saveSiteInfo(config={}, session=None):
-    """ Save a file with site info """
+    """Save a file with site info"""
 
     if config['api']:
         if os.path.exists('%s/siteinfo.json' % (config['path'])):
-            print 'siteinfo.json exists, do not overwrite'
+            print ('siteinfo.json exists, do not overwrite')
         else:
-            print 'Downloading site info as siteinfo.json'
+            print ('Downloading site info as siteinfo.json')
 
             # MediaWiki 1.13+
             r = session.get(
@@ -2356,7 +2350,7 @@ def saveSiteInfo(config={}, session=None):
 
 
 def avoidWikimediaProjects(config={}, other={}):
-    """ Skip Wikimedia projects and redirect to the dumps website """
+    """Skip Wikimedia projects and redirect to the dumps website"""
 
     # notice about wikipedia dumps
     url = ''
@@ -2367,15 +2361,15 @@ def avoidWikimediaProjects(config={}, other={}):
     if re.findall(
             r'(?i)(wikipedia|wikisource|wiktionary|wikibooks|wikiversity|wikimedia|wikispecies|wikiquote|wikinews|wikidata|wikivoyage)\.org',
             url):
-        print 'PLEASE, DO NOT USE THIS SCRIPT TO DOWNLOAD WIKIMEDIA PROJECTS!'
-        print 'Download the dumps from http://dumps.wikimedia.org'
+        print ('PLEASE, DO NOT USE THIS SCRIPT TO DOWNLOAD WIKIMEDIA PROJECTS!')
+        print ('Download the dumps from http://dumps.wikimedia.org')
         if not other['force']:
-            print 'Thanks!'
+            print ('Thanks!')
             sys.exit()
 
 
 def getWikiEngine(url=''):
-    """ Returns the wiki engine of a URL, if known """
+    """Returns the wiki engine of a URL, if known"""
 
     session = requests.Session()
     session.headers.update({'User-Agent': getUserAgent()})
@@ -2452,13 +2446,13 @@ def getWikiEngine(url=''):
     elif re.search(ur'(?im)(<div id="footer-pbwiki">|ws-nav-search|PBinfo *= *{)', result):
         # formerly PBwiki
         wikiengine = 'PBworks'
-    # if wikiengine == 'Unknown': print result
+    # if wikiengine == 'Unknown': print (result)
 
     return wikiengine
 
 
 def mwGetAPIAndIndex(url=''):
-    """ Returns the MediaWiki API and Index.php """
+    """Returns the MediaWiki API and Index.php"""
 
     api = ''
     index = ''
@@ -2510,13 +2504,13 @@ def mwGetAPIAndIndex(url=''):
 
 
 def main(params=[]):
-    """ Main function """
+    """Main function"""
     configfilename = 'config.txt'
     config, other = getParameters(params=params)
     avoidWikimediaProjects(config=config, other=other)
 
-    print welcome()
-    print 'Analysing %s' % (config['api'] and config['api'] or config['index'])
+    print (welcome())
+    print ('Analysing %s' % (config['api'] and config['api'] or config['index']))
 
     # creating path or resuming if desired
     c = 2
@@ -2524,32 +2518,32 @@ def main(params=[]):
     originalpath = config['path']
     # do not enter if resume is requested from begining
     while not other['resume'] and os.path.isdir(config['path']):
-        print '\nWarning!: "%s" path exists' % (config['path'])
+        print ('\nWarning!: "%s" path exists' % (config['path']))
         reply = ''
         if config['failfast']:
             retry = 'yes'
         while reply.lower() not in ['yes', 'y', 'no', 'n']:
-            reply = raw_input(
+            reply = input(
                 'There is a dump in "%s", probably incomplete.\nIf you choose resume, to avoid conflicts, the parameters you have chosen in the current session will be ignored\nand the parameters available in "%s/%s" will be loaded.\nDo you want to resume ([yes, y], [no, n])? ' %
                 (config['path'],
                  config['path'],
                     configfilename))
         if reply.lower() in ['yes', 'y']:
             if not os.path.isfile('%s/%s' % (config['path'], configfilename)):
-                print 'No config file found. I can\'t resume. Aborting.'
+                print ('No config file found. I can\'t resume. Aborting.')
                 sys.exit()
-            print 'You have selected: YES'
+            print ('You have selected: YES')
             other['resume'] = True
             break
         elif reply.lower() in ['no', 'n']:
-            print 'You have selected: NO'
+            print ('You have selected: NO')
             other['resume'] = False
         config['path'] = '%s-%d' % (originalpath, c)
-        print 'Trying to use path "%s"...' % (config['path'])
+        print ('Trying to use path "%s"...' % (config['path']))
         c += 1
 
     if other['resume']:
-        print 'Loading config file...'
+        print ('Loading config file...')
         config = loadConfig(config=config, configfilename=configfilename)
     else:
         os.mkdir(config['path'])
diff --git a/gui.py b/gui.py
index a1be7904..20c3f76f 100644
--- a/gui.py
+++ b/gui.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2011-2012 WikiTeam
@@ -19,10 +19,8 @@
 import platform
 import random
 import re
-from Tkinter import *
-import ttk
-import tkMessageBox
-import thread
+from tkinter import Tk, ttk, messagebox, Label, W, E, N, S, LabelFrame, Entry, StringVar, OptionMenu, Button, Text, Scrollbar, LEFT, SUNKEN, Menu
+import threading
 import time
 import urllib
 import webbrowser
@@ -102,7 +100,7 @@ def __init__(self, master):
         self.optionmenu11var.set("api.php")
         self.optionmenu11 = OptionMenu(self.labelframe11, self.optionmenu11var, self.optionmenu11var.get(), "index.php")
         self.optionmenu11.grid(row=0, column=2)
-        self.button11 = Button(self.labelframe11, text="Check", command=lambda: thread.start_new_thread(self.checkURL, ()), width=5)
+        self.button11 = Button(self.labelframe11, text="Check", command=lambda: threading.start_new_threading(self.checkURL, ()), width=5)
         self.button11.grid(row=0, column=3)
         #batch download labelframe
         self.label12 = Label(self.labelframe12, text="Wiki URLs:")
@@ -174,12 +172,12 @@ def __init__(self, master):
         self.tree.heading('status', text='Status')
         self.tree.grid(row=2, column=0, columnspan=9, sticky=W+E+N+S)
         [self.tree.heading(column, text=column, command=lambda: self.treeSortColumn(column=column, reverse=False)) for column in columns]        
-        #self.tree.bind("<Double-1>", (lambda: thread.start_new_thread(self.downloadDump, ())))
+        #self.tree.bind("<Double-1>", (lambda: threading.start_new_threading(self.downloadDump, ())))
         self.tree.tag_configure('downloaded', background='lightgreen')
         self.tree.tag_configure('nodownloaded', background='white')
-        self.button21 = Button(self.frame2, text="Load available dumps", command=lambda: thread.start_new_thread(self.loadAvailableDumps, ()), width=15)
+        self.button21 = Button(self.frame2, text="Load available dumps", command=lambda: threading.start_new_threading(self.loadAvailableDumps, ()), width=15)
         self.button21.grid(row=3, column=0)
-        self.button23 = Button(self.frame2, text="Download selection", command=lambda: thread.start_new_thread(self.downloadDump, ()), width=15)
+        self.button23 = Button(self.frame2, text="Download selection", command=lambda: threading.start_new_threading(self.downloadDump, ()), width=15)
         self.button23.grid(row=3, column=4)
         self.button22 = Button(self.frame2, text="Clear list", command=self.deleteAvailableDumps, width=10)
         self.button22.grid(row=3, column=8, columnspan=2)
@@ -213,7 +211,7 @@ def __init__(self, master):
         #end menu
     
     def blocked(self):
-        tkMessageBox.showerror("Error", "There is a task in progress. Please, wait.")
+        messagebox.showerror("Error", "There is a task in progress. Please, wait.")
     
     def checkURL(self):
         if re.search(ur"(?im)^https?://[^/]+\.[^/]+/", self.entry11.get()): #well-constructed URL?, one dot at least, aaaaa.com, but bb.aaaaa.com is allowed too
@@ -234,7 +232,7 @@ def checkURL(self):
                     self.entry11.config(background='red')
                     self.msg('index.php is incorrect!', level='error')
         else:
-            tkMessageBox.showerror("Error", "You have to write a correct api.php or index.php URL.")
+            messagebox.showerror("Error", "You have to write a correct api.php or index.php URL.")
     
     def sumSizes(self, sizes):
         total = 0
@@ -266,15 +264,15 @@ def run(self):
         dumpgenerator.main(params=params)
 
         #check dump
-        """
+       """
     
     def msg(self, msg='', level=''):
         levels = { 'ok': 'lightgreen', 'warning': 'yellow', 'error': 'red' }
         if levels.has_key(level.lower()):
-            print '%s: %s' % (level.upper(), msg)
+            print ('%s: %s' % (level.upper(), msg))
             self.status.config(text='%s: %s' % (level.upper(), msg), background=levels[level.lower()])
         else:
-            print msg
+            print (msg)
             self.status.config(text=msg, background='grey')
     
     def treeSortColumn(self, column, reverse=False):
@@ -326,7 +324,7 @@ def downloadDump(self, event=None):
             else:
                 self.msg('Problems in %d dumps. Downloaded %d of %d (and %d were previously downloaded).' % (len(items)-(c+d), c, len(items), d), level='error')
         else:
-            tkMessageBox.showerror("Error", "You have to select some dumps to download.")
+            messagebox.showerror("Error", "You have to select some dumps to download.")
         self.clearAvailableDumps()
         self.showAvailableDumps()
         self.filterAvailableDumps()
@@ -410,7 +408,7 @@ def loadAvailableDumps(self):
         wikifarms_r = re.compile(ur"(%s)" % ('|'.join(wikifarms.keys())))
         c = 0
         for mirror, url, regexp in self.urls:
-            print 'Loading data from', mirror, url
+            print ('Loading data from', mirror, url)
             self.msg(msg='Please wait... Loading data from %s %s' % (mirror, url))
             f = urllib.urlopen(url)
             m = re.compile(regexp).finditer(f.read())
@@ -452,7 +450,7 @@ def callback(self):
         self.msg("Feature not implemented for the moment. Contributions are welcome.", level='warning')
     
 def askclose():
-    if tkMessageBox.askokcancel("Quit", "Do you really wish to exit?"):
+    if messagebox.askokcancel("Quit", "Do you really wish to exit?"):
         root.destroy()
 
 if __name__ == "__main__":
diff --git a/launcher.py b/launcher.py
index 708635ae..bddcc075 100644
--- a/launcher.py
+++ b/launcher.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2011-2016 WikiTeam
@@ -28,17 +28,17 @@
 
 def main():
     if len(sys.argv) < 2:
-        print 'python script.py file-with-apis.txt'
+        print ('python script.py file-with-apis.txt')
         sys.exit()
 
-    print 'Reading list of APIs from', sys.argv[1]
+    print ('Reading list of APIs from', sys.argv[1])
     wikis = open(sys.argv[1], 'r').read().splitlines()
-    print '%d APIs found' % (len(wikis))
+    print ('%d APIs found' % (len(wikis)))
 
     for wiki in wikis:
-        print "#"*73
-        print "# Downloading", wiki
-        print "#"*73
+        print ("#"*73)
+        print ("# Downloading", wiki)
+        print ("#"*73)
         wiki = wiki.lower()
         # Make the prefix in standard way; api and index must be defined, not important which is which
         prefix = dumpgenerator.domain2prefix(config={'api': wiki, 'index': wiki})
@@ -52,17 +52,17 @@ def main():
                 break #stop searching, dot not explore subdirectories
 
         if compressed:
-            print 'Skipping... This wiki was downloaded and compressed before in', zipfilename
+            print ('Skipping... This wiki was downloaded and compressed before in', zipfilename)
             # Get the archive's file list.
             if ( ( ( sys.version_info[0] == 3 ) and ( sys.version_info[1] > 0 ) ) or ( ( sys.version_info[0] == 2 ) and ( sys.version_info[1] > 6 ) ) ):
                 archivecontent = subprocess.check_output (['7z', 'l', zipfilename])
                 if re.search(ur"%s.+-history\.xml" % (prefix), archivecontent) is None:
                     # We should perhaps not create an archive in this case, but we continue anyway.
-                    print "ERROR: The archive contains no history!"
+                    print ("ERROR: The archive contains no history!")
                 if re.search(ur"Special:Version\.html", archivecontent) is None:
-                    print "WARNING: The archive doesn't contain Special:Version.html, this may indicate that download didn't finish."
+                    print ("WARNING: The archive doesn't contain Special:Version.html, this may indicate that download didn't finish.")
             else:
-                print "WARNING: Content of the archive not checked, we need python 2.7+ or 3.1+."
+                print ("WARNING: Content of the archive not checked, we need python 2.7+ or 3.1+.")
                 # TODO: Find a way like grep -q below without doing a 7z l multiple times?
             continue
 
@@ -81,10 +81,10 @@ def main():
         # such as editthis.info, wiki-site.com, wikkii (adjust the value as needed;
         # typically they don't provide any crawl-delay value in their robots.txt).
         if started and wikidir: #then resume
-            print 'Resuming download, using directory', wikidir
-            subprocess.call(['python2', 'dumpgenerator.py', '--api={}'.format(wiki), '--xml', '--images', '--resume', '--path={}'.format(wikidir)], shell=False)
+            print ('Resuming download, using directory', wikidir)
+            subprocess.call(['python3', 'dumpgenerator.py', '--api={}'.format(wiki), '--xml', '--images', '--resume', '--path={}'.format(wikidir)], shell=False)
         else: #download from scratch
-            subprocess.call(['python2', 'dumpgenerator.py', '--api={}'.format(wiki), '--xml', '--images'], shell=False)
+            subprocess.call(['python3', 'dumpgenerator.py', '--api={}'.format(wiki), '--xml', '--images'], shell=False)
             started = True
             #save wikidir now
             for f in os.listdir('.'):
@@ -98,7 +98,7 @@ def main():
         finished = False
         if started and wikidir and prefix:
             if (subprocess.call (['tail -n 1 %s/%s-history.xml | grep -q "</mediawiki>"' % (wikidir, prefix)], shell=True) ):
-                print "No </mediawiki> tag found: dump failed, needs fixing; resume didn't work. Exiting."
+                print ("No </mediawiki> tag found: dump failed, needs fixing; resume didn't work. Exiting.")
             else:
                 finished = True
         # You can also issue this on your working directory to find all incomplete dumps:
@@ -108,7 +108,7 @@ def main():
         if finished:
             time.sleep(1)
             os.chdir(wikidir)
-            print 'Changed directory to', os.getcwd()
+            print ('Changed directory to', os.getcwd())
             # Basic integrity check for the xml. The script doesn't actually do anything, so you should check if it's broken. Nothing can be done anyway, but redownloading.
             subprocess.call('grep "<title>" *.xml -c;grep "<page>" *.xml -c;grep "</page>" *.xml -c;grep "<revision>" *.xml -c;grep "</revision>" *.xml -c', shell=True)
             # Make a non-solid archive with all the text and metadata at default compression. You can also add config.txt if you don't care about your computer and user names being published or you don't use full paths so that they're not stored in it.
@@ -123,7 +123,7 @@ def main():
             subprocess.call('7z' + ' a -ms=off -mx=1 ../%s-wikidump.7z.tmp %s-images.txt images/' % (prefix, prefix), shell=True)
             subprocess.call('mv' + ' ../%s-wikidump.7z.tmp ../%s-wikidump.7z' % (prefix, prefix), shell=True)
             os.chdir('..')
-            print 'Changed directory to', os.getcwd()
+            print ('Changed directory to', os.getcwd())
             time.sleep(1)
 
 if __name__ == "__main__":
diff --git a/listsofwikis/mediawiki/checkalive.py b/listsofwikis/mediawiki/checkalive.py
index 3ea9b293..7611aef8 100644
--- a/listsofwikis/mediawiki/checkalive.py
+++ b/listsofwikis/mediawiki/checkalive.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2011-2012 WikiTeam
@@ -17,11 +17,11 @@
 
 # Script to check if a list of wikis are alive or dead
 
-import thread
+import threading
 import time
-import sys
-import urllib2
-import exceptions
+import urllib.request
+from urllib.error import *
+from http.server import BaseHTTPRequestHandler
 import re
 
 # Configuration
@@ -29,15 +29,23 @@
 limit = 100
 
 def printapi(api):
-    print api, 'is alive'
+    print (api, 'is alive')
     open('wikisalive.txt', 'a').write(('%s\n' % api.strip()).encode('utf-8'))
 
 def checkcore(api):
-    req = urllib2.Request(api, None)
+    req = urllib.request(api, None)
     try:
-        raw = urllib2.urlopen(req, None, delay).read()
-    except IOError: # http://docs.python.org/2/howto/urllib2.html#handling-exceptions
-        print api, 'is dead or has errors'
+        raw = urllib.request.urlopenurlopen(req, None, delay).read()
+    except URLError as reason: # https://docs.python.org/3/library/urllib.error.html
+
+        if reason.isinstance(HTTPError):
+            print (api + 'is dead or has errors because:')
+            print ("Error code " + HTTPError.code + ": " + BaseHTTPRequestHandler.responses[HTTPError.code].shortmessage)
+            print (BaseHTTPRequestHandler.responses[HTTPError.code].longmessage)
+            print ("Reason: " + HTTPError.reason)
+            print ("HTTP Headers:\n" + HTTPError.headers)
+        else:
+            print (api + 'is dead or has errors because:' + reason)
         return
     # RSD is available since 1.17, bug 25648
     rsd = re.search(r'(?:link rel="EditURI".+href=")(?:https?:)?(.+api.php)\?action=rsd', raw)
@@ -60,11 +68,11 @@ def checkcore(api):
         index = domain.group(1) + login.group(1)
         printapi(index)
     else:
-        print api, 'is not a MediaWiki wiki'
+        print (api, 'is not a MediaWiki wiki')
 
 def check(apis):
     for api in apis:
-        thread.start_new_thread(checkcore, (api,))
+        threading.start_new_threading(checkcore, (api,))
         time.sleep(0.1)
     time.sleep(delay+1)
 
diff --git a/listsofwikis/mediawiki/miraheze-spider.py b/listsofwikis/mediawiki/miraheze-spider.py
index f8d6019a..6ed1c828 100644
--- a/listsofwikis/mediawiki/miraheze-spider.py
+++ b/listsofwikis/mediawiki/miraheze-spider.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2014-2017 WikiTeam developers
@@ -29,7 +29,7 @@ def main():
     m = re.findall(ur'<tr><td>(<del>)?<a href="https://([^>]+?)/">[^<]+</a>', raw)
     m.sort()
     for i in m:
-        print 'https://' + i[1] + '/w/api.php'
+        print ('https://' + i[1] + '/w/api.php')
     
 if __name__ == '__main__':
     main()
diff --git a/listsofwikis/mediawiki/neoseeker-spider.py b/listsofwikis/mediawiki/neoseeker-spider.py
index deb3b3ca..35fa87e0 100644
--- a/listsofwikis/mediawiki/neoseeker-spider.py
+++ b/listsofwikis/mediawiki/neoseeker-spider.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2014-2017 WikiTeam developers
@@ -29,7 +29,7 @@ def main():
     m = re.findall(ur'<li><a href=\'([^>]+?)/wiki/\'>', raw)
     m.sort()
     for i in m:
-        print i + '/w/api.php'
+        print (i + '/w/api.php')
     
 if __name__ == '__main__':
     main()
diff --git a/listsofwikis/mediawiki/orain-spider.py b/listsofwikis/mediawiki/orain-spider.py
index b35992d1..807eeaa2 100644
--- a/listsofwikis/mediawiki/orain-spider.py
+++ b/listsofwikis/mediawiki/orain-spider.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2014 WikiTeam developers
@@ -28,7 +28,7 @@ def main():
     raw = r.text
     m = re.findall(ur'<tr><td><a href="//([^>]+?)/">[^<]+</a></td></tr>', raw)
     for i in m:
-        print 'http://' + i + '/w/api.php'
+        print ('http://' + i + '/w/api.php')
     
 if __name__ == '__main__':
     main()
diff --git a/listsofwikis/mediawiki/referata-spider.py b/listsofwikis/mediawiki/referata-spider.py
index 958dd704..f11a5c95 100644
--- a/listsofwikis/mediawiki/referata-spider.py
+++ b/listsofwikis/mediawiki/referata-spider.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2014 WikiTeam developers
@@ -33,7 +33,7 @@ def main():
         
         m = re.findall(ur'(?im)<h3 class="r"><a href=\"([^ ]+?)" onmouse', raw)
         for i in m:
-            print i
+            print (i)
         
         if re.search(ur'id="ofr"', raw): #resultados omitidos, final
             break
diff --git a/listsofwikis/mediawiki/shoutwiki-spider.py b/listsofwikis/mediawiki/shoutwiki-spider.py
index fced8662..6b7fbaa0 100644
--- a/listsofwikis/mediawiki/shoutwiki-spider.py
+++ b/listsofwikis/mediawiki/shoutwiki-spider.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2014 WikiTeam developers
@@ -41,7 +41,7 @@ def main():
         for site in jsonsites['query']['listwikis']:
             siteid = int(site['id'])
             siteurl = site['url']
-            print siteurl
+            print (siteurl)
         
         if len(jsonsites['query']['listwikis']) == int(swlimit):
             #there are more
diff --git a/listsofwikis/mediawiki/wiki-site-spider.py b/listsofwikis/mediawiki/wiki-site-spider.py
index 9b1407b3..49e3ca4c 100644
--- a/listsofwikis/mediawiki/wiki-site-spider.py
+++ b/listsofwikis/mediawiki/wiki-site-spider.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2014 WikiTeam developers
@@ -32,7 +32,7 @@ def main():
         raw = r.text
         m = re.findall(ur'<td><a href="([^>]+?)"', raw)
         for i in m:
-            print i
+            print (i)
     
 if __name__ == '__main__':
     main()
diff --git a/listsofwikis/mediawiki/wikia.py b/listsofwikis/mediawiki/wikia.py
index 249b8360..3e9d25b6 100644
--- a/listsofwikis/mediawiki/wikia.py
+++ b/listsofwikis/mediawiki/wikia.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # wikia.py List of not archived Wikia wikis
@@ -35,11 +35,11 @@ def getall():
     domains = {}
     empty = 0
     # This API module has no query continuation facility
-    print 'Getting list of active domains...'
+    print ('Getting list of active domains...')
     while True:
         list = getlist(wikia, offset, offset + limit)
         if list:
-            print offset
+            print (offset)
             domains = dict(domains.items() + list.items() )
             empty = 0
         else:
@@ -65,7 +65,7 @@ def main():
     for i in domains:
         dbname = re.sub('[-_.]', '', domains[i]['domain'].replace('.wikia.com', '') )
         dbname = re.escape(dbname)
-        print dbname
+        print (dbname)
         first = dbname[0]
         # There are one-letter dbnames; the second letter is replaced by an underscore
         # http://s3.amazonaws.com/wikia_xml_dumps/n/n_/n_pages_full.xml.7z
@@ -76,7 +76,7 @@ def main():
         base = 'http://s3.amazonaws.com/wikia_xml_dumps/' + first + '/' \
             + first + second + '/' + dbname
         full = base + '_pages_full.xml.7z'
-        print full
+        print (full)
         current = base + '_pages_current.xml.7z'
         images = base + '_images.tar'
         try:
@@ -86,7 +86,7 @@ def main():
         except subprocess.CalledProcessError as e:
             # We added --fail for this https://superuser.com/a/854102/283120
             if e.returncode == 22:
-                print 'Missing: ' + domains[i]['domain']
+                print ('Missing: ' + domains[i]['domain'])
                 undumped.append( domains[i]['domain'] )
 
         #try:
diff --git a/listsofwikis/mediawiki/wikkii-spider.py b/listsofwikis/mediawiki/wikkii-spider.py
index 6087482d..ab0fbb44 100644
--- a/listsofwikis/mediawiki/wikkii-spider.py
+++ b/listsofwikis/mediawiki/wikkii-spider.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2014 WikiTeam developers
@@ -28,7 +28,7 @@ def main():
     raw = r.text
     m = re.findall(ur'<dt> <a href="([^>]+?)" class="extiw"', raw)
     for i in m:
-        print i
+        print (i)
     
 if __name__ == '__main__':
     main()
diff --git a/listsofwikis/wikidot/wikidot-duckduckgo.py b/listsofwikis/wikidot/wikidot-duckduckgo.py
index 6c21e6e4..715039b9 100644
--- a/listsofwikis/wikidot/wikidot-duckduckgo.py
+++ b/listsofwikis/wikidot/wikidot-duckduckgo.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2018 WikiTeam developers
diff --git a/listsofwikis/wikidot/wikidot-spider.py b/listsofwikis/wikidot/wikidot-spider.py
index e7d56f7c..e2f7c9e1 100644
--- a/listsofwikis/wikidot/wikidot-spider.py
+++ b/listsofwikis/wikidot/wikidot-spider.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2018 WikiTeam developers
diff --git a/listsofwikis/wikispaces/wikispaces-duckduckgo.py b/listsofwikis/wikispaces/wikispaces-duckduckgo.py
index 3a9ba4e2..7f4b1ab5 100644
--- a/listsofwikis/wikispaces/wikispaces-duckduckgo.py
+++ b/listsofwikis/wikispaces/wikispaces-duckduckgo.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2018 WikiTeam developers
@@ -17,6 +17,7 @@
 
 import random
 import re
+import sys
 import time
 import urllib.request
 
diff --git a/listsofwikis/wikispaces/wikispaces-spider.py b/listsofwikis/wikispaces/wikispaces-spider.py
index 22bdbb8f..8fc611ce 100644
--- a/listsofwikis/wikispaces/wikispaces-spider.py
+++ b/listsofwikis/wikispaces/wikispaces-spider.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2016 wikiTeam
@@ -19,7 +19,7 @@
 import random
 import re
 import time
-import urllib2
+import urllib
 
 def loadUsers():
     users = {}
@@ -60,8 +60,8 @@ def saveWikis(wikis):
 def getUsers(wiki):
     wikiurl = 'https://%s.wikispaces.com/wiki/members?utable=WikiTableMemberList&ut_csv=1' % (wiki)
     try:
-        wikireq = urllib2.Request(wikiurl, headers={ 'User-Agent': 'Mozilla/5.0' })
-        wikicsv = urllib2.urlopen(wikireq)
+        wikireq = urllib.Request(wikiurl, headers={ 'User-Agent': 'Mozilla/5.0' })
+        wikicsv = urllib.urlopen(wikireq)
         reader = csv.reader(wikicsv, delimiter=',', quotechar='"')
         headers = next(reader, None)
         usersfound = {}
@@ -69,14 +69,14 @@ def getUsers(wiki):
             usersfound[row[0]] = u'?'
         return usersfound
     except:
-        print 'Error reading', wikiurl
+        print ('Error reading', wikiurl)
         return {}
 
 def getWikis(user):
     wikiurl = 'https://www.wikispaces.com/user/view/%s' % (user)
     try:
-        wikireq = urllib2.Request(wikiurl, headers={ 'User-Agent': 'Mozilla/5.0' })
-        html = urllib2.urlopen(wikireq).read()
+        wikireq = urllib.Request(wikiurl, headers={ 'User-Agent': 'Mozilla/5.0' })
+        html = urllib.urlopen(wikireq).read()
         if 'Wikis: ' in html:
             html = html.split('Wikis: ')[1].split('</div>')[0]
             wikisfound = {}
@@ -85,7 +85,7 @@ def getWikis(user):
             return wikisfound
         return {}
     except:
-        print 'Error reading', wikiurl
+        print ('Error reading', wikiurl)
         return {}
 
 def main():
@@ -96,16 +96,16 @@ def main():
     
     usersc = len(users)
     wikisc = len(wikis)
-    print 'Loading files'
-    print 'Loaded', usersc, 'users'
-    print 'Loaded', wikisc, 'wikis'
+    print ('Loading files')
+    print ('Loaded', usersc, 'users')
+    print ('Loaded', wikisc, 'wikis')
     
     # find more users
-    print 'Scanning wikis for more users'
+    print ('Scanning wikis for more users')
     for wiki, numusers in wikis.items():
         if numusers != '?': #we have scanned this wiki before, skiping
             continue
-        print 'Scanning https://%s.wikispaces.com for users' % (wiki)
+        print ('Scanning https://%s.wikispaces.com for users' % (wiki))
         users2 = getUsers(wiki)
         wikis[wiki] = len(users2)
         c = 0
@@ -113,7 +113,7 @@ def main():
             if x2 not in users.keys():
                 users[x2] = u'?'
                 c += 1
-        print 'Found %s new users' % (c)
+        print ('Found %s new users' % (c))
         if c > 0:
             if random.randint(0,rand) == 0:
                 saveUsers(users)
@@ -127,11 +127,11 @@ def main():
     users = loadUsers()
     
     # find more wikis
-    print 'Scanning users for more wikis'
+    print ('Scanning users for more wikis')
     for user, numwikis in users.items():
         if numwikis != '?': #we have scanned this user before, skiping
             continue
-        print 'Scanning https://www.wikispaces.com/user/view/%s for wikis' % (user)
+        print ('Scanning https://www.wikispaces.com/user/view/%s for wikis' % (user))
         wikis2 = getWikis(user)
         users[user] = len(wikis2)
         c = 0
@@ -139,7 +139,7 @@ def main():
             if x2 not in wikis.keys():
                 wikis[x2] = u'?'
                 c += 1
-        print 'Found %s new wikis' % (c)
+        print ('Found %s new wikis' % (c))
         if c > 0:
             if random.randint(0,rand) == 0:
                 saveWikis(wikis)
@@ -152,9 +152,9 @@ def main():
     saveUsers(users)
     users = loadUsers()
     
-    print '\nSummary:'
-    print 'Found', len(users)-usersc, 'new users'
-    print 'Found', len(wikis)-wikisc, 'new wikis'
+    print ('\nSummary:')
+    print ('Found', len(users)-usersc, 'new users')
+    print ('Found', len(wikis)-wikisc, 'new wikis')
 
 if __name__ == '__main__':
     main()
diff --git a/not-archived.py b/not-archived.py
index 5418288e..8dbc0981 100644
--- a/not-archived.py
+++ b/not-archived.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # not-archived.py List of not archived wikis, using WikiApiary data
@@ -46,7 +46,7 @@ def main():
         for i in m:
             domain = getdomain(i[1])
             if domain not in donewikis and not domain.endswith('editthis.info') and not domain.endswith('wiki-site.com'):
-                print i[1], i[2], i[3], i[0]
+                print (i[1], i[2], i[3], i[0])
         
         if not re.search(ur'rel="nofollow">Next</a>', raw):
             break
diff --git a/poster/LICENSE.txt b/poster/LICENSE.txt
new file mode 100644
index 00000000..75923941
--- /dev/null
+++ b/poster/LICENSE.txt
@@ -0,0 +1,21 @@
+The MIT License (MIT)
+
+Copyright (c) 2011 Chris AtLee
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in all
+copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE
+SOFTWARE.
diff --git a/poster/PKG-INFO b/poster/PKG-INFO
new file mode 100644
index 00000000..f830ca1a
--- /dev/null
+++ b/poster/PKG-INFO
@@ -0,0 +1,22 @@
+Metadata-Version: 1.0
+Name: poster
+Version: 0.8.1
+Summary: Streaming HTTP uploads and multipart/form-data encoding
+Home-page: http://atlee.ca/software/poster
+Author: Chris AtLee
+Author-email: chris@atlee.ca
+License: MIT
+Download-URL: http://atlee.ca/software/poster/dist/0.8.1
+Description: The modules in the Python standard library don't provide a way to upload large
+        files via HTTP without having to load the entire file into memory first.
+        
+        poster provides support for both streaming POST requests as well as
+        multipart/form-data encoding of string or file parameters
+Keywords: python http post multipart/form-data file upload
+Platform: UNKNOWN
+Classifier: Intended Audience :: Developers
+Classifier: License :: OSI Approved :: MIT License
+Classifier: Natural Language :: English
+Classifier: Programming Language :: Python
+Classifier: Topic :: Internet :: WWW/HTTP
+Classifier: Topic :: Software Development :: Libraries :: Python Modules
diff --git a/poster/README.md b/poster/README.md
new file mode 100644
index 00000000..d32c5ed4
--- /dev/null
+++ b/poster/README.md
@@ -0,0 +1,187 @@
+Python 3 Port of Poster
+==================================
+This fork contains a simple port from Chris AtLee's original code.
+The following readme may be found on his website, and is included for reference purposes only.
+http://atlee.ca/software/poster/
+
+ Welcome to poster's documentation!
+==================================
+
+:Author: Chris AtLee <chris@atlee.ca>
+:Date: |today|
+
+poster provides a set of classes and functions to faciliate making HTTP POST
+(or PUT) requests using the standard multipart/form-data encoding.
+
+Example
+-------
+
+A short example may help::
+
+    # test_client.py
+    from poster.encode import multipart_encode
+    from poster.streaminghttp import register_openers
+    import urllib2
+
+    # Register the streaming http handlers with urllib2
+    register_openers()
+
+    # Start the multipart/form-data encoding of the file "DSC0001.jpg"
+    # "image1" is the name of the parameter, which is normally set
+    # via the "name" parameter of the HTML <input> tag.
+    
+    # headers contains the necessary Content-Type and Content-Length
+    # datagen is a generator object that yields the encoded parameters
+    datagen, headers = multipart_encode({"image1": open("DSC0001.jpg", "rb")})
+
+    # Create the Request object
+    request = urllib2.Request("http://localhost:5000/upload_image", datagen, headers)
+    # Actually do the request, and get the response
+    print urllib2.urlopen(request).read()
+
+And we can check that it's working with Paste and WebOb::
+
+    # test_server.py
+    import webob
+    from paste import httpserver
+
+    def app(environ, start_response):
+        request = webob.Request(environ)
+        start_response("200 OK", [("Content-Type", "text/plain")])
+
+        for name,value in request.POST.items():
+            yield "%s: %s\n" % (name, value)
+
+    httpserver.serve(app, port=5000)
+
+After starting up the server, you should be able to connect to it with
+the client and get the following output::
+
+    image1: FieldStorage('image1', 'DSC0001.jpg')
+
+For more control over how individiual parameters are handled, you should use
+the :class:`poster.encode.MultipartParam` class::
+
+    image_param = MultipartParam.from_file("image1", "DSC0001.jpg")
+
+    datagen, headers = multipart_encode([image_param])
+
+You can also combine poster with other urllib2 handlers, e.g. for sending cookies::
+
+    opener = poster.streaminghttp.register_openers()
+    opener.add_handler(urllib2.HTTPCookieProcessor(cookielib.CookieJar()))
+
+    params = {'file': open("test.txt", "rb"), 'name': 'upload test'}
+    datagen, headers = poster.encode.multipart_encode(params)
+    request = urllib2.Request(upload_url, datagen, headers)
+    result = urllib2.urlopen(request)
+
+
+Roadmap
+-------
+
+0.1 (2008-07-02):
+    - First release, used on internal projects
+
+0.2 (2008-12-01):
+    - Bug fixes from 0.1
+
+0.3 (2009-01-02):
+    - Bug fixes from 0.2:
+       - Use quoted-string encoding for filename parameter
+       - Terminate encoded document with MIME boundary (Thanks to Stephen Waterbury)
+
+0.4 (2009-04-05):
+    - Added __all__ attributes to modules
+    - Bug fixes from 0.3:
+        - Fix connections to HTTPS.  Thanks to Kenji Noguchi and Marat Khayrullin
+
+0.5 (2009-10-07):
+    - Fix MultipartParam to open files in binary mode
+    - Update docs to open files in binary mode
+    - Updated register_openers() to return the OpenerDirector object
+
+0.6 (2010-05-10):
+    - Update docs to clarify how to use multiple parameters with the same key
+    - Fix for unicode filenames.  Thanks to Zed Shaw.
+    - Added poster.version attribute.  Thanks to JP Calderone.
+    - Handle StringIO file objects.  Thanks to Christophe Combelles.
+
+0.7.0 (2010-10-23):
+    - Added callback parameters to MutipartParam and multipart_encode so you
+      can add progress indicators to your applications.  Thanks to Ludvig
+      Ericson for the suggestion.
+    - Fixed a bug where posting to a url that returned a 401 code would hang.
+      Thanks to Patrick Guido and Andreas Loupasakis for the bug reports.
+    - MultipartParam.from_params will now accept MultipartParam instances as
+      the values of a dict object passed in.  The parameter name must match the
+      key corresponding to the parameter in the dict.  Thanks to Matthew King
+      for the suggestion.
+    - poster now works under python2.7
+
+0.8.0 (2011-02-13):
+    - Fixed parameter name encoding so that it follows RFC 2388,2047.  Thanks
+      to Emilien Klein for pointing this out.
+    - Don't include Content-Length header for each part of the multipart
+      message.  Fixes issues with some ruby web servers.  Thanks to Anders
+      Pearson.
+
+0.8.1 (2011-04-16):
+    - Factor out handler creation into get_handlers() method. Thanks to Flavio
+      Percoco Premoli
+
+0.9 (future):
+    - Finalize API
+
+1.0 (future):
+    - Bug fixes from 0.9
+    - No new features
+
+Module reference
+----------------
+
+.. toctree::
+   :maxdepth: 2
+
+   poster
+
+Download
+--------
+poster can be downloaded from http://atlee.ca/software/poster/dist/0.8.1
+
+Source & Bugs
+-------------
+The source code and issue tracker are currently hosted on
+http://bitbucket.org/chrisatlee/poster
+
+License
+-------
+poster is licensed under the MIT license:
+
+Copyright (c) 2011 Chris AtLee
+
+Permission is hereby granted, free of charge, to any person obtaining a copy
+of this software and associated documentation files (the "Software"), to deal
+in the Software without restriction, including without limitation the rights
+to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+copies of the Software, and to permit persons to whom the Software is
+furnished to do so, subject to the following conditions:
+
+The above copyright notice and this permission notice shall be included in
+all copies or substantial portions of the Software.
+
+THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+THE SOFTWARE.
+
+
+Indices and tables
+==================
+
+* :ref:`genindex`
+* :ref:`modindex`
+* :ref:`search`
diff --git a/poster/__init__.py b/poster/__init__.py
new file mode 100644
index 00000000..29073146
--- /dev/null
+++ b/poster/__init__.py
@@ -0,0 +1,32 @@
+# Copyright (c) 2011 Chris AtLee
+# 
+# Permission is hereby granted, free of charge, to any person obtaining a copy
+# of this software and associated documentation files (the "Software"), to deal
+# in the Software without restriction, including without limitation the rights
+# to use, copy, modify, merge, publish, distribute, sublicense, and/or sell
+# copies of the Software, and to permit persons to whom the Software is
+# furnished to do so, subject to the following conditions:
+# 
+# The above copyright notice and this permission notice shall be included in
+# all copies or substantial portions of the Software.
+# 
+# THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
+# IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
+# FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE
+# AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
+# LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM,
+# OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN
+# THE SOFTWARE.
+"""poster module
+
+Support for streaming HTTP uploads, and multipart/form-data encoding
+
+```poster.version``` is a 3-tuple of integers representing the version number.
+New releases of poster will always have a version number that compares greater
+than an older version of poster.
+New in version 0.6."""
+
+import poster.streaminghttp
+import poster.encode
+
+version = (0, 8, 1) # Thanks JP!
diff --git a/poster/encode.py b/poster/encode.py
new file mode 100644
index 00000000..ad9892cf
--- /dev/null
+++ b/poster/encode.py
@@ -0,0 +1,414 @@
+"""multipart/form-data encoding module
+
+This module provides functions that faciliate encoding name/value pairs
+as multipart/form-data suitable for a HTTP POST or PUT request.
+
+multipart/form-data is the standard way to upload files over HTTP"""
+
+unicode = str
+__all__ = ['gen_boundary', 'encode_and_quote', 'MultipartParam',
+        'encode_string', 'encode_file_header', 'get_body_size', 'get_headers',
+        'multipart_encode']
+
+try:
+    import uuid
+    def gen_boundary():
+        """Returns a random string to use as the boundary for a message"""
+        return uuid.uuid4().hex
+except ImportError:
+    import random
+    from hashlib import sha
+    def gen_boundary():
+        """Returns a random string to use as the boundary for a message"""
+        bits = random.getrandbits(160)
+        return sha.new(str(bits)).hexdigest()
+
+import urllib, re, os, mimetypes
+from email.header import Header
+
+def encode_and_quote(data):
+    """If ``data`` is unicode, return urllib.parse.quote_plus(data.encode("utf-8"))
+    otherwise return urllib.parse.quote_plus(data)"""
+    if data is None:
+        return None
+
+    if isinstance(data, unicode):
+        data = data.encode("utf-8")
+    return urllib.parse.quote_plus(data)
+
+def _strify(s):
+    """If s is a unicode string, encode it to UTF-8 and return the results,
+    otherwise return str(s), or None if s is None"""
+    if s is None:
+        return None
+    if isinstance(s, unicode):
+        return s.encode("utf-8")
+    return str(s)
+
+class MultipartParam(object):
+    """Represents a single parameter in a multipart/form-data request
+
+    ``name`` is the name of this parameter.
+
+    If ``value`` is set, it must be a string or unicode object to use as the
+    data for this parameter.
+
+    If ``filename`` is set, it is what to say that this parameter's filename
+    is.  Note that this does not have to be the actual filename any local file.
+
+    If ``filetype`` is set, it is used as the Content-Type for this parameter.
+    If unset it defaults to "text/plain; charset=utf8"
+
+    If ``filesize`` is set, it specifies the length of the file ``fileobj``
+
+    If ``fileobj`` is set, it must be a file-like object that supports
+    .read().
+
+    Both ``value`` and ``fileobj`` must not be set, doing so will
+    raise a ValueError assertion.
+
+    If ``fileobj`` is set, and ``filesize`` is not specified, then
+    the file's size will be determined first by stat'ing ``fileobj``'s
+    file descriptor, and if that fails, by seeking to the end of the file,
+    recording the current position as the size, and then by seeking back to the
+    beginning of the file.
+
+    ``cb`` is a callable which will be called from iter_encode with (self,
+    current, total), representing the current parameter, current amount
+    transferred, and the total size.
+    """
+    def __init__(self, name, value=None, filename=None, filetype=None,
+                        filesize=None, fileobj=None, cb=None):
+        self.name = Header(name).encode()
+        self.value = _strify(value)
+        if filename is None:
+            self.filename = None
+        else:
+            if isinstance(filename, unicode):
+                # Encode with XML entities
+                self.filename = filename.encode("ascii", "xmlcharrefreplace")
+            else:
+                self.filename = str(filename)
+            self.filename = self.filename.replace(b'"', b'\\"')
+        self.filetype = _strify(filetype)
+
+        self.filesize = filesize
+        self.fileobj = fileobj
+        self.cb = cb
+
+        if self.value is not None and self.fileobj is not None:
+            raise ValueError("Only one of value or fileobj may be specified")
+
+        if fileobj is not None and filesize is None:
+            # Try and determine the file size
+            try:
+                self.filesize = os.fstat(fileobj.fileno()).st_size
+            except (OSError, AttributeError):
+                try:
+                    fileobj.seek(0, 2)
+                    self.filesize = fileobj.tell()
+                    fileobj.seek(0)
+                except:
+                    raise ValueError("Could not determine filesize")
+
+    def reset(self):
+        if self.fileobj is not None:
+            self.fileobj.seek(0)
+        elif self.value is None:
+            raise ValueError("Don't know how to reset this parameter")
+
+    @classmethod
+    def from_file(cls, paramname, filename):
+        """Returns a new MultipartParam object constructed from the local
+        file at ``filename``.
+
+        ``filesize`` is determined by os.path.getsize(``filename``)
+
+        ``filetype`` is determined by mimetypes.guess_type(``filename``)[0]
+
+        ``filename`` is set to os.path.basename(``filename``)
+        """
+
+        return cls(paramname, filename=os.path.basename(filename),
+                filetype=mimetypes.guess_type(filename)[0],
+                filesize=os.path.getsize(filename),
+                fileobj=open(filename, "rb"))
+
+    @classmethod
+    def from_params(cls, params):
+        """Returns a list of MultipartParam objects from a sequence of
+        name, value pairs, MultipartParam instances,
+        or from a mapping of names to values
+
+        The values may be strings or file objects, or MultipartParam objects.
+        MultipartParam object names must match the given names in the
+        name,value pairs or mapping, if applicable."""
+        if hasattr(params, 'items'):
+            params = params.items()
+
+        retval = []
+        for item in params:
+            if isinstance(item, cls):
+                retval.append(item)
+                continue
+            name, value = item
+            if isinstance(value, cls):
+                assert value.name == name
+                retval.append(value)
+                continue
+            if hasattr(value, 'read'):
+                # Looks like a file object
+                filename = getattr(value, 'name', None)
+                if filename is not None:
+                    filetype = mimetypes.guess_type(filename)[0]
+                else:
+                    filetype = None
+
+                retval.append(cls(name=name, filename=filename,
+                    filetype=filetype, fileobj=value))
+            else:
+                retval.append(cls(name, value))
+        return retval
+
+    def encode_hdr(self, boundary):
+        """Returns the header of the encoding of this parameter"""
+        boundary = encode_and_quote(boundary)
+
+        headers = ["--%s" % boundary]
+
+        if self.filename:
+            disposition = 'form-data; name="%s"; filename="%s"' % (self.name,
+                    self.filename.decode("utf-8"))
+        else:
+            disposition = 'form-data; name="%s"' % self.name
+
+        headers.append("Content-Disposition: %s" % disposition)
+
+        if self.filetype:
+            filetype = self.filetype
+        else:
+            filetype = "text/plain; charset=utf-8"
+
+        try:
+            headers.append("Content-Type: %s" % filetype.decode("utf-8"))
+        except:
+            headers.append("Content-Type: %s" % filetype)
+
+        headers.append("")
+        headers.append("")
+
+        return "\r\n".join(headers)
+
+    def encode(self, boundary):
+        """Returns the string encoding of this parameter"""
+        if self.value is None:
+            value = self.fileobj.read()
+        else:
+            value = self.value
+
+        try:
+            if re.search("^--%s$" % re.escape(boundary), value, re.M):
+                raise ValueError("boundary found in encoded string")
+        except TypeError:
+            pass
+
+        return "%s%s\r\n" % (self.encode_hdr(boundary), value)
+
+    def iter_encode(self, boundary, blocksize=4096):
+        """Yields the encoding of this parameter
+        If self.fileobj is set, then blocks of ``blocksize`` bytes are read and
+        yielded."""
+        total = self.get_size(boundary)
+        current = 0
+        if self.value is not None:
+            block = self.encode(boundary)
+            current += len(block)
+            yield block
+            if self.cb:
+                self.cb(self, current, total)
+        else:
+            block = self.encode_hdr(boundary)
+            current += len(block)
+            yield block
+            if self.cb:
+                self.cb(self, current, total)
+            last_block = ""
+            encoded_boundary = "--%s" % encode_and_quote(boundary)
+            boundary_exp = re.compile("^%s$" % re.escape(encoded_boundary),
+                    re.M)
+            while True:
+                block = self.fileobj.read(blocksize)
+                if not block:
+                    current += 2
+                    yield "\r\n"
+                    if self.cb:
+                        self.cb(self, current, total)
+                    break
+                try:
+                    last_block += block
+                except:
+                    last_block += str(block)
+                if boundary_exp.search(last_block):
+                    raise ValueError("boundary found in file data")
+                last_block = last_block[-len(encoded_boundary)-2:]
+                current += len(block)
+                yield block
+                if self.cb:
+                    self.cb(self, current, total)
+
+    def get_size(self, boundary):
+        """Returns the size in bytes that this param will be when encoded
+        with the given boundary."""
+        if self.filesize is not None:
+            valuesize = self.filesize
+        else:
+            valuesize = len(self.value)
+
+        return len(self.encode_hdr(boundary)) + 2 + valuesize
+
+def encode_string(boundary, name, value):
+    """Returns ``name`` and ``value`` encoded as a multipart/form-data
+    variable.  ``boundary`` is the boundary string used throughout
+    a single request to separate variables."""
+
+    return MultipartParam(name, value).encode(boundary)
+
+def encode_file_header(boundary, paramname, filesize, filename=None,
+        filetype=None):
+    """Returns the leading data for a multipart/form-data field that contains
+    file data.
+
+    ``boundary`` is the boundary string used throughout a single request to
+    separate variables.
+
+    ``paramname`` is the name of the variable in this request.
+
+    ``filesize`` is the size of the file data.
+
+    ``filename`` if specified is the filename to give to this field.  This
+    field is only useful to the server for determining the original filename.
+
+    ``filetype`` if specified is the MIME type of this file.
+
+    The actual file data should be sent after this header has been sent.
+    """
+
+    return MultipartParam(paramname, filesize=filesize, filename=filename,
+            filetype=filetype).encode_hdr(boundary)
+
+def get_body_size(params, boundary):
+    """Returns the number of bytes that the multipart/form-data encoding
+    of ``params`` will be."""
+    size = sum(p.get_size(boundary) for p in MultipartParam.from_params(params))
+    return size + len(boundary) + 6
+
+def get_headers(params, boundary):
+    """Returns a dictionary with Content-Type and Content-Length headers
+    for the multipart/form-data encoding of ``params``."""
+    headers = {}
+    boundary = urllib.parse.quote_plus(boundary)
+    headers['Content-Type'] = "multipart/form-data; boundary=%s" % boundary
+    headers['Content-Length'] = str(get_body_size(params, boundary))
+    return headers
+
+class multipart_yielder:
+    def __init__(self, params, boundary, cb):
+        self.params = params
+        self.boundary = boundary
+        self.cb = cb
+
+        self.i = 0
+        self.p = None
+        self.param_iter = None
+        self.current = 0
+        self.total = get_body_size(params, boundary)
+
+    def __iter__(self):
+        return self
+
+    def __next__(self):
+        """generator function to yield multipart/form-data representation
+        of parameters"""
+        if self.param_iter is not None:
+            try:
+                block = self.param_iter.__next__()
+                self.current += len(block)
+                if self.cb:
+                    self.cb(self.p, self.current, self.total)
+                return block
+            except StopIteration:
+                self.p = None
+                self.param_iter = None
+
+        if self.i is None:
+            raise StopIteration
+        elif self.i >= len(self.params):
+            self.param_iter = None
+            self.p = None
+            self.i = None
+            block = "--%s--\r\n" % self.boundary
+            self.current += len(block)
+            if self.cb:
+                self.cb(self.p, self.current, self.total)
+            return block
+
+        self.p = self.params[self.i]
+        self.param_iter = self.p.iter_encode(self.boundary)
+        self.i += 1
+        return self.__next__()
+
+    def reset(self):
+        self.i = 0
+        self.current = 0
+        for param in self.params:
+            param.reset()
+
+def multipart_encode(params, boundary=None, cb=None):
+    """Encode ``params`` as multipart/form-data.
+
+    ``params`` should be a sequence of (name, value) pairs or MultipartParam
+    objects, or a mapping of names to values.
+    Values are either strings parameter values, or file-like objects to use as
+    the parameter value.  The file-like objects must support .read() and either
+    .fileno() or both .seek() and .tell().
+
+    If ``boundary`` is set, then it as used as the MIME boundary.  Otherwise
+    a randomly generated boundary will be used.  In either case, if the
+    boundary string appears in the parameter values a ValueError will be
+    raised.
+
+    If ``cb`` is set, it should be a callback which will get called as blocks
+    of data are encoded.  It will be called with (param, current, total),
+    indicating the current parameter being encoded, the current amount encoded,
+    and the total amount to encode.
+
+    Returns a tuple of `datagen`, `headers`, where `datagen` is a
+    generator that will yield blocks of data that make up the encoded
+    parameters, and `headers` is a dictionary with the assoicated
+    Content-Type and Content-Length headers.
+
+    Examples:
+
+    >>> datagen, headers = multipart_encode( [("key", "value1"), ("key", "value2")] )
+    >>> s = "".join(datagen)
+    >>> assert "value2" in s and "value1" in s
+
+    >>> p = MultipartParam("key", "value2")
+    >>> datagen, headers = multipart_encode( [("key", "value1"), p] )
+    >>> s = "".join(datagen)
+    >>> assert "value2" in s and "value1" in s
+
+    >>> datagen, headers = multipart_encode( {"key": "value1"} )
+    >>> s = "".join(datagen)
+    >>> assert "value2" not in s and "value1" in s
+
+    """
+    if boundary is None:
+        boundary = gen_boundary()
+    else:
+        boundary = urllib.parse.quote_plus(boundary)
+
+    headers = get_headers(params, boundary)
+    params = MultipartParam.from_params(params)
+
+    return multipart_yielder(params, boundary, cb), headers
diff --git a/poster/streaminghttp.py b/poster/streaminghttp.py
new file mode 100644
index 00000000..7d59f7b4
--- /dev/null
+++ b/poster/streaminghttp.py
@@ -0,0 +1,205 @@
+"""Streaming HTTP uploads module.
+
+This module extends the standard http.client and urllib.request objects so that
+iterable objects can be used in the body of HTTP requests.
+
+In most cases all one should have to do is call :func:`register_openers()`
+to register the new streaming http handlers which will take priority over
+the default handlers, and then you can use iterable objects in the body
+of HTTP requests.
+
+**N.B.** You must specify a Content-Length header if using an iterable object
+since there is no way to determine in advance the total size that will be
+yielded, and there is no way to reset an interator.
+
+Example usage:
+
+>>> from StringIO import StringIO
+>>> import urllib.request, poster.streaminghttp
+
+>>> opener = poster.streaminghttp.register_openers()
+
+>>> s = "Test file data"
+>>> f = StringIO(s)
+
+>>> req = urllib.request.Request("http://localhost:5000", f,
+...                       {'Content-Length': str(len(s))})
+"""
+
+import http.client, urllib.request, socket
+from http.client import NotConnected
+
+__all__ = ['StreamingHTTPConnection', 'StreamingHTTPRedirectHandler',
+        'StreamingHTTPHandler', 'register_openers']
+
+if hasattr(http.client, 'HTTPS'):
+    __all__.extend(['StreamingHTTPSHandler', 'StreamingHTTPSConnection'])
+
+class _StreamingHTTPMixin:
+    """Mixin class for HTTP and HTTPS connections that implements a streaming
+    send method."""
+    def send(self, value):
+        """Send ``value`` to the server.
+
+        ``value`` can be a string object, a file-like object that supports
+        a .read() method, or an iterable object that supports a .__next__()
+        method.
+        """
+        # Based on python 2.6's http.client.HTTPConnection.send()
+        if self.sock is None:
+            if self.auto_open:
+                self.connect()
+            else:
+                raise NotConnected()
+
+        # send the data to the server. if we get a broken pipe, then close
+        # the socket. we want to reconnect when somebody tries to send again.
+        #
+        # NOTE: we DO propagate the error, though, because we cannot simply
+        #       ignore the error... the caller will know if they can retry.
+        if self.debuglevel > 0:
+            print("send:", repr(value))
+        try:
+            blocksize = 8192
+            if hasattr(value, 'read') :
+                if hasattr(value, 'seek'):
+                    value.seek(0)
+                if self.debuglevel > 0:
+                    print("sendIng a read()able")
+                data = value.read(blocksize)
+                while data:
+                    try:
+                        self.sock.sendall(data)
+                    except:
+                        self.sock.sendall(bytes(data, "utf-8"))
+                    data = value.read(blocksize)
+            elif hasattr(value, '__next__'):
+                if hasattr(value, 'reset'):
+                    value.reset()
+                if self.debuglevel > 0:
+                    print("sendIng an iterable")
+                for data in value:
+                    try:
+                        self.sock.sendall(data)
+                    except:
+                        self.sock.sendall(bytes(data, "utf-8"))
+            else:
+                self.sock.sendall(value)
+        except socket.error as v:
+            if v[0] == 32:      # Broken pipe
+                self.close()
+            raise
+
+class StreamingHTTPConnection(_StreamingHTTPMixin, http.client.HTTPConnection):
+    """Subclass of `http.client.HTTPConnection` that overrides the `send()` method
+    to support iterable body objects"""
+
+class StreamingHTTPRedirectHandler(urllib.request.HTTPRedirectHandler):
+    """Subclass of `urllib.request.HTTPRedirectHandler` that overrides the
+    `redirect_request` method to properly handle redirected POST requests
+
+    This class is required because python 2.5's HTTPRedirectHandler does
+    not remove the Content-Type or Content-Length headers when requesting
+    the new resource, but the body of the original request is not preserved.
+    """
+
+    handler_order = urllib.request.HTTPRedirectHandler.handler_order - 1
+
+    # From python2.6 urllib.request's HTTPRedirectHandler
+    def redirect_request(self, req, fp, code, msg, headers, newurl):
+        """Return a Request or None in response to a redirect.
+
+        This is called by the http_error_30x methods when a
+        redirection response is received.  If a redirection should
+        take place, return a new Request to allow http_error_30x to
+        perform the redirect.  Otherwise, raise HTTPError if no-one
+        else should try to handle this url.  Return None if you can't
+        but another Handler might.
+        """
+        m = req.get_method()
+        if (code in (301, 302, 303, 307) and m in ("GET", "HEAD")
+            or code in (301, 302, 303) and m == "POST"):
+            # Strictly (according to RFC 2616), 301 or 302 in response
+            # to a POST MUST NOT cause a redirection without confirmation
+            # from the user (of urllib.request, in this case).  In practice,
+            # essentially all clients do redirect in this case, so we
+            # do the same.
+            # be conciliant with URIs containing a space
+            newurl = newurl.replace(' ', '%20')
+            newheaders = dict((k, v) for k, v in req.headers.items()
+                              if k.lower() not in (
+                                  "content-length", "content-type")
+                             )
+            return urllib.request.Request(newurl,
+                           headers=newheaders,
+                           origin_req_host=req.origin_req_host,
+                           unverifiable=True)
+        else:
+            raise urllib.request.HTTPError(req.get_full_url(), code, msg, headers, fp)
+
+class StreamingHTTPHandler(urllib.request.HTTPHandler):
+    """Subclass of `urllib.request.HTTPHandler` that uses
+    StreamingHTTPConnection as its http connection class."""
+
+    handler_order = urllib.request.HTTPHandler.handler_order - 1
+
+    def http_open(self, req):
+        """Open a StreamingHTTPConnection for the given request"""
+        return self.do_open(StreamingHTTPConnection, req)
+
+    def http_request(self, req):
+        """Handle a HTTP request.  Make sure that Content-Length is specified
+        if we're using an interable value"""
+        # Make sure that if we're using an iterable object as the request
+        # body, that we've also specified Content-Length
+        data = req.data
+        if data:
+            if hasattr(data, 'read') or hasattr(data, '__next__'):
+                if not req.has_header('Content-length'):
+                    raise ValueError(
+                            "No Content-Length specified for iterable body")
+        return urllib.request.HTTPHandler.do_request_(self, req)
+
+if hasattr(http.client, 'HTTPSConnection'):
+    class StreamingHTTPSConnection(_StreamingHTTPMixin,
+            http.client.HTTPSConnection):
+        """Subclass of `http.client.HTTSConnection` that overrides the `send()`
+        method to support iterable body objects"""
+
+    class StreamingHTTPSHandler(urllib.request.HTTPSHandler):
+        """Subclass of `urllib.request.HTTPSHandler` that uses
+        StreamingHTTPSConnection as its http connection class."""
+
+        handler_order = urllib.request.HTTPSHandler.handler_order - 1
+
+        def https_open(self, req):
+            return self.do_open(StreamingHTTPSConnection, req)
+
+        def https_request(self, req):
+            # Make sure that if we're using an iterable object as the request
+            # body, that we've also specified Content-Length
+            data = req.data
+            if data:
+                if hasattr(data, 'read') or hasattr(data, '__next__'):
+                    if not req.has_header('Content-length'):
+                        raise ValueError(
+                                "No Content-Length specified for iterable body")
+            return urllib.request.HTTPSHandler.do_request_(self, req)
+
+
+def get_handlers():
+    handlers = [StreamingHTTPHandler, StreamingHTTPRedirectHandler]
+    if hasattr(http.client, "HTTPSConnection"):
+        handlers.append(StreamingHTTPSHandler)
+    return handlers
+
+def register_openers():
+    """Register the streaming http handlers in the global urllib.request default
+    opener object.
+
+    Returns the created OpenerDirector object."""
+    opener = urllib.request.build_opener(*get_handlers())
+
+    urllib.request.install_opener(opener)
+
+    return opener
diff --git a/requirements.txt b/requirements.txt
index ff7ce86b..09fbf820 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,5 +1,10 @@
 argparse>=1.2.1
 internetarchive
 kitchen
+lxml
 mwclient
+pymysql
+pywikibot
 requests>=2.3.0
+urllib3
+wikitools
diff --git a/testing/test_dumpgenerator.py b/testing/test_dumpgenerator.py
index 7dd21016..08252080 100644
--- a/testing/test_dumpgenerator.py
+++ b/testing/test_dumpgenerator.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2011-2016 WikiTeam developers
@@ -17,17 +17,13 @@
 
 import datetime
 import json
-try:
-    from hashlib import md5
-except ImportError:             # Python 2.4 compatibility
-    from md5 import new as md5
+from hashlib import md5
 import os
 import requests
 import shutil
 import time
 import unittest
 import urllib
-import urllib2
 import tempfile
 from dumpgenerator import delay, domain2prefix, getImageNames, getPageTitles, getUserAgent, getWikiEngine, mwGetAPIAndIndex
 
@@ -42,14 +38,14 @@ class TestDumpgenerator(unittest.TestCase):
     def test_delay(self):
         # This test checks several delays
         
-        print '\n', '#'*73, '\n', 'test_delay', '\n', '#'*73
+        print ('\n', '#'*73, '\n', 'test_delay', '\n', '#'*73)
         for i in [0, 1, 2, 3]:
-            print 'Testing delay:', i
+            print ('Testing delay:', i)
             config = {'delay': i}
             t1 = time.time()
             delay(config=config)
             t2 = time.time() - t1
-            print 'Elapsed time in seconds (approx.):', t2
+            print ('Elapsed time in seconds (approx.):', t2)
             self.assertTrue(t2 + 0.01 > i and t2 < i + 1)
     
     def test_getImages(self):
@@ -58,7 +54,7 @@ def test_getImages(self):
         # Check the presence of some special files, like odd chars filenames
         # The tested wikis are from different wikifarms and some alone
         
-        print '\n', '#'*73, '\n', 'test_getImages', '\n', '#'*73
+        print ('\n', '#'*73, '\n', 'test_getImages', '\n', '#'*73)
         tests = [
             # Alone wikis
             #['http://wiki.annotation.jp/index.php', 'http://wiki.annotation.jp/api.php', u'かずさアノテーション - ソーシャル・ゲノム・アノテーション.jpg'],
@@ -93,37 +89,37 @@ def test_getImages(self):
         session.headers = {'User-Agent': getUserAgent()}
         for index, api, filetocheck in tests:
             # Testing with API
-            print '\nTesting', api
+            print ('\nTesting', api)
             config_api = {'api': api, 
                 'delay': 0, 
                 'retries': 5,
                 'date': "20150807",
                 }
             config_api['path'] = tempfile.mkdtemp()
-            req = urllib2.Request(url=api, data=urllib.urlencode({'action': 'query', 'meta': 'siteinfo', 'siprop': 'statistics', 'format': 'json'}), headers={'User-Agent': getUserAgent()})
-            f = urllib2.urlopen(req)
+            req = urllib.Request(url=api, data=urllib.urlencode({'action': 'query', 'meta': 'siteinfo', 'siprop': 'statistics', 'format': 'json'}), headers={'User-Agent': getUserAgent()})
+            f = urllib.urlopen(req)
             imagecount = int(json.loads(f.read())['query']['statistics']['images'])
             f.close()
             
-            print 'Trying to parse', filetocheck, 'with API'
+            print ('Trying to parse', filetocheck, 'with API')
             result_api = getImageNames(config=config_api, session=session)
             self.assertEqual(len(result_api), imagecount)
             self.assertTrue(filetocheck in [filename for filename, url, uploader in result_api])
             
             # Testing with index
-            print '\nTesting', index
+            print ('\nTesting', index)
             config_index = {'index': index, 
                 'delay': 0, 
                 'retries': 5,
                 'date': "20150807",
                 }
             config_api['path'] = tempfile.mkdtemp()
-            req = urllib2.Request(url=api, data=urllib.urlencode({'action': 'query', 'meta': 'siteinfo', 'siprop': 'statistics', 'format': 'json'}), headers={'User-Agent': getUserAgent()})
-            f = urllib2.urlopen(req)
+            req = urllib.Request(url=api, data=urllib.urlencode({'action': 'query', 'meta': 'siteinfo', 'siprop': 'statistics', 'format': 'json'}), headers={'User-Agent': getUserAgent()})
+            f = urllib.urlopen(req)
             imagecount = int(json.loads(f.read())['query']['statistics']['images'])
             f.close()
     
-            print 'Trying to parse', filetocheck, 'with index'
+            print ('Trying to parse', filetocheck, 'with index')
             result_index = getImageNames(config=config_index, session=session)
             #print 111, set([filename for filename, url, uploader in result_api]) - set([filename for filename, url, uploader in result_index])
             self.assertEqual(len(result_index), imagecount)
@@ -143,7 +139,7 @@ def test_getPageTitles(self):
         # Check the presence of some special titles, like odd chars
         # The tested wikis are from different wikifarms and some alone
         
-        print '\n', '#'*73, '\n', 'test_getPageTitles', '\n', '#'*73
+        print ('\n', '#'*73, '\n', 'test_getPageTitles', '\n', '#'*73)
         tests = [
             # Alone wikis
             ['https://archiveteam.org/index.php', 'https://archiveteam.org/api.php', u'April Fools\' Day'],
@@ -160,8 +156,8 @@ def test_getPageTitles(self):
         session.headers = {'User-Agent': getUserAgent()}
         for index, api, pagetocheck in tests:
             # Testing with API
-            print '\nTesting', api
-            print 'Trying to parse', pagetocheck, 'with API'
+            print ('\nTesting', api)
+            print ('Trying to parse', pagetocheck, 'with API')
             config_api = {'api': api, 
                 'index': '', 
                 'delay': 0, 
@@ -177,8 +173,8 @@ def test_getPageTitles(self):
             self.assertTrue(pagetocheck in result_api)
             
             # Testing with index
-            print 'Testing', index
-            print 'Trying to parse', pagetocheck, 'with index'
+            print ('Testing', index)
+            print ('Trying to parse', pagetocheck, 'with index')
             config_index = {'index': index, 
                 'api': '', 
                 'delay': 0, 
@@ -202,7 +198,7 @@ def test_getPageTitles(self):
                 c += 1
             
     def test_getWikiEngine(self):
-        print '\n', '#'*73, '\n', 'test_getWikiEngine', '\n', '#'*73
+        print ('\n', '#'*73, '\n', 'test_getWikiEngine', '\n', '#'*73)
         tests = [
             ['https://www.dokuwiki.org', 'DokuWiki'],
             #['http://wiki.openwrt.org', 'DokuWiki'],
@@ -260,17 +256,17 @@ def test_getWikiEngine(self):
             ['http://wiki.openid.net/', 'PBworks'],
         ]
         for wiki, engine in tests:
-            print 'Testing', wiki
+            print ('Testing', wiki)
             try:
                 guess_engine = getWikiEngine(wiki)
             except ConnectionError:
-                print "%s failed to load, skipping..." % (wiki)
+                print ("%s failed to load, skipping..." % (wiki))
                 continue
-            print 'Got: %s, expected: %s' % (guess_engine, engine)
+            print ('Got: %s, expected: %s' % (guess_engine, engine))
             self.assertEqual(guess_engine, engine)
     
     def test_mwGetAPIAndIndex(self):
-        print '\n', '#'*73, '\n', 'test_mwGetAPIAndIndex', '\n', '#'*73
+        print ('\n', '#'*73, '\n', 'test_mwGetAPIAndIndex', '\n', '#'*73)
         tests = [
             # Alone wikis
             ['https://archiveteam.org', 'https://archiveteam.org/api.php', 'https://archiveteam.org/index.php'],
@@ -301,7 +297,7 @@ def test_mwGetAPIAndIndex(self):
             # It seems offline
         ]
         for wiki, api, index in tests:
-            print 'Testing', wiki
+            print ('Testing', wiki)
             api2, index2 = mwGetAPIAndIndex(wiki)
             self.assertEqual(api, api2)
             self.assertEqual(index, index2)
diff --git a/uploader.py b/uploader.py
index 73626f79..a47c8a37 100644
--- a/uploader.py
+++ b/uploader.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2011-2016 WikiTeam
@@ -20,12 +20,10 @@
 import os
 import re
 import subprocess
-import sys
 import time
 import requests
-import urlparse
+import urllib.parse
 from io import BytesIO
-from xml.sax.saxutils import quoteattr
 from internetarchive import get_item
 
 import dumpgenerator
@@ -48,22 +46,22 @@ def upload(wikis, config={}, uploadeddumps=[]):
 
     filelist = os.listdir(dumpdir)
     for wiki in wikis:
-        print "#"*73
-        print "# Uploading", wiki
-        print "#"*73
+        print ("#"*73)
+        print ("# Uploading", wiki)
+        print ("#"*73)
         wiki = wiki.lower()
         configtemp = config
         try:
             prefix = dumpgenerator.domain2prefix(config={'api': wiki})
         except KeyError:
-            print "ERROR: could not produce the prefix for %s" % wiki
+            print ("ERROR: could not produce the prefix for %s" % wiki)
         config = configtemp
 
         wikiname = prefix.split('-')[0]
         dumps = []
         for f in filelist:
             if f.startswith('%s-' % (wikiname)) and (f.endswith('-wikidump.7z') or f.endswith('-history.xml.7z')):
-                print "%s found" % f
+                print ("%s found" % f)
                 dumps.append(f)
                 # Re-introduce the break here if you only need to upload one file
                 # and the I/O is too slow
@@ -78,10 +76,10 @@ def upload(wikis, config={}, uploadeddumps=[]):
                     rmline='rm -rf %s-%s-wikidump/' % (wikiname, wikidate)
                     # With -f the deletion might have happened before and we won't know
                     if not os.system(rmline):
-                        print 'DELETED %s-%s-wikidump/' % (wikiname, wikidate)
+                        print ('DELETED %s-%s-wikidump/' % (wikiname, wikidate))
                 if config.prune_wikidump and dump.endswith('wikidump.7z'):
                         # Simplistic quick&dirty check for the presence of this file in the item
-                        print "Checking content in previously uploaded files"
+                        print ("Checking content in previously uploaded files")
                         stdout, stderr = subprocess.Popen(["md5sum", dumpdir + '/' + dump], stdout=subprocess.PIPE, stderr=subprocess.PIPE).communicate()
                         dumphash = re.sub(' +.+\n?', '', stdout)
 
@@ -89,22 +87,22 @@ def upload(wikis, config={}, uploadeddumps=[]):
                             log(wiki, dump, 'verified', config)
                             rmline='rm -rf %s' % dumpdir + '/' + dump
                             if not os.system(rmline):
-                                print 'DELETED ' + dumpdir + '/' + dump
-                            print '%s was uploaded before, skipping...' % (dump)
+                                print ('DELETED ' + dumpdir + '/' + dump)
+                            print ('%s was uploaded before, skipping...' % (dump))
                             continue
                         else:
-                            print 'ERROR: The online item misses ' + dump
+                            print ('ERROR: The online item misses ' + dump)
                             log(wiki, dump, 'missing', config)
                             # We'll exit this if and go upload the dump
                 else:
-                    print '%s was uploaded before, skipping...' % (dump)
+                    print ('%s was uploaded before, skipping...' % (dump))
                     continue
             else:
-                print '%s was not uploaded before' % dump
+                print ('%s was not uploaded before' % dump)
 
             time.sleep(0.1)
             wikidate_text = wikidate[0:4]+'-'+wikidate[4:6]+'-'+wikidate[6:8]
-            print wiki, wikiname, wikidate, dump
+            print (wiki, wikiname, wikidate, dump)
 
             # Does the item exist already?
             ismissingitem = not item.exists
@@ -197,7 +195,7 @@ def upload(wikis, config={}, uploadeddumps=[]):
                         logourl = re.findall(ur'"wordmark-image">[^<]*<a[^>]*>[^<]*<img src="([^"]+)"', raw)[0]
                     if 'http' not in logourl:
                         # Probably a relative path, construct the absolute path
-                        logourl = urlparse.urljoin(wiki, logourl)
+                        logourl = urllib.parse.urljoin(wiki, logourl)
                 except:
                     pass
 
@@ -216,7 +214,7 @@ def upload(wikis, config={}, uploadeddumps=[]):
 
                 wikiurl = wiki # we use api here http://en.ecgpedia.org/api.php
             else:
-                print 'Item already exists.'
+                print ('Item already exists.')
                 lang = 'foo'
                 wikititle = 'foo'
                 wikidesc = 'foo'
@@ -235,7 +233,7 @@ def upload(wikis, config={}, uploadeddumps=[]):
                     'language': lang,
                     'last-updated-date': wikidate_text,
                     'subject': '; '.join(wikikeys), # Keywords should be separated by ; but it doesn't matter much; the alternative is to set one per field with subject[0], subject[1], ...
-                    'licenseurl': wikilicenseurl and urlparse.urljoin(wiki, wikilicenseurl),
+                    'licenseurl': wikilicenseurl and urllib.parse.urljoin(wiki, wikilicenseurl),
                     'rights': wikirights,
                     'originalurl': wikiurl,
                 }
@@ -244,10 +242,10 @@ def upload(wikis, config={}, uploadeddumps=[]):
             try:
                 item.upload(dumpdir + '/' + dump, metadata=md, access_key=accesskey, secret_key=secretkey, verbose=True, queue_derive=False)
                 item.modify_metadata(md) # update
-                print 'You can find it in https://archive.org/details/wiki-%s' % (wikiname)
+                print ('You can find it in https://archive.org/details/wiki-%s' % (wikiname))
                 uploadeddumps.append(dump)
             except Exception as e:
-                print wiki, dump, 'Error when uploading?'
+                print (wiki, dump, 'Error when uploading?')
                 print(e)
             try:
                 log(wiki, dump, 'ok', config)
@@ -294,7 +292,7 @@ def main(params=[]):
         uploadeddumps = [l.split(';')[1] for l in open('uploader-%s.log' % (listfile), 'r').read().strip().splitlines() if len(l.split(';'))>1]
     except:
         pass
-    print '%d dumps uploaded previously' % (len(uploadeddumps))
+    print ('%d dumps uploaded previously' % (len(uploadeddumps)))
     wikis = open(listfile, 'r').read().strip().splitlines()
 
     upload(wikis, config, uploadeddumps)
diff --git a/wikiadownloader.py b/wikiadownloader.py
index a8b451f0..9193a324 100644
--- a/wikiadownloader.py
+++ b/wikiadownloader.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2011 WikiTeam
@@ -42,7 +42,7 @@
 wikia = f.read().strip().split('\n')
 f.close()
 
-print >>sys.stderr, len(wikia), 'wikis in Wikia'
+print(len(wikia), 'wikis in Wikia list')
 
 start = '!'
 if len(sys.argv) > 1:
@@ -53,8 +53,8 @@
     prefix = wiki.split('http://')[1]
     if prefix < start:
         continue
-    print >>sys.stderr, "Starting:", wiki
-    
+    sys.stderr.write("Starting:", wiki)
+
     f = urllib.urlopen('%s/wiki/Special:Statistics' % (wiki))
     html = f.read()
     f.close()
@@ -67,7 +67,7 @@
         date = "%s-%s-%s" % (i.group("year"), i.group("month"), i.group("day"))
         compression = i.group("compression")
 
-        print >>sys.stderr, 'Downloading', wiki, dump.lower()
+        sys.stderr.write('Downloading', wiki, dump.lower())
         
         #{"name":"pages_full.xml.gz","timestamp":1273755409,"mwtimestamp":"20100513125649"}
         #{"name":"pages_current.xml.gz","timestamp":1270731925,"mwtimestamp":"20100408130525"}
@@ -76,7 +76,5 @@
         os.system('wget -q -c "%s" -O %s-%s-pages-meta-%s.%s' % (urldump, prefix, date, dump.lower() == 'current' and 'current' or 'history', compression))
 
     if not m.search(html):
-        print >>sys.stderr, 'Failed to download:', wiki
-        print >>sys.stderr, wiki
-
-fail_file.close()
+        sys.stderr.write(sys.stderr, 'Failed to download:', wiki)
+        sys.stderr.write(sys.stderr, wiki)
\ No newline at end of file
diff --git a/wikiapiary/wikiapiary_family.py b/wikiapiary/wikiapiary_family.py
index daf381f6..9b16340a 100644
--- a/wikiapiary/wikiapiary_family.py
+++ b/wikiapiary/wikiapiary_family.py
@@ -37,7 +37,7 @@ def scriptpath(self, code):
         but needs to be overridden in the family file for any wiki that
         uses a different value.
 
-        """
+       """
         return '/w'
 
     # Which version of MediaWiki is used? REQUIRED
diff --git a/wikimediacommons/commons-update-status.py b/wikimediacommons/commons-update-status.py
index 00e64407..4a1beb32 100644
--- a/wikimediacommons/commons-update-status.py
+++ b/wikimediacommons/commons-update-status.py
@@ -54,7 +54,7 @@ def main():
     identifiers_list.sort()
     
     rows = ["|-\n| %s || [https://archive.org/details/%s %s] || ??? || ???" % (k, v, v) for k, v in identifiers_list]
-    output = """
+    output ="""
 {| class="wikitable sortable"
 ! Date !! Identifier !! Files !! Size (GB)
 %s
diff --git a/wikimediacommons/commonschecker.py b/wikimediacommons/commonschecker.py
index fa5bd768..faa5cf23 100644
--- a/wikimediacommons/commonschecker.py
+++ b/wikimediacommons/commonschecker.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf8 -*-
 # Copyright (C) 2011-2012 WikiTeam
 # This program is free software: you can redistribute it and/or modify
@@ -16,38 +16,35 @@
 
 import csv
 import datetime
-try:
-    from hashlib import md5
-except ImportError:             # Python 2.4 compatibility
-    from md5 import new as md5
+from hashlib import md5
 import os
 import re
 import sys
 import zipfile
 
 def welcome():
-    """  """
-    print "#"*73
-    print """# Welcome to CommonsChecker 0.1 by WikiTeam (GPL v3)                    #
-# More info at: http://code.google.com/p/wikiteam/                      #"""
-    print "#"*73
-    print ''
-    print "#"*73
-    print """# Copyright (C) 2011-2012 WikiTeam                                      #
-# This program is free software: you can redistribute it and/or modify  #
-# it under the terms of the GNU General Public License as published by  #
-# the Free Software Foundation, either version 3 of the License, or     #
-# (at your option) any later version.                                   #
-#                                                                       #
-# This program is distributed in the hope that it will be useful,       #
-# but WITHOUT ANY WARRANTY; without even the implied warranty of        #
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the         #
-# GNU General Public License for more details.                          #
-#                                                                       #
-# You should have received a copy of the GNU General Public License     #
-# along with this program.  If not, see <http://www.gnu.org/licenses/>. #"""
-    print "#"*73
-    print ''
+    """"""
+    print ("#"*73)
+    print ("# Welcome to CommonsChecker 0.1 by WikiTeam (GPL v3)                    #")
+    print ("# More info at: http://code.google.com/p/wikiteam/                      #")
+    print ("#"*73)
+    print ('')
+    print ("#"*73)
+    print ("# Copyright (C) 2011-2012 WikiTeam                                      #")
+    print ("# This program is free software: you can redistribute it and/or modify  #")
+    print ("# it under the terms of the GNU General Public License as published by  #")
+    print ("# the Free Software Foundation, either version 3 of the License, or     #")
+    print ("# (at your option) any later version.                                   #")
+    print ("#                                                                       #")
+    print ("# This program is distributed in the hope that it will be useful,       #")
+    print ("# but WITHOUT ANY WARRANTY; without even the implied warranty of        #")
+    print ("# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the         #")
+    print ("# GNU General Public License for more details.                          #")
+    print ("#                                                                       #")
+    print ("# You should have received a copy of the GNU General Public License     #")
+    print ("# along with this program.  If not, see <http://www.gnu.org/licenses/>. #")
+    print ("#"*73)
+    print ('')
 
 def main():
     welcome()
@@ -56,7 +53,7 @@ def main():
     enddate = ''
     delta = datetime.timedelta(days=1) #chunks by day
     if len(sys.argv) == 1:
-        print 'Usage example: python script.py 2005-01-01 2005-01-10 [to check the first 10 days of 2005]'
+        print ('Usage example: python script.py 2005-01-01 2005-01-10 [to check the first 10 days of 2005]')
         sys.exit()
     elif len(sys.argv) == 2: #use sys.argv[1] as start and enddata, just check a day
         startdate = datetime.datetime.strptime(sys.argv[1], '%Y-%m-%d')
@@ -67,9 +64,9 @@ def main():
     else:
         sys.exit()
 
-    print "Checking Wikimedia Commons files from %s to %s" % (startdate.strftime('%Y-%m-%d'), enddate.strftime('%Y-%m-%d'))
+    print ("Checking Wikimedia Commons files from %s to %s" % (startdate.strftime('%Y-%m-%d'), enddate.strftime('%Y-%m-%d')))
     while startdate <= enddate:
-        print '== %s ==' % (startdate.strftime('%Y-%m-%d'))
+        print ('== %s ==' % (startdate.strftime('%Y-%m-%d')))
         filenamecsv = startdate.strftime('%Y-%m-%d.csv')
         filenamezip = startdate.strftime('%Y-%m-%d.zip')
         if os.path.exists(filenamecsv):
@@ -82,8 +79,8 @@ def main():
                 csv_file_list = []
                 files = {}
                 for img_name, img_saved_as, img_timestamp, img_user, img_user_text, img_size, img_width, img_height in f:
-                  csv_data_dict[unicode('%s/%s' % (startdate.strftime('%Y/%m/%d'), img_saved_as), 'utf-8')] = {'img_name':img_name, 'img_saved_as':img_saved_as, 'img_timestamp':img_timestamp, 'img_user':img_user, 'img_user_text':img_user_text, 'img_size':img_size, 'img_width':img_width, 'img_height':img_height}
-                  csv_file_list.append(unicode('%s/%s' % (startdate.strftime('%Y/%m/%d'), img_saved_as), 'utf-8'))
+                  csv_data_dict[str('%s/%s' % (startdate.strftime('%Y/%m/%d'), img_saved_as), 'utf-8')] = {'img_name':img_name, 'img_saved_as':img_saved_as, 'img_timestamp':img_timestamp, 'img_user':img_user, 'img_user_text':img_user_text, 'img_size':img_size, 'img_width':img_width, 'img_height':img_height}
+                  csv_file_list.append(str('%s/%s' % (startdate.strftime('%Y/%m/%d'), img_saved_as), 'utf-8'))
                 for i in zipfiles:
                   files_in_zip.append(i.filename)
                   files[i.filename] = i
@@ -103,15 +100,15 @@ def main():
                           else:
                               error = 'corrupt (%s of %s bytes)' % (i.file_size, csv_img['img_size'])
                           if not ok:
-                              print csv_img['img_name'], csv_img['img_saved_as'], error
+                              print (csv_img['img_name'], csv_img['img_saved_as'], error)
                               errors.append([csv_img['img_saved_as'], error])
                 if errors:
-                    print 'This .zip contains errors:'
-                    print '\n'.join(['  -> "%s" is %s' % (filename, error) for filename, error in errors])
+                    print ('This .zip contains errors:')
+                    print ('\n'.join(['  -> "%s" is %s' % (filename, error) for filename, error in errors]))
                 else:
-                    print 'No errors found'
+                    print ('No errors found')
             else:
-                print 'Error, no %s available' % (filenamezip)
+                print ('Error, no %s available' % (filenamezip))
             startdate += delta
 if __name__ == "__main__":
     main()
diff --git a/wikimediacommons/commonsdownloader.py b/wikimediacommons/commonsdownloader.py
index d1ee89d7..528a14cb 100644
--- a/wikimediacommons/commonsdownloader.py
+++ b/wikimediacommons/commonsdownloader.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf8 -*-
 
 # Copyright (C) 2011-2016 WikiTeam developers
@@ -17,45 +17,42 @@
 
 import csv
 import datetime
-try:
-    from hashlib import md5
-except ImportError:             # Python 2.4 compatibility
-    from md5 import new as md5
+from hashlib import md5
 import os
 import re
 import sys
 import urllib
 
 def welcome():
-    """  """
-    print "#"*73
-    print """# Welcome to CommonsDownloader 0.1 by WikiTeam (GPL v3)                 #
-# More info: https://github.com/WikiTeam/wikiteam                      #"""
-    print "#"*73
-    print ''
-    print "#"*73
-    print """# Copyright (C) 2011-2016 WikiTeam                                      #
-# This program is free software: you can redistribute it and/or modify  #
-# it under the terms of the GNU General Public License as published by  #
-# the Free Software Foundation, either version 3 of the License, or     #
-# (at your option) any later version.                                   #
-#                                                                       #
-# This program is distributed in the hope that it will be useful,       #
-# but WITHOUT ANY WARRANTY; without even the implied warranty of        #
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the         #
-# GNU General Public License for more details.                          #
-#                                                                       #
-# You should have received a copy of the GNU General Public License     #
-# along with this program.  If not, see <http://www.gnu.org/licenses/>. #"""
-    print "#"*73
-    print ''
+    """"""
+    print ("#"*73)
+    print ("# Welcome to CommonsDownloader 0.1 by WikiTeam (GPL v3)")
+    print ("More info: https://github.com/WikiTeam/wikiteam")
+    print ("#"*73)
+    print ('')
+    print ("#"*73)
+    print ("# Copyright (C) 2011-2016 WikiTeam")
+    print ("# This program is free software: you can redistribute it and/or modify  #")
+    print ("# it under the terms of the GNU General Public License as published by  #")
+    print ("# the Free Software Foundation, either version 3 of the License, or     #")
+    print ("# (at your option) any later version.                                   #")
+    print ("#                                                                       #")
+    print ("# This program is distributed in the hope that it will be useful,       #")
+    print ("# but WITHOUT ANY WARRANTY; without even the implied warranty of        #")
+    print ("# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the         #")
+    print ("# GNU General Public License for more details.                          #")
+    print ("#                                                                       #")
+    print ("# You should have received a copy of the GNU General Public License     #")
+    print ("# along with this program.  If not, see <http://www.gnu.org/licenses/>. #")
+    print ("#"*73)
+    print ('')
 
 def bye():
-    """  """
-    print "---> Congratulations! Your dump is complete <---"
-    print "If you found any bug, report a new issue here (Google account required): http://code.google.com/p/wikiteam/issues/list"
-    print "If this is a public wiki, please, consider sending us a copy of this dump. Contact us at http://code.google.com/p/wikiteam"
-    print "Good luck! Bye!"
+    """"""
+    print ("---> Congratulations! Your dump is complete <---")
+    print ("If you found any bug, report a new issue here (Google account required): http://code.google.com/p/wikiteam/issues/list")
+    print ("If this is a public wiki, please, consider sending us a copy of this dump. Contact us at http://code.google.com/p/wikiteam")
+    print ("Good luck! Bye!")
 
 def main():
     welcome()
@@ -66,7 +63,7 @@ def main():
     delta = datetime.timedelta(days=1) #chunks by day
     filenamelimit = 100 #do not change!!!
     if len(sys.argv) == 1:
-        print 'Usage example: python script.py 2005-01-01 2005-01-10 [to download the first 10 days of 2005]'
+        print ('Usage example: python script.py 2005-01-01 2005-01-10 [to download the first 10 days of 2005]')
         sys.exit()
     elif len(sys.argv) == 2: #use sys.argv[1] as start and enddata, just download a day
         startdate = datetime.datetime.strptime(sys.argv[1], '%Y-%m-%d')
@@ -77,9 +74,9 @@ def main():
     else:
         sys.exit()
     
-    print "Downloading Wikimedia Commons files from %s to %s" % (startdate.strftime('%Y-%m-%d'), enddate.strftime('%Y-%m-%d'))
+    print ("Downloading Wikimedia Commons files from %s to %s" % (startdate.strftime('%Y-%m-%d'), enddate.strftime('%Y-%m-%d')))
     while startdate <= enddate:
-        print '== %s ==' % (startdate.strftime('%Y-%m-%d'))
+        print ('== %s ==' % (startdate.strftime('%Y-%m-%d')))
         savepath = startdate.strftime('%Y/%m/%d')
         filenamecsv = startdate.strftime('%Y-%m-%d.csv')
         filenamezip = startdate.strftime('%Y-%m-%d.zip')
@@ -96,9 +93,9 @@ def main():
                     h = open(filenamecsv, 'w')
                     h.write('img_name|img_saved_as|img_timestamp|img_user|img_user_text|img_size|img_width|img_height\n')
                     h.close()
-                
-                img_name = unicode(img_name, 'utf-8')
-                img_user_text = unicode(img_user_text, 'utf-8')
+
+                img_name = str(img_name, 'utf-8')
+                img_user_text = str(img_user_text, 'utf-8')
                 original_name = img_name
                 if re.search(ur"(?m)^\d{14}\!", original_name): #removing 20101005024534! (or similar) from name if present
                     original_name = original_name[15:]
@@ -117,7 +114,7 @@ def main():
                 else:
                     img_saved_as = re.sub(r' ', r'_', img_name) # do not use ur'', it is encoded
                     img_saved_as_ = re.sub(r'"', r'\"', re.sub(r' ', r'_', img_name.encode('utf-8'))) # do not use ur'', it is encoded
-                print img_name, img_saved_as, img_timestamp
+                print (img_name, img_saved_as, img_timestamp)
                 
                 #wget file
                 if original_name != img_name: #the image is an old version, download using /archive/ path in server
diff --git a/wikimediacommons/commonssql.py b/wikimediacommons/commonssql.py
index 830a7095..2a85b864 100644
--- a/wikimediacommons/commonssql.py
+++ b/wikimediacommons/commonssql.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf8 -*-
 
 # Copyright (C) 2012-2016 WikiTeam developers
@@ -16,7 +16,7 @@
 # along with this program.  If not, see <http://www.gnu.org/licenses/>.
 
 import csv
-import MySQLdb
+import pymysql
 import re
 import sys
 
@@ -36,7 +36,7 @@ def main():
     ]
 
     f = csv.writer(open(filename, 'a'), delimiter='|', quotechar='"', quoting=csv.QUOTE_MINIMAL)
-    conn = MySQLdb.connect(host='s4.labsdb', db='commonswiki_p', read_default_file='~/replica.my.cnf', use_unicode=True)
+    conn = pymysql.connect(host='s4.labsdb', db='commonswiki_p', read_default_file='~/replica.my.cnf', use_unicode=True)
     for query in queries:
         conn.query(query)
         r = conn.store_result()
diff --git a/wikipediadownloader.py b/wikipediadownloader.py
index 15d23c88..3fd25c8d 100644
--- a/wikipediadownloader.py
+++ b/wikipediadownloader.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2011-2014 WikiTeam
@@ -54,16 +54,16 @@ def main():
     for project, date in projects:
         if start:
             if start != project:
-                print 'Skipping %s, %s' % (project, date)
+                print ('Skipping %s, %s' % (project, date))
                 continue
             else:
                 start = ''  # reset
 
-        print '-' * 50, '\n', 'Checking', project, date, '\n', '-' * 50
+        print ('-' * 50, '\n', 'Checking', project, date, '\n', '-' * 50)
         time.sleep(1)  # ctrl-c
         f = urllib.urlopen('%s/%s/%s/' % (dumpsdomain, project, date))
         htmlproj = f.read()
-        # print htmlproj
+        # print (htmlproj)
         f.close()
 
         for dumpclass in ['pages-meta-history\d*\.xml[^\.]*\.7z']:
@@ -80,7 +80,7 @@ def main():
                     urldumps.append(
                         '%s/%s' % (dumpsdomain, i.group('urldump')))
 
-                # print urldumps
+                # print (urldumps)
                 for urldump in urldumps:
                     dumpfilename = urldump.split('/')[-1]
                     path = '%s/%s' % (dumpfilename[0], project)
@@ -96,7 +96,7 @@ def main():
                     f.close()
                     md51 = re.findall(
                         r'(?P<md5>[a-f0-9]{32})\s+%s/%s' % (path, dumpfilename), raw)[0]
-                    print md51
+                    print (md51)
 
                     f = urllib.urlopen(
                         '%s/%s/%s/%s-%s-md5sums.txt' % (dumpsdomain, project, date, project, date))
@@ -108,11 +108,11 @@ def main():
                     f.close()
                     md52 = re.findall(
                         r'(?P<md5>[a-f0-9]{32})\s+%s' % (dumpfilename), raw)[0]
-                    print md52
+                    print (md52)
 
                     if md51 == md52:
-                        print 'md5sum is correct for this file, horay! \o/'
-                        print '\n' * 3
+                        print ('md5sum is correct for this file, horay! \o/')
+                        print ('\n' * 3)
                         corrupted = False
                     else:
                         os.remove('%s/%s' % (path, dumpfilename))
diff --git a/wikispaces.py b/wikispaces.py
index e134fc1f..671d72d0 100644
--- a/wikispaces.py
+++ b/wikispaces.py
@@ -1,4 +1,4 @@
-#!/usr/bin/env python2
+#!/usr/bin/env python3
 # -*- coding: utf-8 -*-
 
 # Copyright (C) 2018 WikiTeam developers
@@ -89,7 +89,7 @@ def saveURL(wikidomain='', url='', filename='', path='', overwrite=False, iterat
             saveURL(wikidomain=wikidomain, url=url, filename=filename, path=path, overwrite=overwrite, iteration=iteration+1)
 
 def undoHTMLEntities(text=''):
-    """ Undo some HTML codes """
+    """Undo some HTML codes"""
 
     # i guess only < > & " ' need conversion
     # http://www.w3schools.com/html/html_entities.asp
diff --git a/wikiteam/__init__.py b/wikiteam/__init__.py
deleted file mode 100644
index 8b137891..00000000
--- a/wikiteam/__init__.py
+++ /dev/null
@@ -1 +0,0 @@
-
diff --git a/wikiteam/mediawiki.py b/wikiteam/mediawiki.py
deleted file mode 100644
index 55ec0a53..00000000
--- a/wikiteam/mediawiki.py
+++ /dev/null
@@ -1,1075 +0,0 @@
-#!/usr/bin/env python3
-# -*- coding: utf-8 -*-
-
-# Copyright (C) 2011-2016 WikiTeam developers
-# This program is free software: you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation, either version 3 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-# Documentation for users: https://github.com/WikiTeam/wikiteam/wiki
-# Documentation for developers: http://wikiteam.readthedocs.com
-
-import json
-import re
-import sys
-import urllib
-
-import wikiteam
-
-def mwCleanHTML(raw=''):
-    """ Extract only the real wiki content and remove rubbish """
-    """ This function is ONLY used to retrieve page titles and file names when no API is available """
-    """ DO NOT use this function to extract page content """
-    
-    # different "tags" used by different MediaWiki versions to mark where
-    # starts and ends content
-    if re.search('<!-- bodytext -->', raw):
-        raw = raw.split('<!-- bodytext -->')[1].split('<!-- /bodytext -->')[0]
-    elif re.search('<!-- start content -->', raw):
-        raw = raw.split(
-            '<!-- start content -->')[1].split('<!-- end content -->')[0]
-    elif re.search('<!-- Begin Content Area -->', raw):
-        raw = raw.split(
-            '<!-- Begin Content Area -->')[1].split('<!-- End Content Area -->')[0]
-    elif re.search('<!-- content -->', raw):
-        raw = raw.split('<!-- content -->')[1].split('<!-- mw_content -->')[0]
-    elif re.search('<article id="WikiaMainContent" class="WikiaMainContent">', raw):
-        raw = raw.split('<article id="WikiaMainContent" class="WikiaMainContent">')[1].split('</article>')[0]
-    elif re.search('<body class=', raw):
-        raw = raw.split('<body class=')[1].split('<div class="printfooter">')[0]
-    else:
-        sys.stderr.write(raw[:250])
-        sys.stderr.write('This wiki doesn\'t use marks to split content\n')
-        sys.exit()
-    return raw
-
-def mwCleanXML(xml=''):
-    """ Trim redundant info """
-    
-    # do not touch XML codification, leave AS IS
-    if re.search(r'</siteinfo>\n', xml):
-        xml = xml.split('</siteinfo>\n')[1]
-    if re.search(r'</mediawiki>', xml):
-        xml = xml.split('</mediawiki>')[0]
-    return xml
-
-def mwCreateNewDump(config={}):
-    sys.stderr.write('Trying generating a new dump into a new directory...')
-    if config['pages']:
-        pagetitles = mwGetPageTitles(config=config)
-        wikiteam.savePageTitles(config=config, pagetitles=pagetitles)
-        mwGeneratePageDump(config=config, pagetitles=pagetitles)
-        mwCheckXMLIntegrity(config=config, pagetitles=pagetitles)
-    if config['images']:
-        imagenames = mwGetImageNames(config=config)
-        mwSaveImageNames(config=config, imagenames=imagenames)
-        mwGenerateImageDump(config=config, imagenames=imagenames)
-    if config['logs']:
-        mwSaveLogs(config=config)
-    mwSaveIndexPHP(config=config)
-    mwSaveSpecialVersion(config=config)
-    mwSaveSiteInfo(config=config)
-
-def mwCurateImageURL(config={}, url=''):
-    """ Returns an absolute URL for an image, adding the domain if missing """
-
-    if 'mwindex' in config and config['mwindex']:
-        # remove from :// (http or https) until the first / after domain
-        domainalone = config['mwindex'].split(
-            '://')[0] + '://' + config['mwindex'].split('://')[1].split('/')[0]
-    elif 'mwapi' in config and config['mwapi']:
-        domainalone = config['mwapi'].split(
-            '://')[0] + '://' + config['mwapi'].split('://')[1].split('/')[0]
-    else:
-        sys.stderr.write('ERROR: no index nor API')
-        sys.exit()
-
-    if url.startswith('//'):  # Orain wikifarm returns URLs starting with //
-        url = '%s:%s' % (domainalone.split('://')[0], url)
-    # is it a relative URL?
-    elif url[0] == '/' or (not url.startswith('http://') and not url.startswith('https://')):
-        if url[0] == '/':  # slash is added later
-            url = url[1:]
-        # concat http(s) + domain + relative url
-        url = '%s/%s' % (domainalone, url)
-    url = wikiteam.undoHTMLEntities(text=url)
-    # url = urllib.unquote(url) #do not use unquote with url, it break some
-    # urls with odd chars
-    url = re.sub(' ', '_', url)
-    
-    return url
-
-def mwGeneratePageDump(config={}, pagetitles=None, start=None):
-    """ Generates a XML dump for page titles """
-    
-    sys.stderr.write('Retrieving XML for every page from "%s"' % (start or 'start'))
-    header = mwGetXMLHeader(config=config)
-    footer = '</mediawiki>\n'  # new line at the end
-    xmlfilename = '%s-%s-%s.xml' % (wikiteam.domain2prefix(config=config),
-                                    config['date'],
-                                    config['curonly'] and 'current' or 'history')
-    xmlfile = ''
-    lock = True
-    if start:
-        sys.stderr.write("Removing the last chunk of past XML dump: it is probably incomplete.\n")
-        for i in reverse_readline('%s/%s' % (config['path'], xmlfilename), truncate=True):
-            pass
-    else:
-        # requested complete xml dump
-        lock = False
-        xmlfile = open('%s/%s' % (config['path'], xmlfilename), 'w')
-        xmlfile.write(header)
-        xmlfile.close()
-
-    xmlfile = open('%s/%s' % (config['path'], xmlfilename), 'a')
-    c = 1
-    for pagetitle in mwGetPageTitles(config=config, start=start):
-        if not pagetitle.strip():
-            continue
-        if pagetitle == start:  # start downloading from start, included
-            lock = False
-        if lock:
-            continue
-        wikiteam.delay(config=config)
-        if c % 10 == 0:
-            sys.stderr.write('Downloaded %d pages\n' % (c))
-        try:
-            for xml in getXMLPage(config=config, title=title):
-                xml = cleanXML(xml=xml)
-                xmlfile.write(xml)
-        except PageMissingError:
-            logerror(
-                config=config,
-                text='The page "%s" was missing in the wiki (probably deleted)' %
-                (title))
-        # here, XML is a correct <page> </page> chunk or
-        # an empty string due to a deleted page (logged in errors log) or
-        # an empty string due to an error while retrieving the page from server
-        # (logged in errors log)
-        c += 1
-    xmlfile.write(footer)
-    xmlfile.close()
-    sys.stderr.write('XML dump saved at... %s\n' % (xmlfilename))
-
-def mwGetAPI(config={}):
-    """ Returns API for a MediaWiki wiki, if available """
-
-    api = ''
-    html = wikiteam.getURL(url=config['wiki'])
-    m = re.findall(
-        r'(?im)<\s*link\s*rel="EditURI"\s*type="application/rsd\+xml"\s*href="([^>]+?)\?action=rsd"\s*/\s*>',
-        html)
-    if m:
-        api = m[0]
-        if api.startswith('//'):  # gentoo wiki and others
-            api = url.split('//')[0] + api
-    return api
-
-def mwGetImageNames(config={}):
-    """ Get list of image names """
-
-    sys.stderr.write('Retrieving image filenames\n')
-    imagenames = []
-    if 'mwapi' in config and config['mwapi']:
-        imagenames = mwGetImageNamesAPI(config=config)
-    elif 'mwindex' in config and config['mwindex']:
-        imagenames = mwGetImageNamesScraper(config=config)
-    # imagenames = list(set(imagenames)) # it is a list of lists
-    imagenames.sort()
-    sys.stderr.write('%d image names loaded\n' % (len(imagenames)))
-    return imagenames
-
-def mwGetImageNamesAPI(config={}):
-    """ Retrieve file list: filename, url, uploader """
-    
-    oldAPI = False
-    aifrom = '!'
-    imagenames = []
-    while aifrom:
-        sys.stderr.write('.')  # progress
-        data = {
-            'action': 'query',
-            'list': 'allimages',
-            'aiprop': 'url|user',
-            'aifrom': aifrom,
-            'format': 'json',
-            'ailimit': 500}
-        # FIXME Handle HTTP Errors HERE
-        r = wikiteam.getURL(url=config['mwapi'], data=data)
-        #handleStatusCode(r)
-        jsonimages = wikiteam.getJSON(r)
-        wikiteam.delay(config=config)
-
-        if 'query' in jsonimages:
-            aifrom = ''
-            if 'query-continue' in jsonimages and 'allimages' in jsonimages['query-continue']:
-                if 'aicontinue' in jsonimages['query-continue']['allimages']:
-                    aifrom = jsonimages['query-continue']['allimages']['aicontinue']
-                elif 'aifrom' in jsonimages['query-continue']['allimages']:
-                    aifrom = jsonimages['query-continue']['allimages']['aifrom']
-            elif 'continue' in jsonimages:
-                if 'aicontinue' in jsonimages['continue']:
-                    aifrom = jsonimages['continue']['aicontinue']
-                elif 'aifrom' in jsonimages['continue']:
-                    aifrom = jsonimages['continue']['aifrom']
-            # sys.stderr.write(aifrom)
-
-            for image in jsonimages['query']['allimages']:
-                url = image['url']
-                url = mwCurateImageURL(config=config, url=url)
-                # encoding to ascii is needed to work around this horrible bug:
-                # http://bugs.python.org/issue8136
-                if 'mwapi' in config and '.wikia.com' in config['mwapi']:
-                    #to avoid latest?cb=20120816112532 in filenames
-                    filename = urllib.parse.unquote(re.sub('_', ' ', url.split('/')[-3])).encode('ascii', 'ignore')
-                else:
-                    filename = urllib.parse.unquote(re.sub('_', ' ', url.split('/')[-1])).encode('ascii', 'ignore')
-                uploader = re.sub('_', ' ', image['user'])
-                imagenames.append([filename, url, uploader])
-        else:
-            oldAPI = True
-            break
-
-    if oldAPI:
-        gapfrom = '!'
-        imagenames = []
-        while gapfrom:
-            sys.stderr.write('.')  # progress
-            # Some old APIs doesn't have allimages query
-            # In this case use allpages (in nm=6) as generator for imageinfo
-            # Example:
-            # http://minlingo.wiki-site.com/api.php?action=query&generator=allpages&gapnamespace=6
-            # &gaplimit=500&prop=imageinfo&iiprop=user|url&gapfrom=!
-            data = {
-                'action': 'query',
-                'generator': 'allpages',
-                'gapnamespace': 6,
-                'gaplimit': 500,
-                'gapfrom': gapfrom,
-                'prop': 'imageinfo',
-                'iiprop': 'user|url',
-                'format': 'json'}
-            # FIXME Handle HTTP Errors HERE
-            r = wikiteam.getURL(url=config['mwapi'], data=data)
-            #handleStatusCode(r)
-            jsonimages = wikiteam.getJSON(r)
-            wikiteam.delay(config=config)
-
-            if 'query' in jsonimages:
-                gapfrom = ''
-                if 'query-continue' in jsonimages and 'allpages' in jsonimages['query-continue']:
-                    if 'gapfrom' in jsonimages['query-continue']['allpages']:
-                        gapfrom = jsonimages['query-continue']['allpages']['gapfrom']
-
-                for image, props in jsonimages['query']['pages'].items():
-                    url = props['imageinfo'][0]['url']
-                    url = mwCurateImageURL(config=config, url=url)
-                    tmp_filename = ':'.join(props['title'].split(':')[1:])
-                    filename = re.sub('_', ' ', tmp_filename)
-                    uploader = re.sub('_', ' ', props['imageinfo'][0]['user'])
-                    imagenames.append([filename, url, uploader])
-            else:
-                # if the API doesn't return query data, then we're done
-                break
-
-    if len(imagenames) == 1:
-        sys.stderr.write('    Found 1 image')
-    else:
-        sys.stderr.write('    Found %d images' % (len(imagenames)))
-
-    return imagenames
-
-def mwGetImageNamesScraper(config={}):
-    """ Retrieve file list: filename, url, uploader """
-
-    # (?<! http://docs.python.org/library/re.html
-    r_next = r'(?<!&amp;dir=prev)&amp;offset=(?P<offset>\d+)&amp;'
-    imagenames = []
-    offset = '29990101000000'  # january 1, 2999
-    limit = 5000
-    retries = config['retries']
-    while offset:
-        # 5000 overload some servers, but it is needed for sites like this with
-        # no next links
-        # http://www.memoryarchive.org/en/index.php?title=Special:Imagelist&sort=byname&limit=50&wpIlMatch=
-        data={
-            'title': 'Special:Imagelist',
-            'limit': limit,
-            'offset': offset}
-        raw = wikiteam.getURL(url=config['index'], data=data)
-        #handleStatusCode(r)
-        wikiteam.delay(config=config)
-        # delicate wiki
-        if re.search(r'(?i)(allowed memory size of \d+ bytes exhausted|Call to a member function getURL)', raw):
-            if limit > 10:
-                sys.stderr.write('Error: listing %d images in a chunk is not possible, trying tiny chunks' % (limit))
-                limit = limit / 10
-                continue
-            elif retries > 0:  # waste retries, then exit
-                retries -= 1
-                sys.stderr.write('Retrying...')
-                continue
-            else:
-                sys.stderr.write('No more retries, exit...')
-                break
-
-        raw = mwCleanHTML(raw)
-        # archiveteam 1.15.1 <td class="TablePager_col_img_name"><a href="/index.php?title=File:Yahoovideo.jpg" title="File:Yahoovideo.jpg">Yahoovideo.jpg</a> (<a href="/images/2/2b/Yahoovideo.jpg">file</a>)</td>
-        # wikanda 1.15.5 <td class="TablePager_col_img_user_text"><a
-        # href="/w/index.php?title=Usuario:Fernandocg&amp;action=edit&amp;redlink=1"
-        # class="new" title="Usuario:Fernandocg (página no
-        # existe)">Fernandocg</a></td>
-        r_images1 = r'(?im)<td class="TablePager_col_img_name"><a href[^>]+title="[^:>]+:(?P<filename>[^>]+)">[^<]+</a>[^<]+<a href="(?P<url>[^>]+/[^>/]+)">[^<]+</a>[^<]+</td>\s*<td class="TablePager_col_img_user_text"><a[^>]+>(?P<uploader>[^<]+)</a></td>'
-        # wikijuegos 1.9.5
-        # http://softwarelibre.uca.es/wikijuegos/Especial:Imagelist old
-        # mediawiki version
-        r_images2 = r'(?im)<td class="TablePager_col_links"><a href[^>]+title="[^:>]+:(?P<filename>[^>]+)">[^<]+</a>[^<]+<a href="(?P<url>[^>]+/[^>/]+)">[^<]+</a></td>\s*<td class="TablePager_col_img_timestamp">[^<]+</td>\s*<td class="TablePager_col_img_name">[^<]+</td>\s*<td class="TablePager_col_img_user_text"><a[^>]+>(?P<uploader>[^<]+)</a></td>'
-        # gentoowiki 1.18
-        r_images3 = r'(?im)<td class="TablePager_col_img_name"><a[^>]+title="[^:>]+:(?P<filename>[^>]+)">[^<]+</a>[^<]+<a href="(?P<url>[^>]+)">[^<]+</a>[^<]+</td><td class="TablePager_col_thumb"><a[^>]+><img[^>]+></a></td><td class="TablePager_col_img_size">[^<]+</td><td class="TablePager_col_img_user_text"><a[^>]+>(?P<uploader>[^<]+)</a></td>'
-        # http://www.memoryarchive.org/en/index.php?title=Special:Imagelist&sort=byname&limit=50&wpIlMatch=
-        # (<a href="/en/Image:109_0923.JPG" title="Image:109 0923.JPG">desc</a>) <a href="/en/upload/c/cd/109_0923.JPG">109 0923.JPG</a> . . 885,713 bytes . . <a href="/en/User:Bfalconer" title="User:Bfalconer">Bfalconer</a> . . 18:44, 17 November 2005<br />
-        r_images4 = r'(?im)<a href=[^>]+ title="[^:>]+:(?P<filename>[^>]+)">[^<]+</a>[^<]+<a href="(?P<url>[^>]+)">[^<]+</a>[^<]+<a[^>]+>(?P<uploader>[^<]+)</a>'
-        r_images5 = (
-            r'(?im)<td class="TablePager_col_img_name">\s*<a href[^>]*?>(?P<filename>[^>]+)</a>\s*\(<a href="(?P<url>[^>]+)">[^<]*?</a>\s*\)\s*</td>\s*'
-            '<td class="TablePager_col_thumb">[^\n\r]*?</td>\s*'
-            '<td class="TablePager_col_img_size">[^<]*?</td>\s*'
-            '<td class="TablePager_col_img_user_text">\s*(<a href="[^>]*?" title="[^>]*?">)?(?P<uploader>[^<]+?)(</a>)?\s*</td>')
-
-        # Select the regexp that returns more results
-        regexps = [r_images1, r_images2, r_images3, r_images4, r_images5]
-        count = 0
-        i = 0
-        regexp_best = 0
-        for regexp in regexps:
-            if len(re.findall(regexp, raw)) > count:
-                count = len(re.findall(regexp, raw))
-                regexp_best = i
-            i += 1
-        m = re.compile(regexps[regexp_best]).finditer(raw)
-
-        # Iter the image results
-        for i in m:
-            url = i.group('url')
-            url = mwCurateImageURL(config=config, url=url)
-            filename = re.sub('_', ' ', i.group('filename'))
-            filename = wikiteam.undoHTMLEntities(text=filename)
-            filename = urllib.unquote(filename)
-            uploader = re.sub('_', ' ', i.group('uploader'))
-            uploader = wikiteam.undoHTMLEntities(text=uploader)
-            uploader = urllib.unquote(uploader)
-            imagenames.append([filename, url, uploader])
-
-        if re.search(r_next, raw):
-            new_offset = re.findall(r_next, raw)[0]
-            # Avoid infinite loop
-            if new_offset != offset:
-                offset = new_offset
-                retries += 5  # add more retries if we got a page with offset
-            else:
-                offset = ''
-        else:
-            offset = ''
-
-    if (len(imagenames) == 1):
-        sys.stderr.write('    Found 1 image')
-    else:
-        sys.stderr.write('    Found %d images' % (len(imagenames)))
-
-    imagenames.sort()
-    return imagenames
-
-def mwGetIndex(config={}):
-    """ Returns Index.php for a MediaWiki wiki, if available """
-
-    if config['mwapi']:
-        mwapi = config['mwapi']
-    else:
-        mwapi = mwGetAPI(config=config)
-    index = ''
-    html = wikiteam.getURL(url=config['wiki'])
-    m = re.findall(r'<li id="ca-viewsource"[^>]*?>\s*(?:<span>)?\s*<a href="([^\?]+?)\?', html)
-    if m:
-        index = m[0]
-    else:
-        m = re.findall(r'<li id="ca-history"[^>]*?>\s*(?:<span>)?\s*<a href="([^\?]+?)\?', html)
-        if m:
-            index = m[0]
-    if index:
-        if index.startswith('/'):
-            index = '/'.join(mwapi.split('/')[:-1]) + '/' + index.split('/')[-1]
-    else:
-        if mwapi:
-            if len(re.findall(r'/index\.php5\?', html)) > len(re.findall(r'/index\.php\?', html)):
-                index = '/'.join(mwapi.split('/')[:-1]) + '/index.php5'
-            else:
-                index = '/'.join(mwapi.split('/')[:-1]) + '/index.php'
-    return index
-
-def mwGetNamespaces(config={}):
-    """ Get list of namespaces """
-
-    sys.stderr.write('Retrieving namespaces\n')
-    namespaces = []
-    namespacenames = []
-    if 'mwapi' in config and config['mwapi']:
-        namespaces, namespacenames = mwGetNamespacesAPI(config=config)
-    elif 'mwindex' in config and config['mwindex']:
-        namespaces, namespacenames = mwGetImageNamesScraper(config=config)
-    namespaces.sort()
-    sys.stderr.write('%d namespaces loaded\n' % (len(namespaces)))
-    return namespaces, namespacenames
-
-def mwGetNamespacesAPI(config={}):
-    """ Uses the API to get the list of namespaces names and ids """
-    namespaces = config['namespaces']
-    namespacenames = {0: ''}  # main is 0, no prefix
-    if namespaces:
-        data = {'action': 'query',
-                'meta': 'siteinfo',
-                'siprop': 'namespaces',
-                'format': 'json'}
-        r = wikiteam.getURL(url=config['mwapi'], data=data)
-        result = wikiteam.getJSON(r)
-        wikiteam.delay(config=config)
-        if 'all' in namespaces:
-            namespaces = []
-            for i in result['query']['namespaces'].keys():
-                if int(i) < 0:  # Skipping -1: Special, -2: Media
-                    continue
-                namespaces.append(int(i))
-                namespacenames[int(i)] = result['query']['namespaces'][i]['*']
-        else:
-            # check if those namespaces really exist in this wiki
-            namespaces2 = []
-            for i in result['query']['namespaces'].keys():
-                if int(i) < 0:
-                    continue
-                if int(i) in namespaces:
-                    namespaces2.append(int(i))
-                    namespacenames[int(i)] = result['query']['namespaces'][i]['*']
-            namespaces = namespaces2
-    else:
-        namespaces = [0]
-
-    namespaces = list(set(namespaces))  # uniques
-    sys.stderr.write('%d namespaces found\n' % (len(namespaces)))
-    return namespaces, namespacenames
-
-def mwGetNamespacesScraper(config={}):
-    """ Hackishly gets the list of namespaces names and ids from the dropdown in the HTML of Special:AllPages """
-    """ Function called if no API is available """
-    
-    namespaces = config['namespaces']
-    namespacenames = {0: ''}  # main is 0, no prefix
-    if namespaces:
-        raw = wikiteam.getURL(url=config['index'], data={'title': 'Special:Allpages'})
-        wikiteam.delay(config=config)
-
-        # [^>]*? to include selected="selected"
-        m = re.compile(r'<option [^>]*?value="(?P<namespaceid>\d+)"[^>]*?>(?P<namespacename>[^<]+)</option>').finditer(raw)
-        if 'all' in namespaces:
-            namespaces = []
-            for i in m:
-                namespaces.append(int(i.group("namespaceid")))
-                namespacenames[int(i.group("namespaceid"))] = i.group("namespacename")
-        else:
-            # check if those namespaces really exist in this wiki
-            namespaces2 = []
-            for i in m:
-                if int(i.group("namespaceid")) in namespaces:
-                    namespaces2.append(int(i.group("namespaceid")))
-                    namespacenames[int(i.group("namespaceid"))] = i.group("namespacename")
-            namespaces = namespaces2
-    else:
-        namespaces = [0]
-
-    namespaces = list(set(namespaces))  # uniques
-    std.stderr.write('%d namespaces found' % (len(namespaces)))
-    return namespaces, namespacenames
-
-def mwGetPageTitles(config={}):
-    """ Get list of page titles """
-    # http://en.wikipedia.org/wiki/Special:AllPages
-    # http://archiveteam.org/index.php?title=Special:AllPages
-    # http://www.wikanda.es/wiki/Especial:Todas
-    sys.stderr.write('Loading page titles from namespaces = %s\n' % (','.join([str(i) for i in config['namespaces']]) or 'None'))
-    sys.stderr.write('Excluding titles from namespaces = %s\n' % (','.join([str(i) for i in config['exnamespaces']]) or 'None'))
-
-    if 'mwapi' in config and config['mwapi']:
-        for pagetitle in mwGetPageTitlesAPI(config=config):
-            yield pagetitle
-    elif 'mwindex' in config and config['mwindex']:
-        for pagetitle in mwGetPageTitlesScraper(config=config):
-            yield pagetitle
-
-def mwGetPageTitlesAPI(config={}):
-    """ Uses the API to get the list of page titles """
-    pagetitles = []
-    namespaces, namespacenames = mwGetNamespacesAPI(
-        config=config)
-    for namespace in namespaces:
-        if namespace in config['exnamespaces']:
-            sys.stderr.write('    Skipping namespace = %d\n' % (namespace))
-            continue
-
-        c = 0
-        sys.stderr.write('    Retrieving page titles in namespace %d\n' % (namespace))
-        apfrom = '!'
-        while apfrom:
-            sys.stderr.write('.')  # progress
-            data = {
-                'action': 'query',
-                'list': 'allpages',
-                'apnamespace': namespace,
-                'apfrom': apfrom.encode('utf-8'),
-                'format': 'json',
-                'aplimit': 500}
-            retryCount = 0
-            while retryCount < config["retries"]:
-                try:
-                    r = wikiteam.getURL(url=config['mwapi'], data=data)
-                    break
-                except ConnectionError as err:
-                    sys.stderr.write("Connection error: %s\n" % (str(err),))
-                    retryCount += 1
-                    time.sleep(20)
-            #wikiteam.handleStatusCode(r)
-            # FIXME Handle HTTP errors here!
-            jsontitles = wikiteam.getJSON(r)
-            apfrom = ''
-            if 'query-continue' in jsontitles and 'allpages' in jsontitles[
-                    'query-continue']:
-                if 'apcontinue' in jsontitles['query-continue']['allpages']:
-                    apfrom = jsontitles[
-                        'query-continue']['allpages']['apcontinue']
-                elif 'apfrom' in jsontitles['query-continue']['allpages']:
-                    apfrom = jsontitles['query-continue']['allpages']['apfrom']
-            elif 'continue' in jsontitles:
-                if 'apcontinue' in jsontitles['continue']:
-                    apfrom = jsontitles['continue']['apcontinue']
-                elif 'apfrom' in jsontitles['continue']:
-                    apfrom = jsontitles['continue']['apfrom']
-            
-            # sys.stderr.write(apfrom)
-            # sys.stderr.write(jsontitles)
-            allpages = jsontitles['query']['allpages']
-            # Hack for old versions of MediaWiki API where result is dict
-            if isinstance(allpages, dict):
-                allpages = allpages.values()
-            for page in allpages:
-                yield page['title']
-            c += len(allpages)
-
-            if len(pagetitles) != len(set(pagetitles)):
-                # Are we in a loop? Server returning dupes, stop it
-                sys.stderr.write('Probably a loop, finishing\n')
-                apfrom = ''
-
-            wikiteam.delay(config=config)
-        sys.stderr.write('    %d titles retrieved in namespace %d\n' % (c, namespace))
-
-
-def mwGetPageTitlesScraper(config={}):
-    """ Scrape list of page titles from Special:Allpages """
-    
-    pagetitles = []
-    namespaces, namespacenames = mwGetNamespacesScraper(
-        config=config)
-    for namespace in namespaces:
-        sys.stderr.write('    Retrieving titles in namespace %s\n' % (namespace))
-        url = '%s?title=Special:Allpages&namespace=%s' % (config['index'], namespace)
-        raw = wikiteam.getURL(url=url)
-        raw = mwCleanHTML(raw)
-
-        r_title = r'title="(?P<title>[^>]+)">'
-        r_suballpages = ''
-        r_suballpages1 = r'&amp;from=(?P<from>[^>]+)&amp;to=(?P<to>[^>]+)">'
-        r_suballpages2 = r'Special:Allpages/(?P<from>[^>]+)">'
-        r_suballpages3 = r'&amp;from=(?P<from>[^>]+)" title="[^>]+">'
-        if re.search(r_suballpages1, raw):
-            r_suballpages = r_suballpages1
-        elif re.search(r_suballpages2, raw):
-            r_suballpages = r_suballpages2
-        elif re.search(r_suballpages3, raw):
-            r_suballpages = r_suballpages3
-        else:
-            pass  # perhaps no subpages
-
-        # 3 is the current deep of English Wikipedia for Special:Allpages
-        deep = 3
-        c = 0
-        checked_suballpages = []
-        rawacum = raw
-        while r_suballpages and re.search(r_suballpages, raw) and c < deep:
-            # load sub-Allpages
-            m = re.compile(r_suballpages).finditer(raw)
-            for i in m:
-                fr = i.group('from')
-
-                if r_suballpages == r_suballpages1:
-                    to = i.group('to')
-                    name = '%s-%s' % (fr, to)
-                    url = '%s?title=Special:Allpages&namespace=%s&from=%s&to=%s' % (
-                        config['index'], namespace, fr, to)  # do not put urllib.quote in fr or to
-                # fix, esta regexp no carga bien todas? o falla el r_title en
-                # este tipo de subpag? (wikiindex)
-                elif r_suballpages == r_suballpages2:
-                    # clean &amp;namespace=\d, sometimes happens
-                    fr = fr.split('&amp;namespace=')[0]
-                    name = fr
-                    url = '%s?title=Special:Allpages/%s&namespace=%s' % (
-                        config['index'], name, namespace)
-                elif r_suballpages == r_suballpages3:
-                    fr = fr.split('&amp;namespace=')[0]
-                    name = fr
-                    url = '%s?title=Special:Allpages&from=%s&namespace=%s' % (
-                        config['index'], name, namespace)
-
-                if name not in checked_suballpages:
-                    # to avoid reload dupe subpages links
-                    checked_suballpages.append(name)
-                    wikiteam.delay(config=config)
-                    raw2 = wikiteam.getURL(url=url)
-                    raw2 = mwCleanHTML(raw2)
-                    rawacum += raw2  # merge it after removed junk
-                    sys.stderr.write('    Reading %s, %s bytes, %d subpages, %d pages' % (name, len(raw2), \
-                        len(re.findall(r_suballpages, raw2)), \
-                        len(re.findall(r_title, raw2))))
-
-                wikiteam.delay(config=config)
-            c += 1
-
-        c = 0
-        m = re.compile(r_title).finditer(rawacum)
-        for i in m:
-            t = wikiteam.undoHTMLEntities(text=i.group('title'))
-            if not t.startswith('Special:'):
-                if t not in pagetitles:
-                    pagetitles.append(t)
-                    c += 1
-        sys.stderr.write('    %d titles retrieved in the namespace %d\n' % (c, namespace))
-    return pagetitles
-
-def mwGetXMLHeader(config={}):
-    """ Retrieve a random page to extract XML header (namespace info, etc) """
-
-    pagetitle = 'Main_Page'
-    try:
-        xml = "".join([x for x in mwGetXMLPage(config=config, pagetitle=pagetitle, verbose=False)])
-    except PageMissingError as pme:
-        # The <page> does not exist. Not a problem, if we get the <siteinfo>.
-        xml = pme.xml
-    except ExportAbortedError:
-        # Issue 26: Account for missing "Special" namespace.
-        # Hope the canonical special name has not been removed.
-        # http://albens73.fr/wiki/api.php?action=query&meta=siteinfo&siprop=namespacealiases
-        try:
-            if config['mwapi']:
-                sys.stderr.write("Trying the local name for the Special namespace instead\n")
-                xml = "".join([x for x in mwGetXMLPage(config=config, pagetitle=pagetitle, verbose=False)])
-        except PageMissingError as pme:
-            xml = pme.xml
-        except ExportAbortedError:
-            pass
-
-    header = xml.split('</mediawiki>')[0]
-    if not re.match(r"\s*<mediawiki", xml):
-        sys.stderr.write('XML export on this wiki is broken, quitting.\n')
-        logerror('XML export on this wiki is broken, quitting.')
-        sys.exit()
-    return header
-
-def mwGetXMLPage(config={}, pagetitle='', verbose=True):
-    """ Get the full history (or current only) of a page """
-
-    # if server errors occurs while retrieving the full page history, it may return [oldest OK versions] + last version, excluding middle revisions, so it would be partialy truncated
-    # http://www.mediawiki.org/wiki/Manual_talk:Parameters_to_Special:Export#Parameters_no_longer_in_use.3F
-
-    limit = 1000
-    truncated = False
-    pagetitle_ = re.sub(' ', '_', pagetitle)
-    # do not convert & into %26, pagetitle_ = re.sub('&', '%26', pagetitle_)
-    data = {'title': config['mwexport'], 'pages': pagetitle_, 'action': 'submit'}
-    if config['curonly']:
-        data['curonly'] = 1
-        data['limit'] = 1
-    else:
-        data['offset'] = '1'  # 1 always < 2000s
-        data['limit'] = limit
-    # in other case, do not set data['templates']
-    if 'templates' in config and config['templates']: #fix, what is this option for?
-        data['templates'] = 1
-
-    xml = mwGetXMLPageCore(config=config, data=data)
-    if not xml:
-        raise ExportAbortedError(config['index'])
-    if not "</page>" in xml:
-        raise PageMissingError(data['title'], xml)
-    else:
-        # strip these sha1s sums which keep showing up in the export and
-        # which are invalid for the XML schema (they only apply to
-        # revisions)
-        xml = re.sub(r'\n\s*<sha1>\w+</sha1>\s*\n', r'\n', xml)
-        xml = re.sub(r'\n\s*<sha1/>\s*\n', r'\n', xml)
-
-    yield xml.split("</page>")[0]
-
-    # if complete history, check if this page history has > limit edits,
-    # if so, retrieve all revisions using offset if available
-    # else, warning about Special:Export truncating large page histories
-    r_timestamp = r'<timestamp>([^<]+)</timestamp>'
-    numedits = 0
-    numedits += len(re.findall(r_timestamp, xml))
-
-    # search for timestamps in xml to avoid analysing empty pages like
-    # Special:Allpages and the random one
-    if not config['curonly'] and re.search(r_timestamp, xml):
-        while not truncated and data['offset']:  # next chunk
-            # get the last timestamp from the acum XML
-            # assuming history is sorted chronologically
-            data['offset'] = re.findall(r_timestamp, xml)[-1]
-            try:
-                xml2 = mwGetXMLPageCore(config=config, data=data)
-            except MemoryError:
-                sys.stderr.write("Page history exceeds our memory, halving limit.\n")
-                data['limit'] = data['limit'] / 2
-                continue
-
-            # are there more edits in this next XML chunk or no <page></page>?
-            if re.findall(r_timestamp, xml2):
-                if re.findall(r_timestamp, xml2)[-1] == data['offset']:
-                    # again the same XML, this wiki does not support params in
-                    # Special:Export, offer complete XML up to X edits (usually
-                    # 1000)
-                    sys.stderr.write('ATTENTION: This wiki does not allow some parameters in Special:Export, therefore pages with large histories may be truncated\n')
-                    truncated = True
-                    break
-                else:
-                    """    </namespaces>
-                      </siteinfo>
-                      <page>
-                        <title>Main Page</title>
-                        <id>15580374</id>
-                        <restrictions>edit=sysop:move=sysop</restrictions> (?)
-                        <revision>
-                          <id>418009832</id>
-                          <timestamp>2011-03-09T19:57:06Z</timestamp>
-                          <contributor>
-                    """
-                    # offset is OK in this wiki, merge with the previous chunk
-                    # of this page history and continue
-                    try:
-                        xml2 = xml2.split("</page>")[0]
-                        yield '  <revision>' + ('<revision>'.join(xml2.split('<revision>')[1:]))
-                    except MemoryError:
-                        sys.stderr.write("Page's history exceeds our memory, halving limit.\n")
-                        data['limit'] = data['limit'] / 2
-                        continue
-                    xml = xml2
-                    numedits += len(re.findall(r_timestamp, xml))
-            else:
-                data['offset'] = ''  # no more edits in this page history
-    yield "</page>\n"
-
-    if verbose:
-        if numedits == 1:
-           sys.stderr.write('    %s, 1 edit\n' % (pagetitle))
-        else:
-           sys.stderr.write('    %s, %d edits\n' % (pagetitle, numedits))
-
-def mwGetXMLPageCore(config={}, data={}):
-    """ Returns a XML containing data['limit'] revisions (or current only), ending in </mediawiki>
-        if retrieving data['limit'] revisions fails, returns current only version
-        if all fail, returns empty string
-    """
-    
-    xml = ''
-    cretries = 0
-    maxseconds = 100  # max seconds to wait in a single sleeping
-    maxretries = config['retries']  # x retries and exit
-    increment = 20  # increment seconds every retry
-
-    while not re.search(r'</mediawiki>', xml):
-        if cretries > 0 and cretries < maxretries:
-            wait = increment * cretries < maxseconds and increment * \
-                cretries or maxseconds  # incremental until maxseconds
-            sys.stderr.write('    In attempt %d, XML for "%s" is wrong. Waiting %d seconds and reloading...\n' % (c, data['pages'], wait))
-            time.sleep(wait)
-            # reducing server load requesting smallest chunks (if curonly then
-            # limit = 1 from mother function)
-            if data['limit'] > 1:
-                data['limit'] = data['limit'] / 2  # half
-        if cretries >= maxretries:
-            sys.stderr.write('    We have retried %d times\n' % (cretries))
-            sys.stderr.write('    MediaWiki error for "%s", probably network error...' % (data['pages']))
-            # If it's not already what we tried: our last chance, preserve only the last revision...
-            # config['curonly'] means that the whole dump is configured to save only the last,
-            # data['curonly'] should mean that we've already tried this
-            # fallback, because it's set by the following if and passed to
-            # mwGetXMLPageCore
-            if not config['curonly'] and not 'curonly' in data:
-                sys.stderr.write('    Trying to save only the last revision for this page...\n')
-                data['curonly'] = 1
-                logerror(
-                    config=config,
-                    text='Error while retrieving the full history of "%s". Trying to save only the last revision for this page' %
-                    (data['pages'])
-                )
-                return mwGetXMLPageCore(config=config, data=data)
-            else:
-                sys.stderr.write('    Saving in error log, skipping...\n')
-                logerror(
-                    config=config,
-                    text='Error while retrieving last revision of "%s". Skipping.\n' %
-                    (data['pages']))
-                raise ExportAbortedError(config['index'])
-                return ''  # empty xml
-        # FIXME HANDLE HTTP Errors HERE
-        try:
-            r = wikiteam.getURL(url=config['index'], data=data)
-            #handleStatusCode(r)
-            #r = fixBOM(r)
-            xml = fixBOM(r)
-        except:
-            sys.stderr.write('    Connection error\n')
-            xml = ''
-        cretries += 1
-
-    return xml
-
-def mwReadPageTitles(config={}, start=None):
-    """ Read title list from a file, from the title "start" """
-
-    titlesfilename = '%s-%s-titles.txt' % (
-        domain2prefix(config=config), config['date'])
-    titlesfile = open('%s/%s' % (config['path'], titlesfilename), 'r')
-
-    seeking = False
-    if start:
-        seeking = True
-
-    with titlesfile as f:
-        for line in f:
-            if line.strip() == '--END--':
-                break
-            elif seeking and line.strip() != start:
-                continue
-            elif seeking and line.strip() == start:
-                seeking = False
-                yield line.strip()
-            else:
-                yield line.strip()
-
-def mwRemoveIP(raw=''):
-    """ Remove IP from HTML comments <!-- --> """
-
-    raw = re.sub(r'\d+\.\d+\.\d+\.\d+', '0.0.0.0', raw)
-    # http://www.juniper.net/techpubs/software/erx/erx50x/swconfig-routing-vol1/html/ipv6-config5.html
-    # weird cases as :: are not included
-    raw = re.sub(
-        r'(?i)[\da-f]{0,4}:[\da-f]{0,4}:[\da-f]{0,4}:[\da-f]{0,4}:[\da-f]{0,4}:[\da-f]{0,4}:[\da-f]{0,4}:[\da-f]{0,4}',
-        '0:0:0:0:0:0:0:0',
-        raw)
-
-    return raw
-
-def mwResumePreviousDump(config={}):
-    imagenames = []
-    sys.stderr.write('Resuming previous dump process...')
-    if config['xml']:
-        pagetitles = mwReadPageTitles(config=config)
-        try:
-            lasttitles = wikiteam.reverseReadline('%s/%s-%s-titles.txt' % (config['path'], domain2prefix(config=config), config['date']))
-            lasttitle=lasttitles.next()
-            if lasttitle == '':
-                lasttitle=lasttitles.next()
-        except:
-            pass  # probably file does not exists
-        if lasttitle == '--END--':
-            # titles list is complete
-            sys.stderr.write('Title list was completed in the previous session')
-        else:
-            sys.stderr.write('Title list is incomplete. Reloading...')
-            # do not resume, reload, to avoid inconsistences, deleted pages or
-            # so
-            pagetitles = mwGetPageTitles(config=config, start=lastxmltitle)
-            wikiteam.savePageTitles(config=config, pagetitles=pagetitles)
-
-        # checking xml dump
-        xmliscomplete = False
-        lastxmltitle = None
-        try:
-            f = wikiteam.reverseReadline(
-                '%s/%s-%s-%s.xml' %
-                (config['path'],
-                 domain2prefix(
-                    config=config),
-                    config['date'],
-                    config['curonly'] and 'current' or 'history'),
-                )
-            for l in f:
-                if l == '</mediawiki>':
-                    # xml dump is complete
-                    xmliscomplete = True
-                    break
-
-                xmltitle = re.search(r'<title>([^<]+)</title>', l)
-                if xmltitle:
-                    lastxmltitle = wikiteam.undoHTMLEntities(text=xmltitle.group(1))
-                    break
-        except:
-            pass  # probably file does not exists
-
-        if xmliscomplete:
-            sys.stderr.write('XML dump was completed in the previous session')
-        elif lastxmltitle:
-            # resuming...
-            sys.stderr.write('Resuming XML dump from "%s"' % (lastxmltitle))
-            pagetitles = mwReadPageTitles(config=config, start=lastxmltitle)
-            mwGenerateXMLDump(
-                config=config,
-                pagetitles=pagetitles,
-                start=lastxmltitle)
-        else:
-            # corrupt? only has XML header?
-            sys.stderr.write('XML is corrupt? Regenerating...')
-            pagetitles = mwReadPageTitles(config=config)
-            mwGenerateXMLDump(config=config, pagetitles=pagetitles)
-
-    if config['images']:
-        # load images
-        lastimage = ''
-        try:
-            f = open('%s/%s-%s-images.txt' % (config['path'], domain2prefix(config=config), config['date']), 'r')
-            raw = f.read().strip()
-            lines = raw.split('\n')
-            for l in lines:
-                if re.search(r'\t', l):
-                    imagenames.append(l.split('\t'))
-            lastimage = lines[-1]
-            f.close()
-        except:
-            pass  # probably file doesnot exists
-        if lastimage == '--END--':
-            sys.stderr.write('Image list was completed in the previous session')
-        else:
-            sys.stderr.write('Image list is incomplete. Reloading...')
-            # do not resume, reload, to avoid inconsistences, deleted images or
-            # so
-            imagenames = mwGetImageNames(config=config)
-            saveImageNames(config=config, imagenames=imagenames)
-        # checking images directory
-        listdir = []
-        try:
-            listdir = [n.decode('utf-8') for n in os.listdir('%s/images' % (config['path']))]
-        except:
-            pass  # probably directory does not exist
-        listdir.sort()
-        complete = True
-        lastfilename = ''
-        lastfilename2 = ''
-        c = 0
-        for filename, url, uploader in imagenames:
-            lastfilename2 = lastfilename
-            # return always the complete filename, not the truncated
-            lastfilename = filename
-            filename2 = filename
-            if len(filename2) > other['filenamelimit']:
-                filename2 = truncateFilename(other=other, filename=filename2)
-            if filename2 not in listdir:
-                complete = False
-                break
-            c += 1
-        sys.stderr.write('%d images were found in the directory from a previous session' % (c))
-        if complete:
-            # image dump is complete
-            sys.stderr.write('Image dump was completed in the previous session')
-        else:
-            # we resume from previous image, which may be corrupted (or missing
-            # .desc)  by the previous session ctrl-c or abort
-            mwGenerateImageDump(config=config, imagenames=imagenames, start=lastfilename2)
-
-    if config['logs']:
-        # fix
-        pass
-
-    mwSaveIndexPHP(config=config)
-    mwSaveSpecialVersion(config=config)
-    mwSaveSiteInfo(config=config)
-
-def mwSaveIndexPHP(config={}):
-    """ Save index.php as .html, to preserve license details available at the botom of the page """
-
-    if os.path.exists('%s/index.html' % (config['path'])):
-        sys.stderr.write('index.html exists, do not overwrite')
-    else:
-        sys.stderr.write('Downloading index.php (Main Page) as index.html')
-        raw = wikiteam.getURL(url=config['index'], data={})
-        wikiteam.delay(config=config)
-        raw = mwRemoveIP(raw=raw)
-        with open('%s/index.html' % (config['path']), 'w') as outfile:
-            outfile.write(raw)
-
-def mwSaveSiteInfo(config={}):
-    """ Save a file with site info """
-
-    if config['api']:
-        if os.path.exists('%s/siteinfo.json' % (config['path'])):
-            sys.stderr.write('siteinfo.json exists, do not overwrite')
-        else:
-            sys.stderr.write('Downloading site info as siteinfo.json')
-
-            # MediaWiki 1.13+
-            raw = wikiteam.getURL(url=config['api'], data={
-                'action': 'query',
-                'meta': 'siteinfo',
-                'siprop': 'general|namespaces|statistics|dbrepllag|interwikimap|namespacealiases|specialpagealiases|usergroups|extensions|skins|magicwords|fileextensions|rightsinfo',
-                'sinumberingroup': 1,
-                'format': 'json'})
-            wikiteam.delay(config=config)
-            # MediaWiki 1.11-1.12
-            if not 'query' in wikiteam.getJSON(raw):
-                raw = wikiteam.getURL(url=config['api'], data={
-                    'action': 'query',
-                    'meta': 'siteinfo',
-                    'siprop': 'general|namespaces|statistics|dbrepllag|interwikimap',
-                    'format': 'json'})
-            # MediaWiki 1.8-1.10
-            if not 'query' in wikiteam.getJSON(raw):
-                raw = wikiteam.getURL(url=config['api'], data={
-                    'action': 'query',
-                    'meta': 'siteinfo',
-                    'siprop': 'general|namespaces',
-                    'format': 'json'})
-            result = wikiteam.getJSON(raw)
-            wikiteam.delay(config=config)
-            with open('%s/siteinfo.json' % (config['path']), 'w') as outfile:
-                outfile.write(json.dumps(result, indent=4, sort_keys=True))
-
-def mwSaveSpecialVersion(config={}):
-    """ Save Special:Version as .html, to preserve extensions details """
-
-    if os.path.exists('%s/Special:Version.html' % (config['path'])):
-        sys.stderr.write('Special:Version.html exists, do not overwrite')
-    else:
-        sys.stderr.write('Downloading Special:Version with extensions and other related info')
-        raw = wikiteam.getURL(url=config['index'], data={'title': 'Special:Version'})
-        wikiteam.delay(config=config)
-        raw = mwRemoveIP(raw=raw)
-        with open('%s/Special:Version.html' % (config['path']), 'w') as outfile:
-            outfile.write(raw)
-
-def main():
-    pass
-
-if __name__ == "__main__":
-    main()
diff --git a/wikiteam/wikispaces.py b/wikiteam/wikispaces.py
deleted file mode 100644
index 976f5494..00000000
--- a/wikiteam/wikispaces.py
+++ /dev/null
@@ -1,35 +0,0 @@
-#!/usr/bin/env python3
-# -*- coding: utf-8 -*-
-
-# Copyright (C) 2011-2016 WikiTeam developers
-# This program is free software: you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation, either version 3 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-# Documentation for users: https://github.com/WikiTeam/wikiteam/wiki
-# Documentation for developers: http://wikiteam.readthedocs.com
-
-import re
-
-import wikiteam
-
-def wsCreateNewDump(config={}):
-    pass
-
-def wsGetPageTitles(config={}):
-    pass
-
-def main():
-    pass
-
-if __name__ == "__main__":
-    main()
diff --git a/wikiteam/wikiteam.py b/wikiteam/wikiteam.py
deleted file mode 100644
index 560cd470..00000000
--- a/wikiteam/wikiteam.py
+++ /dev/null
@@ -1,792 +0,0 @@
-#!/usr/bin/env python3
-# -*- coding: utf-8 -*-
-
-# Copyright (C) 2011-2016 WikiTeam developers
-# This program is free software: you can redistribute it and/or modify
-# it under the terms of the GNU General Public License as published by
-# the Free Software Foundation, either version 3 of the License, or
-# (at your option) any later version.
-#
-# This program is distributed in the hope that it will be useful,
-# but WITHOUT ANY WARRANTY; without even the implied warranty of
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
-# GNU General Public License for more details.
-#
-# You should have received a copy of the GNU General Public License
-# along with this program.  If not, see <http://www.gnu.org/licenses/>.
-
-# Documentation for users: https://github.com/WikiTeam/wikiteam/wiki
-# Documentation for developers: http://wikiteam.readthedocs.com
-
-import argparse
-import datetime
-import http.cookiejar as cookielib
-import json
-import os
-import pickle as cPickle
-import random
-import re
-import sys
-import time
-import urllib
-
-__version__ = "0.3.1"
-
-"""
-Stuff to check if works properly or re-add if needed:
-* fixBOM
-* sessions
-"""
-
-def avoidWikimediaProjects(config={}):
-    """ Skip Wikimedia projects and redirect to the dumps website """
-
-    # notice about wikipedia dumps
-    if re.findall(r'(?i)(wikipedia|wikisource|wiktionary|wikibooks|wikiversity|wikimedia|wikispecies|wikiquote|wikinews|wikidata|wikivoyage)\.org', config['wiki']):
-        sys.stderr.write('PLEASE, DO NOT USE THIS SCRIPT TO DOWNLOAD WIKIMEDIA PROJECTS!\n')
-        sys.stderr.write('Download Wikimedia dumps from https://dumps.wikimedia.org\n')
-        """if not other['force']:
-            sys.stderr.write('Thanks!')
-            sys.exit()"""
-
-def bye():
-    """ Print closing message """
-    
-    message = """
----> Congratulations! Your dump is complete <---
-If you found any bug, report a new issue here: https://github.com/WikiTeam/wikiteam/issues
-If this is a public wiki, please consider publishing this dump. Do it yourself as explained in https://github.com/WikiTeam/wikiteam/wiki/Tutorial#Publishing_the_dump or contact us at https://github.com/WikiTeam/wikiteam
-Good luck! Bye!"""
-    sys.stderr.write(message)
-
-def createNewDump(config={}):
-    if config['wikiengine'] == 'mediawiki':
-        import mediawiki
-        mediawiki.mwCreateNewDump(config=config)
-    elif config['wikiengine'] == 'wikispaces':
-        import wikispaces
-        wikispaces.wsCreateNewDump(config=config)
-    else:
-        sys.stderr.write("Wikiengine %s not supported. Exiting.\n" % (config['wikiengine']))
-
-def createDumpPath(config={}):
-    # creating path or resuming if desired
-    c = 2
-    # to avoid concat blabla-2, blabla-2-3, and so on...
-    originalpath = config['path']
-    # do not enter if resume is requested from begining
-    while not config['other']['resume'] and os.path.isdir(config['path']):
-        sys.stderr.write('\nWarning!: "%s" path exists\n' % (config['path']))
-        reply = ''
-        while reply.lower() not in ['yes', 'y', 'no', 'n']:
-            reply = input(
-                'There is a dump in "%s", probably incomplete.\nIf you choose resume, to avoid conflicts, the parameters you have chosen in the current session will be ignored\nand the parameters available in "%s/%s" will be loaded.\nDo you want to resume ([yes, y], [no, n])? ' %
-                (config['path'],
-                 config['path'],
-                    config['other']['configfilename']))
-        if reply.lower() in ['yes', 'y']:
-            if not os.path.isfile('%s/%s' % (config['path'], config['other']['configfilename'])):
-                sys.stderr.write('No config file found. I can\'t resume. Aborting.\n')
-                sys.exit()
-            sys.stderr.write('You have selected: YES\n')
-            config['other']['resume'] = True
-            break
-        elif reply.lower() in ['no', 'n']:
-            sys.stderr.write('You have selected: NO\n')
-            config['other']['resume'] = False
-        config['path'] = '%s-%d' % (originalpath, c)
-        sys.stderr.write('Trying to use path "%s"...\n' % (config['path']))
-        c += 1
-    return config
-
-def delay(config={}):
-    """ Add a delay if configured for that """
-    if config['delay'] > 0:
-        sys.stderr.write('Sleeping... %d seconds...\n' % (config['delay']))
-        time.sleep(config['delay'])
-
-def domain2prefix(config={}):
-    """ Convert domain name to a valid prefix filename. """
-
-    domain = ''
-    if config['wiki']:
-        domain = config['wiki']
-    domain = domain.lower()
-    domain = re.sub(r'(https?://|www\.|/index\.php|/api\.php)', '', domain)
-    domain = re.sub(r'/', '_', domain)
-    domain = re.sub(r'\.', '', domain)
-    domain = re.sub(r'[^A-Za-z0-9]', '_', domain)
-    domain = domain.strip('_')
-    return domain
-
-def getAPI(config={}):
-    """ Returns API for a wiki, if available """
-    
-    api = ''
-    if config['wikiengine'] == 'mediawiki':
-        import mediawiki
-        api = mediawiki.mwGetAPI(config=config)
-    
-    return api
-
-def getImageNames(config={}):
-    """ Returns list of image names for this wiki """
-    
-    imagenames = []
-    if config['wikiengine'] == 'mediawiki':
-        import mediawiki
-        imagenames = mediawiki.mwGetImageNames(config=config)
-    
-    return imagenames
-
-def getIndex(config={}):
-    """ Returns Index.php for a wiki, if available """
-    
-    index = ''
-    if config['wikiengine'] == 'mediawiki':
-        import mediawiki
-        index = mediawiki.mwGetIndex(config=config)
-    
-    return index
-
-def getJSON(request):
-    """Strip Unicode BOM"""
-    """if request.text.startswith(u'\ufeff'):
-        request.encoding = 'utf-8-sig'
-    return request.json()"""
-    return json.loads(request)
-
-def getNamespaces(config={}):
-    """ Returns list of namespaces for this wiki """
-    
-    namespaces = []
-    namespacenames = []
-    if config['wikiengine'] == 'mediawiki':
-        import mediawiki
-        namespaces, namespacenames = mediawiki.mwGetNamespaces(config=config)
-    
-    return namespacenames
-
-def getPageTitles(config={}):
-    """ Returns page titles for this wiki """
-    
-    if config['wikiengine'] == 'mediawiki':
-        import mediawiki
-        for pagetitle in mediawiki.mwGetPageTitles(config=config):
-            yield pagetitle
-
-def getParameters(params=[]):
-    """ Import parameters into variable """
-    
-    if not params:
-        params = sys.argv
-    
-    config = {}
-    parser = argparse.ArgumentParser(description='Tools for downloading and preserving wikis.')
-
-    # General params
-    parser.add_argument(
-        '-v', '--version', action='version', version=getVersion())
-    parser.add_argument(
-        '--cookies', metavar="cookies.txt", help="Path to a cookies.txt file.")
-    parser.add_argument(
-        '--delay',
-        metavar=5,
-        default=0,
-        type=float,
-        help="Adds a delay (in seconds).")
-    parser.add_argument(
-        '--retries',
-        metavar=5,
-        default=5,
-        help="Maximum number of retries.")
-    parser.add_argument('--path', help='Path to store wiki dump at.')
-    parser.add_argument(
-        '--resume',
-        action='store_true',
-        help='Resumes previous incomplete dump (requires --path).')
-    parser.add_argument('--force', action='store_true', help='')
-    parser.add_argument(
-        '--user', help='Username if authentication is required.')
-    parser.add_argument(
-        '--pass',
-        dest='password',
-        help='Password if authentication is required.')
-
-    # URL params
-    # This script should work with any general URL, finding out
-    # API, index.php or whatever by itself when necessary
-    groupWiki = parser.add_argument_group()
-    groupWiki.add_argument(
-        'wiki',
-        default='',
-        nargs='?',
-        help="URL to wiki (e.g. http://wiki.domain.org).")
-    # URL params for MediaWiki
-    groupWiki.add_argument(
-        '--mwapi',
-        help="URL to MediaWiki API (e.g. http://wiki.domain.org/w/api.php).")
-    groupWiki.add_argument(
-        '--mwindex',
-        help="URL to MediaWiki index.php (e.g. http://wiki.domain.org/w/index.php).")
-
-    # Download params
-    groupDownload = parser.add_argument_group(
-        'Data to download',
-        'What info download from the wiki')
-    groupDownload.add_argument(
-        '--pages',
-        action='store_true',
-        help="Generates a dump of pages (--pages --curonly for current revisions only).")
-    groupDownload.add_argument('--curonly', action='store_true',
-                               help='Store only the current version of pages.')
-    groupDownload.add_argument(
-        '--images', action='store_true', help="Generates an image dump.")
-    groupDownload.add_argument(
-        '--namespaces',
-        metavar="1,2,3",
-        help='Comma-separated value of namespaces to include (all by default).')
-    groupDownload.add_argument(
-        '--exnamespaces',
-        metavar="1,2,3",
-        help='Comma-separated value of namespaces to exclude.')
-
-    # Meta info params
-    groupMeta = parser.add_argument_group(
-        'Meta info',
-        'What meta info to retrieve from the wiki')
-    groupMeta.add_argument(
-        '--get-api',
-        action='store_true',
-        help="Returns wiki API when available.")
-    groupMeta.add_argument(
-        '--get-index',
-        action='store_true',
-        help="Returns wiki Index.php when available.")
-    groupMeta.add_argument(
-        '--get-page-titles',
-        action='store_true',
-        help="Returns wiki page titles.")
-    groupMeta.add_argument(
-        '--get-image-names',
-        action='store_true',
-        help="Returns wiki image names.")
-    groupMeta.add_argument(
-        '--get-namespaces',
-        action='store_true',
-        help="Returns wiki namespaces.")
-    groupMeta.add_argument(
-        '--get-wiki-engine',
-        action='store_true',
-        help="Returns wiki engine.")
-
-    args = parser.parse_args()
-    #sys.stderr.write(args)
-    
-    # Not wiki? Exit
-    if not args.wiki:
-        sys.stderr.write('ERROR: Provide a URL to a wiki\n')
-        parser.print_help()
-        sys.exit(1)
-    
-    # Don't mix download params and meta info params
-    if (args.pages or args.images) and \
-       (args.get_api or args.get_index or args.get_page_titles or args.get_image_names or args.get_namespaces or args.get_wiki_engine):
-        sys.stderr.write('ERROR: Don\'t mix download params and meta info params\n')
-        parser.print_help()
-        sys.exit(1)
-
-    # No download params and no meta info params? Exit
-    if (not args.pages and not args.images) and \
-       (not args.get_api and not args.get_index and not args.get_page_titles and not args.get_image_names and not args.get_namespaces and not args.get_wiki_engine):
-        sys.stderr.write('ERROR: Use at least one download param or meta info param\n')
-        parser.print_help()
-        sys.exit(1)
-
-    # Load cookies
-    cj = cookielib.MozillaCookieJar()
-    if args.cookies:
-        cj.load(args.cookies)
-        sys.stderr.write('Using cookies from %s\n' % args.cookies)
-
-    # check user and pass (one requires both)
-    if (args.user and not args.password) or (args.password and not args.user):
-        sys.stderr.write('ERROR: Both --user and --pass are required for authentication.\n')
-        parser.print_help()
-        sys.exit(1)
-    
-    session = None
-    if args.user and args.password:
-        import requests
-        session = requests.Session()
-        session.cookies = cj
-        session.headers.update({'User-Agent': getUserAgent()})
-        session.auth = (args.user, args.password)
-        #session.mount(args.mw_api.split('/api.php')[0], HTTPAdapter(max_retries=max_ret)) Mediawiki-centric, be careful
-
-    # check URLs
-    for url in [args.mwapi, args.mwindex, args.wiki]:
-        if url and (not url.startswith('http://') and not url.startswith('https://')):
-            sys.stderr.write(url)
-            sys.stderr.write('ERROR: URLs must start with http:// or https://\n')
-            parser.print_help()
-            sys.exit(1)
-    
-    # Meta info params
-    metainfo = '' # only one allowed, so we don't mix output
-    if args.get_api:
-        metainfo = 'get_api'
-    elif args.get_index:
-        metainfo = 'get_index'
-    elif args.get_page_titles:
-        metainfo = 'get_page_titles'
-    elif args.get_image_names:
-        metainfo = 'get_image_names'
-    elif args.get_namespaces:
-        metainfo = 'get_namespaces'
-    elif args.get_wiki_engine:
-        metainfo = 'get_wiki_engine'
-
-    namespaces = ['all']
-    exnamespaces = []
-    # Process namespace inclusions
-    if args.namespaces:
-        # fix, why - ?  and... --namespaces= all with a space works?
-        if re.search(
-                r'[^\d, \-]',
-                args.namespaces) and args.namespaces.lower() != 'all':
-            sys.stderr.write("Invalid namespace values.\nValid format is integer(s) separated by commas\n")
-            sys.exit()
-        else:
-            ns = re.sub(' ', '', args.namespaces)
-            if ns.lower() == 'all':
-                namespaces = ['all']
-            else:
-                namespaces = [int(i) for i in ns.split(',')]
-
-    # Process namespace exclusions
-    if args.exnamespaces:
-        if re.search(r'[^\d, \-]', args.exnamespaces):
-            sys.stderr.write("Invalid namespace values.\nValid format is integer(s) separated by commas\n")
-            sys.exit(1)
-        else:
-            ns = re.sub(' ', '', args.exnamespaces)
-            if ns.lower() == 'all':
-                sys.stderr.write('You cannot exclude all namespaces.\n')
-                sys.exit(1)
-            else:
-                exnamespaces = [int(i) for i in ns.split(',')]
-
-    # --curonly requires --xml
-    if args.curonly and not args.pages:
-        sys.stderr.write("--curonly requires --pages\n")
-        parser.print_help()
-        sys.exit(1)
-    
-    config = {
-        'cookies': args.cookies or '', 
-        'curonly': args.curonly, 
-        'date': datetime.datetime.now().strftime('%Y%m%d'), 
-        'delay': args.delay, 
-        'exnamespaces': exnamespaces, 
-        'images': args.images, 
-        'logs': False, 
-        'metainfo': metainfo, 
-        'namespaces': namespaces, 
-        'pages': args.pages, 
-        'path': args.path and os.path.normpath(args.path) or '', 
-        'retries': int(args.retries), 
-        'wiki': args.wiki, 
-        'wikicanonical': '', 
-        'wikiengine': getWikiEngine(args.wiki), 
-        'other': {
-            'configfilename': 'config.txt', 
-            'filenamelimit': 100,  # do not change
-            'force': args.force, 
-            'resume': args.resume, 
-            'session': session, 
-        }
-    }
-    
-    # Get ready special variables (API for MediWiki, etc)
-    if config['wikiengine'] == 'mediawiki':
-        import mediawiki
-        config['mwexport'] = 'Special:Export'
-        if not args.mwapi:
-            config['mwapi'] = mediawiki.mwGetAPI(config=config)
-            if not config['mwapi']:
-                sys.stderr.write('ERROR: Provide a URL to API\n')
-                sys.exit(1)
-            else:
-                data={
-                    'action': 'query',
-                    'meta': 'siteinfo',
-                    'siprop': 'namespaces',
-                    'format': 'json'}
-                r = getURL(config['mwapi'], data=data)
-                config['mwexport'] = getJSON(r)['query']['namespaces']['-1']['*'] \
-                    + ':Export'
-        if not args.mwindex:
-            config['mwindex'] = mediawiki.mwGetIndex(config=config)
-            if not config['mwindex']:
-                sys.stderr.write('ERROR: Provide a URL to Index.php\n')
-                sys.exit(1)
-    elif wikiengine == 'wikispaces':
-        import wikispaces
-        # use wikicanonical for base url for Wikispaces?
-    
-    # calculating path, if not defined by user with --path=
-    if not config['path']:
-        config['path'] = './%s-%s-wikidump' % (domain2prefix(config=config), config['date'])
-
-    return config
-
-def getURL(url='', data=None):
-    # fix quizas pasandole el config pueda saber si esta definido el campo session y usarlo si interesa con un if
-    html = ''
-    try:
-        req = urllib.request.Request(url, headers={ 'User-Agent': 'Mozilla/5.0' })
-        if data:
-            data = urllib.parse.urlencode(data).encode()
-            html = urllib.request.urlopen(req, data=data).read().decode().strip()
-        else:
-            html = urllib.request.urlopen(req).read().decode().strip()
-    except:
-        sys.stderr.write("Error while retrieving URL: %s\n" % url)
-        if data:
-            sys.stderr.write("Data sent: %s\n" % data)
-        sys.exit()
-    return html
-
-def getUserAgent():
-    """ Return a cool user-agent to hide Python user-agent """
-    
-    useragents = [
-        'Mozilla/5.0', 
-    ]
-    return random.choice(useragents)
-
-def getVersion():
-    return __version__
-
-def getWikiEngine(url=''):
-    """ Returns wiki engine of a URL, if known """
-    
-    wikiengine = 'unknown'
-    if url:
-        html = getURL(url=url)
-    else:
-        return wikiengine.lower()
-    
-    if re.search(
-            r'(?im)(<meta name="generator" content="DokuWiki)|dokuwiki__site',
-            html):
-        wikiengine = 'dokuwiki'
-    elif re.search(r'(?im)(alt="Powered by MediaWiki"|<meta name="generator" content="MediaWiki)', html):
-        wikiengine = 'mediawiki'
-    elif re.search(r'(?im)(>MoinMoin Powered</a>|<option value="LocalSiteMap">)', html):
-        wikiengine = 'moinmoin'
-    elif re.search(r'(?im)(twikiCurrentTopicLink|twikiCurrentWebHomeLink|twikiLink)', html):
-        wikiengine = 'twiki'
-    elif re.search(r'(?im)(<!--PageHeaderFmt-->)', html):
-        wikiengine = 'pmwiki'
-    elif re.search(r'(?im)(<meta name="generator" content="PhpWiki|<meta name="PHPWIKI_VERSION)', html):
-        wikiengine = 'phpwiki'
-    elif re.search(r'(?im)(<meta name="generator" content="Tiki Wiki|Powered by <a href="http://(www\.)?tiki\.org"| id="tiki-(top|main)")', html):
-        wikiengine = 'tikiwiki'
-    elif re.search(r'(?im)(foswikiNoJs|<meta name="foswiki\.|foswikiTable|foswikiContentFooter)', html):
-        wikiengine = 'foswiki'
-    elif re.search(r'(?im)(<meta http-equiv="powered by" content="MojoMojo)', html):
-        wikiengine = 'mojomojo'
-    elif re.search(r'(?im)(id="xwiki(content|nav_footer|platformversion|docinfo|maincontainer|data)|/resources/js/xwiki/xwiki|XWiki\.webapppath)', html):
-        wikiengine = 'xwiki'
-    elif re.search(r'(?im)(<meta id="confluence-(base-url|context-path)")', html):
-        wikiengine = 'confluence'
-    elif re.search(r'(?im)(<meta name="generator" content="Banana Dance)', html):
-        wikiengine = 'bananadance'
-    elif re.search(r'(?im)(Wheeled by <a class="external-link" href="http://www\.wagn\.org">|<body id="wagn">)', html):
-        wikiengine = 'wagn'
-    elif re.search(r'(?im)(<meta name="generator" content="MindTouch)', html):
-        wikiengine = 'mindtouch'  # formerly DekiWiki
-    elif re.search(r'(?im)(<div class="wikiversion">\s*(<p>)?JSPWiki|xmlns:jspwiki="http://www\.jspwiki\.org")', html):
-        wikiengine = 'jspwiki'
-    elif re.search(r'(?im)(Powered by:?\s*(<br ?/>)?\s*<a href="http://kwiki\.org">|\bKwikiNavigation\b)', html):
-        wikiengine = 'kwiki'
-    elif re.search(r'(?im)(Powered by <a href="http://www\.anwiki\.com")', html):
-        wikiengine = 'anwiki'
-    elif re.search(r'(?im)(<meta name="generator" content="Aneuch|is powered by <em>Aneuch</em>|<!-- start of Aneuch markup -->)', html):
-        wikiengine = 'aneuch'
-    elif re.search(r'(?im)(<meta name="generator" content="bitweaver)', html):
-        wikiengine = 'bitweaver'
-    elif re.search(r'(?im)(powered by <a href="[^"]*\bzwiki.org(/[^"]*)?">)', html):
-        wikiengine = 'zwiki'
-    # WakkaWiki forks
-    elif re.search(r'(?im)(<meta name="generator" content="WikkaWiki|<a class="ext" href="(http://wikka\.jsnx\.com/|http://wikkawiki\.org/)">)', html):
-        wikiengine = 'wikkawiki'  # formerly WikkaWakkaWiki
-    elif re.search(r'(?im)(<meta name="generator" content="CoMa Wiki)', html):
-        wikiengine = 'comawiki'
-    elif re.search(r'(?im)(Fonctionne avec <a href="http://www\.wikini\.net)', html):
-        wikiengine = 'wikini'
-    elif re.search(r'(?im)(Powered by <a href="[^"]*CitiWiki">CitiWiki</a>)', html):
-        wikiengine = 'citiwiki'
-    elif re.search(r'(?im)(Powered by <a href="http://wackowiki\.com/|title="WackoWiki")', html):
-        wikiengine = 'wackowiki'
-    elif re.search(r'(?im)(Powered by <a href="http://www\.wakkawiki\.com)', html):
-        # This may not work for heavily modded/themed installations, e.g.
-        # http://operawiki.info/
-        wikiengine = 'wakkawiki'
-    # Custom wikis used by wiki farms
-    elif re.search(r'(?im)(var wikispaces_page|<div class="WikispacesContent)', html):
-        wikiengine = 'wikispaces'
-    elif re.search(r'(?im)(Powered by <a href="http://www\.wikidot\.com">|wikidot-privacy-button-hovertip|javascript:WIKIDOT\.page)', html):
-        wikiengine = 'wikidot'
-    elif re.search(r'(?im)(IS_WETPAINT_USER|wetpaintLoad|WPC-bodyContentContainer)', html):
-        wikiengine = 'wetpaint'
-    elif re.search(r'(?im)(<div id="footer-pbwiki">|ws-nav-search|PBinfo *= *{)', html):
-        # formerly PBwiki
-        wikiengine = 'pbworks'
-    # if wikiengine == 'Unknown': sys.stderr.write(html)
-
-    return wikiengine.lower()
-
-def fixBOM(r):
-    """Strip Unicode BOM"""
-    if request.text.startswith(u'\ufeff'):
-        request.encoding = 'utf-8-sig'
-    return request.text
-
-def handleStatusCode(response):
-    statuscode = response.status_code
-    if statuscode >= 200 and statuscode < 300:
-        return
-
-    sys.stderr.write("HTTP Error %d.\n" % statuscode)
-    if statuscode >= 300 and statuscode < 400:
-        sys.stderr.write("Redirect should happen automatically: please report this as a bug.\n")
-        sys.stderr.write('%s\n' % response.url)
-
-    elif statuscode == 400:
-        sys.stderr.write("Bad Request: The wiki may be malfunctioning.\n")
-        sys.stderr.write("Please try again later.\n")
-        sys.stderr.write('%s\n' % response.url)
-        sys.exit(1)
-
-    elif statuscode == 401 or statuscode == 403:
-        sys.stderr.write("Authentication required.\n")
-        sys.stderr.write("Please use --userpass.\n")
-        sys.stderr.write('%s\n' % response.url)
-
-    elif statuscode == 404:
-        sys.stderr.write("Not found. Is Special:Export enabled for this wiki?\n")
-        sys.stderr.write('%s\n' % response.url)
-        sys.exit(1)
-
-    elif statuscode == 429 or (statuscode >= 500 and statuscode < 600):
-        sys.stderr.write("Server error, max retries exceeded.\n")
-        sys.stderr.write("Please resume the dump later.\n")
-        sys.stderr.write('%s\n' % response.url)
-        sys.exit(1)
-
-def printImageNames(config={}):
-    """ Print list of page titles for this wiki """
-    
-    for imagename in getImageNames(config=config):
-        sys.stdout.write('%s\n' % (imagename))
-        
-def printNamespaces(config={}):
-    """ Print list of namespaces for this wiki """
-    
-    namespacenames = getNamespaces(config=config)
-    for namespaceid, namespacename in namespacenames.items():
-        sys.stdout.write('%s %s\n' % (namespaceid, namespacename))
-        
-def printPageTitles(config={}):
-    """ Print list of page titles for this wiki """
-    
-    for pagetitle in getPageTitles(config=config):
-        sys.stdout.write('%s\n' % (pagetitle))
-
-def resumePreviousDump(config={}):
-    if config['wikiengine'] == 'mediawiki':
-        import mediawiki
-        mediawiki.mwResumePreviousDump(config=config)
-    elif config['wikiengine'] == 'wikispaces':
-        import wikispaces
-        wikispaces.wsResumePreviousDump(config=config)
-    else:
-        sys.stderr.write("Wikiengine %s not supported. Exiting.\n" % (config['wikiengine']))
-
-def reverseReadline(filename, buf_size=8192, truncate=False):
-    """a generator that returns the lines of a file in reverse order"""
-    # Original code by srohde, abdus_salam: cc by-sa 3.0
-    # http://stackoverflow.com/a/23646049/718903
-    with open(filename, 'r+') as fh:
-        segment = None
-        offset = 0
-        fh.seek(0, os.SEEK_END)
-        total_size = remaining_size = fh.tell()
-        while remaining_size > 0:
-            offset = min(total_size, offset + buf_size)
-            fh.seek(-offset, os.SEEK_END)
-            buffer = fh.read(min(remaining_size, buf_size))
-            remaining_size -= buf_size
-            lines = buffer.split('\n')
-            # the first line of the buffer is probably not a complete line so
-            # we'll save it and append it to the last line of the next buffer
-            # we read
-            if segment is not None:
-                # if the previous chunk starts right from the beginning of line
-                # do not concat the segment to the last line of new chunk
-                # instead, yield the segment first 
-                if buffer[-1] is not '\n':
-                    lines[-1] += segment
-                else:
-                    if truncate and '</page>' in segment:
-                        pages = buffer.split('</page>')
-                        fh.seek(-offset+buf_size-len(pages[-1]), os.SEEK_END)
-                        fh.truncate
-                        raise StopIteration
-                    else:
-                        yield segment
-            segment = lines[0]
-            for index in range(len(lines) - 1, 0, -1):
-                if truncate and '</page>' in segment:
-                    pages = buffer.split('</page>')
-                    fh.seek(-offset-len(pages[-1]), os.SEEK_END)
-                    fh.truncate
-                    raise StopIteration
-                else:
-                    yield lines[index]
-        yield segment
-
-def saveConfig(config={}):
-    """ Save config file """
-    
-    # Do not save config['other'] as it has session info and other stuff
-    config2 = config.copy()
-    config2['other'] = {}
-    with open('%s/%s' % (config['path'], config['other']['configfilename']), 'w') as outfile:
-        sys.stderr.write('Saving config file...\n')
-        try: #str
-            cPickle.dump(config2, outfile)
-        except: #bytes
-            with open('%s/%s' % (config['path'], config['other']['configfilename']), 'wb') as outfile:
-                cPickle.dump(config2, outfile)
-
-def saveImageNames(config={}, imagenames=[]):
-    """ Save image list in a file, including filename, url and uploader """
-
-    imagesfilename = '%s-%s-images.txt' % (
-        domain2prefix(config=config), config['date'])
-    imagesfile = open('%s/%s' % (config['path'], imagesfilename), 'w')
-    imagesfile.write('\n'.join(['%s\t%s\t%s' % (filename, url, uploader) for filename, url, uploader in imagenames]))
-    imagesfile.write('\n--END--')
-    imagesfile.close()
-    sys.stderr.write('Image filenames and URLs saved at... %s ' % imagesfilename)
-
-def savePageTitles(config={}, pagetitles=None):
-    pagetitlesfilename = '%s-%s-titles.txt' % (
-        domain2prefix(config=config), config['date'])
-    with open('%s/%s' % (config['path'], pagetitlesfilename), 'wt') as f:
-        for pagetitle in pagetitles:
-            output = '%s\n' % (pagetitle)
-            f.write(output)
-
-        # TODO: Sort to remove dupes? In CZ, Widget:AddThis appears two times:
-        # main namespace and widget namespace.
-        # We can use sort -u in UNIX, but is it worth it?
-        f.write('--END--\n')
-        f.close()
-    sys.stderr.write('Page titles saved at... %s\n' % (pagetitlesfilename))
-
-def undoHTMLEntities(text=''):
-    """ Undo some HTML codes """
-
-    # i guess only < > & " ' need conversion
-    # http://www.w3schools.com/html/html_entities.asp
-    text = re.sub('&lt;', '<', text)
-    text = re.sub('&gt;', '>', text)
-    text = re.sub('&amp;', '&', text)
-    text = re.sub('&quot;', '"', text)
-    text = re.sub('&#039;', '\'', text)
-
-    return text
-
-def welcome():
-    """ Print opening message """
-    
-    message = """
-#########################################################################
-# Welcome to WikiTeam's tools v%s (GPL v3)                           #
-# Tools for downloading and preserving wikis                            #
-# More info at: https://github.com/WikiTeam/wikiteam                    #
-#########################################################################
-
-#########################################################################
-# Copyright (C) 2011-2016 WikiTeam                                      #
-# This program is free software: you can redistribute it and/or modify  #
-# it under the terms of the GNU General Public License as published by  #
-# the Free Software Foundation, either version 3 of the License, or     #
-# (at your option) any later version.                                   #
-#                                                                       #
-# This program is distributed in the hope that it will be useful,       #
-# but WITHOUT ANY WARRANTY; without even the implied warranty of        #
-# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the         #
-# GNU General Public License for more details.                          #
-#                                                                       #
-# You should have received a copy of the GNU General Public License     #
-# along with this program.  If not, see <http://www.gnu.org/licenses/>. #
-#########################################################################
-""" % (getVersion())
-    sys.stderr.write(message)
-
-def loadConfig(config={}):
-    """ Load config file """
-    
-    try:
-        with open('%s/%s' % (config['path'], config['other']['configfilename']), 'r') as infile:
-            sys.stderr.write('Loading config file...\n')
-            config = cPickle.load(infile)
-    except:
-        sys.stderr.write('ERROR: There is no config file. we can\'t resume. Start a new dump.\n')
-        sys.exit()
-
-    return config
-
-def main(params=[]):
-    """ Main function """
-    
-    config = getParameters(params=params)    
-    avoidWikimediaProjects(config=config)
-    config = createDumpPath(config=config)
-    if config['other']['resume']:
-        # Resume dump
-        welcome()
-        config = loadConfig(config=config)
-        resumePreviousDump(config=config)
-    elif config['pages'] or config['images'] or config['logs']:
-        # New dump
-        welcome()
-        os.mkdir(config['path'])
-        saveConfig(config=config)
-        createNewDump(config=config)
-    elif config['metainfo']:
-        # No dumps. Print meta info params
-        if config['metainfo'] == 'get_api':
-            print(getAPI(config=config))
-        elif config['metainfo'] == 'get_index':
-            print(getIndex(config=config))
-        elif config['metainfo'] == 'get_page_titles':
-            printPageTitles(config=config)
-        elif config['metainfo'] == 'get_image_names':
-            printImageNames(config=config)
-        elif config['metainfo'] == 'get_namespaces':
-            printNamespaces(config=config)
-        elif config['metainfo'] == 'get_wiki_engine':
-            print(config['wikiengine'])
-        sys.exit()
-            
-    bye()
-
-if __name__ == "__main__":
-    main()
diff --git a/wikitools/COPYING b/wikitools/COPYING
new file mode 100644
index 00000000..94a9ed02
--- /dev/null
+++ b/wikitools/COPYING
@@ -0,0 +1,674 @@
+                    GNU GENERAL PUBLIC LICENSE
+                       Version 3, 29 June 2007
+
+ Copyright (C) 2007 Free Software Foundation, Inc. <http://fsf.org/>
+ Everyone is permitted to copy and distribute verbatim copies
+ of this license document, but changing it is not allowed.
+
+                            Preamble
+
+  The GNU General Public License is a free, copyleft license for
+software and other kinds of works.
+
+  The licenses for most software and other practical works are designed
+to take away your freedom to share and change the works.  By contrast,
+the GNU General Public License is intended to guarantee your freedom to
+share and change all versions of a program--to make sure it remains free
+software for all its users.  We, the Free Software Foundation, use the
+GNU General Public License for most of our software; it applies also to
+any other work released this way by its authors.  You can apply it to
+your programs, too.
+
+  When we speak of free software, we are referring to freedom, not
+price.  Our General Public Licenses are designed to make sure that you
+have the freedom to distribute copies of free software (and charge for
+them if you wish), that you receive source code or can get it if you
+want it, that you can change the software or use pieces of it in new
+free programs, and that you know you can do these things.
+
+  To protect your rights, we need to prevent others from denying you
+these rights or asking you to surrender the rights.  Therefore, you have
+certain responsibilities if you distribute copies of the software, or if
+you modify it: responsibilities to respect the freedom of others.
+
+  For example, if you distribute copies of such a program, whether
+gratis or for a fee, you must pass on to the recipients the same
+freedoms that you received.  You must make sure that they, too, receive
+or can get the source code.  And you must show them these terms so they
+know their rights.
+
+  Developers that use the GNU GPL protect your rights with two steps:
+(1) assert copyright on the software, and (2) offer you this License
+giving you legal permission to copy, distribute and/or modify it.
+
+  For the developers' and authors' protection, the GPL clearly explains
+that there is no warranty for this free software.  For both users' and
+authors' sake, the GPL requires that modified versions be marked as
+changed, so that their problems will not be attributed erroneously to
+authors of previous versions.
+
+  Some devices are designed to deny users access to install or run
+modified versions of the software inside them, although the manufacturer
+can do so.  This is fundamentally incompatible with the aim of
+protecting users' freedom to change the software.  The systematic
+pattern of such abuse occurs in the area of products for individuals to
+use, which is precisely where it is most unacceptable.  Therefore, we
+have designed this version of the GPL to prohibit the practice for those
+products.  If such problems arise substantially in other domains, we
+stand ready to extend this provision to those domains in future versions
+of the GPL, as needed to protect the freedom of users.
+
+  Finally, every program is threatened constantly by software patents.
+States should not allow patents to restrict development and use of
+software on general-purpose computers, but in those that do, we wish to
+avoid the special danger that patents applied to a free program could
+make it effectively proprietary.  To prevent this, the GPL assures that
+patents cannot be used to render the program non-free.
+
+  The precise terms and conditions for copying, distribution and
+modification follow.
+
+                       TERMS AND CONDITIONS
+
+  0. Definitions.
+
+  "This License" refers to version 3 of the GNU General Public License.
+
+  "Copyright" also means copyright-like laws that apply to other kinds of
+works, such as semiconductor masks.
+
+  "The Program" refers to any copyrightable work licensed under this
+License.  Each licensee is addressed as "you".  "Licensees" and
+"recipients" may be individuals or organizations.
+
+  To "modify" a work means to copy from or adapt all or part of the work
+in a fashion requiring copyright permission, other than the making of an
+exact copy.  The resulting work is called a "modified version" of the
+earlier work or a work "based on" the earlier work.
+
+  A "covered work" means either the unmodified Program or a work based
+on the Program.
+
+  To "propagate" a work means to do anything with it that, without
+permission, would make you directly or secondarily liable for
+infringement under applicable copyright law, except executing it on a
+computer or modifying a private copy.  Propagation includes copying,
+distribution (with or without modification), making available to the
+public, and in some countries other activities as well.
+
+  To "convey" a work means any kind of propagation that enables other
+parties to make or receive copies.  Mere interaction with a user through
+a computer network, with no transfer of a copy, is not conveying.
+
+  An interactive user interface displays "Appropriate Legal Notices"
+to the extent that it includes a convenient and prominently visible
+feature that (1) displays an appropriate copyright notice, and (2)
+tells the user that there is no warranty for the work (except to the
+extent that warranties are provided), that licensees may convey the
+work under this License, and how to view a copy of this License.  If
+the interface presents a list of user commands or options, such as a
+menu, a prominent item in the list meets this criterion.
+
+  1. Source Code.
+
+  The "source code" for a work means the preferred form of the work
+for making modifications to it.  "Object code" means any non-source
+form of a work.
+
+  A "Standard Interface" means an interface that either is an official
+standard defined by a recognized standards body, or, in the case of
+interfaces specified for a particular programming language, one that
+is widely used among developers working in that language.
+
+  The "System Libraries" of an executable work include anything, other
+than the work as a whole, that (a) is included in the normal form of
+packaging a Major Component, but which is not part of that Major
+Component, and (b) serves only to enable use of the work with that
+Major Component, or to implement a Standard Interface for which an
+implementation is available to the public in source code form.  A
+"Major Component", in this context, means a major essential component
+(kernel, window system, and so on) of the specific operating system
+(if any) on which the executable work runs, or a compiler used to
+produce the work, or an object code interpreter used to run it.
+
+  The "Corresponding Source" for a work in object code form means all
+the source code needed to generate, install, and (for an executable
+work) run the object code and to modify the work, including scripts to
+control those activities.  However, it does not include the work's
+System Libraries, or general-purpose tools or generally available free
+programs which are used unmodified in performing those activities but
+which are not part of the work.  For example, Corresponding Source
+includes interface definition files associated with source files for
+the work, and the source code for shared libraries and dynamically
+linked subprograms that the work is specifically designed to require,
+such as by intimate data communication or control flow between those
+subprograms and other parts of the work.
+
+  The Corresponding Source need not include anything that users
+can regenerate automatically from other parts of the Corresponding
+Source.
+
+  The Corresponding Source for a work in source code form is that
+same work.
+
+  2. Basic Permissions.
+
+  All rights granted under this License are granted for the term of
+copyright on the Program, and are irrevocable provided the stated
+conditions are met.  This License explicitly affirms your unlimited
+permission to run the unmodified Program.  The output from running a
+covered work is covered by this License only if the output, given its
+content, constitutes a covered work.  This License acknowledges your
+rights of fair use or other equivalent, as provided by copyright law.
+
+  You may make, run and propagate covered works that you do not
+convey, without conditions so long as your license otherwise remains
+in force.  You may convey covered works to others for the sole purpose
+of having them make modifications exclusively for you, or provide you
+with facilities for running those works, provided that you comply with
+the terms of this License in conveying all material for which you do
+not control copyright.  Those thus making or running the covered works
+for you must do so exclusively on your behalf, under your direction
+and control, on terms that prohibit them from making any copies of
+your copyrighted material outside their relationship with you.
+
+  Conveying under any other circumstances is permitted solely under
+the conditions stated below.  Sublicensing is not allowed; section 10
+makes it unnecessary.
+
+  3. Protecting Users' Legal Rights From Anti-Circumvention Law.
+
+  No covered work shall be deemed part of an effective technological
+measure under any applicable law fulfilling obligations under article
+11 of the WIPO copyright treaty adopted on 20 December 1996, or
+similar laws prohibiting or restricting circumvention of such
+measures.
+
+  When you convey a covered work, you waive any legal power to forbid
+circumvention of technological measures to the extent such circumvention
+is effected by exercising rights under this License with respect to
+the covered work, and you disclaim any intention to limit operation or
+modification of the work as a means of enforcing, against the work's
+users, your or third parties' legal rights to forbid circumvention of
+technological measures.
+
+  4. Conveying Verbatim Copies.
+
+  You may convey verbatim copies of the Program's source code as you
+receive it, in any medium, provided that you conspicuously and
+appropriately publish on each copy an appropriate copyright notice;
+keep intact all notices stating that this License and any
+non-permissive terms added in accord with section 7 apply to the code;
+keep intact all notices of the absence of any warranty; and give all
+recipients a copy of this License along with the Program.
+
+  You may charge any price or no price for each copy that you convey,
+and you may offer support or warranty protection for a fee.
+
+  5. Conveying Modified Source Versions.
+
+  You may convey a work based on the Program, or the modifications to
+produce it from the Program, in the form of source code under the
+terms of section 4, provided that you also meet all of these conditions:
+
+    a) The work must carry prominent notices stating that you modified
+    it, and giving a relevant date.
+
+    b) The work must carry prominent notices stating that it is
+    released under this License and any conditions added under section
+    7.  This requirement modifies the requirement in section 4 to
+    "keep intact all notices".
+
+    c) You must license the entire work, as a whole, under this
+    License to anyone who comes into possession of a copy.  This
+    License will therefore apply, along with any applicable section 7
+    additional terms, to the whole of the work, and all its parts,
+    regardless of how they are packaged.  This License gives no
+    permission to license the work in any other way, but it does not
+    invalidate such permission if you have separately received it.
+
+    d) If the work has interactive user interfaces, each must display
+    Appropriate Legal Notices; however, if the Program has interactive
+    interfaces that do not display Appropriate Legal Notices, your
+    work need not make them do so.
+
+  A compilation of a covered work with other separate and independent
+works, which are not by their nature extensions of the covered work,
+and which are not combined with it such as to form a larger program,
+in or on a volume of a storage or distribution medium, is called an
+"aggregate" if the compilation and its resulting copyright are not
+used to limit the access or legal rights of the compilation's users
+beyond what the individual works permit.  Inclusion of a covered work
+in an aggregate does not cause this License to apply to the other
+parts of the aggregate.
+
+  6. Conveying Non-Source Forms.
+
+  You may convey a covered work in object code form under the terms
+of sections 4 and 5, provided that you also convey the
+machine-readable Corresponding Source under the terms of this License,
+in one of these ways:
+
+    a) Convey the object code in, or embodied in, a physical product
+    (including a physical distribution medium), accompanied by the
+    Corresponding Source fixed on a durable physical medium
+    customarily used for software interchange.
+
+    b) Convey the object code in, or embodied in, a physical product
+    (including a physical distribution medium), accompanied by a
+    written offer, valid for at least three years and valid for as
+    long as you offer spare parts or customer support for that product
+    model, to give anyone who possesses the object code either (1) a
+    copy of the Corresponding Source for all the software in the
+    product that is covered by this License, on a durable physical
+    medium customarily used for software interchange, for a price no
+    more than your reasonable cost of physically performing this
+    conveying of source, or (2) access to copy the
+    Corresponding Source from a network server at no charge.
+
+    c) Convey individual copies of the object code with a copy of the
+    written offer to provide the Corresponding Source.  This
+    alternative is allowed only occasionally and noncommercially, and
+    only if you received the object code with such an offer, in accord
+    with subsection 6b.
+
+    d) Convey the object code by offering access from a designated
+    place (gratis or for a charge), and offer equivalent access to the
+    Corresponding Source in the same way through the same place at no
+    further charge.  You need not require recipients to copy the
+    Corresponding Source along with the object code.  If the place to
+    copy the object code is a network server, the Corresponding Source
+    may be on a different server (operated by you or a third party)
+    that supports equivalent copying facilities, provided you maintain
+    clear directions next to the object code saying where to find the
+    Corresponding Source.  Regardless of what server hosts the
+    Corresponding Source, you remain obligated to ensure that it is
+    available for as long as needed to satisfy these requirements.
+
+    e) Convey the object code using peer-to-peer transmission, provided
+    you inform other peers where the object code and Corresponding
+    Source of the work are being offered to the general public at no
+    charge under subsection 6d.
+
+  A separable portion of the object code, whose source code is excluded
+from the Corresponding Source as a System Library, need not be
+included in conveying the object code work.
+
+  A "User Product" is either (1) a "consumer product", which means any
+tangible personal property which is normally used for personal, family,
+or household purposes, or (2) anything designed or sold for incorporation
+into a dwelling.  In determining whether a product is a consumer product,
+doubtful cases shall be resolved in favor of coverage.  For a particular
+product received by a particular user, "normally used" refers to a
+typical or common use of that class of product, regardless of the status
+of the particular user or of the way in which the particular user
+actually uses, or expects or is expected to use, the product.  A product
+is a consumer product regardless of whether the product has substantial
+commercial, industrial or non-consumer uses, unless such uses represent
+the only significant mode of use of the product.
+
+  "Installation Information" for a User Product means any methods,
+procedures, authorization keys, or other information required to install
+and execute modified versions of a covered work in that User Product from
+a modified version of its Corresponding Source.  The information must
+suffice to ensure that the continued functioning of the modified object
+code is in no case prevented or interfered with solely because
+modification has been made.
+
+  If you convey an object code work under this section in, or with, or
+specifically for use in, a User Product, and the conveying occurs as
+part of a transaction in which the right of possession and use of the
+User Product is transferred to the recipient in perpetuity or for a
+fixed term (regardless of how the transaction is characterized), the
+Corresponding Source conveyed under this section must be accompanied
+by the Installation Information.  But this requirement does not apply
+if neither you nor any third party retains the ability to install
+modified object code on the User Product (for example, the work has
+been installed in ROM).
+
+  The requirement to provide Installation Information does not include a
+requirement to continue to provide support service, warranty, or updates
+for a work that has been modified or installed by the recipient, or for
+the User Product in which it has been modified or installed.  Access to a
+network may be denied when the modification itself materially and
+adversely affects the operation of the network or violates the rules and
+protocols for communication across the network.
+
+  Corresponding Source conveyed, and Installation Information provided,
+in accord with this section must be in a format that is publicly
+documented (and with an implementation available to the public in
+source code form), and must require no special password or key for
+unpacking, reading or copying.
+
+  7. Additional Terms.
+
+  "Additional permissions" are terms that supplement the terms of this
+License by making exceptions from one or more of its conditions.
+Additional permissions that are applicable to the entire Program shall
+be treated as though they were included in this License, to the extent
+that they are valid under applicable law.  If additional permissions
+apply only to part of the Program, that part may be used separately
+under those permissions, but the entire Program remains governed by
+this License without regard to the additional permissions.
+
+  When you convey a copy of a covered work, you may at your option
+remove any additional permissions from that copy, or from any part of
+it.  (Additional permissions may be written to require their own
+removal in certain cases when you modify the work.)  You may place
+additional permissions on material, added by you to a covered work,
+for which you have or can give appropriate copyright permission.
+
+  Notwithstanding any other provision of this License, for material you
+add to a covered work, you may (if authorized by the copyright holders of
+that material) supplement the terms of this License with terms:
+
+    a) Disclaiming warranty or limiting liability differently from the
+    terms of sections 15 and 16 of this License; or
+
+    b) Requiring preservation of specified reasonable legal notices or
+    author attributions in that material or in the Appropriate Legal
+    Notices displayed by works containing it; or
+
+    c) Prohibiting misrepresentation of the origin of that material, or
+    requiring that modified versions of such material be marked in
+    reasonable ways as different from the original version; or
+
+    d) Limiting the use for publicity purposes of names of licensors or
+    authors of the material; or
+
+    e) Declining to grant rights under trademark law for use of some
+    trade names, trademarks, or service marks; or
+
+    f) Requiring indemnification of licensors and authors of that
+    material by anyone who conveys the material (or modified versions of
+    it) with contractual assumptions of liability to the recipient, for
+    any liability that these contractual assumptions directly impose on
+    those licensors and authors.
+
+  All other non-permissive additional terms are considered "further
+restrictions" within the meaning of section 10.  If the Program as you
+received it, or any part of it, contains a notice stating that it is
+governed by this License along with a term that is a further
+restriction, you may remove that term.  If a license document contains
+a further restriction but permits relicensing or conveying under this
+License, you may add to a covered work material governed by the terms
+of that license document, provided that the further restriction does
+not survive such relicensing or conveying.
+
+  If you add terms to a covered work in accord with this section, you
+must place, in the relevant source files, a statement of the
+additional terms that apply to those files, or a notice indicating
+where to find the applicable terms.
+
+  Additional terms, permissive or non-permissive, may be stated in the
+form of a separately written license, or stated as exceptions;
+the above requirements apply either way.
+
+  8. Termination.
+
+  You may not propagate or modify a covered work except as expressly
+provided under this License.  Any attempt otherwise to propagate or
+modify it is void, and will automatically terminate your rights under
+this License (including any patent licenses granted under the third
+paragraph of section 11).
+
+  However, if you cease all violation of this License, then your
+license from a particular copyright holder is reinstated (a)
+provisionally, unless and until the copyright holder explicitly and
+finally terminates your license, and (b) permanently, if the copyright
+holder fails to notify you of the violation by some reasonable means
+prior to 60 days after the cessation.
+
+  Moreover, your license from a particular copyright holder is
+reinstated permanently if the copyright holder notifies you of the
+violation by some reasonable means, this is the first time you have
+received notice of violation of this License (for any work) from that
+copyright holder, and you cure the violation prior to 30 days after
+your receipt of the notice.
+
+  Termination of your rights under this section does not terminate the
+licenses of parties who have received copies or rights from you under
+this License.  If your rights have been terminated and not permanently
+reinstated, you do not qualify to receive new licenses for the same
+material under section 10.
+
+  9. Acceptance Not Required for Having Copies.
+
+  You are not required to accept this License in order to receive or
+run a copy of the Program.  Ancillary propagation of a covered work
+occurring solely as a consequence of using peer-to-peer transmission
+to receive a copy likewise does not require acceptance.  However,
+nothing other than this License grants you permission to propagate or
+modify any covered work.  These actions infringe copyright if you do
+not accept this License.  Therefore, by modifying or propagating a
+covered work, you indicate your acceptance of this License to do so.
+
+  10. Automatic Licensing of Downstream Recipients.
+
+  Each time you convey a covered work, the recipient automatically
+receives a license from the original licensors, to run, modify and
+propagate that work, subject to this License.  You are not responsible
+for enforcing compliance by third parties with this License.
+
+  An "entity transaction" is a transaction transferring control of an
+organization, or substantially all assets of one, or subdividing an
+organization, or merging organizations.  If propagation of a covered
+work results from an entity transaction, each party to that
+transaction who receives a copy of the work also receives whatever
+licenses to the work the party's predecessor in interest had or could
+give under the previous paragraph, plus a right to possession of the
+Corresponding Source of the work from the predecessor in interest, if
+the predecessor has it or can get it with reasonable efforts.
+
+  You may not impose any further restrictions on the exercise of the
+rights granted or affirmed under this License.  For example, you may
+not impose a license fee, royalty, or other charge for exercise of
+rights granted under this License, and you may not initiate litigation
+(including a cross-claim or counterclaim in a lawsuit) alleging that
+any patent claim is infringed by making, using, selling, offering for
+sale, or importing the Program or any portion of it.
+
+  11. Patents.
+
+  A "contributor" is a copyright holder who authorizes use under this
+License of the Program or a work on which the Program is based.  The
+work thus licensed is called the contributor's "contributor version".
+
+  A contributor's "essential patent claims" are all patent claims
+owned or controlled by the contributor, whether already acquired or
+hereafter acquired, that would be infringed by some manner, permitted
+by this License, of making, using, or selling its contributor version,
+but do not include claims that would be infringed only as a
+consequence of further modification of the contributor version.  For
+purposes of this definition, "control" includes the right to grant
+patent sublicenses in a manner consistent with the requirements of
+this License.
+
+  Each contributor grants you a non-exclusive, worldwide, royalty-free
+patent license under the contributor's essential patent claims, to
+make, use, sell, offer for sale, import and otherwise run, modify and
+propagate the contents of its contributor version.
+
+  In the following three paragraphs, a "patent license" is any express
+agreement or commitment, however denominated, not to enforce a patent
+(such as an express permission to practice a patent or covenant not to
+sue for patent infringement).  To "grant" such a patent license to a
+party means to make such an agreement or commitment not to enforce a
+patent against the party.
+
+  If you convey a covered work, knowingly relying on a patent license,
+and the Corresponding Source of the work is not available for anyone
+to copy, free of charge and under the terms of this License, through a
+publicly available network server or other readily accessible means,
+then you must either (1) cause the Corresponding Source to be so
+available, or (2) arrange to deprive yourself of the benefit of the
+patent license for this particular work, or (3) arrange, in a manner
+consistent with the requirements of this License, to extend the patent
+license to downstream recipients.  "Knowingly relying" means you have
+actual knowledge that, but for the patent license, your conveying the
+covered work in a country, or your recipient's use of the covered work
+in a country, would infringe one or more identifiable patents in that
+country that you have reason to believe are valid.
+
+  If, pursuant to or in connection with a single transaction or
+arrangement, you convey, or propagate by procuring conveyance of, a
+covered work, and grant a patent license to some of the parties
+receiving the covered work authorizing them to use, propagate, modify
+or convey a specific copy of the covered work, then the patent license
+you grant is automatically extended to all recipients of the covered
+work and works based on it.
+
+  A patent license is "discriminatory" if it does not include within
+the scope of its coverage, prohibits the exercise of, or is
+conditioned on the non-exercise of one or more of the rights that are
+specifically granted under this License.  You may not convey a covered
+work if you are a party to an arrangement with a third party that is
+in the business of distributing software, under which you make payment
+to the third party based on the extent of your activity of conveying
+the work, and under which the third party grants, to any of the
+parties who would receive the covered work from you, a discriminatory
+patent license (a) in connection with copies of the covered work
+conveyed by you (or copies made from those copies), or (b) primarily
+for and in connection with specific products or compilations that
+contain the covered work, unless you entered into that arrangement,
+or that patent license was granted, prior to 28 March 2007.
+
+  Nothing in this License shall be construed as excluding or limiting
+any implied license or other defenses to infringement that may
+otherwise be available to you under applicable patent law.
+
+  12. No Surrender of Others' Freedom.
+
+  If conditions are imposed on you (whether by court order, agreement or
+otherwise) that contradict the conditions of this License, they do not
+excuse you from the conditions of this License.  If you cannot convey a
+covered work so as to satisfy simultaneously your obligations under this
+License and any other pertinent obligations, then as a consequence you may
+not convey it at all.  For example, if you agree to terms that obligate you
+to collect a royalty for further conveying from those to whom you convey
+the Program, the only way you could satisfy both those terms and this
+License would be to refrain entirely from conveying the Program.
+
+  13. Use with the GNU Affero General Public License.
+
+  Notwithstanding any other provision of this License, you have
+permission to link or combine any covered work with a work licensed
+under version 3 of the GNU Affero General Public License into a single
+combined work, and to convey the resulting work.  The terms of this
+License will continue to apply to the part which is the covered work,
+but the special requirements of the GNU Affero General Public License,
+section 13, concerning interaction through a network will apply to the
+combination as such.
+
+  14. Revised Versions of this License.
+
+  The Free Software Foundation may publish revised and/or new versions of
+the GNU General Public License from time to time.  Such new versions will
+be similar in spirit to the present version, but may differ in detail to
+address new problems or concerns.
+
+  Each version is given a distinguishing version number.  If the
+Program specifies that a certain numbered version of the GNU General
+Public License "or any later version" applies to it, you have the
+option of following the terms and conditions either of that numbered
+version or of any later version published by the Free Software
+Foundation.  If the Program does not specify a version number of the
+GNU General Public License, you may choose any version ever published
+by the Free Software Foundation.
+
+  If the Program specifies that a proxy can decide which future
+versions of the GNU General Public License can be used, that proxy's
+public statement of acceptance of a version permanently authorizes you
+to choose that version for the Program.
+
+  Later license versions may give you additional or different
+permissions.  However, no additional obligations are imposed on any
+author or copyright holder as a result of your choosing to follow a
+later version.
+
+  15. Disclaimer of Warranty.
+
+  THERE IS NO WARRANTY FOR THE PROGRAM, TO THE EXTENT PERMITTED BY
+APPLICABLE LAW.  EXCEPT WHEN OTHERWISE STATED IN WRITING THE COPYRIGHT
+HOLDERS AND/OR OTHER PARTIES PROVIDE THE PROGRAM "AS IS" WITHOUT WARRANTY
+OF ANY KIND, EITHER EXPRESSED OR IMPLIED, INCLUDING, BUT NOT LIMITED TO,
+THE IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR
+PURPOSE.  THE ENTIRE RISK AS TO THE QUALITY AND PERFORMANCE OF THE PROGRAM
+IS WITH YOU.  SHOULD THE PROGRAM PROVE DEFECTIVE, YOU ASSUME THE COST OF
+ALL NECESSARY SERVICING, REPAIR OR CORRECTION.
+
+  16. Limitation of Liability.
+
+  IN NO EVENT UNLESS REQUIRED BY APPLICABLE LAW OR AGREED TO IN WRITING
+WILL ANY COPYRIGHT HOLDER, OR ANY OTHER PARTY WHO MODIFIES AND/OR CONVEYS
+THE PROGRAM AS PERMITTED ABOVE, BE LIABLE TO YOU FOR DAMAGES, INCLUDING ANY
+GENERAL, SPECIAL, INCIDENTAL OR CONSEQUENTIAL DAMAGES ARISING OUT OF THE
+USE OR INABILITY TO USE THE PROGRAM (INCLUDING BUT NOT LIMITED TO LOSS OF
+DATA OR DATA BEING RENDERED INACCURATE OR LOSSES SUSTAINED BY YOU OR THIRD
+PARTIES OR A FAILURE OF THE PROGRAM TO OPERATE WITH ANY OTHER PROGRAMS),
+EVEN IF SUCH HOLDER OR OTHER PARTY HAS BEEN ADVISED OF THE POSSIBILITY OF
+SUCH DAMAGES.
+
+  17. Interpretation of Sections 15 and 16.
+
+  If the disclaimer of warranty and limitation of liability provided
+above cannot be given local legal effect according to their terms,
+reviewing courts shall apply local law that most closely approximates
+an absolute waiver of all civil liability in connection with the
+Program, unless a warranty or assumption of liability accompanies a
+copy of the Program in return for a fee.
+
+                     END OF TERMS AND CONDITIONS
+
+            How to Apply These Terms to Your New Programs
+
+  If you develop a new program, and you want it to be of the greatest
+possible use to the public, the best way to achieve this is to make it
+free software which everyone can redistribute and change under these terms.
+
+  To do so, attach the following notices to the program.  It is safest
+to attach them to the start of each source file to most effectively
+state the exclusion of warranty; and each file should have at least
+the "copyright" line and a pointer to where the full notice is found.
+
+    <one line to give the program's name and a brief idea of what it does.>
+    Copyright (C) <year>  <name of author>
+
+    This program is free software: you can redistribute it and/or modify
+    it under the terms of the GNU General Public License as published by
+    the Free Software Foundation, either version 3 of the License, or
+    (at your option) any later version.
+
+    This program is distributed in the hope that it will be useful,
+    but WITHOUT ANY WARRANTY; without even the implied warranty of
+    MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+    GNU General Public License for more details.
+
+    You should have received a copy of the GNU General Public License
+    along with this program.  If not, see <http://www.gnu.org/licenses/>.
+
+Also add information on how to contact you by electronic and paper mail.
+
+  If the program does terminal interaction, make it output a short
+notice like this when it starts in an interactive mode:
+
+    <program>  Copyright (C) <year>  <name of author>
+    This program comes with ABSOLUTELY NO WARRANTY; for details type `show w'.
+    This is free software, and you are welcome to redistribute it
+    under certain conditions; type `show c' for details.
+
+The hypothetical commands `show w' and `show c' should show the appropriate
+parts of the General Public License.  Of course, your program's commands
+might be different; for a GUI interface, you would use an "about box".
+
+  You should also get your employer (if you work as a programmer) or school,
+if any, to sign a "copyright disclaimer" for the program, if necessary.
+For more information on this, and how to apply and follow the GNU GPL, see
+<http://www.gnu.org/licenses/>.
+
+  The GNU General Public License does not permit incorporating your program
+into proprietary programs.  If your program is a subroutine library, you
+may consider it more useful to permit linking proprietary applications with
+the library.  If this is what you want to do, use the GNU Lesser General
+Public License instead of this License.  But first, please read
+<http://www.gnu.org/philosophy/why-not-lgpl.html>.
diff --git a/wikitools/README.md b/wikitools/README.md
new file mode 100644
index 00000000..2dc2cc60
--- /dev/null
+++ b/wikitools/README.md
@@ -0,0 +1,135 @@
+wikitools -- Package for working with MediaWiki wikis
+
+Requirements
+------------
+
+  * Python 2.5+. Not compatible with Python 3; not tested on older versions
+  * Bob Ippolito's simplejson module, if using Python < 2.6
+    <http://pypi.python.org/pypi/simplejson>
+  * To upload files or import XML, you need Chris AtLee's poster package
+    <http://pypi.python.org/pypi/poster>  
+  * The wiki this is used for should be running at least MediaWiki version 1.13 and have the API enabled.
+
+Installation
+------------
+
+  * Run "python setup.py install" or copy the wikitools directory
+    to an appropriate Python module directory.
+  * An exe installer for Windows is also available (should be run as an 
+    administrator to avoid errors)
+  * An RPM for Linux is also available.
+  * Arch Linux users may use AUR package for their convenience:
+    <https://aur.archlinux.org/packages/python2-wikitools/>
+
+Available modules
+-----------------
+
+  * api.py - Contains the APIRequest class, for doing queries directly,
+	see API examples below
+  * wiki.py - Contains the Wiki class, used for logging in to the site,
+    storing cookies, and storing basic site information
+  * page.py -  Contains the Page class for dealing with individual pages
+    on the wiki. Can be used to get page info and text, as well as edit and
+	other actions if enabled on the wiki
+  * category.py - Category is a subclass of Page with extra functions for
+    working with categories
+  * wikifile.py - File is a subclass of Page with extra functions for
+    working with files - note that there may be some issues with shared 
+	repositories, as the pages for files on shared repos technically don't
+	exist on the local wiki.
+  * user.py - Contains the User class for getting information about and 
+    blocking/unblocking users
+  * pagelist.py - Contains several functions for getting a list of Page
+    objects from lists of titles, pageids, or API query results
+
+Further documentation
+---------------------
+  * https://code.google.com/p/python-wikitools/wiki/Documentation
+
+Current limitations
+-------------------
+
+  * Can only do what the API can do. On a site without the edit-API enabled
+    (disabled by default prior to MediaWiki 1.14), you cannot edit/delete/
+	protect pages, only retrieve information about them. 
+  * May have issues with some non-ASCII characters. Most of these bugs
+    should be resolved, though full UTF-8 support is still a little flaky
+  * Usage on restricted-access (logged-out users can't read) wikis is
+    mostly untested
+  
+Quick start
+-----------
+
+To make a simple query:
+
+```python
+#!/usr/bin/python
+
+from wikitools import wiki
+from wikitools import api
+
+# create a Wiki object
+site = wiki.Wiki("http://my.wikisite.org/w/api.php") 
+# login - required for read-restricted wikis
+site.login("username", "password")
+# define the params for the query
+params = {'action':'query', 'titles':'Main Page'}
+# create the request object
+request = api.APIRequest(site, params)
+# query the API
+result = request.query()
+```
+
+The result will look something like:
+
+```json
+{u'query':
+	{u'pages':
+		{u'15580374':
+			{u'ns': 0, u'pageid': 15580374, u'title': u'Main Page'}
+		}
+	}
+}
+```
+
+If the API module you need requires a token, you first do something like:
+```python
+params = { 'action':'query', 'meta':'tokens' }
+token = api.APIRequest(site, params).query()['query']['tokens']['csrftoken']
+# define the params for the query
+params = { 'action':'thank', 'rev':diff, 'token':token }
+```
+
+For most normal usage, you may not have to do API queries yourself and can just
+use the various classes. For example, to add a template to the top of all the 
+pages in namespace 0 in a category:
+
+```python
+#!/usr/bin/python
+
+from wikitools import wiki
+from wikitools import category
+
+site = wiki.Wiki("http://my.wikisite.org/w/api.php") 
+site.login("username", "password")
+# Create object for "Category:Foo"
+cat = category.Category(site, "Foo")
+# iterate through all the pages in ns 0
+for article in cat.getAllMembersGen(namespaces=[0]):
+	# edit each page
+	article.edit(prependtext="{{template}}\n")
+``` 
+
+See the MediaWiki API documentation at <http://www.mediawiki.org/wiki/API>
+for more information about using the MediaWiki API. You can get an example of
+what query results will look like by doing the queries in your web browser using
+the "jsonfm" format option
+ 
+Licensed under the GNU General Public License, version 3. A copy of the
+license is included with this release.
+
+Authors
+-------
+
+* Original source code Alex Z. (User:Mr.Z-man @ en.wikipedia) <mrzmanwiki@gmail.com>
+* Some code/assistance (User:Bjweeks @ en.wikipedia)
diff --git a/wikitools/__init__.py b/wikitools/__init__.py
new file mode 100644
index 00000000..23184a88
--- /dev/null
+++ b/wikitools/__init__.py
@@ -0,0 +1,25 @@
+﻿#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# -*- coding: utf-8 -*-
+# Copyright 2008-2013 Alex Zaddach (mrzmanwiki@gmail.com)
+
+# This file is part of wikitools.
+# wikitools is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+ 
+# wikitools is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+ 
+# You should have received a copy of the GNU General Public License
+# along with wikitools.  If not, see <http://www.gnu.org/licenses/>.
+__all__ = ["wiki", "api", "page", "category", "user", "pagelist", "wikifile"]
+from wiki import *
+from api import *
+from page import *
+from category import *
+from user import *
+from wikifile import *
diff --git a/wikitools/api.py b/wikitools/api.py
new file mode 100644
index 00000000..354cec78
--- /dev/null
+++ b/wikitools/api.py
@@ -0,0 +1,398 @@
+﻿#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# Copyright 2008-2013 Alex Zaddach (mrzmanwiki@gmail.com)
+
+# This file is part of wikitools.
+# wikitools is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+ 
+# wikitools is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+ 
+# You should have received a copy of the GNU General Public License
+# along with wikitools.  If not, see <http://www.gnu.org/licenses/>.
+
+# This module is documented at http://code.google.com/p/python-wikitools/wiki/api
+
+import urllib
+import re
+import time
+import sys
+import wiki
+import base64
+import warnings
+import copy
+from urllib import quote_plus, _is_unicode
+from poster.encode import multipart_encode
+canupload = True
+
+import json
+try:
+	import gzip
+	from io import StringIO
+except:
+	gzip = False
+
+class APIError(Exception):
+	"""Base class for errors"""
+
+class APIDisabled(APIError):
+	"""API not enabled"""
+	
+class APIRequest:
+	"""A request to the site's API"""
+	def __init__(self, wiki, data, write=False, multipart=False):
+		"""	
+		wiki - A Wiki object
+		data - API parameters in the form of a dict
+		write - set to True if doing a write query, so it won't try again on error
+		multipart - use multipart data transfer, required for file uploads,
+		requires the poster package
+		
+		maxlag is set by default to 5 but can be changed
+		format is always set to json
+		"""
+		if not canupload and multipart:
+			raise APIError("The poster module is required for multipart support")
+		self.sleep = 5
+		self.data = data.copy()
+		self.data['format'] = "json"
+		self.iswrite = write
+		if wiki.assertval is not None and self.iswrite:
+			self.data['assert'] =  wiki.assertval
+		if not 'maxlag' in self.data and not wiki.maxlag < 0:
+			self.data['maxlag'] = wiki.maxlag
+		self.multipart = multipart
+		if self.multipart:
+			(datagen, self.headers) = multipart_encode(self.data)
+			self.encodeddata = ''
+			for singledata in datagen:
+				self.encodeddata = self.encodeddata + singledata
+		else:
+			self.encodeddata = urlencode(self.data, 1)
+			self.headers = {
+				"Content-Type": "application/x-www-form-urlencoded",
+				"Content-Length": str(len(self.encodeddata))
+			}
+		self.headers["User-agent"] = wiki.useragent
+		if gzip:
+			self.headers['Accept-Encoding'] = 'gzip'
+		self.wiki = wiki
+		self.response = False
+		if wiki.auth:
+			self.headers['Authorization'] = "Basic {0}".format(
+				base64.encodestring(wiki.auth + ":" + wiki.httppass)).replace('\n','')
+		if hasattr(wiki, "passman"):
+			self.opener = urllib.build_opener(urllib.HTTPDigestAuthHandler(wiki.passman), urllib.HTTPCookieProcessor(wiki.cookies))
+		else:
+			self.opener = urllib.build_opener(urllib.HTTPCookieProcessor(wiki.cookies))
+		self.request = urllib.Request(self.wiki.apibase, self.encodeddata, self.headers)
+		
+	def setMultipart(self, multipart=True):
+		"""Enable multipart data transfer, required for file uploads."""
+		if not canupload and multipart:
+			raise APIError("The poster package is required for multipart support")
+		self.multipart = multipart
+		if multipart:
+			(datagen, headers) = multipart_encode(self.data)
+			self.headers.pop('Content-Length')
+			self.headers.pop('Content-Type')
+			self.headers.update(headers)
+			self.encodeddata = ''
+			for singledata in datagen:
+				self.encodeddata = self.encodeddata + singledata
+		else:
+			self.encodeddata = urlencode(self.data, 1)
+			self.headers['Content-Length'] = str(len(self.encodeddata))
+			self.headers['Content-Type'] = "application/x-www-form-urlencoded"
+
+	def changeParam(self, param, value):
+		"""Change or add a parameter after making the request object
+		
+		Simply changing self.data won't work as it needs to update other things.
+
+		value can either be a normal string value, or a file-like object,
+		which will be uploaded, if setMultipart was called previously.
+		
+		"""
+		if param == 'format':
+			raise APIError('You can not change the result format')
+		self.data[param] = value
+		if self.multipart:
+			(datagen, headers) = multipart_encode(self.data)
+			self.headers.pop('Content-Length')
+			self.headers.pop('Content-Type')
+			self.headers.update(headers)
+			self.encodeddata = ''
+			for singledata in datagen:
+				self.encodeddata = self.encodeddata + singledata
+		else:
+			self.encodeddata = urlencode(self.data, 1)
+			self.headers['Content-Length'] = str(len(self.encodeddata))
+			self.headers['Content-Type'] = "application/x-www-form-urlencoded"
+		self.request = urllib.Request(self.wiki.apibase, self.encodeddata, self.headers)
+	
+	def query(self, querycontinue=True):
+		"""Actually do the query here and return usable stuff
+		
+		querycontinue - look for query-continue in the results and continue querying
+		until there is no more data to retrieve (DEPRECATED: use queryGen as a more
+		reliable and efficient alternative)
+		
+		"""
+		if querycontinue and self.data['action'] == 'query':
+			warnings.warn("""The querycontinue option is deprecated and will be removed
+in a future release, use the new queryGen function instead
+for queries requring multiple requests""", FutureWarning)
+		data = False
+		while not data:
+			rawdata = self.__getRaw()
+			data = self.__parseJSON(rawdata)
+			if not data and type(data) is APIListResult:
+				break
+		if 'error' in data:
+			if self.iswrite and data['error']['code'] == 'blocked':
+				raise wiki.UserBlocked(data['error']['info'])
+			raise APIError(data['error']['code'], data['error']['info'])
+		if 'query-continue' in data and querycontinue:
+			data = self.__longQuery(data)
+		return data
+	
+	def queryGen(self):
+		"""Unlike the old query-continue method that tried to stitch results
+		together, which could work poorly for complex result sets and could
+		use a lot of memory, this yield each set returned by the API and lets
+		the user process the data. 
+		Loosely based on the recommended implementation on mediawiki.org
+		
+		"""
+		reqcopy = copy.deepcopy(self.request)
+		self.changeParam('continue', '')
+		while True:
+			data = False
+			while not data:
+				rawdata = self.__getRaw()
+				data = self.__parseJSON(rawdata)
+				if not data and type(data) is APIListResult:
+					break
+			if 'error' in data:
+				if self.iswrite and data['error']['code'] == 'blocked':
+					raise wiki.UserBlocked(data['error']['info'])
+				raise APIError(data['error']['code'], data['error']['info'])
+			yield data
+			if 'continue' not in data: 
+				break
+			else:
+				self.request = copy.deepcopy(reqcopy)
+				for param in data['continue']:
+					self.changeParam(param, data['continue'][param])
+
+	def __longQuery(self, initialdata):
+		"""For queries that require multiple requests"""
+		self._continues = set()
+		self._generator = ''
+		total = initialdata
+		res = initialdata
+		params = self.data
+		numkeys = len(res['query-continue'].keys())
+		while numkeys > 0:
+			key1 = ''
+			key2 = ''
+			possiblecontinues = res['query-continue'].keys()
+			if len(possiblecontinues) == 1:
+				key1 = possiblecontinues[0]
+				keylist = res['query-continue'][key1].keys()
+				if len(keylist) == 1:
+					key2 = keylist[0]
+				else:
+					for key in keylist:
+						if len(key) < 11:
+							key2 = key
+							break
+					else:
+						key2 = keylist[0]
+			else:
+				for posskey in possiblecontinues:
+					keylist = res['query-continue'][posskey].keys()
+					for key in keylist:
+						if len(key) < 11:
+							key1 = posskey
+							key2 = key
+							break
+					if key1:
+						break
+				else:
+					key1 = possiblecontinues[0]
+					key2 = res['query-continue'][key1].keys()[0]
+			if isinstance(res['query-continue'][key1][key2], int):
+				cont = res['query-continue'][key1][key2]
+			else:
+				cont = res['query-continue'][key1][key2].encode('utf-8')
+			if len(key2) >= 11 and key2.startswith('g'):
+				self._generator = key2
+				for ckey in self._continues:
+					params.pop(ckey, None)		
+			else:
+				self._continues.add(key2)
+			params[key2] = cont
+			req = APIRequest(self.wiki, params)
+			res = req.query(False)
+			for type in possiblecontinues:
+				total = resultCombine(type, total, res)
+			if 'query-continue' in res:
+				numkeys = len(res['query-continue'].keys())
+			else:
+				numkeys = 0
+		return total
+
+	def __getRaw(self):
+		data = False
+		while not data:
+			try:
+				if self.sleep >= self.wiki.maxwaittime or self.iswrite:
+					catcherror = None
+				else:
+					catcherror = Exception
+				data = self.opener.open(self.request)
+				self.response = data.info()
+				if gzip:
+					encoding = self.response.get('Content-encoding')
+					if encoding in ('gzip', 'x-gzip'):
+						data = gzip.GzipFile('', 'rb', 9, StringIO.StringIO(data.read()))
+			except catcherror as exc:
+				errname = sys.exc_info()[0].__name__
+				errinfo = exc
+				print("%s: %s trying request again in %d seconds" % (errname, errinfo, self.sleep))
+				time.sleep(self.sleep+0.5)
+				self.sleep+=5
+		return data
+
+	def __parseJSON(self, data):
+		maxlag = True
+		while maxlag:
+			try:
+				maxlag = False
+				parsed = json.loads(data.read())
+				content = None
+				if isinstance(parsed, dict):
+					content = APIResult(parsed)
+					content.response = self.response.items()
+				elif isinstance(parsed, list):
+					content = APIListResult(parsed)
+					content.response = self.response.items()
+				else:
+					content = parsed
+				if 'error' in content:
+					error = content['error']['code']
+					if error == "maxlag":
+						lagtime = int(re.search("(\d+) seconds", content['error']['info']).group(1))
+						if lagtime > self.wiki.maxwaittime:
+							lagtime = self.wiki.maxwaittime
+						print("Server lag, sleeping for "+str(lagtime)+" seconds")
+						maxlag = True
+						time.sleep(int(lagtime)+0.5)
+						return False
+			except: # Something's wrong with the data...
+				data.seek(0)
+				if "MediaWiki API is not enabled for this site. Add the following line to your LocalSettings.php<pre><b>$wgEnableAPI=true;</b></pre>" in data.read():
+					raise APIDisabled("The API is not enabled on this site")
+				print ("Invalid JSON, trying request again")
+				# FIXME: Would be nice if this didn't just go forever if its never going to work
+				return False
+		return content
+		
+class APIResult(dict):
+	response = []
+	
+class APIListResult(list):
+	response = []
+		
+def resultCombine(type, old, new):
+	"""Experimental-ish result-combiner thing
+	
+	If the result isn't something from action=query,
+	this will just explode, but that shouldn't happen hopefully?
+	
+	"""
+	ret = old
+	if type in new['query']: # Basic list, easy
+		ret['query'][type].extend(new['query'][type])
+	else: # Else its some sort of prop=thing and/or a generator query
+		for key in new['query']['pages'].keys(): # Go through each page
+			if not key in old['query']['pages']: # if it only exists in the new one
+				ret['query']['pages'][key] = new['query']['pages'][key] # add it to the list
+			else:
+				if not type in new['query']['pages'][key]:
+					continue
+				elif type in new['query']['pages'][key] and not type in ret['query']['pages'][key]: # if only the new one does, just add it to the return
+					ret['query']['pages'][key][type] = new['query']['pages'][key][type]
+					continue					
+				else: # Need to check for possible duplicates for some, this is faster than just iterating over new and checking for dups in ret
+					retset = set([tuple(entry.items()) for entry in ret['query']['pages'][key][type]])
+					newset = set([tuple(entry.items()) for entry in new['query']['pages'][key][type]])
+					retset.update(newset)
+					ret['query']['pages'][key][type] = [dict(entry) for entry in retset]
+	return ret
+		
+def urlencode(query,doseq=0):
+    """
+	Hack of urllib's urlencode function, which can handle
+	utf-8, but for unknown reasons, chooses not to by 
+	trying to encode everything as ascii
+    """
+    if hasattr(query,"items"):
+        # mapping objects
+        query = query.items()
+    else:
+        # it's a bother at times that strings and string-like objects are
+        # sequences...
+        try:
+            # non-sequence items should not work with len()
+            # non-empty strings will fail this
+            if len(query) and not isinstance(query[0], tuple):
+                raise TypeError
+            # zero-length sequences of all types will get here and succeed,
+            # but that's a minor nit - since the original implementation
+            # allowed empty dicts that type of behavior probably should be
+            # preserved for consistency
+        except TypeError:
+            ty,va,tb = sys.exc_info()
+            raise TypeError("not a valid non-string sequence or mapping object", tb)
+
+    l = []
+    if not doseq:
+        # preserve old behavior
+        for k, v in query:
+            k = quote_plus(str(k))
+            v = quote_plus(str(v))
+            l.append(k + '=' + v)
+    else:
+        for k, v in query:
+            k = quote_plus(str(k))
+            if isinstance(v, str):
+                v = quote_plus(v)
+                l.append(k + '=' + v)
+            elif _is_unicode(v):
+                # is there a reasonable way to convert to ASCII?
+                # encode generates a string, but "replace" or "ignore"
+                # lose information and "strict" can raise UnicodeError
+                v = quote_plus(v.encode("utf8","replace"))
+                l.append(k + '=' + v)
+            else:
+                try:
+                    # is this a sufficient test for sequence-ness?
+                    x = len(v)
+                except TypeError:
+                    # not a sequence
+                    v = quote_plus(str(v))
+                    l.append(k + '=' + v)
+                else:
+                    # loop over the sequence
+                    for elt in v:
+                        l.append(k + '=' + quote_plus(str(elt)))
+    return '&'.join(l)
+
diff --git a/wikitools/category.py b/wikitools/category.py
new file mode 100644
index 00000000..decdff13
--- /dev/null
+++ b/wikitools/category.py
@@ -0,0 +1,115 @@
+﻿#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# Copyright 2008-2013 Alex Zaddach (mrzmanwiki@gmail.com)
+
+# This file is part of wikitools.
+# wikitools is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+ 
+# wikitools is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+ 
+# You should have received a copy of the GNU General Public License
+# along with wikitools.  If not, see <http://www.gnu.org/licenses/>.
+
+import page
+import api
+
+class Category(page.Page):
+	"""A category on the wiki"""
+	def __init__(self, site, title=False, check=True, followRedir=False, section=False, sectionnumber=False, pageid=False):
+		"""	
+		wiki - A wiki object
+		title - The page title, as a string or unicode object
+		check - Checks for existence, normalizes title, required for most things
+		followRedir - follow redirects (check must be true)
+		section - the section name
+		sectionnumber - the section number
+		pageid - pageid, can be in place of title
+		""" 
+		page.Page.__init__(self, site=site, title=title, check=check, followRedir=followRedir, section=section, sectionnumber=sectionnumber, pageid=pageid)
+		self.members = []
+		if self.namespace != 14:
+			self.setNamespace(14, check)
+			
+	def getAllMembers(self, titleonly=False, reload=False, namespaces=False):
+		"""Gets a list of pages in the category
+		
+		titleonly - set to True to only create a list of strings,
+		else it will be a list of Page objects
+		reload - reload the list even if it was generated before
+		namespaces - List of namespaces to restrict to (queries with this option will not be cached)
+
+		"""
+		if self.members and not reload:
+			if titleonly:
+				if namespaces is not False:
+					return [p.title for p in self.members if p.namespace in namespaces]
+				else:
+					return [p.title for p in self.members]
+			if namespaces is False:
+				return self.members
+			else:
+				return [p for p in self.members if p.namespace in namespaces]
+		else:
+			ret = []
+			members = []
+			for member in self.__getMembersInternal(namespaces):
+				members.append(member)
+				if titleonly:
+					ret.append(member.title)
+			if titleonly:
+				return ret
+			if namespaces is False:
+				self.members = members
+			return members
+	
+	def getAllMembersGen(self, titleonly=False, reload=False, namespaces=False):
+		"""Generator function for pages in the category
+		
+		titleonly - set to True to return strings,
+		else it will return Page objects
+		reload - reload the list even if it was generated before
+		namespaces - List of namespaces to restrict to (queries with this option will not be cached)
+		
+		"""
+		if self.members and not reload:
+			for member in self.members:
+				if namespaces is False or member.namespace in namespaces:
+					if titleonly:
+						yield member.title
+					else:
+						yield member
+		else:
+			if namespaces is False:
+				self.members = []
+			for member in self.__getMembersInternal(namespaces):
+				if namespaces is False:
+					self.members.append(member)
+				if titleonly:
+					yield member.title
+				else:
+					yield member
+				
+	def __getMembersInternal(self, namespaces=False):
+		params = {'action':'query',
+			'list':'categorymembers',
+			'cmtitle':self.title,
+			'cmlimit':self.site.limit,
+			'cmprop':'title'
+		}
+		if namespaces is not False:
+			params['cmnamespace'] = '|'.join([str(ns) for ns in namespaces])
+		while True:
+			req = api.APIRequest(self.site, params)
+			data = req.query(False)
+			for item in data['query']['categorymembers']:
+				yield page.Page(self.site, item['title'], check=False, followRedir=False)
+			try:
+				params['cmcontinue'] = data['query-continue']['categorymembers']['cmcontinue']
+			except:
+				break 
diff --git a/wikitools/page.py b/wikitools/page.py
new file mode 100644
index 00000000..8eb5a9b4
--- /dev/null
+++ b/wikitools/page.py
@@ -0,0 +1,817 @@
+﻿#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# Copyright 2008-2013 Alex Zaddach (mrzmanwiki@gmail.com),  bjweeks
+
+# This file is part of wikitools.
+# wikitools is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+ 
+# wikitools is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+ 
+# You should have received a copy of the GNU General Public License
+# along with wikitools.  If not, see <http://www.gnu.org/licenses/>.
+
+import datetime
+import wiki
+import api
+import urllib
+from hashlib import md5
+import unicodedata
+
+
+class BadTitle(wiki.WikiError):
+	"""Invalid title"""
+	
+class NoPage(wiki.WikiError):
+	"""Non-existent page"""
+	
+class BadNamespace(wiki.WikiError):
+	"""Invalid namespace number"""
+
+class EditError(wiki.WikiError):
+	"""Problem with edit request"""
+
+class ProtectError(wiki.WikiError):
+	"""Problem with protection request"""
+
+def namespaceDetect(title, site):
+	""" Detect the namespace of a given title
+	title - the page title
+	site - the wiki object the page is on
+	"""
+	bits = title.split(':', 1)
+	if len(bits) == 1 or bits[0] == '':
+		return 0
+	else:
+		nsprefix = bits[0].lower() # wp:Foo and caTEGory:Foo are normalized by MediaWiki
+		for ns in site.namespaces:
+			if nsprefix == site.namespaces[ns]['*'].lower():
+				return int(ns)
+		else:
+			if site.NSaliases:
+				for ns in site.NSaliases:
+					if nsprefix == ns.lower():
+						return int(site.NSaliases[ns])
+	return 0	
+	
+class Page(object):
+	""" A page on the wiki"""
+
+	def __init__(self, site, title=False, check=True, followRedir=True, section=False, sectionnumber=None, pageid=False, namespace=False):
+		"""	
+		wiki - A wiki object
+		title - The page title, as a string or unicode object
+		check - Checks for existence, normalizes title, required for most things
+		followRedir - follow redirects (check must be true)
+		section - the section name
+		sectionnumber - the section number
+		pageid - pageid, can be in place of title
+		namespace - use to set the namespace prefix *if its not already in the title*
+		""" 
+		# Initialize instance vars from function args
+		if not title and not pageid:
+			raise wiki.WikiError("No title or pageid given")
+		self.site = site
+		if pageid:
+			self.pageid = int(pageid)
+		else:
+			self.pageid = 0
+		self.followRedir = followRedir
+		self.title = title
+		self.unprefixedtitle = False # will be set later
+		self.urltitle = ''
+		self.wikitext = ''
+		self.templates = []
+		self.links = []
+		self.categories = []
+		self.exists = True # If we're not going to check, assume it does
+		self.protection = {}
+		self.namespace = namespace
+		
+		# Things that need to be done before anything else
+		if self.title:
+			self.title = self.title.replace('_', ' ')
+		if self.namespace:
+			if namespace not in self.site.namespaces.keys():
+				raise BadNamespace(namespace)
+			if self.title:
+				self.unprefixedtitle = self.title
+				self.title = ':'.join((self.site.namespaces[self.namespace]['*'], self.title.decode('utf8')))
+		if int(self.namespace) is 0 and self.title:
+			self.namespace = int(self.namespace)
+			self.unprefixedtitle = self.title		
+		# Setting page info with API, should set:
+		# pageid, exists, title, unprefixedtitle, namespace
+		if check:
+			self.setPageInfo()
+		else:
+			if self.namespace is False and self.title:
+				self.namespace = namespaceDetect(self.title, self.site)
+				if self.namespace is not 0:
+					nsname = self.site.namespaces[self.namespace]['*']
+					self.unprefixedtitle = self.title.split(':', 1)[1]
+					self.title = ':'.join((nsname, self.unprefixedtitle))
+				else:
+					self.unprefixedtitle = self.title
+					
+		if section or sectionnumber is not None:
+			self.setSection(section, sectionnumber)
+		else:
+			self.section = False
+		if title:
+			if not isinstance(self.title, str):
+				self.title = str(self.title, 'utf-8')
+			if not isinstance(self.unprefixedtitle, str):
+				self.unprefixedtitle = str(self.unprefixedtitle, 'utf-8')
+			self.urltitle = urllib.quote(self.title.encode('utf-8')).replace('%20', '_').replace('%2F', '/')
+
+	def setPageInfo(self):
+		"""Sets basic page info, required for almost everything"""
+		followRedir = self.followRedir
+		params = {'action':'query'}
+		if self.pageid:
+			params['pageids'] = self.pageid
+		else:
+			params['titles'] = self.title
+		if followRedir:
+			params['redirects'] = ''
+		req = api.APIRequest(self.site, params)
+		response = req.query(False)
+		self.pageid = response['query']['pages'].keys()[0]
+		if self.pageid > 0:
+			self.exists = True
+		if 'missing' in response['query']['pages'][str(self.pageid)]:
+			if not self.title:
+				# Pageids are never recycled, so a bad pageid with no title will never work
+				raise wiki.WikiError("Bad pageid given with no title")
+			self.exists = False
+		if 'invalid' in response['query']['pages'][str(self.pageid)]:
+			raise BadTitle(self.title)
+		if 'title' in response['query']['pages'][str(self.pageid)]:
+			self.title = response['query']['pages'][str(self.pageid)]['title'].encode('utf-8')
+			self.namespace = int(response['query']['pages'][str(self.pageid)]['ns'])
+			if self.namespace is not 0:
+				self.unprefixedtitle = self.title.split(':', 1)[1]	
+			else:
+				self.unprefixedtitle = self.title
+		self.pageid = int(self.pageid)
+		if self.pageid < 0:
+			self.pageid = 0
+		return self
+		
+	def setNamespace(self, newns, recheck=False):
+		"""Change the namespace number of a page object
+		
+		Updates the title with the new prefix
+		newns - integer namespace number
+		recheck - redo pageinfo checks
+		
+		"""
+		if not newns in self.site.namespaces.keys():
+			raise BadNamespace
+		if self.namespace == newns:
+			return self.namespace
+		if self.title:
+			if self.namespace != 0:
+				bits = self.title.split(':', 1)
+				nsprefix = bits[0].lower()
+				for ns in self.site.namespaces:
+					if nsprefix == self.site.namespaces[ns]['*'].lower():
+						self.title = bits[1]
+						break
+				else:
+					if self.site.NSaliases:
+						for ns in self.site.NSaliases:
+							if nsprefix == ns.lower():
+								self.title = bits[1]
+								break
+			self.namespace = newns
+			if self.namespace:
+				self.title = self.site.namespaces[self.namespace]['*']+':'+self.title
+			self.urltitle = urllib.quote(self.title.encode('utf-8')).replace('%20', '_').replace('%2F', '/')
+		else:
+			self.namespace = newns
+		if recheck:
+			self.pageid = False
+			self.setPageInfo()
+		else:
+			self.pageid = 0
+		self.wikitext = ''
+		self.templates = []
+		self.links = []
+		return self.namespace
+		
+	def setSection(self, section=None, number=None):
+		"""Set a section for the page
+		
+		section - the section name
+		number - the section number
+		
+		"""
+		if section is None and number is None:
+			self.section = False
+		elif number is not None:
+			try:
+				self.section = str(int(number))
+			except ValueError:
+				raise wiki.WikiError("Section number must be an int")
+		else:
+			self.section = self.__getSection(section)
+		self.wikitext = ''
+		return self.section
+	
+	def __getSection(self, section):
+		if not self.title:
+			self.setPageInfo()
+		params = {
+			'action': 'parse',
+			'page':self.title,
+			'prop':'sections'
+		}
+		number = False
+		req = api.APIRequest(self.site, params)
+		response = req.query()
+		for item in response['parse']['sections']:
+			if section == item['line'] or section == item['anchor']:
+				if item['index'].startswith('T'): # TODO: It would be cool if it set the page title to the template in this case 
+					continue
+				number = item['index']
+				break
+		return number
+		
+	def canHaveSubpages(self):
+		"""Is the page in a namespace that allows subpages?"""
+		if not self.title:
+			self.setPageInfo()
+		return 'subpages' in self.site.namespaces[self.namespace]
+		
+	def isRedir(self):
+		"""Is the page a redirect?"""
+		params = {'action':'query',
+			'redirects':''
+		}
+		if not self.exists:
+			raise NoPage
+		if self.pageid != 0 and self.exists:
+			params['pageids'] = self.pageid
+		elif self.title:
+			params['titles'] = self.title
+		else:
+			self.setPageInfo()
+			if self.pageid != 0 and self.exists:
+				params['pageids'] = self.pageid
+			else:
+				raise NoPage
+		req = api.APIRequest(self.site, params)
+		res = req.query(False)
+		if 'redirects' in res['query']:
+			return True
+		else:
+			return False
+	
+	def isTalk(self):
+		"""Is the page a discussion page?"""
+		if not self.title:
+			self.setPageInfo()
+		return (self.namespace%2==1 and self.namespace >= 0)
+		
+	def toggleTalk(self, check=True, followRedir=True):
+		"""Switch to and from the talk namespaces
+		
+		Returns a new page object that's either the talk or non-talk
+		version of the current page
+		
+		check and followRedir - same meaning as Page constructor
+		
+		"""
+		if not self.title:
+			self.setPageInfo()
+		ns = self.namespace
+		if ns < 0:
+			return False
+		nsname = self.site.namespaces[ns]['*']
+		if self.isTalk():
+			newns = self.site.namespaces[ns-1]['*']
+		else:
+			newns = self.site.namespaces[ns+1]['*']
+		try:
+			pagename = self.title.split(nsname+':',1)[1]
+		except:
+			pagename = self.title
+		if newns != '':
+			newname = newns+':'+pagename
+		else:
+			newname = pagename
+		return Page(self.site, newname, check, followRedir)						
+			
+	def getWikiText(self, expandtemplates=False, force=False):
+		"""Gets the Wikitext of the page
+		
+		expandtemplates - expand the templates to wikitext instead of transclusions
+		force - load the text even if we already loaded it before
+		
+		"""
+	
+		if self.wikitext and not force:
+			return self.wikitext
+		if self.pageid == 0 and not self.title:
+			self.setPageInfo()
+		if not self.exists:
+			raise NoPage
+		params = {
+			'action': 'query',
+			'prop': 'revisions',
+			'rvprop': 'content|timestamp',
+			'rvlimit': '1'
+		}
+		if self.pageid:
+			params['pageids'] = self.pageid
+		else:
+			params['titles'] = self.title		
+		if expandtemplates:
+			params['rvexpandtemplates'] = '1'
+		if self.section is not False:
+			params['rvsection'] = self.section
+		req = api.APIRequest(self.site, params)
+		response = req.query(False)
+		if self.pageid == 0:
+			self.pageid = int(response['query']['pages'].keys()[0])
+			if self.pageid == -1:
+				self.exists == False
+				raise NoPage
+		self.wikitext = response['query']['pages'][str(self.pageid)]['revisions'][0]['*'].encode('utf-8')
+		self.lastedittime = response['query']['pages'][str(self.pageid)]['revisions'][0]['timestamp']
+		return self.wikitext
+	
+	def getLinks(self, force=False):
+		"""Gets a list of all the internal links *on* the page
+		
+		force - load the list even if we already loaded it before
+		
+		"""
+		if self.links and not force:
+			return self.links
+		if self.pageid == 0 and not self.title:
+			self.setPageInfo()
+		if not self.exists:
+			raise NoPage
+		params = {
+			'action': 'query',
+			'prop': 'links',
+			'pllimit': self.site.limit,
+		}
+		if self.pageid > 0:
+			params['pageids'] = self.pageid
+		else:
+			params['titles'] = self.title	
+		req = api.APIRequest(self.site, params)
+		self.links = []
+		for data in req.queryGen():
+			self.links.extend(self.__extractToList(data, 'links'))
+		return self.links
+		
+	def getProtection(self, force=False):
+		"""Returns the current protection status of the page"""
+		if self.protection and not force:
+			return self.protection
+		if self.pageid == 0 and not self.title:
+			self.setPageInfo()
+		params = {
+			'action': 'query',
+			'prop': 'info',
+			'inprop': 'protection',
+		}
+		if not self.exists or self.pageid <= 0:
+			params['titles'] = self.title
+		else:
+			params['titles'] = self.title
+		req = api.APIRequest(self.site, params)
+		response = req.query(False)
+		for pr in response['query'].values()[0].values()[0]['protection']:
+			if pr['level']: 
+				if pr['expiry'] == 'infinity':
+					expiry = 'infinity'
+				else:
+					expiry = datetime.datetime.strptime(pr['expiry'],'%Y-%m-%dT%H:%M:%SZ')
+				self.protection[pr['type']] = {
+					'expiry': expiry, 
+					'level': pr['level']
+					}
+		return self.protection
+	
+	def getTemplates(self, force=False):
+		"""Gets all list of all the templates on the page
+		
+		force - load the list even if we already loaded it before
+		
+		"""	
+		if self.templates and not force:
+			return self.templates
+		if self.pageid == 0 and not self.title:
+			self.setPageInfo()
+		if not self.exists:
+			raise NoPage
+		params = {
+			'action': 'query',
+			'prop': 'templates',
+			'tllimit': self.site.limit,
+		}
+		if self.pageid:
+			params['pageids'] = self.pageid
+		else:
+			params['titles'] = self.title	
+		req = api.APIRequest(self.site, params)
+		self.templates = []
+		for data in req.queryGen():
+			self.templates.extend(self.__extractToList(data, 'templates'))
+		return self.templates
+	
+	def getCategories(self, force=False):
+		"""Gets all list of all the categories on the page
+		
+		force - load the list even if we already loaded it before
+		
+		"""	
+		if self.categories and not force:
+			return self.categories
+		if self.pageid == 0 and not self.title:
+			self.setPageInfo()
+		if not self.exists:
+			raise NoPage
+		params = {
+			'action': 'query',
+			'prop': 'categories',
+			'cllimit': self.site.limit,
+		}
+		if self.pageid:
+			params['pageids'] = self.pageid
+		else:
+			params['titles'] = self.title	
+		req = api.APIRequest(self.site, params)
+		self.categories = []
+		for data in req.queryGen():
+			self.categories.extend(self.__extractToList(data, 'categories'))
+		return self.categories
+		
+	def getHistory(self, direction='older', content=True, limit='all'):
+		"""Get the history of a page
+		
+		direction - 2 options: 'older' (default) - start with the current revision and get older ones
+			'newer' - start with the oldest revision and get newer ones
+		content - If False, get only metadata (timestamp, edit summary, user, etc)
+			If True (default), also get the revision text
+		limit - Only retrieve a certain number of revisions. If 'all' (default), all revisions are returned 
+		
+		The data is returned in essentially the same format as the API, a list of dicts that look like:
+		{u'*': u"Page content", # Only returned when content=True
+		 u'comment': u'Edit summary',
+		 u'contentformat': u'text/x-wiki', # Only returned when content=True
+		 u'contentmodel': u'wikitext', # Only returned when content=True
+		 u'parentid': 139946, # id of previous revision
+		 u'revid': 139871, # revision id
+		 u'sha1': u'0a5cec3ca3e084e767f00c9a5645c17ac27b2757', # sha1 hash of page content
+		 u'size': 129, # size of page in bytes
+		 u'timestamp': u'2002-08-05T14:11:27Z', # timestamp of edit
+		 u'user': u'Username',
+		 u'userid': 48 # user id
+		}		
+		
+		Note that unlike other get* functions, the data is not cached
+		"""
+		max = limit
+		if limit == 'all':
+			max = float("inf")
+		if limit == 'all' or limit > self.site.limit:
+			limit = self.site.limit
+		history = []
+		rvc = None
+		while True:
+			revs, rvc = self.__getHistoryInternal(direction, content, limit, rvc)
+			history = history+revs
+			if len(history) == max or rvc is None:
+				break
+			if max - len(history) < self.site.limit:
+				limit = max - len(history)
+		return history
+		
+	def getHistoryGen(self, direction='older', content=True, limit='all'):
+		"""Generator function for page history
+		
+		The interface is the same as getHistory, but it will only retrieve 1 revision at a time.
+		This will be slower and have much higher network overhead, but does not require storing
+		the entire page history in memory	
+		"""
+		max = limit
+		count = 0
+		rvc = None
+		while True:
+			revs, rvc = self.__getHistoryInternal(direction, content, 1, rvc)
+			yield revs[0]
+			count += 1
+			if count == max or rvc is None:
+				break
+	
+	def __getHistoryInternal(self, direction, content, limit, rvcontinue):
+	
+		if self.pageid == 0 and not self.title:
+			self.setPageInfo()
+		if not self.exists:
+			raise NoPage
+		if direction != 'newer' and direction != 'older':
+			raise wiki.WikiError("direction must be 'newer' or 'older'")
+		params = {
+			'action':'query',
+			'prop':'revisions',
+			'rvdir':direction,
+			'rvprop':'ids|flags|timestamp|user|userid|size|sha1|comment',
+			'continue':'',
+			'rvlimit':limit
+		}
+		if self.pageid:
+			params['pageids'] = self.pageid
+		else:
+			params['titles'] = self.title	
+
+		if content:
+			params['rvprop']+='|content'
+		if rvcontinue:
+			params['continue'] = rvcontinue['continue']
+			params['rvcontinue'] = rvcontinue['rvcontinue']
+		req = api.APIRequest(self.site, params)
+		response = req.query(False)
+		id = response['query']['pages'].keys()[0]
+		if not self.pageid:
+			self.pageid = int(id)
+		revs = response['query']['pages'][id]['revisions']
+		rvc = None
+		if 'continue' in response:
+			rvc = response['continue']
+		return (revs, rvc)
+	
+	def __extractToList(self, json, stuff):
+		list = []
+		if self.pageid == 0:
+			self.pageid = json['query']['pages'].keys()[0]
+		if stuff in json['query']['pages'][str(self.pageid)]:
+			for item in json['query']['pages'][str(self.pageid)][stuff]:
+				list.append(item['title'])
+		return list
+	
+	def edit(self, *args, **kwargs):
+		"""Edit the page
+		
+		Arguments are a subset of the API's action=edit arguments, valid arguments
+		are defined in the validargs set
+		To skip the MD5 check, set "skipmd5" keyword argument to True
+		http://www.mediawiki.org/wiki/API:Edit_-_Create%26Edit_pages#Parameters
+		
+		For backwards compatibility:
+		'newtext' is equivalent to  'text'
+		'basetime' is equivalent to 'basetimestamp'
+		
+		"""
+		validargs = set(['text', 'summary', 'minor', 'notminor', 'bot', 'basetimestamp', 'starttimestamp',
+			'recreate', 'createonly', 'nocreate', 'watch', 'unwatch', 'watchlist', 'prependtext', 'appendtext', 
+			'section', 'captchaword', 'captchaid'])			
+		# For backwards compatibility
+		if 'newtext' in kwargs:
+			kwargs['text'] = kwargs['newtext']
+			del kwargs['newtext']
+		if 'basetime' in kwargs:
+			kwargs['basetimestamp'] = kwargs['basetime']
+			del kwargs['basetime']		
+		if len(args) and 'text' not in kwargs:
+			kwargs['text'] = args[0]
+		skipmd5 = False
+		if 'skipmd5' in kwargs and kwargs['skipmd5']:
+			skipmd5 = True
+		invalid = set(kwargs.keys()).difference(validargs)		
+		if invalid:
+			for arg in invalid:
+				del kwargs[arg]
+		if not self.title:
+			self.setPageInfo()	
+		if not 'section' in kwargs and self.section is not False:
+			kwargs['section'] = self.section
+		if not 'text' in kwargs and not 'prependtext' in kwargs and not 'appendtext' in kwargs:
+			raise EditError("No text specified")
+		if 'prependtext' in kwargs and 'section' in kwargs:
+			raise EditError("Bad param combination")
+		if 'createonly' in kwargs and 'nocreate' in kwargs:
+			raise EditError("Bad param combination")
+		token = self.site.getToken('csrf')
+		if 'text' in kwargs:
+			hashtext = kwargs['text']
+		elif 'prependtext' in kwargs and 'appendtext' in kwargs:
+			hashtext = kwargs['prependtext']+kwargs['appendtext']
+		elif 'prependtext' in kwargs:
+			hashtext = kwargs['prependtext']
+		else:
+			hashtext = kwargs['appendtext']
+		params = {
+			'action': 'edit',
+			'title':self.title,
+			'token':token,
+		}
+		if not skipmd5:
+			if not isinstance(hashtext, str):
+				hashtext = hashtext.decode('utf8')
+			hashtext = unicodedata.normalize('NFC', hashtext).encode('utf8')
+			params['md5'] = md5(hashtext).hexdigest()
+		params.update(kwargs)
+		req = api.APIRequest(self.site, params, write=True)
+		result = req.query()
+		if 'edit' in result and result['edit']['result'] == 'Success':
+			self.wikitext = ''
+			self.links = []
+			self.templates = []
+			self.exists = True
+		return result
+		
+	def move(self, mvto, reason=False, movetalk=False, noredirect=False, watch=False, unwatch=False):
+		"""Move the page
+		
+		Params are the same as the API:
+		mvto - page title to move to, the only required param
+		reason - summary for the log
+		movetalk - move the corresponding talk page
+		noredirect - don't create a redirect at the previous title
+		watch - add the page to your watchlist
+		unwatch - remove the page from your watchlist
+		
+		"""
+		if not self.title and self.pageid == 0:
+			self.setPageInfo()
+		if not self.exists:
+			raise NoPage
+		token = self.site.getToken('csrf')
+		params = {
+			'action': 'move',
+			'to':mvto,
+			'token':token,
+		}
+		if self.pageid:
+			params['fromid'] = self.pageid
+		else:
+			params['from'] = self.title
+		if reason:
+			params['reason'] = reason.encode('utf-8')
+		if movetalk:
+			params['movetalk'] = '1'
+		if noredirect:
+			params['noredirect'] = '1'
+		if watch:
+			params['watch'] = '1'
+		if unwatch:
+			params['unwatch'] = '1'
+		req = api.APIRequest(self.site, params, write=True)
+		result = req.query()
+		if 'move' in result:
+			self.title = result['move']['to']
+			self.namespace = namespaceDetect(self.title, self.site)
+			if self.namespace is not 0:
+				self.unprefixedtitle = self.title.split(':', 1)[1]
+			else:
+				self.unprefixedtitle = self.title			
+			if not isinstance(self.title, str):
+				self.title = str(self.title, 'utf-8')
+				self.urltitle = urllib.quote(self.title.encode('utf-8')).replace('%20', '_').replace('%2F', '/')	
+			else:
+				self.urltitle = urllib.quote(self.title.encode('utf-8')).replace('%20', '_').replace('%2F', '/')
+		return result
+
+	def protect(self, restrictions={}, expirations={}, reason=False, cascade=False):
+		"""Protect a page
+		
+		Restrictions and expirations are dictionaries of
+		protection level/expiry settings, e.g., {'edit':'sysop'} and
+		{'move':'3 days'}. expirations can also be a string to set 
+		all levels to the same expiration
+		
+		reason - summary for log
+		cascade - apply protection to all pages transcluded on the page
+		
+		"""
+		if not self.title:
+			self.setPageInfo()
+		if not restrictions:
+			raise ProtectError("No protection levels given")
+		if len(expirations) > len(restrictions):
+			raise ProtectError("More expirations than restrictions given")
+		token = self.site.getToken('csrf')
+		protections = ''
+		expiry = ''
+		if isinstance(expirations, str):
+			expiry = expirations
+		for type in restrictions:
+			if protections:
+				protections+="|"
+			protections+= type+"="+restrictions[type]
+			if isinstance(expirations, dict) and type in expirations:
+				if expiry:
+					expiry+="|"
+				expiry+=expirations[type]
+			elif isinstance(expirations, dict):
+				if expiry:
+					expiry+="|"
+				expiry+='indefinite'
+		params = {'action':'protect',
+			'title':self.title,
+			'token':token,
+			'protections':protections
+		}
+		if expiry:
+			params['expiry'] = expiry
+		if reason:
+			params['reason'] = reason
+		if cascade:
+			params['cascade'] = ''
+		req = api.APIRequest(self.site, params, write=True)
+		result = req.query()
+		if 'protect' in result:
+			self.protection = {}
+		return result
+	
+	def delete(self, reason=False, watch=False, unwatch=False):
+		"""Delete the page
+		
+		reason - summary for log
+		watch - add the page to your watchlist
+		unwatch - remove the page from your watchlist
+		
+		"""
+		if not self.title and self.pageid == 0:
+			self.setPageInfo()
+		if not self.exists:
+			raise NoPage
+		token = self.site.getToken('csrf')
+		params = {
+			'action': 'delete',
+			'token':token,
+		}
+		if self.pageid:
+			params['pageid'] = self.pageid
+		else:
+			params['title'] = self.title
+		if reason:
+			params['reason'] = reason.encode('utf-8')
+		if watch:
+			params['watch'] = '1'
+		if unwatch:
+			params['unwatch'] = '1'
+		req = api.APIRequest(self.site, params, write=True)
+		result = req.query()
+		if 'delete' in result:
+			self.pageid = 0
+			self.exists = False
+			self.wikitext = ''
+			self.templates = ''
+			self.links = ''
+			self.protection = {}
+			self.section = False			
+		return result
+	
+	
+	def __hash__(self):
+		return int(self.pageid) ^ hash(self.site.apibase)
+	
+	def __str__(self):
+		if self.title:
+			title = self.title
+		else:
+			title = 'pageid: '+self.pageid
+		return self.__class__.__name__ +' '+repr(title) + " from " + repr(self.site.domain)
+	
+	def __repr__(self):
+		if self.title:
+			title = self.title
+		else:
+			title = 'pageid: '+self.pageid
+		return "<"+self.__module__+'.'+self.__class__.__name__+" "+repr(title)+" using "+repr(self.site.apibase)+">"
+	
+	def __eq__(self, other):
+		if not isinstance(other, Page):
+			return False
+		if self.title:			
+			if self.title == other.title and self.site == other.site:
+				return True
+		else:
+			if self.pageid == other.pageid and self.site == other.site:
+				return True
+		return False
+		
+	def __ne__(self, other):
+		if not isinstance(other, Page):
+			return True
+		if self.title:
+			if self.title == other.title and self.site == other.site:
+				return False
+		else:
+			if self.pageid == other.pageid and self.site == other.site:
+				return False
+		return True
diff --git a/wikitools/pagelist.py b/wikitools/pagelist.py
new file mode 100644
index 00000000..9fb3b00c
--- /dev/null
+++ b/wikitools/pagelist.py
@@ -0,0 +1,160 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# Copyright 2008-2013 Alex Zaddach (mrzmanwiki@gmail.com)
+
+# This file is part of wikitools.
+# wikitools is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+ 
+# wikitools is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+ 
+# You should have received a copy of the GNU General Public License
+# along with wikitools.  If not, see <http://www.gnu.org/licenses/>.
+
+import api
+import page
+import category
+import wikifile
+import math
+
+def listFromQuery(site, queryresult):
+	"""Generate a list of pages from an API query result
+	
+	queryresult is the list of pages from a list or generator query
+	e.g. - for a list=categorymembers query, use result['query']['categorymembers']
+	for a generator query, use result['query']['pages']
+	
+	"""
+	ret = []
+	if isinstance(queryresult, list):
+		for item in queryresult:
+			pageid = False
+			if 'pageid' in item:
+				pageid = item['pageid']
+			if item['ns'] == 14:
+				item = category.Category(site, title=item['title'], check=False, followRedir=False, pageid=pageid)
+			elif item['ns'] == 6:
+				item = wikifile.File(site, title=item['title'], check=False, followRedir=False, pageid=pageid)
+			else:
+				item = page.Page(site, title=item['title'], check=False, followRedir=False, pageid=pageid)
+			ret.append(item)
+	else:
+		for key in queryresult.keys():
+			item = queryresult[key]
+			pageid = False
+			if 'pageid' in item:
+				pageid = item['pageid']
+			if item['ns'] == 14:
+				item = category.Category(site, title=item['title'], check=False, followRedir=False, pageid=pageid)
+			elif item['ns'] == 6:
+				item = wikifile.File(site, title=item['title'], check=False, followRedir=False, pageid=pageid)
+			else:
+				item = page.Page(site, title=item['title'], check=False, followRedir=False, pageid=pageid)
+			ret.append(item)
+	return ret
+
+def listFromTitles(site, titles, check=True, followRedir=False):
+	"""Create a list of page objects from a list of titles
+	
+	check and followRedir have the same meaning as in page.Page
+	
+	"""
+	ret = []
+	if not check:
+		for title in titles:
+			title = page.Page(site, title=title, check=False)
+			ret.append(title)
+	else:
+		querylist = []
+		limit = int(site.limit)
+		if len(titles) > limit/10:
+			iters = int(math.ceil(float(len(titles)) / (limit/10)))
+			for x in range(0,iters):
+				lower = x*limit/10
+				upper = (x+1)*limit/10
+				querylist.append(titles[lower:upper])
+		else:
+			querylist.append(titles)
+		response = False
+		for item in querylist:
+			tlist = '|'.join(item)
+			if not isinstance(tlist, str):
+				tlist = str(tlist, 'utf8')
+			params = {'action':'query',
+				'titles':tlist,
+			}
+			if followRedir:
+				params['redirects'] = ''
+			req = api.APIRequest(site, params)
+			res = req.query(False)
+			for key in res['query']['pages']:
+				obj = res['query']['pages'][key]
+				item = makePage(key, obj, site)
+				ret.append(item)
+	return ret
+
+def listFromPageids(site, pageids, check=True, followRedir=False):			
+	"""Create a list of page objects from a list of pageids
+	
+	check and followRedir have the same meaning as in page.Page
+	
+	"""
+	ret = []
+	if not check:
+		for id in pageids:
+			title = page.Page(site, pageid=id, check=False)
+			ret.append(title)
+	else:
+		querylist = []
+		limit = int(site.limit)
+		if len(pageids) > limit/10:
+			iters = int(math.ceil(float(len(pageids)) / (limit/10)))
+			for x in range(0,iters):
+				lower = x*limit/10
+				upper = (x+1)*limit/10
+				querylist.append(pageids[lower:upper])
+		else:
+			querylist.append(pageids)
+		response = False
+		for item in querylist:
+			ids = [str(id) for id in item]
+			idlist = '|'.join(ids)
+			params = {'action':'query',
+				'pageids':idlist,
+			}
+			if followRedir:
+				params['redirects'] = ''
+			req = api.APIRequest(site, params)
+			res = req.query()
+			if not response:
+				response = res
+			else:
+				response = api.resultCombine('', response, res)
+		for key in response['query']['pages'].keys():
+			res = response['query']['pages'][key]
+			item = makePage(key, res, site)
+			ret.append(item)
+	return ret
+	
+def makePage(key, result, site):
+	title=False
+	if 'title' in result:
+		title = result['title']
+	if 'ns' in result and result['ns'] == 14:
+		item = category.Category(site, title=title, check=False, followRedir=False, pageid=key)
+	elif 'ns' in result and result['ns'] == 6:
+		item = wikifile.File(site, title=title, check=False, followRedir=False, pageid=key)
+	else:
+		item = page.Page(site, title=title, check=False, followRedir=False, pageid=key)
+	if 'missing' in result:
+		item.exists = False
+	if 'invalid' in result:
+		item = False
+	if 'ns' in result:
+		item.setNamespace(int(result['ns']))
+	return item
diff --git a/wikitools/user.py b/wikitools/user.py
new file mode 100644
index 00000000..c41e0065
--- /dev/null
+++ b/wikitools/user.py
@@ -0,0 +1,223 @@
+﻿#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# Copyright 2008-2013 Alex Zaddach (mrzmanwiki@gmail.com), bjweeks
+
+# This file is part of wikitools.
+# wikitools is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+ 
+# wikitools is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+ 
+# You should have received a copy of the GNU General Public License
+# along with wikitools.  If not, see <http://www.gnu.org/licenses/>.
+
+import wiki
+import page
+import api
+import socket
+import re
+
+class User:
+	"""A user on the wiki"""
+	def __init__(self, site, name, check=True):
+		"""
+		wiki - A wiki object
+		name - The username, as a string
+		check - Checks for existence, normalizes name
+		"""
+		self.site = site
+		self.name = name.strip()
+		if not isinstance(self.name, str):
+			self.name = str(self.name, 'utf8')
+		self.exists = True # If we're not going to check, assume it does
+		self.blocked = None # So we can tell the difference between blocked/not blocked/haven't checked
+		self.editcount = -1
+		self.groups = []
+		self.id = 0
+		if check:
+			self.setUserInfo()
+		self.isIP = False
+		self.IPcheck()
+		self.page = page.Page(self.site, ':'.join([self.site.namespaces[2]['*'], self.name]), check=check, followRedir=False)
+	
+	def IPcheck(self):
+		try: #IPv4 check
+                        s = socket.inet_aton(self.name.replace(' ', '_'))
+                        if socket.inet_ntoa(s) == self.name:
+                                self.isIP = True
+                                self.exists = False
+				return
+                except:
+                        pass
+		try:
+			s = socket.inet_pton(socket.AF_INET6, self.name.replace(' ', '_'))
+			if self.IPnorm(socket.inet_ntop(socket.AF_INET6, s)) == self.IPnorm(self.name):
+				self.isIP = True
+				self.exists = False
+				self.name = self.IPnorm(self.name)
+				return
+		except:
+			pass
+
+	def IPnorm(self, ip):
+		"""This is basically a port of MediaWiki's IP::sanitizeIP but assuming no CIDR ranges"""
+		ip = ip.upper()
+		# Expand zero abbreviations
+		abbrevPos = ip.find('::')
+		if abbrevPos != -1:
+			addressEnd = len(ip) - 1
+			# If the '::' is at the beginning...
+			if abbrevPos == 0:
+				repeat = '0:'
+				extra = '0' if ip == '::' else ''
+				pad = 9
+			elif abbrevPos == addressEnd - 1:
+				repeat = ':0'
+				extra = ''
+				pad = 9
+			else:
+				repeat = ':0'
+				extra = ':'
+				pad = 8
+			ip = ip.replace( '::', repeat*(pad-ip.count(':'))+extra)
+		# Remove leading zereos from each bloc as needed
+		ip = re.sub('/(^|:)0+(([0-9A-Fa-f]{1,4}))/', '\1\2', ip)
+		return ip;
+
+	def setUserInfo(self):
+		"""Sets basic user info"""		
+		params = {
+			'action': 'query',
+			'list': 'users',
+			'ususers':self.name,
+			'usprop':'blockinfo|groups|editcount'
+		}
+		req = api.APIRequest(self.site, params)
+		response = req.query(False)
+		user = response['query']['users'][0]
+		self.name = user['name']
+		if 'missing' in user or 'invalid' in user:
+			self.exists = False
+			return
+		self.id = int(user['userid'])
+		self.editcount = int(user['editcount'])
+		if 'groups' in user:
+			self.groups = user['groups']
+		if 'blockedby' in user:
+			self.blocked = True
+		else:
+			self.blocked = False
+		return self
+		
+	def getTalkPage(self, check=True, followRedir=False):
+		"""Convenience function to get an object for the user's talk page"""
+		return page.Page(self.site, ':'.join([self.site.namespaces[3]['*'], self.name]), check=check, followRedir=False)
+		
+	def isBlocked(self, force=False):
+		"""Determine if a user is blocked"""
+		if self.blocked is not None and not force:
+			return self.blocked
+		params = {'action':'query',
+			'list':'blocks',
+			'bkusers':self.name,
+			'bkprop':'id'
+		}
+		req = api.APIRequest(self.site, params)
+		res = req.query(False)
+		if len(res['query']['blocks']) > 0:
+			self.blocked = True
+		else:
+			self.blocked = False
+		return self.blocked		
+			
+	def block(self, reason=False, expiry=False, anononly=False, nocreate=False, autoblock=False, noemail=False, hidename=False, allowusertalk=False, reblock=False):
+		"""Block the user
+		
+		Params are the same as the API
+		reason - block reason
+		expiry - block expiration
+		anononly - block anonymous users only
+		nocreate - disable account creation
+		autoblock - block IP addresses used by the user
+		noemail - block user from sending email through the site
+		hidename - hide the username from the log (requires hideuser right)
+		allowusertalk - allow the user to edit their talk page
+		reblock - overwrite existing block
+		
+		"""
+		token = self.site.getToken('csrf')
+		params = {'action':'block',
+			'user':self.name,
+			'token':token
+		}
+		if reason:
+			params['reason'] = reason
+		if expiry:
+			params['expiry'] = expiry
+		if anononly:
+			params['anononly'] = ''
+		if nocreate:
+			params['nocreate'] = ''
+		if autoblock:
+			params['autoblock'] = ''
+		if noemail:
+			params['noemail'] = ''
+		if hidename:
+			params['hidename'] = ''
+		if allowusertalk:
+			params['allowusertalk'] = ''
+		if reblock:
+			params['reblock'] = ''
+		req = api.APIRequest(self.site, params, write=False)
+		res = req.query()
+		if 'block' in res:
+			self.blocked = True
+		return res
+		
+	def unblock(self, reason=False):
+		"""Unblock the user
+		
+		reason - reason for the log
+		
+		"""
+		token = self.site.getToken('csrf')
+		params = {
+		    'action': 'unblock',
+			'user': self.name,
+			'token': token
+		}
+		if reason:
+			params['reason'] = reason
+		req = api.APIRequest(self.site, params, write=False)
+		res = req.query()
+		if 'unblock' in res:
+			self.blocked = False
+		return res
+	
+	def __hash__(self):
+		return int(self.name) ^ hash(self.site.apibase)
+	
+	def __eq__(self, other):
+		if not isinstance(other, User):
+			return False
+		if self.name == other.name and self.site == other.site:
+			return True
+		return False
+	def __ne__(self, other):
+		if not isinstance(other, User):
+			return True
+		if self.name == other.name and self.site == other.site:
+			return False
+		return True
+	
+	def __str__(self):
+		return self.__class__.__name__ + ' ' + repr(self.name) + " on " + repr(self.site.domain)
+	
+	def __repr__(self):
+		return "<"+self.__module__+'.'+self.__class__.__name__+" "+repr(self.name)+" on "+repr(self.site.apibase)+">"
+		
diff --git a/wikitools/wiki.py b/wikitools/wiki.py
new file mode 100644
index 00000000..188be955
--- /dev/null
+++ b/wikitools/wiki.py
@@ -0,0 +1,406 @@
+﻿#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# Copyright 2008-2013 Alex Zaddach (mrzmanwiki@gmail.com)
+
+# This file is part of wikitools.
+# wikitools is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+
+# wikitools is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+ 
+# You should have received a copy of the GNU General Public License
+# along with wikitools.  If not, see <http://www.gnu.org/licenses/>.
+
+import http.cookiejar
+import api
+import re
+import time
+import os
+import warnings
+from urllib import parse
+from urllib.request import HTTPPasswordMgrWithDefaultRealm
+import pickle
+
+class WikiError(Exception):
+	"""Base class for errors"""
+	
+class UserBlocked(WikiError):
+	"""Trying to edit while blocked"""
+
+class Namespace(int):
+	"""
+	Class for namespace 'constants'
+	Names are based on canonical (non-localized) names
+	This functions as an integer in every way, except that the OR operator ( | )
+	is overridden to produce a string namespace list for use in API queries
+	wikiobj.NS_MAIN|wikiobj.NS_USER|wikiobj.NS_PROJECT returns '0|2|4'
+	"""
+	def __or__(self, other):
+		return '|'.join([str(self), str(other)])
+	
+	def __ror__(self, other):
+		return '|'.join([str(other), str(self)])
+
+VERSION = '1.4'
+		
+class Wiki:
+	"""A Wiki site"""
+
+	def __init__(self, url="https://en.wikipedia.org/w/api.php", httpuser=None, httppass=None, preauth=False):
+		"""
+		url - A URL to the site's API, defaults to en.wikipedia
+		httpuser - optional user name for HTTP Auth
+        	httppass - password for HTTP Auth, leave out to enter interactively
+		preauth - true to send headers for HTTP Auth on the first request
+		          instead of relying on the negotiation for them
+
+		"""
+		self.apibase = url
+		self.cookies = WikiCookieJar()
+		self.username = ''
+		urlbits = parse(self.apibase)
+		self.domain = '://'.join([urlbits.scheme, urlbits.netloc])
+		if httpuser is not None:
+			if httppass is None:
+				from getpass import getpass
+				self.httppass = getpass("HTTP Auth password for "+httpuser+": ")
+			if preauth:
+				self.httppass = httppass
+				self.auth = httpuser
+			else:
+				self.passman = HTTPPasswordMgrWithDefaultRealm()
+				self.passman.add_password(None, self.domain, httpuser, httppass)
+		else:
+			self.passman = None
+			self.auth = None
+		self.maxlag = 5
+		self.maxwaittime = 120
+		self.useragent = "python-wikitools/%s" % VERSION
+		self.cookiepath = ''
+		self.limit = 500
+		self.siteinfo = {}
+		self.namespaces = {}
+		self.NSaliases = {}
+		self.assertval = None
+		self.newtoken = False
+		try:
+			self.setSiteinfo()
+		except api.APIError: # probably read-restricted
+			pass
+	
+	def setSiteinfo(self):
+		"""Retrieves basic siteinfo
+		
+		Called when constructing,
+		or after login if the first call failed
+		
+		"""
+		params = {'action':'query',
+			'meta':'siteinfo|tokens',
+			'siprop':'general|namespaces|namespacealiases',
+		}
+		if self.maxlag < 120:
+			params['maxlag'] = 120
+		req = api.APIRequest(self, params)
+		info = req.query(False)
+		sidata = info['query']['general']
+		for item in sidata:
+			self.siteinfo[item] = sidata[item]
+		nsdata = info['query']['namespaces']
+		for ns in nsdata:
+			nsinfo = nsdata[ns]
+			self.namespaces[nsinfo['id']] = nsinfo
+			if ns != "0":
+				try:
+					attr = "NS_%s" % (nsdata[ns]['canonical'].replace(' ', '_').upper())
+				except KeyError:
+					attr = "NS_%s" % (nsdata[ns]['*'].replace(' ', '_').upper())
+			else:
+				attr = "NS_MAIN"
+			setattr(self, attr.encode('utf8'), Namespace(ns.encode('utf8')))			
+		nsaliasdata = info['query']['namespacealiases']
+		if nsaliasdata:
+			for ns in nsaliasdata:
+				self.NSaliases[ns['*']] = ns['id']
+		if not 'writeapi' in sidata:
+			warnings.warn(UserWarning, "WARNING: Write-API not enabled, you will not be able to edit")
+		version = re.search("\d\.(\d\d)", self.siteinfo['generator'])
+		if not int(version.group(1)) >= 13: # Will this even work on 13?
+			warnings.warn(UserWarning, "WARNING: Some features may not work on older versions of MediaWiki")
+		if 'tokens' in info['query'].keys():
+			self.newtoken = True
+		return self
+	
+	def login(self, username, password=False, remember=False, force=False, verify=True, domain=None):
+		"""Login to the site
+		
+		remember - saves cookies to a file - the filename will be:
+		hash(username - apibase).cookies
+		the cookies will be saved in the current directory, change cookiepath
+		to use a different location
+		force - forces login over the API even if a cookie file exists 
+		and overwrites an existing cookie file if remember is True
+		verify - Checks cookie validity with isLoggedIn()
+		domain - domain name, required for some auth systems like LDAP
+		
+		"""
+		if not force:
+			try:	
+				cookiefile = self.cookiepath + str(hash(username+' - '+self.apibase))+'.cookies'
+				self.cookies.load(self, cookiefile, True, True)
+				self.username = username
+				if not verify or self.isLoggedIn(self.username):
+					return True
+			except:
+				pass
+		if not password:
+			from getpass import getpass
+			password = getpass("Wiki password for "+username+": ")
+		def loginerror(info):
+			try:
+				print (info['login']['result'])
+			except:
+				print (info['error']['code'])
+				print (info['error']['info'])
+			return False
+		data = {
+			"action" : "login",
+			"lgname" : username,
+			"lgpassword" : password,
+		}
+		if domain is not None:
+			data["lgdomain"] = domain
+		if self.maxlag < 120:
+			data['maxlag'] = 120
+		req = api.APIRequest(self, data)
+		info = req.query()
+		if info['login']['result'] == "Success":
+			self.username = username
+		elif info['login']['result'] == "NeedToken":
+			req.changeParam('lgtoken', info['login']['token'])
+			info = req.query()
+			if info['login']['result'] == "Success":
+				self.username = username
+			else:
+				return loginerror(info)
+		else:
+			return loginerror(info)
+		if not self.siteinfo:
+			self.setSiteinfo()
+		params = {
+			'action': 'query',
+			'meta': 'userinfo',
+			'uiprop': 'rights',
+		}
+		if self.maxlag < 120:
+			params['maxlag'] = 120
+		req = api.APIRequest(self, params)
+		info = req.query(False)
+		user_rights = info['query']['userinfo']['rights']
+		if 'apihighlimits' in user_rights:
+			self.limit = 5000
+		if remember:
+			cookiefile = self.cookiepath + str(hash(self.username+' - '+self.apibase))+'.cookies'
+			self.cookies.save(self, cookiefile, True, True)
+		if self.useragent == "python-wikitools/%s" % VERSION:
+			self.useragent = "python-wikitools/%s (User:%s)" % (VERSION, self.username)
+		return True
+	
+	def logout(self):
+		params = { 'action': 'logout' }
+		if self.maxlag < 120:
+			params['maxlag'] = 120
+		cookiefile = self.cookiepath + str(hash(self.username+' - '+self.apibase))+'.cookies'
+		try:
+			os.remove(cookiefile)
+		except:
+			pass
+		req = api.APIRequest(self, params, write=True)
+		# action=logout returns absolutely nothing, which json.loads() treats as False
+		# causing APIRequest.query() to get stuck in a loop
+		req.opener.open(req.request)
+		self.cookies = WikiCookieJar()
+		self.username = ''
+		self.maxlag = 5
+		self.useragent = "python-wikitools/%s" % VERSION
+		self.limit = 500
+		return True
+		
+	def isLoggedIn(self, username = False):
+		"""Verify that we are a logged in user
+		
+		username - specify a username to check against
+		
+		"""
+		
+		data = {
+			"action" : "query",
+			"meta" : "userinfo",
+		}
+		if self.maxlag < 120:
+			data['maxlag'] = 120
+		req = api.APIRequest(self, data)
+		info = req.query(False)
+		if info['query']['userinfo']['id'] == 0:
+			return False
+		elif username and info['query']['userinfo']['name'] != username:
+			return False
+		else:
+			return True
+	
+	def setMaxlag(self, maxlag = 5):
+		"""Set the maximum server lag to allow
+		
+		If the lag is > the maxlag value, all requests will wait
+		Setting to a negative number will disable maxlag checks
+		
+		"""
+		try:
+			int(maxlag)
+		except:
+			raise WikiError("maxlag must be an integer")
+		self.maxlag = int(maxlag)
+		return self.maxlag
+		
+	def setUserAgent(self, useragent):
+		"""Function to set a different user-agent"""
+		self.useragent = str(useragent)
+		return self.useragent
+
+	def setAssert(self, value):
+		"""Set an assertion value
+		
+		This only makes a difference on sites with the AssertEdit extension
+		on others it will be silently ignored
+		This is only checked on edits, so only applied to write queries
+		
+		Set to None (the default) to not use anything
+		http://www.mediawiki.org/wiki/Extension:Assert_Edit
+		
+		"""
+		valid = ['user', 'bot', 'true', 'false', 'exists', 'test', None]
+		if value not in valid:
+			raise WikiError("Invalid assertion")
+		self.assertval = value
+		return self.assertval
+		
+	def getToken(self, type):
+		"""Get a token
+		
+		For wikis with MW 1.24 or newer:
+		type (string) - csrf, deleteglobalaccount, patrol, rollback, setglobalaccountstatus, userrights, watch
+
+		For older wiki versions, only csrf (edit, move, etc.) tokens are supported
+		
+		"""
+		if self.newtoken:
+			params = {
+				'action':'query',
+				'meta':'tokens',
+				'type':type,
+			}
+			req = api.APIRequest(self, params)
+			response = req.query(False)
+			token = response['query']['tokens'][type+'token']
+		else:
+			if type not in ['edit', 'delete', 'protect', 'move', 'block', 'unblock', 'email', 'csrf']:
+				raise WikiError('Token type unavailable')
+			params = {
+				'action':'query',
+				'prop':'info',
+				'intoken':'edit',
+				'titles':'1'
+			}
+			req = api.APIRequest(self, params)
+			response = req.query(False)
+			if response.get('data', False):
+				pid = response['data']['query']['pages'].keys()[0]
+				token = response['query']['pages'][pid]['edittoken']
+			else:
+				pages = response['query']['pages']
+				token = pages.itervalues().next()['edittoken']
+		return token
+
+
+	def __hash__(self):
+		return hash(self.apibase)
+		
+	def __eq__(self, other):
+		if not isinstance(other, Wiki):
+			return False
+		if self.apibase == other.apibase:
+			return True
+		return False
+	def __ne__(self, other):
+		if not isinstance(other, Wiki):
+			return True
+		if self.apibase == other.apibase:
+			return False
+		return True
+		
+	def __str__(self):
+		if self.username:
+			user = ' - using User:'+self.username
+		else:
+			user = ' - not logged in'
+		return self.domain + user
+	
+	def __repr__(self):
+		if self.username:
+			user = ' User:'+self.username
+		else:
+			user = ' not logged in'
+		return "<"+self.__module__+'.'+self.__class__.__name__+" "+repr(self.apibase)+user+">"
+		
+		
+
+class CookiesExpired(WikiError):
+	"""Cookies are expired, needs to be an exception so login() will use the API instead"""
+
+class WikiCookieJar(http.cookiejar.FileCookieJar):
+	def save(self, site, filename=None, ignore_discard=False, ignore_expires=False):
+		if not filename:
+			filename = self.filename
+		old_umask = os.umask(0o077)
+		f = open(filename, 'w')
+		f.write('')
+		content = ''
+		for c in self:
+			if not ignore_discard and c.discard:
+				continue
+			if not ignore_expires and c.is_expired:
+				continue
+			cook = pickle.dumps(c, 2)
+			f.write(cook+'|~|')
+		content+=str(int(time.time()))+'|~|' # record the current time so we can test for expiration later
+		content+='site.limit = %d;' % (site.limit) # This eventially might have more stuff in it
+		f.write(content)
+		f.close()
+		os.umask(old_umask)
+	
+	def load(self, site, filename, ignore_discard, ignore_expires):
+		f = open(filename, 'r')
+		cookies = f.read().split('|~|')
+		saved = cookies[len(cookies)-2]
+		if int(time.time()) - int(saved) > 1296000: # 15 days, not sure when the cookies actually expire...
+			f.close()
+			os.remove(filename)
+			raise CookiesExpired
+		sitedata = cookies[len(cookies)-1]
+		del cookies[len(cookies)-2]
+		del cookies[len(cookies)-1]
+		for c in cookies:
+			cook = pickle.loads(c)
+			if not ignore_discard and cook.discard:
+				continue
+			if not ignore_expires and cook.is_expired:
+				continue
+			self.set_cookie(cook)
+		exec (sitedata)
+		f.close()
+	
diff --git a/wikitools/wikifile.py b/wikitools/wikifile.py
new file mode 100644
index 00000000..a5297e5e
--- /dev/null
+++ b/wikitools/wikifile.py
@@ -0,0 +1,259 @@
+#!/usr/bin/env python3
+# -*- coding: utf-8 -*-
+# Copyright 2009-2013 Alex Zaddach (mrzmanwiki@gmail.com)
+
+# This file is part of wikitools.
+# wikitools is free software: you can redistribute it and/or modify
+# it under the terms of the GNU General Public License as published by
+# the Free Software Foundation, either version 3 of the License, or
+# (at your option) any later version.
+ 
+# wikitools is distributed in the hope that it will be useful,
+# but WITHOUT ANY WARRANTY; without even the implied warranty of
+# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
+# GNU General Public License for more details.
+ 
+# You should have received a copy of the GNU General Public License
+# along with wikitools.  If not, see <http://www.gnu.org/licenses/>.
+
+import wiki
+import page
+import api
+import io
+import urllib
+import warnings
+
+class FileDimensionError(wiki.WikiError):
+	"""Invalid dimensions"""
+	
+class UploadError(wiki.WikiError):
+	"""Error during uploading"""
+
+class File(page.Page):
+	"""A file on the wiki"""
+	def __init__(self, wiki, title, check=True, followRedir=False, section=False, sectionnumber=False, pageid=False):
+		"""	
+		wiki - A wiki object
+		title - The page title, as a string or unicode object
+		check - Checks for existence, normalizes title, required for most things
+		followRedir - follow redirects (check must be true)
+		section - the section name
+		sectionnumber - the section number
+		pageid - pageid, can be in place of title
+		""" 
+		page.Page.__init__(self, wiki, title, check, followRedir, section, sectionnumber, pageid)
+		if self.namespace != 6:
+			self.setNamespace(6, check)
+		self.usage = []
+		self.filehistory = []
+
+	def getHistory(self, force=False):
+		warnings.warn("""File.getHistory has been renamed to File.getFileHistory""", FutureWarning)
+		return self.getFileHistory(force)
+		
+	def getFileHistory(self, force=False):
+		if self.filehistory and not force:
+			return self.filehistory
+		if self.pageid == 0 and not self.title:
+			self.setPageInfo()
+		params = {
+			'action': 'query',
+			'prop': 'imageinfo',
+			'iilimit': self.site.limit,
+		}
+		if self.pageid > 0:
+			params['pageids'] = self.pageid
+		else:
+			params['titles'] = self.title	
+		req = api.APIRequest(self.site, params)
+		self.filehistory = []
+		for data in req.queryGen():
+			pid = data['query']['pages'].keys()[0]
+			for item in data['query']['pages'][pid]['imageinfo']:
+				self.filehistory.append(item)
+		return self.filehistory
+			
+	def getUsage(self, titleonly=False, force=False, namespaces=False):
+		"""Gets a list of pages that use the file
+		
+		titleonly - set to True to only create a list of strings,
+		else it will be a list of Page objects
+		force - reload the list even if it was generated before
+		namespaces - List of namespaces to restrict to (queries with this option will not be cached)
+		
+		"""
+		if self.usage and not force:
+			if titleonly:
+				if namespaces is not False:
+					return [p.title for p in self.usage if p.namespace in namespaces]
+				else:
+					return [p.title for p in self.usage]
+			if namespaces is False:
+				return self.usage
+			else:
+				return [p for p in self.usage if p.namespace in namespaces]
+		else:
+			ret = []
+			usage = []
+			for title in self.__getUsageInternal(namespaces):
+				usage.append(title)
+				if titleonly:
+					ret.append(title.title)
+			if titleonly:
+				return ret
+			if namespaces is False:
+				self.usage = usage
+			return usage
+	
+	def getUsageGen(self, titleonly=False, force=False, namespaces=False):
+		"""Generator function for pages that use the file
+		
+		titleonly - set to True to return strings,
+		else it will return Page objects
+		force - reload the list even if it was generated before
+		namespaces - List of namespaces to restrict to (queries with this option will not be cached)
+		
+		"""
+		if self.usage and not force:
+			for title in self.usage:
+				if namespaces is False or title.namespace in namespaces:
+					if titleonly:
+						yield title.title
+					else:
+						yield title
+		else:
+			if namespaces is False:
+				self.usage = []
+			for title in self.__getUsageInternal():
+				if namespaces is False:
+					self.usage.append(title)
+				if titleonly:
+					yield title.title
+				else:
+					yield title
+				
+	def __getUsageInternal(self, namespaces=False):
+		params = {'action':'query',
+			'list':'imageusage',
+			'iutitle':self.title,
+			'iulimit':self.site.limit,
+		}
+		if namespaces is not False:
+			params['iunamespace'] = '|'.join([str(ns) for ns in namespaces])
+		while True:
+			req = api.APIRequest(self.site, params)
+			data = req.query(False)
+			for item in data['query']['imageusage']:
+				yield page.Page(self.site, item['title'], check=False, followRedir=False)
+			try:
+				params['iucontinue'] = data['query-continue']['imageusage']['iucontinue']
+			except:
+				break 
+		
+	def __extractToList(self, json, stuff):
+		list = []
+		if stuff in json['query']:
+			for item in json['query'][stuff]:
+				list.append(item['title'])
+		return list
+	
+	def download(self, width=False, height=False, location=False):
+		"""Download the image to a local file
+		
+		width/height - set width OR height of the downloaded image
+		location - set the filename to save to. If not set, the page title
+		minus the namespace prefix will be used and saved to the current directory
+		
+		"""
+		if self.pageid == 0:
+			self.setPageInfo()
+		params = {'action':'query',
+			'prop':'imageinfo',
+			'iiprop':'url'
+		}
+		if width and height:
+			raise FileDimensionError("Can't specify both width and height")
+		if width:
+			params['iiurlwidth'] = width
+		if height:
+			params['iiurlheight'] = height
+		if self.pageid != 0:
+			params['pageids'] = self.pageid
+		elif self.title:
+			params['titles'] = self.title
+		else:
+			self.setPageInfo()
+			if not self.exists: # Non-existant files may be on a shared repo (e.g. commons)
+				params['titles'] = self.title
+			else:
+				params['pageids'] = self.pageid
+		req = api.APIRequest(self.site, params)
+		res = req.query(False)
+		key = res['query']['pages'].keys()[0]
+		url = res['query']['pages'][key]['imageinfo'][0]['url']
+		if not location:
+			location = self.title.split(':', 1)[1]
+		opener = urllib.build_opener(urllib.HTTPCookieProcessor(self.site.cookies))
+		headers = { "User-agent": self.site.useragent }
+		request = urllib.Request(url, None, headers)
+		data = opener.open(request)
+		f = open(location, 'wb', 0)
+		f.write(data.read())
+		f.close()
+		return location
+		
+	def upload(self, fileobj=None, comment='', url=None, ignorewarnings=False, watch=False):
+		"""Upload a file, requires the "poster" module
+		
+		fileobj - A file object opened for reading
+		comment - The log comment, used as the inital page content if the file 
+		doesn't already exist on the wiki
+		url - A URL to upload the file from, if allowed on the wiki
+		ignorewarnings - Ignore warnings about duplicate files, etc.
+		watch - Add the page to your watchlist
+		
+		"""
+		if not api.canupload and fileobj:
+			raise UploadError("The poster module is required for file uploading")
+		if not fileobj and not url:
+			raise UploadError("Must give either a file object or a URL")
+		if fileobj and url:
+			raise UploadError("Cannot give a file and a URL")
+		if fileobj:
+			if not isinstance(fileobj, io.IOBase):
+				raise UploadError('If uploading from a file, a file object must be passed')
+			if fileobj.mode not in ['r', 'rb', 'r+']:
+				raise UploadError('File must be readable')
+			fileobj.seek(0)
+		params = {'action':'upload',
+			'comment':comment,
+			'filename':self.unprefixedtitle,
+			'token':self.site.getToken('csrf')
+		}
+		if url:
+			params['url'] = url
+		else:
+			params['file'] = fileobj
+		if ignorewarnings:
+			params['ignorewarnings'] = ''
+		if watch:
+			params['watch'] = ''
+		req = api.APIRequest(self.site, params, write=True, multipart=bool(fileobj))
+		res = req.query()
+		if 'upload' in res:
+			if res['upload']['result'] == 'Success':
+				self.wikitext = ''
+				self.links = []
+				self.templates = []
+				self.exists = True
+			elif res['upload']['result'] == 'Warning':
+				for warning in res['upload']['warnings'].keys():
+					if warning == 'duplicate':
+						print ('File is a duplicate of ' + res['upload']['warnings']['duplicate'][0])
+					elif warning == 'page-exists' or warning == 'exists':
+						print ('Page already exists: ' + res['upload']['warnings'][warning])
+					else:
+						print ('Warning: ' + warning + ' ' + res['upload']['warnings'][warning])
+		return res
+		
+