suballpages

git-svn-id: https://wikiteam.googlecode.com/svn/trunk@4 31edc4fc-5e31-b4c4-d58b-c8bc928bcb95
pull/117/head
emijrp 13 years ago
parent 4f8bd2fbf2
commit cc9f064e51

@ -81,7 +81,7 @@ def getAllPageTitles(domain='', namespaces=[]):
deep = 3 # 3 is the current deep of English Wikipedia for Special:Allpages, 3 levels
c = 0
checked_suballpages = []
rawacum = ''
rawacum = raw
while re.search(r_suballpages, raw) and c < deep:
#load sub-Allpages
m = re.compile(r_suballpages).finditer(raw)
@ -150,8 +150,8 @@ def cleanXML(xml=''):
return xml
if __name__ == '__main__':
domain = 'http://archiveteam.org/index.php' # 'http://en.wikipedia.org/w'
#domain = 'http://wikanda.cadizpedia.eu/w/index.php' # 'http://en.wikipedia.org/w'
#domain = 'http://archiveteam.org/index.php' # 'http://en.wikipedia.org/w'
domain = 'http://wikanda.cadizpedia.eu/w/index.php' # 'http://en.wikipedia.org/w'
curonly = False
namespaces = [0]

Loading…
Cancel
Save