launcher for batch downloads

git-svn-id: https://wikiteam.googlecode.com/svn/trunk@446 31edc4fc-5e31-b4c4-d58b-c8bc928bcb95
pull/117/head
emijrp 12 years ago
parent 657577cc37
commit 2df1ffa9a0

@ -0,0 +1,48 @@
#!/usr/bin/python
# -*- coding: utf-8 -*-
# Copyright (C) 2011-2012 WikiTeam
# This program is free software: you can redistribute it and/or modify
# it under the terms of the GNU General Public License as published by
# the Free Software Foundation, either version 3 of the License, or
# (at your option) any later version.
#
# This program is distributed in the hope that it will be useful,
# but WITHOUT ANY WARRANTY; without even the implied warranty of
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
# GNU General Public License for more details.
#
# You should have received a copy of the GNU General Public License
# along with this program. If not, see <http://www.gnu.org/licenses/>.
import os
import re
import sys
import time
f = open(sys.argv[1], 'r')
wikis = f.read().splitlines()
f.close()
for wiki in wikis:
os.system('python ../dumpgenerator.py --api=%s/api.php --xml --images' % wiki)
wikiname = re.sub(r'(\.|^www\.)', '', wiki.split('://')[1])
wikiname = re.sub('-', '_', wikiname)
wikidir = ''
for dirname, dirnames, filenames in os.walk('.'):
if dirname == '.':
for d in dirnames:
if d.startswith(wikiname):
wikidir = d
prefix = wikidir.split('-wikidump')[0]
if wikidir and prefix:
os.chdir(wikidir)
print 'Changed directory to', os.getcwd()
os.system('grep "<title>" *.xml -c;grep "<page>" *.xml -c;grep "</page>" *.xml -c;grep "<revision>" *.xml -c;grep "</revision>" *.xml -c')
os.system('7z a ../%s-wikidump.7z %s-history.xml %s-titles.txt %s-images.txt index.html Special:Version.html errors.log images/' % (prefix, prefix, prefix, prefix))
os.system('7z a ../%s-history.xml.7z %s-history.xml %s-titles.txt index.html Special:Version.html errors.log' % (prefix, prefix, prefix))
os.chdir('..')
print 'Changed directory to', os.getcwd()
time.sleep(1)

@ -35,7 +35,6 @@ TODO:
* basic: GUI to download just a wiki
* advanced: batch downloads, upload to Internet Archive or anywhere
"""
wikifarms = {

Loading…
Cancel
Save