Skip to content

Commit

Permalink
working
Browse files Browse the repository at this point in the history
  • Loading branch information
h4ck3rm1k3 committed Jan 23, 2016
1 parent c2591c3 commit 8adb792
Show file tree
Hide file tree
Showing 4 changed files with 21 additions and 5 deletions.
8 changes: 7 additions & 1 deletion dumpgenerator.py
Original file line number Diff line number Diff line change
Expand Up @@ -135,9 +135,15 @@ def getNamespaces(config={}):

def getSDTitles(site):
titles = []
for x in (
for x in (
'AfD_debates',
'Articles for deletion',
'Miscellaneous_pages_for_deletion',
'Templates_for_deletion',
'All articles proposed for deletion',
'Declined_AfC_submissions',
"Proposed_deletion",
"Proposed deletions needing attention",
"Expired_proposed_deletions",
'Candidates_for_speedy_deletion_as_hoaxes',
'Candidates_for_speedy_deletion_as_importance_or_significance_not_asserted',
Expand Down
11 changes: 11 additions & 0 deletions families/wikipedia_family.py
Original file line number Diff line number Diff line change
Expand Up @@ -950,6 +950,17 @@ def __init__(self):
'en': u'Draft talk',
}

self.namespaces[710] = {
'en': u'TimedText',
'pt': u'TimedText',
}

self.namespaces[711] = {
'en': u'TimedText talk',
'pt': u'TimedText talk',
}


self.category_redirect_templates = {
'_default': (),
'ar': (u'تحويل تصنيف',
Expand Down
2 changes: 1 addition & 1 deletion process.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,7 +8,7 @@
path = './'
for infile in glob.glob( os.path.join(path, '*') ):
print "current file is: " + infile
match = re.search(r'(\d\d\d\d)(\d\d)(\d\d)(\d\d)(\d\d)(\d\d)',infile)
#match = re.search(r'(\d\d\d\d)(\d\d)(\d\d)(\d\d)(\d\d)(\d\d)',infile)
match = re.search(r'w\-(\d+)\-wiki',infile)
# match = re.search(r'.+(dddddddddddddd).+',infile)
# match = re.search(r'.+(\dddddddddddddd).+',infile)
Expand Down
5 changes: 2 additions & 3 deletions runexport.sh
Original file line number Diff line number Diff line change
@@ -1,12 +1,11 @@
#set -e

export PYTHONPATH=$HOME/experiments/wikiteam/
cd ${HOME}/experiments/wikiteam/data
pushd ${HOME}/experiments/wikiteam/data
python $HOME/experiments/wikiteam/dumpgenerator.py

echo going to run process
cd ${HOME}/experiments/wikiteam/data
#pwd
python $HOME/experiments/wikiteam/process.py
popd
rm -rf ${HOME}/experiments/wikiteam/data/enwikipedia*
#rm -rf ${HOME}/experiments/wikiteam/data/Api*

0 comments on commit 8adb792

Please sign in to comment.