import urllib2, json, time, locale
from datetime import datetime
from datetime import date
from operator import itemgetter
global NUMYEARS
NUMYEARS = date.today().year-2010 + 1 # 2014 - 2010 + 1 = 5 (years)
locale.setlocale(locale.LC_ALL, '')
wikiAddress = r'http://wiki.teamfortress.com/w/api.php?action=query&list=allusers&auprop=editcount|registration&auwitheditsonly&aulimit=500&format=json'
usernameSubs = {'Ohyeahcrucz': 'Cructo',
'I-ghost': 'i-ghost',
'Darkid': 'darkid'
}
bots = [r'FreemBOT', r'MousseBOT', r'PilkBOT', r'SebBOT', r'WindBOT']
usersList = []
def populate_list(aufrom=None):
global usersList
if aufrom:
result = json.loads(urllib2.urlopen(wikiAddress + r'&aufrom=' + aufrom).read())
else:
result = json.loads(urllib2.urlopen(wikiAddress).read())
list = result['query']['allusers']
usersList += list
print 'User count:', str(len(usersList))
if 'query-continue' in result:
populate_list(aufrom=result['query-continue']['allusers']['aufrom'])
else:
return 1
def userEditCount(nlower, nupper=None):
count = 0
for user in sortedList:
if nupper is None:
if user['editcount'] >= nlower:
count += 1
else:
if nlower <= user['editcount'] and user['editcount'] <= nupper:
count += 1
return count
def addTableRow(nlower, nupper=None):
if nupper is None:
return """\n|-
| {nlower}+
| {{{{Chart bar|{count}|max={max}}}}}
| {percentage}%""".format(nlower = nlower,
count = userEditCount(nlower),
max = len(usersList),
percentage = str('%.2f' % (100 * float(userEditCount(nlower))/float(len(usersList))))
)
else:
return """\n|-
| {nlower} - {nupper}
| {{{{Chart bar|{count}|max={max}}}}}
| {percentage}%""".format(nlower = nlower,
nupper = nupper,
count = userEditCount(nlower, nupper),
max = len(usersList),
percentage = str('%.2f' % (100 * float(userEditCount(nlower, nupper))/float(len(usersList))))
)
def monthName(n):
return {1: "January",
2: "February",
3: "March",
4: "April",
5: "May",
6: "June",
7: "July",
8: "August",
9: "September",
10: "October",
11: "November",
12: "December",
}[n]
def addTimeData(timeSortedList):
timeRange = [[0]*12 for i in range(NUMYEARS)] #[year][month]
for user in timeSortedList:
time = user['registration']
timeRange[int(time[:4])-2010][int(time[5:7])-1] += 1 # 2013-05 -> 3, 4
runningTotal = 0
output = ""
for year in range(NUMYEARS):
for month in range(1,12):
numUsers = timeRange[year][month-1]
if numUsers == 0:
continue # Time segment has no data, just skip.
runningTotal += numUsers
output += """\n|-
| <span style="display:none;">{year}{month}</span>{monthName} {year}
| {{{{Chart bar|{numUsers}|max=3500}}}}
| {total}""".format(numUsers = numUsers,
month = month,
monthName = monthName(month),
year = year+2010,
total = runningTotal)
return output
populate_list()
sortedList = sorted(usersList, key=itemgetter('editcount'), reverse=True)
timeSortedList = sorted(usersList, key=itemgetter('registration'))
outputString = """User edits statistics. Data accurate as of {0} (GMT). Further stats available at [http://stats.wiki.tf/wiki/tf stats.wiki.tf]
;Note: All data excludes registered users with no edits.""".format(time.strftime(r'%H:%M, %d %B %Y', time.gmtime()))
outputString += """\n\n== Edit count distribution ==
{| class="wikitable grid sortable plainlinks" style="text-align: center"
! class="header" width="30%" | Number of edits
! class="header" width="50%" | Users
! class="header" width="20%" | Percentage of users"""
print("""Adding percentage breakdown""")
outputString += addTableRow(1, 10)
outputString += addTableRow(11, 100)
outputString += addTableRow(101, 1000)
outputString += addTableRow(1001, 5000)
outputString += addTableRow(5001)
outputString += """\n|}"""
print("""Adding joins per month""")
outputString += """\n\n== User signups ==
{| class="wikitable grid sortable plainlinks" style="text-align:center"
! class="header" width="30%" | Date
! class="header" width="50%" | Signups
! class="header" width="20%" | Total number of users"""
outputString += addTimeData(timeSortedList)
outputString += "\n|}"
print("""Adding top 100 editors list""")
outputString += """\n\n== Top editors list ==
Limited to the top 100.
{{| class="wikitable grid sortable"
! class="header" | #
! class="header" | User
! class="header" | Edit count
! class="header" | Edits per day
! class="header" | Registration date""".format(time.strftime(r'%H:%M, %d %B %Y', time.gmtime()))
n = 1
timenow = datetime.now()
for user in sortedList[:100]:
username = user['name']
usereditcount = user['editcount']
userregistration = user['registration']
if username in usernameSubs:
username = usernameSubs[username]
userstarttime = datetime.strptime(userregistration, r'%Y-%m-%dT%H:%M:%SZ')
timedelta = timenow - userstarttime
editsperday = ('%.2f' % (float(usereditcount)/float(timedelta.days)))
outputString += """\n|-
| {n} || [[User:{username}|{username}]] || {editcount} || {editday} || <span style="display:none;">{sortabledate}</span>{date}""".format(
n = str(n),
username = username,
editcount = locale.format('%d', usereditcount, grouping=True),
editday = str(editsperday),
sortabledate = time.strftime(r'%Y-%m-%d %H:%M:00', time.strptime(userregistration, r'%Y-%m-%dT%H:%M:%SZ')),
date = time.strftime(r'%H:%M, %d %B %Y', time.strptime(userregistration, r'%Y-%m-%dT%H:%M:%SZ'))
)
n += 1
outputString += "\n|}"
file = open(r'edit_count_table.txt', 'wb')
file.write(outputString)
print 'Article written to edit_count_table.txt'
file.close()