Difference between revisions of "User:Moussekateer/editcount.py"
Moussekateer (talk | contribs) m |
m (<pre/>) |
||
(3 intermediate revisions by 2 users not shown) | |||
Line 1: | Line 1: | ||
<pre>import urllib2, json, time, locale | <pre>import urllib2, json, time, locale | ||
from datetime import datetime | from datetime import datetime | ||
+ | from datetime import date | ||
from operator import itemgetter | from operator import itemgetter | ||
+ | global NUMYEARS | ||
+ | NUMYEARS = date.today().year-2010 + 1 # 2014 - 2010 + 1 = 5 (years) | ||
locale.setlocale(locale.LC_ALL, '') | locale.setlocale(locale.LC_ALL, '') | ||
wikiAddress = r'http://wiki.teamfortress.com/w/api.php?action=query&list=allusers&auprop=editcount|registration&auwitheditsonly&aulimit=500&format=json' | wikiAddress = r'http://wiki.teamfortress.com/w/api.php?action=query&list=allusers&auprop=editcount|registration&auwitheditsonly&aulimit=500&format=json' | ||
+ | usernameSubs = {'Ohyeahcrucz': 'Cructo', | ||
+ | 'I-ghost': 'i-ghost', | ||
+ | 'Darkid': 'darkid' | ||
+ | } | ||
+ | bots = [r'FreemBOT', r'MousseBOT', r'PilkBOT', r'SebBOT', r'WindBOT'] | ||
usersList = [] | usersList = [] | ||
Line 22: | Line 30: | ||
else: | else: | ||
return 1 | return 1 | ||
+ | |||
+ | def userEditCount(nlower, nupper=None): | ||
+ | count = 0 | ||
+ | for user in sortedList: | ||
+ | if nupper is None: | ||
+ | if user['editcount'] >= nlower: | ||
+ | count += 1 | ||
+ | else: | ||
+ | if nlower <= user['editcount'] and user['editcount'] <= nupper: | ||
+ | count += 1 | ||
+ | return count | ||
+ | |||
+ | def addTableRow(nlower, nupper=None): | ||
+ | if nupper is None: | ||
+ | return """\n|- | ||
+ | | {nlower}+ | ||
+ | | {{{{Chart bar|{count}|max={max}}}}} | ||
+ | | {percentage}%""".format(nlower = nlower, | ||
+ | count = userEditCount(nlower), | ||
+ | max = len(usersList), | ||
+ | percentage = str('%.2f' % (100 * float(userEditCount(nlower))/float(len(usersList)))) | ||
+ | ) | ||
+ | else: | ||
+ | return """\n|- | ||
+ | | {nlower} - {nupper} | ||
+ | | {{{{Chart bar|{count}|max={max}}}}} | ||
+ | | {percentage}%""".format(nlower = nlower, | ||
+ | nupper = nupper, | ||
+ | count = userEditCount(nlower, nupper), | ||
+ | max = len(usersList), | ||
+ | percentage = str('%.2f' % (100 * float(userEditCount(nlower, nupper))/float(len(usersList)))) | ||
+ | ) | ||
+ | |||
+ | def monthName(n): | ||
+ | return {1: "January", | ||
+ | 2: "February", | ||
+ | 3: "March", | ||
+ | 4: "April", | ||
+ | 5: "May", | ||
+ | 6: "June", | ||
+ | 7: "July", | ||
+ | 8: "August", | ||
+ | 9: "September", | ||
+ | 10: "October", | ||
+ | 11: "November", | ||
+ | 12: "December", | ||
+ | }[n] | ||
+ | |||
+ | def addTimeData(timeSortedList): | ||
+ | timeRange = [[0]*12 for i in range(NUMYEARS)] #[year][month] | ||
+ | for user in timeSortedList: | ||
+ | time = user['registration'] | ||
+ | timeRange[int(time[:4])-2010][int(time[5:7])-1] += 1 # 2013-05 -> 3, 4 | ||
+ | runningTotal = 0 | ||
+ | output = "" | ||
+ | for year in range(NUMYEARS): | ||
+ | for month in range(1,12): | ||
+ | numUsers = timeRange[year][month-1] | ||
+ | if numUsers == 0: | ||
+ | continue # Time segment has no data, just skip. | ||
+ | runningTotal += numUsers | ||
+ | output += """\n|- | ||
+ | | <span style="display:none;">{year}{month}</span>{monthName} {year} | ||
+ | | {{{{Chart bar|{numUsers}|max=3500}}}} | ||
+ | | {total}""".format(numUsers = numUsers, | ||
+ | month = month, | ||
+ | monthName = monthName(month), | ||
+ | year = year+2010, | ||
+ | total = runningTotal) | ||
+ | return output | ||
populate_list() | populate_list() | ||
sortedList = sorted(usersList, key=itemgetter('editcount'), reverse=True) | sortedList = sorted(usersList, key=itemgetter('editcount'), reverse=True) | ||
+ | timeSortedList = sorted(usersList, key=itemgetter('registration')) | ||
− | outputString = """ | + | outputString = """User edits statistics. Data accurate as of {0} (GMT). Further stats available at [http://stats.wiki.tf/wiki/tf stats.wiki.tf] |
+ | ;Note<nowiki>:</nowiki> All data excludes registered users with no edits.""".format(time.strftime(r'%H:%M, %d %B %Y', time.gmtime())) | ||
− | == | + | outputString += """\n\n== Edit count distribution == |
+ | {| class="wikitable grid sortable plainlinks" style="text-align: center" | ||
+ | ! class="header" width="30%" | Number of edits | ||
+ | ! class="header" width="50%" | Users | ||
+ | ! class="header" width="20%" | Percentage of users""" | ||
+ | print("""Adding percentage breakdown""") | ||
+ | outputString += addTableRow(1, 10) | ||
+ | outputString += addTableRow(11, 100) | ||
+ | outputString += addTableRow(101, 1000) | ||
+ | outputString += addTableRow(1001, 5000) | ||
+ | outputString += addTableRow(5001) | ||
+ | outputString += """\n|}""" | ||
+ | print("""Adding joins per month""") | ||
+ | outputString += """\n\n== User signups == | ||
+ | {| class="wikitable grid sortable plainlinks" style="text-align:center" | ||
+ | ! class="header" width="30%" | Date | ||
+ | ! class="header" width="50%" | Signups | ||
+ | ! class="header" width="20%" | Total number of users""" | ||
+ | outputString += addTimeData(timeSortedList) | ||
+ | outputString += "\n|}" | ||
+ | print("""Adding top 100 editors list""") | ||
+ | outputString += """\n\n== Top editors list == | ||
Limited to the top 100. | Limited to the top 100. | ||
− | {| class="wikitable grid sortable" | + | {{| class="wikitable grid sortable" |
− | |||
! class="header" | # | ! class="header" | # | ||
! class="header" | User | ! class="header" | User | ||
! class="header" | Edit count | ! class="header" | Edit count | ||
! class="header" | Edits per day | ! class="header" | Edits per day | ||
− | ! class="header" | Registration date | + | ! class="header" | Registration date""".format(time.strftime(r'%H:%M, %d %B %Y', time.gmtime())) |
− | |||
n = 1 | n = 1 | ||
timenow = datetime.now() | timenow = datetime.now() | ||
for user in sortedList[:100]: | for user in sortedList[:100]: | ||
− | + | username = user['name'] | |
− | timedelta = timenow-userstarttime | + | usereditcount = user['editcount'] |
− | editsperday = ('%.2f' % (float( | + | userregistration = user['registration'] |
− | + | if username in usernameSubs: | |
− | outputString += | + | username = usernameSubs[username] |
− | + | userstarttime = datetime.strptime(userregistration, r'%Y-%m-%dT%H:%M:%SZ') | |
+ | timedelta = timenow - userstarttime | ||
+ | editsperday = ('%.2f' % (float(usereditcount)/float(timedelta.days))) | ||
+ | outputString += """\n|- | ||
+ | | {n} || [[User:{username}|{username}]] || {editcount} || {editday} || <span style="display:none;">{sortabledate}</span>{date}""".format( | ||
+ | n = str(n), | ||
+ | username = username, | ||
+ | editcount = locale.format('%d', usereditcount, grouping=True), | ||
+ | editday = str(editsperday), | ||
+ | sortabledate = time.strftime(r'%Y-%m-%d %H:%M:00', time.strptime(userregistration, r'%Y-%m-%dT%H:%M:%SZ')), | ||
+ | date = time.strftime(r'%H:%M, %d %B %Y', time.strptime(userregistration, r'%Y-%m-%dT%H:%M:%SZ')) | ||
+ | ) | ||
n += 1 | n += 1 | ||
− | outputString += | + | outputString += "\n|}" |
file = open(r'edit_count_table.txt', 'wb') | file = open(r'edit_count_table.txt', 'wb') | ||
− | file.write(outputString)</pre> | + | file.write(outputString) |
+ | print 'Article written to edit_count_table.txt' | ||
+ | file.close()</pre> |
Latest revision as of 06:41, 2 July 2014
import urllib2, json, time, locale from datetime import datetime from datetime import date from operator import itemgetter global NUMYEARS NUMYEARS = date.today().year-2010 + 1 # 2014 - 2010 + 1 = 5 (years) locale.setlocale(locale.LC_ALL, '') wikiAddress = r'http://wiki.teamfortress.com/w/api.php?action=query&list=allusers&auprop=editcount|registration&auwitheditsonly&aulimit=500&format=json' usernameSubs = {'Ohyeahcrucz': 'Cructo', 'I-ghost': 'i-ghost', 'Darkid': 'darkid' } bots = [r'FreemBOT', r'MousseBOT', r'PilkBOT', r'SebBOT', r'WindBOT'] usersList = [] def populate_list(aufrom=None): global usersList if aufrom: result = json.loads(urllib2.urlopen(wikiAddress + r'&aufrom=' + aufrom).read()) else: result = json.loads(urllib2.urlopen(wikiAddress).read()) list = result['query']['allusers'] usersList += list print 'User count:', str(len(usersList)) if 'query-continue' in result: populate_list(aufrom=result['query-continue']['allusers']['aufrom']) else: return 1 def userEditCount(nlower, nupper=None): count = 0 for user in sortedList: if nupper is None: if user['editcount'] >= nlower: count += 1 else: if nlower <= user['editcount'] and user['editcount'] <= nupper: count += 1 return count def addTableRow(nlower, nupper=None): if nupper is None: return """\n|- | {nlower}+ | {{{{Chart bar|{count}|max={max}}}}} | {percentage}%""".format(nlower = nlower, count = userEditCount(nlower), max = len(usersList), percentage = str('%.2f' % (100 * float(userEditCount(nlower))/float(len(usersList)))) ) else: return """\n|- | {nlower} - {nupper} | {{{{Chart bar|{count}|max={max}}}}} | {percentage}%""".format(nlower = nlower, nupper = nupper, count = userEditCount(nlower, nupper), max = len(usersList), percentage = str('%.2f' % (100 * float(userEditCount(nlower, nupper))/float(len(usersList)))) ) def monthName(n): return {1: "January", 2: "February", 3: "March", 4: "April", 5: "May", 6: "June", 7: "July", 8: "August", 9: "September", 10: "October", 11: "November", 12: "December", }[n] def addTimeData(timeSortedList): timeRange = [[0]*12 for i in range(NUMYEARS)] #[year][month] for user in timeSortedList: time = user['registration'] timeRange[int(time[:4])-2010][int(time[5:7])-1] += 1 # 2013-05 -> 3, 4 runningTotal = 0 output = "" for year in range(NUMYEARS): for month in range(1,12): numUsers = timeRange[year][month-1] if numUsers == 0: continue # Time segment has no data, just skip. runningTotal += numUsers output += """\n|- | <span style="display:none;">{year}{month}</span>{monthName} {year} | {{{{Chart bar|{numUsers}|max=3500}}}} | {total}""".format(numUsers = numUsers, month = month, monthName = monthName(month), year = year+2010, total = runningTotal) return output populate_list() sortedList = sorted(usersList, key=itemgetter('editcount'), reverse=True) timeSortedList = sorted(usersList, key=itemgetter('registration')) outputString = """User edits statistics. Data accurate as of {0} (GMT). Further stats available at [http://stats.wiki.tf/wiki/tf stats.wiki.tf] ;Note: All data excludes registered users with no edits.""".format(time.strftime(r'%H:%M, %d %B %Y', time.gmtime())) outputString += """\n\n== Edit count distribution == {| class="wikitable grid sortable plainlinks" style="text-align: center" ! class="header" width="30%" | Number of edits ! class="header" width="50%" | Users ! class="header" width="20%" | Percentage of users""" print("""Adding percentage breakdown""") outputString += addTableRow(1, 10) outputString += addTableRow(11, 100) outputString += addTableRow(101, 1000) outputString += addTableRow(1001, 5000) outputString += addTableRow(5001) outputString += """\n|}""" print("""Adding joins per month""") outputString += """\n\n== User signups == {| class="wikitable grid sortable plainlinks" style="text-align:center" ! class="header" width="30%" | Date ! class="header" width="50%" | Signups ! class="header" width="20%" | Total number of users""" outputString += addTimeData(timeSortedList) outputString += "\n|}" print("""Adding top 100 editors list""") outputString += """\n\n== Top editors list == Limited to the top 100. {{| class="wikitable grid sortable" ! class="header" | # ! class="header" | User ! class="header" | Edit count ! class="header" | Edits per day ! class="header" | Registration date""".format(time.strftime(r'%H:%M, %d %B %Y', time.gmtime())) n = 1 timenow = datetime.now() for user in sortedList[:100]: username = user['name'] usereditcount = user['editcount'] userregistration = user['registration'] if username in usernameSubs: username = usernameSubs[username] userstarttime = datetime.strptime(userregistration, r'%Y-%m-%dT%H:%M:%SZ') timedelta = timenow - userstarttime editsperday = ('%.2f' % (float(usereditcount)/float(timedelta.days))) outputString += """\n|- | {n} || [[User:{username}|{username}]] || {editcount} || {editday} || <span style="display:none;">{sortabledate}</span>{date}""".format( n = str(n), username = username, editcount = locale.format('%d', usereditcount, grouping=True), editday = str(editsperday), sortabledate = time.strftime(r'%Y-%m-%d %H:%M:00', time.strptime(userregistration, r'%Y-%m-%dT%H:%M:%SZ')), date = time.strftime(r'%H:%M, %d %B %Y', time.strptime(userregistration, r'%Y-%m-%dT%H:%M:%SZ')) ) n += 1 outputString += "\n|}" file = open(r'edit_count_table.txt', 'wb') file.write(outputString) print 'Article written to edit_count_table.txt' file.close()