https://www.mediawiki.org/wiki/Special:Code/MediaWiki/115476
Revision: 115476 Author: ezachte Date: 2012-06-04 12:57:59 +0000 (Mon, 04 Jun 2012) Log Message: ----------- last revision of scripts for old style report card? Modified Paths: -------------- trunk/wikistats/reportcard/ComScoreTop1000.pl trunk/wikistats/reportcard/RT_yyyy_mm.html trunk/wikistats/reportcard/ReportCardExtractWikiCountsOutput.pl trunk/wikistats/reportcard/ReportCardGenerateHtml.pl Modified: trunk/wikistats/reportcard/ComScoreTop1000.pl =================================================================== --- trunk/wikistats/reportcard/ComScoreTop1000.pl 2012-06-04 10:41:35 UTC (rev 115475) +++ trunk/wikistats/reportcard/ComScoreTop1000.pl 2012-06-04 12:57:59 UTC (rev 115476) @@ -15,10 +15,10 @@ my $do_normalize = $true ; my $no_normalize = $false ; - $file_csv_ref = "Reference sites UV_(Oct 09 - Dec 10).csv" ; - $file_csv_top = "Top 1000 poperties, UV trend_(Oct 09 - Dec 10).csv" ; - $file_html_ref = "ComScoreReferenceSites-2010-12.htm" ; - $file_html_top = "ComScoreTop1000Properties-2010-12.htm" ; + $file_csv_ref = "Reference sites UV_(Dec 10 - Feb 12).csv" ; + $file_csv_top = "Top 1000 poperties, UV trend_(Dec 10 - Feb 12).csv" ; + $file_html_ref = "ComScoreReferenceSites-2012-02.htm" ; + $file_html_top = "ComScoreTop1000Properties-2012-02.htm" ; # note normalization needs overhaul: * 30/actual days in month does not work for UV's @@ -59,6 +59,7 @@ while ($line = <CSV>) { chomp $line ; + $line =~ s/"(\d+),(\d+),(\d+)"/$1$2$3/g ; $line =~ s/"(\d+),(\d+)"/$1$2/g ; $line =~ s/"([^"]*)"/$1/g ; @@ -199,8 +200,8 @@ "$out_license" . "</small>\n" ; - $delta_rank_year = "&Delta Year = Rank ${months [$#months-12]} ⇒ ${months [$#months]}" ; - $delta_rank_month = "&Delta Month = Rank ${months [$#months-1]} ⇒ ${months [$#months]}" ; + $delta_rank_year = "Δ Year = Rank ${months [$#months-12]} ⇒ ${months [$#months]}" ; + $delta_rank_month = "Δ Month = Rank ${months [$#months-1]} ⇒ ${months [$#months]}" ; $delta_perc_year = "% Year = Growth ${months [$#months-12]} ⇒ ${months [$#months]}" ; $delta_perc_month = "% Month = Growth ${months [$#months-1]} ⇒ ${months [$#months]}" ; @@ -249,7 +250,7 @@ $html .= "<table border=1>\n" ; $html .= "<tr><td colspan=99 align=left class=l><h2><font color=#C00000>Complete list</font></h2></td></tr>" ; $html .= "<tr><th class=l colspan=2>Property</th><th class=c colspan=3>Rank</th><th class=c colspan=2>Growth</th><th class=c>Rel. pop.</th><th class=c colspan=99>Monthly data: Unique Visitors (count x 1000) <small><small>+ Rank + Rang change + Growth percentage</small></small></th></tr>" ; - $html .= "<tr><th class=l>Site (*)</th><th class=c>Type</th><th class=c>Rank</th><th class=c>&Delta Year</th><th class=c>&Delta Month</th><th class=c>% Year</th><th class=c>% Month</th><th>WM=100</small></th>" ; + $html .= "<tr><th class=l>Site (*)</th><th class=c>Type</th><th class=c>Rank</th><th class=c>Δ Year</th><th class=c>Δ Month</th><th class=c>% Year</th><th class=c>% Month</th><th>WM=100</small></th>" ; for ($i = $#months; $i >= 0 ; $i--) { $html .= "<th class=c>${months[$i]}</th>" ; } $html .= "</tr>" ; @@ -423,7 +424,7 @@ $html .= "</tr><tr><td colspan=99> </td></tr>" ; $html .= "<tr><td colspan=99 align=left class=l><a id='fast' name='fast'></a><h2><font color=#C00000>Fastest risers</font> <small>$threshold_filter+ rise in ranks in a year</small></h2></td></tr>" ; $html .= "<tr><th class=l colspan=2>Property</th><th class=c colspan=3>Rank</th><th class=c colspan=2>Growth</th><th class=c>Rel. pop.</th><th class=c colspan=99>Monthly data: Unique Visitors (count x 1000) <small><small>+ Rank + Rang change + Growth percentage</small></small></th></tr>" ; - $html .= "<tr><th class=l>Site</th><th class=c>Type</th><th class=c>Rank</th><th class=c>&Delta Year</th><th class=c>&Delta Month</th><th class=c>% Year</th><th class=c>% Month</th><th>WM=100</small></th>" ; + $html .= "<tr><th class=l>Site</th><th class=c>Type</th><th class=c>Rank</th><th class=c>Δ Year</th><th class=c>Δ Month</th><th class=c>% Year</th><th class=c>% Month</th><th>WM=100</small></th>" ; for ($i = $#months; $i >= 0 ; $i--) { $html .= "<th class=c>${months[$i]}</th>" ; } $html .= $html_fast_risers ; Modified: trunk/wikistats/reportcard/RT_yyyy_mm.html =================================================================== --- trunk/wikistats/reportcard/RT_yyyy_mm.html 2012-06-04 10:41:35 UTC (rev 115475) +++ trunk/wikistats/reportcard/RT_yyyy_mm.html 2012-06-04 12:57:59 UTC (rev 115476) @@ -402,7 +402,7 @@ <!-- Reach: Page Requests: Tabs --> <td align=left valign=middle> <!== OUT SC ==> - <img src='charts/{{yyyy}}-{{mm}}/Page-Views-Total-Indexed.png'> + <img src='charts/{{yyyy}}-{{mm}}/Page-Views-Total-Indexed-Wikis.png'> <!== OUT D ==> <!== TABS {20|log scale|linear scale|indexed per wiki|indexed per project|Mobile|M&S} ==> <!== TAB {21|<img src='charts/{{yyyy}}-{{mm}}/Page-Views-Total-Absolute-Log.png'><br>} ==> Modified: trunk/wikistats/reportcard/ReportCardExtractWikiCountsOutput.pl =================================================================== --- trunk/wikistats/reportcard/ReportCardExtractWikiCountsOutput.pl 2012-06-04 10:41:35 UTC (rev 115475) +++ trunk/wikistats/reportcard/ReportCardExtractWikiCountsOutput.pl 2012-06-04 12:57:59 UTC (rev 115476) @@ -5,12 +5,11 @@ $trace_on_exit = $true ; ez_lib_version (2) ; - $month_last = "12" ; - $year_last = 2010 ; + $month_last = "4" ; + $year_last = 2012 ; + $month_start = $month_last ; + $year_start = $year_last - 3 ; - $month_start = "1" ; - $year_start = 2008 ; - $m_start = &months_since_2000_01 ($year_start, $month_start) ; $m_last = &months_since_2000_01 ($year_last, $month_last) ; $m_last_12 = $m_last - 12 ; @@ -49,19 +48,19 @@ sub ParseArguments { -# my @options ; -# getopt ("io", \%options) ; + my @options ; + getopt ("io", \%options) ; -# die ("Specify input folder for projectcounts files as: -i path") if (! defined ($options {"i"})) ; -# die ("Specify output folder as: -o path'") if (! defined ($options {"o"})) ; + die ("Specify input folder for projectcounts files as: -i path") if (! defined ($options {"i"})) ; + die ("Specify output folder as: -o path'") if (! defined ($options {"o"})) ; -# $path_in = $options {"i"} ; -# $path_out = $options {"o"} ; + $path_in = $options {"i"} ; + $path_out = $options {"o"} ; -# die "Input folder '$path_in' does not exist" if (! -d $path_in) ; -# die "Output folder '$path_out' does not exist" if (! -d $path_out) ; + die "Input folder '$path_in' does not exist" if (! -d $path_in) ; + die "Output folder '$path_out' does not exist" if (! -d $path_out) ; - $path_in = "w:/# out bayes" ; + $path_in = "w:/# out bayes/csv_report_card" ; $path_out = "w:/@ report card/data" ; print "Input folder: $path_in\n" ; @@ -108,7 +107,7 @@ while ($line = <CSV_IN>) { ($language,$date,$counts) = split (',', $line, 3) ; - + next if $language =~ /^zz/ ; next if $language eq 'commons' and $project ne 'wx' ; next if $language eq 'sr' and $project eq 'wn' ; # ignore insane bot spam on @@ -144,6 +143,7 @@ $totals {"$f,$m"} += $fields [$f] ; $totals_project {"$f,$m"} {$project} += $fields [$f] ; + $totals_project {"$f,$m"} {$all_projects} += $fields [$f] ; # print "TOTALS $f $m = . " . $totals {"$f,$m"} . "\n" ; @@ -199,6 +199,7 @@ { chomp $line ; ($language,$date,$reguser_bot,$group,$counts) = split (',', $line, 5) ; + next if $language =~ /^zz/ ; next if $language eq 'commons' and $project ne 'wx' ; # commons also in wikipedia csv files (bug, hard to cleanup, just skip) # next if $language eq 'commons' ; # ignore editor count on commons alltogether, most are already counted for other project @@ -272,7 +273,6 @@ ($language,$date,$counts) = split (',', $line, 3) ; if ($language ne "commons") { next ; } - if ($date eq "00/0000") { @fields = split (',', $counts) ; @@ -330,6 +330,7 @@ print "Write file '$file_csv_out'\n" ; open CSV_OUT, '>', $file_csv_out ; $output = "" ; + foreach $f (1,2,3,4,6,11) # new editors, editors_gt_5, editors_gt_100, articles, new articles, edits { @@ -338,7 +339,12 @@ $line = ",Total," ; for ($m = $m_start ; $m <= $m_last ; $m++) - { $line .= $totals {"$f,$m"} . "," ; } + { + if ($f <= 3) # new editors, editors_gt_5, editors_gt_100, + { $line .= $totals_project {"$f,$m"} {$all_projects} . "," ; } + else + { $line .= $totals {"$f,$m"} . "," ; } + } # growth in one year if ($totals {"$f,$m_last_12"} != 0) @@ -390,6 +396,7 @@ if ($f <= 3) # 0 = Contributors, 1 = New Wikimedians, 2 = Active Editors (5+ edits), 3 = Very Active Editors (100+ edits), { $output .= ",Note: All projects does not include Commons\n" ; } $output .= "$csv_recent_months,%inc year, %inc month\n" ; + foreach $project (sort {$totals_project {"$f,$m_last"} {$b} <=> $totals_project {"$f,$m_last"} {$a}} @projects) { # next if $project eq 'commons' and ($f ==2 or $f == 3) ; # (very) active editors no longer counted for commons @@ -426,6 +433,8 @@ # print "$index $f: $key -> ${values_f_12 {$key}}\n" ; ($project,$language) = split (",", $key) ; +if ($f == 2) +{ print "project $project $language\n" ; } $language_name = $out_languages {$language} ; if (($project ne "wp") && ($project ne "wx")) { $line = "$index,$language_name " . &GetProjectName ($project) . "," ; } @@ -465,6 +474,7 @@ $output .= "\n,${out_report_descriptions [$f]} - Indexed - Per Project\n" ; $output .= "$csv_recent_months,%inc year, %inc month\n" ; + foreach $project (sort {$totals_project {"$f,$m_last"} {$b} <=> $totals_project {"$f,$m_last"} {$a}} @projects) { # next if $project eq 'commons' and ($f ==2 or $f == 3) ; # (very) active editors no longer counted for commons Modified: trunk/wikistats/reportcard/ReportCardGenerateHtml.pl =================================================================== --- trunk/wikistats/reportcard/ReportCardGenerateHtml.pl 2012-06-04 10:41:35 UTC (rev 115475) +++ trunk/wikistats/reportcard/ReportCardGenerateHtml.pl 2012-06-04 12:57:59 UTC (rev 115476) @@ -9,8 +9,8 @@ use Getopt::Std ; # !! adapt these for every run !! - $p_year = 2011 ; - $p_month = 12 ; + $p_year = 2012 ; + $p_month = 2 ; $debug = $false ; @@ -91,40 +91,40 @@ # !! This is rather crummy if not outright stupid Q&D way to collect variable data, data need to be externalized !! -## if ($2011_12) +## if ($2012_02) ## { # projects @rank = qw ( 5th x 0 0 th) ; # All - Web Properties - Unique Visitors - @reach = qw ( 31.7 x 1.8 -1.3 %) ; # All - Reach Percentage by Region - @visitors = qw ( 457,063,000 m 15.6 -3.7 %) ; # All - Unique Visitors by Region - @page_requests = qw (16,365,306,811 b 17.3 -6.1 %) ; # All - copy/calc manually monthly total and monthly and yearly growth from 1st column (Sigma) of http://stats.wikimedia.org/EN/TablesPageViewsMonthly.htm (Wikipedia only is good enough) - @commons_files = qw ( 11,974,179 m 50.1 1.8 %) ; # Commons - Binaries per month - Absolute - @article_count = qw ( 20,845,401 m 18.6 1.9 %) ; # Wp - Starting Sep-2010 Wikipedia articles only / Article count (official) - Absolute - @new_articles = qw ( 12,759 k 50.0 67.2 %) ; # Wp - New articles per day - Absolute - @edits = qw ( 11,636,349 m 1.0 4.7 %) ; # Wp - Edits per month - Absolute - @new_editors = qw ( 15,181 k -9.1 -6.4 %) ; # All - New editors - Absolute - @active_editors = qw ( 83,293 k 1.6 0.1 %) ; # All - Active editors - Absolute - @very_active_editors = qw ( 11,041 k 2.7 2.8 %) ; # All - Very active editors - Absolute + @reach = qw ( 32.8 x 4.5 -0.4 %) ; # All - Reach Percentage by Region + @visitors = qw ( 475,699,000 m 25.4 -1.3 %) ; # All - Unique Visitors by Region + @page_requests = qw (18,127,912,107 b 16.2 0.4 %) ; # All - copy/calc manually monthly total and monthly and yearly growth from 1st column (Sigma) of http://stats.wikimedia.org/EN/TablesPageViewsMonthly.htm (Wikipedia only is good enough) + @commons_files = qw ( 12,367,426 m 32.1 1.5 %) ; # Commons - Binaries per month - Absolute + @article_count = qw ( 21,158,235 m 18.5 1.3 %) ; # Wp - Starting Sep-2010 Wikipedia articles only / Article count (official) - Absolute + @new_articles = qw ( 8,449 k -6.1 -36.7 %) ; # Wp - New articles per day - Absolute + @edits = qw ( 12,422,452 m -2.5 6.8 %) ; # Wp - Edits per month - Absolute + @new_editors = qw ( 15,333 k -14.7 -8.8 %) ; # All - New editors - Absolute + @active_editors = qw ( 85,163 k -1.7 -3.6 %) ; # All - Active editors - Absolute + @very_active_editors = qw ( 10,913 k 0.0 -6.8 %) ; # All - Very active editors - Absolute # http://stats.wikimedia.org/EN/TablesPageViewsMonthly.htm push @rank, "1|Site Rank<br>#1: 5th position will be stable for long time: differences with those ranked 4th and 6th are considerable." ; - push @reach, "2|Reach<br>#2: Change in reach in 3 years: (avg Oct-Dec 08 -> avg Oct-Dec 11) pp= percentage points: <br>" . - "# Europe +9pp, (38%->47%), North-Am +10pp (35%->45%), Asia +1pp (16%->18%),<br>" . - "# Latin-America +6pp (35%->41%), Middle East-Africa +2pp (30%->32%),<br>" . - "# India +16pp (20%->35%), World +4.8pp (27.8%->32.7%)" ; - push @visitors, "3,4|Unique Visitors<br>#3: 8% higher than average for last 12 months (422M).<br>" . -# " 4.9% higher than previous month (which was also an all time high)<br>" . - "#4: Change in UV's in 3 years: (avg Oct-Dec 08 -> avg Oct-Dec 11): <br>" . - "# Europe +68%, North-Am +46%, Latin-Am: +103%, Asia: +58%, World +69%<br>" . - "# India +164%, Middle East-Africa: +180%" ; - push @page_requests, "5,6,7,8,9|Page Requests<br>" . - "5: <a href='http://stats.wikimedia.org/EN/TablesPageViewsMonthlyCombined.htm'>Fastest and slowest growth in page requests in top 25 Wikipedias in 2011</a>:<br>" . - " Fast: Chinese +323%, Persian +114%, Ukranian +69%, Korean +65%, Arabic +43%,<br>" . - " Indonesian +40%, Hebrew +40%, Russian +38%, Thai +35%, Commons +33%.<br>" . - " Slow: Finnish +2%, Hungarian +5%.<br>" . - "6: <a href='http://stats.wikimedia.org/EN/TablesPageViewsMonthlyAllProjects.htm'>Projects ranked by growth in page requests in 2011</a>:<br>" . - " Wikiquote: +127%, Wiktionary: +57%, Commons: +33%, Wikibooks: +26%, Wikisource: +23%,<br>" . - " Wikipedia: +16%, Wikinews: +12%, Wikiversity: +5%<br>" . - "7: Numbers have been corrected for 88 hours of missing traffic data.<br>" . - "8: Wiktionary traffic back to normal after massive botnet spam in Oct/Nov.<br>" . + push @reach, "2|Reach<br>#2: Change in reach in 3 years: (avg Dec-Feb 08/09 -> avg Dec-Feb 11/12) pp= percentage points: <br>" . + "# Europe +8.3pp, (38%->47%), North-Am +10.6pp (36%->46%), Asia +1.4pp (16%->18%),<br>" . + "# Latin-America +5.7pp (31%->37%), Middle East-Africa +3.1pp (29%->32%),<br>" . + "# India +15.1pp (20%->35%), World +4.8pp (27.8%->32.6%)" ; + push @visitors, "3,4|Unique Visitors<br>3: 9% higher than average for last 12 months (436M), even on the shortest month of the year.<br>" . +# " 1.1% higher than previous record month Oct 2011<br>" . + "#4: Change in UV's in 3 years: (avg Dec-Feb 08/09 -> avg Dec-Feb 11/12): <br>" . + "# Europe +60%, North-Am +48%, Latin-Am: +98%, Asia: +53%, World +64%<br>" . + "# India +165%, Middle East-Africa: +149%" ; + push @page_requests, "5,6,7,8|Page Requests<br>" . +# "5: 58% of page requests to all Wiktionaries combined came from one ip address,<br>" . +# " which spammed Special:Random page on most languages.<br>" . + "#6: Fastest and slowest growth in page requests in top 25 Wikipedias in 2011:<br>" . + "# Fast: Chinese +323%, Persian +114%, Ukranian +69%, Korean +65%, Arabic +43%,<br>" . + "# Indonesian +40%, Hebrew +40%, Russian +38%, Thai +35%, Commons +33%.<br>" . + "# Slow: Finnish +2%, Hungarian +5%, see <a href='http://stats.wikimedia.org/EN/TablesPageViewsMonthlyCombined.htm'>details</a><br>" . + "#7: Projects ranked by growth in page requests in 2011:<br>" . + "# Wikiquote: +127%, Wiktionary: +57%, Commons: +33%, Wikibooks: +26%, Wikisource: +23%,<br>" . + "# Wikipedia: +16%, Wikinews: +12%, Wikiversity: +5%, see <a href='http://stats.wikimedia.org/EN/TablesPageViewsMonthlyAllProjects.htm'>details</a><br>" . # " Reassesment may follow later.<br>" ; # "6: Note that total requests <b>from mobile devices</b> is even much higher, approx half go to regular site" ; # "6: <a href='http://stats.wikimedia.org/wikimedia/squids/SquidReportClients.htm'>Total file requests from mobile devices for all Wikimedia projects</a> in March: 7.2%!<br>" . @@ -135,19 +135,31 @@ # "#8: Page views for Chinese Wikipedia went from 52M in January to 163M in April.<br>" . # " #Unique visitors from China stayed low as usual, even dropped 6% from January to April.<br>" . # " #(Chinese community said year ago they had issues with Google ranking, maybe these were fixed?)<br>" . - "#9: Page requests have been normalized to 30 days (Jan*30/31, Feb*30/28, Mar*30/31, etc)<br>" ; + "#8: Page requests have been normalized to 30 days (Jan*30/31, Feb*30/28, Mar*30/31, etc)<br>" ; # push @commons_files, "7|Commons Files<br>7: Recent growth in " . # "<br> Probably related to Wiki Loves Monuments contest (WLM)</a><br>" ; - push @article_count, "10|Article Count<br>10: Some Wikipedias contain massive amounts of bot created stubs,<br>" . - " (e.g. Dutch Wikipedia 42% of total, Volap\xFCk 92% of total)<br>" . - " which makes article count a questionable metric of community effort.<br>" . - " see also <a href='http://stats.wikimedia.org/EN/BotActivityMatrixCreates.htm'>new report</a> on bot induced article creation activity per wiki." ; + push @article_count, "9|" ; +# push @article_count, "9|Article Count<br>#9: Some Wikipedias contain massive amounts of bot created stubs,<br>" . +# "# (e.g. Dutch Wikipedia 42% of total, Volap\xFCk 92% of total)<br>" . +# "# which makes article count a questionable metric of community effort.<br>" . +# "# see also new report on <a href='http://stats.wikimedia.org/EN/BotActivityMatrixCreates.htm'>bot induced article creation activity per wiki.</a>" ; ## "9: Seven Wiktionaries in top 25 Wikimedia projects" ; -push @new_articles, "10|New Articles Per Day<br>" . - "10: On Dutch Wikipedia <a href='http://nl.wikipedia.org/wiki/Speciaal:Bijdragen/Joopwikibot'>Joopwikibot</a> created roughly 164k of trivial taxonomy stubs in last 3 months." ; +push @new_articles, "9|Article Count, New Articles<br>9: Data for January (February will be added very soon)" ; +push @edits, "10|" ; +push @new_editors, "10|" ; +push @active_editors, "10|" ; +push @very_active_editors, "10|Edits, New Editors, (Very)Active Editors<br>10: Provisionary data, final data will arrive soon (< 1 % change)" ; + +#push @new_articles, "10,11|New Articles Per Day<br>" . +# "10: Sharp drop in overall number of new articles on all Wikipedias combined mostly due to bot inactivity<br>" . +# " on Dutch Wikipedia, which in Dec accounted for 33% of all new articles.<br>" . +# "11: Still this month the number of wikis with exceptionally large numbers of new articles rose sharply:<br>" . +# " New articles per day for Dec->Jan: Slovene 33->312, Bashkir 4->308, Malagasy 3->232,<br>" . +# " Latin 45->215, Armenian 31->123, Fiji Hindi 22->83<br>" . +# " For comparison, two large Wikipedias with normal article creation rate: Russian 348, Spanish 285" ; ## push @edits, "6|Edits<br>#6: Over the last 3 years there is fairly consistent growth in manual, registered edits.<br>" . ## "# Net growth in constructive edits is less clear, as this metric includes most reverting edits." ; ## " Strong one-monthly dip in July due to World Cup Socker?." ; @@ -169,8 +181,169 @@ ## } +### if ($2012_01) +### { # projects +# @rank = qw ( 5th x 0 0 th) ; # All - Web Properties - Unique Visitors +# @reach = qw ( 33.2 x 2.1 1.5 %) ; # All - Reach Percentage by Region +# @visitors = qw ( 482,157,000 m 16.5 5.5 %) ; # All - Unique Visitors by Region +# @page_requests = qw (18,054,255,294 b 16.5 10.3 %) ; # All - copy/calc manually monthly total and monthly and yearly growth from 1st column (Sigma) of http://stats.wikimedia.org/EN/TablesPageViewsMonthly.htm (Wikipedia only is good enough) +# @commons_files = qw ( 12,200,544 m 48.7 1.9 %) ; # Commons - Binaries per month - Absolute +# @article_count = qw ( 21,158,235 m 18.5 1.3 %) ; # Wp - Starting Sep-2010 Wikipedia articles only / Article count (official) - Absolute +# @new_articles = qw ( 8,449 k -6.1 -36.7 %) ; # Wp - New articles per day - Absolute +# @edits = qw ( 12,422,452 m -2.5 6.8 %) ; # Wp - Edits per month - Absolute +# @new_editors = qw ( 16,170 k -16.0 2.1 %) ; # All - New editors - Absolute +# @active_editors = qw ( 88,548 k -3.2 6.7 %) ; # All - Active editors - Absolute +# @very_active_editors = qw ( 11,730 k -0.5 6.3 %) ; # All - Very active editors - Absolute +# # http://stats.wikimedia.org/EN/TablesPageViewsMonthly.htm +# push @rank, "1|Site Rank<br>#1: 5th position will be stable for long time: differences with those ranked 4th and 6th are considerable." ; +# push @reach, "2|Reach<br>#2: Change in reach in 3 years: (avg Nov-Jan 08/09 -> avg Nov-Jan 11/12) pp= percentage points: <br>" . +# "# Europe +9pp, (38%->47%), North-Am +10pp (35%->45%), Asia +1pp (17%->18%),<br>" . +# "# Latin-America +6pp (32%->39%), Middle East-Africa +2pp (31%->32%),<br>" . +# "# India +15pp (20%->36%), World +4.7pp (27.9%->32.6%)" ; +# push @visitors, "3,4|Unique Visitors<br>3: 13% higher than average for last 12 months (428M).<br>" . +# " 1.1% higher than previous record month Oct 2011<br>" . +# "#4: Change in UV's in 3 years: (avg Nov-Jan 11/12 -> avg Nov-Jan 11/12): <br>" . +# "# Europe +66%, North-Am +47%, Latin-Am: +105%, Asia: +54%, World +68%<br>" . +# "# India +157%, Middle East-Africa: +173%" ; +# push @page_requests, "5,6,7,8|Page Requests<br>" . +# "5: 58% of page requests to all Wiktionaries combined came from one ip address,<br>" . +# " which spammed Special:Random page on most languages.<br>" . +# "#6: Fastest and slowest growth in page requests in top 25 Wikipedias in 2011:<br>" . +# "# Fast: Chinese +323%, Persian +114%, Ukranian +69%, Korean +65%, Arabic +43%,<br>" . +# "# Indonesian +40%, Hebrew +40%, Russian +38%, Thai +35%, Commons +33%.<br>" . +# "# Slow: Finnish +2%, Hungarian +5%, see <a href='http://stats.wikimedia.org/EN/TablesPageViewsMonthlyCombined.htm'>details</a><br>" . +# "#7: Projects ranked by growth in page requests in 2011:<br>" . +# "# Wikiquote: +127%, Wiktionary: +57%, Commons: +33%, Wikibooks: +26%, Wikisource: +23%,<br>" . +# "# Wikipedia: +16%, Wikinews: +12%, Wikiversity: +5%, see <a href='http://stats.wikimedia.org/EN/TablesPageViewsMonthlyAllProjects.htm'>details</a><br>" . +## " Reassesment may follow later.<br>" ; +## "6: Note that total requests <b>from mobile devices</b> is even much higher, approx half go to regular site" ; +## "6: <a href='http://stats.wikimedia.org/wikimedia/squids/SquidReportClients.htm'>Total file requests from mobile devices for all Wikimedia projects</a> in March: 7.2%!<br>" . +## " See also <a href='charts/2011-04/RatioMobileTraffic.png'>Plot for both metrics.</a><br>" . +## "7: Note: Requests from mobile devices to the non-mobile site, which are redirected to the mobile site<br>" . +## " are probably counted twice. Follow up requests from the mobile device via internal links<br>" . +## " are not affected. Number of double counts not yet known.<br>" . +## "#8: Page views for Chinese Wikipedia went from 52M in January to 163M in April.<br>" . +## " #Unique visitors from China stayed low as usual, even dropped 6% from January to April.<br>" . +## " #(Chinese community said year ago they had issues with Google ranking, maybe these were fixed?)<br>" . +# "#8: Page requests have been normalized to 30 days (Jan*30/31, Feb*30/28, Mar*30/31, etc)<br>" ; +## push @commons_files, "7|Commons Files<br>7: Recent growth in " . +## "<br> Probably related to Wiki Loves Monuments contest (WLM)</a><br>" ; +# push @article_count, "9|Article Count<br>#9: Some Wikipedias contain massive amounts of bot created stubs,<br>" . +# "# (e.g. Dutch Wikipedia 42% of total, Volap\xFCk 92% of total)<br>" . +# "# which makes article count a questionable metric of community effort.<br>" . +# "# see also new report on <a href='http://stats.wikimedia.org/EN/BotActivityMatrixCreates.htm'>bot induced article creation activity per wiki.</a>" ; + +### "9: Seven Wiktionaries in top 25 Wikimedia projects" ; +#push @new_articles, "10,11|New Articles Per Day<br>" . +# "10: Sharp drop in overall number of new articles on all Wikipedias combined mostly due to bot inactivity<br>" . +# " on Dutch Wikipedia, which in Dec accounted for 33% of all new articles.<br>" . +# "11: Still this month the number of wikis with exceptionally large numbers of new articles rose sharply:<br>" . +# " New articles per day for Dec->Jan: Slovene 33->312, Bashkir 4->308, Malagasy 3->232,<br>" . +# " Latin 45->215, Armenian 31->123, Fiji Hindi 22->83<br>" . +# " For comparison, two large Wikipedias with normal article creation rate: Russian 348, Spanish 285" ; +### push @edits, "6|Edits<br>#6: Over the last 3 years there is fairly consistent growth in manual, registered edits.<br>" . +### "# Net growth in constructive edits is less clear, as this metric includes most reverting edits." ; +### " Strong one-monthly dip in July due to World Cup Socker?." ; +### "#13: Average monthly manual edits by registered users for all Wikipedia's combined, in millions<br>" . +### " #2006 ⇒ 2010: 7.7 ⇒ 9.9 ⇒ 11.5 ⇒ 12.4 ⇒ 12.7" ; +## push @new_editors, "8|New Editors Per Month<br>" . +## "8: Continued decline in new editors at large wikipedias, but sharp rise at Commons (WLM)" ; +### " yet with 8120 best result in last 10 months (average last 12 months: 7805)" ; +### " Arguably slowing influx of editors can partly be attributed to (multi-factorial) <a href='http://en.wikipedia.org/wiki/Market_saturation'>saturation process(es)</a><br>" . +### " But 19% drop for Wikipedias in half year (comparing 3-monthly averages) is not consistent with that.<br>" . +### "#7:WMF recently commissioned in depth study of editor activity trends, which is ongoing." ; +### "#8: Since a few months editors on Commons are no longer included in overall editor total,<br>" . +### "# on the assumption that most of these also edit on one or more other projects.<br>" ; +### " #Detection of double counts between any projects and languages is planned for late 2010." ; +## push @active_editors, "7|(Very) Active Editors<br>" . +## "7: Recent spike in (very) active editors on Commons probably caused by Wiki Loves Monuments project (temporary), but also by improved upload facilities (permanent)." ; +## push @very_active_editors, "7|" ; +## " Rise in many wikipedias outweighed <a href='charts/2011-09/Editors-Active-Indexed-Wikis.png'>slow decline</a> (-10% in 3 years) in English, German, Japanese" ; + +### } + +### if ($2011_12) +### { # projects +# @rank = qw ( 5th x 0 0 th) ; # All - Web Properties - Unique Visitors +# @reach = qw ( 31.7 x 1.8 -1.3 %) ; # All - Reach Percentage by Region +# @visitors = qw ( 457,063,000 m 15.6 -3.7 %) ; # All - Unique Visitors by Region +# @page_requests = qw (16,365,306,811 b 17.3 -6.1 %) ; # All - copy/calc manually monthly total and monthly and yearly growth from 1st column (Sigma) of http://stats.wikimedia.org/EN/TablesPageViewsMonthly.htm (Wikipedia only is good enough) +# @commons_files = qw ( 11,974,179 m 50.1 1.8 %) ; # Commons - Binaries per month - Absolute +# @article_count = qw ( 20,845,401 m 18.6 1.9 %) ; # Wp - Starting Sep-2010 Wikipedia articles only / Article count (official) - Absolute +# @new_articles = qw ( 12,759 k 50.0 67.2 %) ; # Wp - New articles per day - Absolute +# @edits = qw ( 11,636,349 m 1.0 4.7 %) ; # Wp - Edits per month - Absolute +# @new_editors = qw ( 15,181 k -9.1 -6.4 %) ; # All - New editors - Absolute +# @active_editors = qw ( 83,293 k 1.6 0.1 %) ; # All - Active editors - Absolute +# @very_active_editors = qw ( 11,041 k 2.7 2.8 %) ; # All - Very active editors - Absolute +# # http://stats.wikimedia.org/EN/TablesPageViewsMonthly.htm +# push @rank, "1|Site Rank<br>#1: 5th position will be stable for long time: differences with those ranked 4th and 6th are considerable." ; +# push @reach, "2|Reach<br>#2: Change in reach in 3 years: (avg Oct-Dec 08 -> avg Oct-Dec 11) pp= percentage points: <br>" . +# "# Europe +9pp, (38%->47%), North-Am +10pp (35%->45%), Asia +1pp (16%->18%),<br>" . +# "# Latin-America +6pp (35%->41%), Middle East-Africa +2pp (30%->32%),<br>" . +# "# India +16pp (20%->35%), World +4.8pp (27.8%->32.7%)" ; +# push @visitors, "3,4|Unique Visitors<br>#3: 8% higher than average for last 12 months (422M).<br>" . +## " 4.9% higher than previous month (which was also an all time high)<br>" . +# "#4: Change in UV's in 3 years: (avg Oct-Dec 08 -> avg Oct-Dec 11): <br>" . +# "# Europe +68%, North-Am +46%, Latin-Am: +103%, Asia: +58%, World +69%<br>" . +# "# India +164%, Middle East-Africa: +180%" ; +# push @page_requests, "5,6,7,8,9|Page Requests<br>" . +# "5: <a href='http://stats.wikimedia.org/EN/TablesPageViewsMonthlyCombined.htm'>Fastest and slowest growth in page requests in top 25 Wikipedias in 2011</a>:<br>" . +# " Fast: Chinese +323%, Persian +114%, Ukranian +69%, Korean +65%, Arabic +43%,<br>" . +# " Indonesian +40%, Hebrew +40%, Russian +38%, Thai +35%, Commons +33%.<br>" . +# " Slow: Finnish +2%, Hungarian +5%.<br>" . +# "6: <a href='http://stats.wikimedia.org/EN/TablesPageViewsMonthlyAllProjects.htm'>Projects ranked by growth in page requests in 2011</a>:<br>" . +# " Wikiquote: +127%, Wiktionary: +57%, Commons: +33%, Wikibooks: +26%, Wikisource: +23%,<br>" . +# " Wikipedia: +16%, Wikinews: +12%, Wikiversity: +5%<br>" . +# "7: Numbers have been corrected for 88 hours of missing traffic data.<br>" . +# "8: Wiktionary traffic back to normal after massive botnet spam in Oct/Nov.<br>" . +## " Reassesment may follow later.<br>" ; +## "6: Note that total requests <b>from mobile devices</b> is even much higher, approx half go to regular site" ; +## "6: <a href='http://stats.wikimedia.org/wikimedia/squids/SquidReportClients.htm'>Total file requests from mobile devices for all Wikimedia projects</a> in March: 7.2%!<br>" . +## " See also <a href='charts/2011-04/RatioMobileTraffic.png'>Plot for both metrics.</a><br>" . +## "7: Note: Requests from mobile devices to the non-mobile site, which are redirected to the mobile site<br>" . +## " are probably counted twice. Follow up requests from the mobile device via internal links<br>" . +## " are not affected. Number of double counts not yet known.<br>" . +## "#8: Page views for Chinese Wikipedia went from 52M in January to 163M in April.<br>" . +## " #Unique visitors from China stayed low as usual, even dropped 6% from January to April.<br>" . +## " #(Chinese community said year ago they had issues with Google ranking, maybe these were fixed?)<br>" . +# "#9: Page requests have been normalized to 30 days (Jan*30/31, Feb*30/28, Mar*30/31, etc)<br>" ; +## push @commons_files, "7|Commons Files<br>7: Recent growth in " . +## "<br> Probably related to Wiki Loves Monuments contest (WLM)</a><br>" ; + +# push @article_count, "10|Article Count<br>10: Some Wikipedias contain massive amounts of bot created stubs,<br>" . +# " (e.g. Dutch Wikipedia 42% of total, Volap\xFCk 92% of total)<br>" . +# " which makes article count a questionable metric of community effort.<br>" . +# " see also <a href='http://stats.wikimedia.org/EN/BotActivityMatrixCreates.htm'>new report</a> on bot induced article creation activity per wiki." ; + + +### "9: Seven Wiktionaries in top 25 Wikimedia projects" ; +#push @new_articles, "10|New Articles Per Day<br>" . +# "10: On Dutch Wikipedia <a href='http://nl.wikipedia.org/wiki/Speciaal:Bijdragen/Joopwikibot'>Joopwikibot</a> created roughly 164k of trivial taxonomy stubs in last 3 months." ; +### push @edits, "6|Edits<br>#6: Over the last 3 years there is fairly consistent growth in manual, registered edits.<br>" . +### "# Net growth in constructive edits is less clear, as this metric includes most reverting edits." ; +### " Strong one-monthly dip in July due to World Cup Socker?." ; +### "#13: Average monthly manual edits by registered users for all Wikipedia's combined, in millions<br>" . +### " #2006 ⇒ 2010: 7.7 ⇒ 9.9 ⇒ 11.5 ⇒ 12.4 ⇒ 12.7" ; +## push @new_editors, "8|New Editors Per Month<br>" . +## "8: Continued decline in new editors at large wikipedias, but sharp rise at Commons (WLM)" ; +### " yet with 8120 best result in last 10 months (average last 12 months: 7805)" ; +### " Arguably slowing influx of editors can partly be attributed to (multi-factorial) <a href='http://en.wikipedia.org/wiki/Market_saturation'>saturation process(es)</a><br>" . +### " But 19% drop for Wikipedias in half year (comparing 3-monthly averages) is not consistent with that.<br>" . +### "#7:WMF recently commissioned in depth study of editor activity trends, which is ongoing." ; +### "#8: Since a few months editors on Commons are no longer included in overall editor total,<br>" . +### "# on the assumption that most of these also edit on one or more other projects.<br>" ; +### " #Detection of double counts between any projects and languages is planned for late 2010." ; +## push @active_editors, "7|(Very) Active Editors<br>" . +## "7: Recent spike in (very) active editors on Commons probably caused by Wiki Loves Monuments project (temporary), but also by improved upload facilities (permanent)." ; +## push @very_active_editors, "7|" ; +## " Rise in many wikipedias outweighed <a href='charts/2011-09/Editors-Active-Indexed-Wikis.png'>slow decline</a> (-10% in 3 years) in English, German, Japanese" ; + +### } + + + ### if ($2011_11) ### { # @rank = qw ( 5th x 0 0 th) ; # Web Properties - Unique Visitors @@ -1277,7 +1450,8 @@ { $line =~ s/\{\{yyyy\}\}_\{\{mm\+1\}\}/{{yyyy+1}}_{{mm+1}}/ ; } # Q&D temp fix } -# $no_upd = "<font color=#C00000><small>No data yet for English Wikipedia.</small><\/font>" ; + $no_upd_feb = "<font color=#C00000><small>Data for January, February will be added soon.</small><\/font>" ; + $no_upd_feb2 = "<br><font color=#C00000><small>Provisionary data, final adjustment will follow soon. (< 1% change)</small><\/font>" ; if ($true) # test ? { @@ -1286,12 +1460,12 @@ $line =~ s/H2 (PAGE REQUESTS)/A[$1] H2 {${page_requests[0]} billion|Page Requests for All Wikimedia Projects}/ ; $line =~ s/H2 (WEB PROPERTIES)/A[$1] H2 {${rank[0]} in rank|Web Properties - Unique Visitors}/ ; $line =~ s/H2 (COMMONS FILES)/A[$1] H2 {${commons_files[0]} million|Binary Files}/ ; - $line =~ s/H2 (ARTICLE COUNT)/A[$1] H2 {${article_count[0]} million|Wikipedia Articles $no_upd}/ ; - $line =~ s/H2 (ARTICLES PER DAY)/A[$1] H2 {${new_articles[0]}|New Wikipedia Articles Per Day $no_upd}/ ; - $line =~ s/H2 (EDITS PER MONTH)/A[$1] H2 {${edits[0]} million|Wikipedia Edits Per Month $no_upd}/ ; - $line =~ s/H2 (NEW EDITORS PER MONTH)/A[$1] H2 {${new_editors[0]}|New Editors Per Month for All Wikimedia Projects $no_upd}/ ; - $line =~ s/H2 (ACTIVE EDITORS)/A[$1] H2 {${active_editors[0]}|Active Wikimedia Editors for All Wikimedia Projects <small>(5+ edits per month)<\/small> $no_upd}/ ; - $line =~ s/H2 (VERY ACTIVE EDITORS)/A[$1] H2 {${very_active_editors[0]}|Very Active Editors for All Wikimedia Projects <small>(100+ edits per month)<\/small> $no_upd}/ ; + $line =~ s/H2 (ARTICLE COUNT)/A[$1] H2 {${article_count[0]} million|Wikipedia Articles $no_upd_feb}/ ; + $line =~ s/H2 (ARTICLES PER DAY)/A[$1] H2 {${new_articles[0]}|New Wikipedia Articles Per Day $no_upd_feb}/ ; + $line =~ s/H2 (EDITS PER MONTH)/A[$1] H2 {${edits[0]} million|Wikipedia Edits Per Month $no_upd_feb2}/ ; + $line =~ s/H2 (NEW EDITORS PER MONTH)/A[$1] H2 {${new_editors[0]}|New Editors Per Month for All Wikimedia Projects $no_upd_feb2}/ ; + $line =~ s/H2 (ACTIVE EDITORS)/A[$1] H2 {${active_editors[0]}|Active Wikimedia Editors for All Wikimedia Projects <small>(5+ edits per month)<\/small> $no_upd_feb2}/ ; + $line =~ s/H2 (VERY ACTIVE EDITORS)/A[$1] H2 {${very_active_editors[0]}|Very Active Editors for All Wikimedia Projects <small>(100+ edits per month)<\/small> $no_upd_feb2}/ ; $line =~ s/TRENDS UNIQUE VISITORS/TRENDS {$trend_one_year|${visitors[2]}%}{$trend_one_month|${visitors[3]}%}/ ; $line =~ s/TRENDS PAGE REQUESTS/TRENDS {$trend_one_year|${page_requests[2]}%}{$trend_one_month|${page_requests[3]}%}/ ; @@ -1559,7 +1733,8 @@ { my $path_out = shift ; - $notice_synopsis = "<font color=#008000><b>Please keep in mind December has one day more than November, which influences some of the metrics.</b></font><br>" . + $notice_synopsis = "<font color=#008000><b>Please remember subsequent months can have a different number of days, which influences<br>" . + "monthly change percentages. Leap year February still has 7% less days than January</b></font><br>" . "<font color=#008000>Exception: page request counts are always normalized to 30 day months.</font>" ; open SYNOPSIS, '>', "$path_out/RC_${p_year}_${p_month_d2}_synopsis.txt" ; _______________________________________________ MediaWiki-CVS mailing list MediaWiki-CVS@lists.wikimedia.org https://lists.wikimedia.org/mailman/listinfo/mediawiki-cvs