User:Canderous/editcount.js

From EditThis.info

(Difference between revisions)
m
 
(2 intermediate revisions not shown)
Line 2: Line 2:
// To run this tool on other servers:
// To run this tool on other servers:
-
// 1. copy this script to the target server (this is required because of javascript cross-site security restrictions)
+
// 1. copy this script to the target server (this is required because of javascript cross-site security restrictions)
-
// 2. update the following URL
+
// 2. update the following URL
-
// for example: "User:Canderous/editcount.js"
+
//     for example: "User:Interiot/Tool2/code.js"
var tool2_url = "User:Canderous/editcount.js";
var tool2_url = "User:Canderous/editcount.js";
-
// 3. update this namespace list, extracted from something like http://en.wikiquote.org/wiki/Special:Export//
+
// 3. update this namespace list, extracted from something like http://en.wikiquote.org/wiki/Special:Export//
-
// These *should not* have colons after them.
+
var namespaces = [
var namespaces = [
"Talk",
"Talk",
"User",
"User",
"User talk",
"User talk",
-
"Wikiquote",
+
"Editthis",
-
"Wikiquote talk",
+
"Editthis talk",
"Image",
"Image",
"Image talk",
"Image talk",
Line 25: Line 24:
"Help talk",
"Help talk",
"Category",
"Category",
-
"Category talk",
+
"Category talk"
-
// 3b. these two project project entries are not added by Special:Export, and might or might not need to be updated
+
-
"Editthis",
+
-
"Editthis talk"
+
];
];
-
 
-
namespaces[100] = "Portal";
 
-
namespaces[101] = "Portal talk";
 
-
 
-
// 4. update this date-parser to match the format and language of your specific wiki.  Feel free to contact Interiot regarding this, if you can't find another
 
-
// copy of this script that uses the same language.
 
-
// input: a text string from Special:Contributions.    output: a javascript Date object
 
-
// documentation:  http://www.quirksmode.org/js/introdate.html#parse, http://www.elated.com/tutorials/programming/javascript/dates/
 
-
function date_parse(text) {
 
-
var matches = text.match(/^([0-9:]+), +([0-9]+) +([a-z]+) +([0-9]+)$/i);
 
-
if (!matches) {
 
-
//dump_text("XXX"); // for debugging
 
-
return matches;
 
-
}
 
-
 
-
parseme = matches[3] + ", " + matches[2] + " "  + matches[4] + " " + matches[1] + ":00";
 
-
 
-
//dump_text(parseme); // for debugging
 
-
 
-
var dt = new Date();
 
-
dt.setTime( Date.parse(parseme));
 
-
 
-
//dump_text(dt.toLocaleString()); // for debugging
 
-
 
-
return dt;
 
-
}
 
-
 
-
// ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^ end of server-specific configuration ^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^^
 
-
 
// TODO:
// TODO:
-
// - the current document.location method doesn't work when the page is accessed sans-mod_rewrite
+
// - the current document.location method doesn't work when the page is accessed sans-mod_rewrite
-
// - test with non-ASCII characters
+
// - test with non-ASCII characters
-
// - non-ascii usernames
+
//     - non-ascii usernames
-
// - ??
+
//     - ??
Line 94: Line 61:
function generate_input_form(bodyContent) {
function generate_input_form(bodyContent) {
-
  if (navigator.userAgent.toLowerCase().indexOf('msie')+1)
 
-
  {
 
-
  bodyContent.innerHTML = "This counter does not currently work in Internet Explorer.  Please <a href='http://www.getfirefox.com'>get Firefox</a> or use <a href='http://en.wikipedia.org/wiki/Wikipedia:WikiProject_edit_counters/Flcelloguy%27s_Tool'>Flcelloguy's Tool</a> instead.";
 
-
  }
 
-
  else
 
-
  {
 
   bodyContent.innerHTML =
   bodyContent.innerHTML =
-
             "<form><table><tr><td>Username <td><input maxlength=128 name=username value='' id=username title='username'>" +
+
             "<form><table><tr><td>Username <td><input maxlength=128 name=username value='' title='username'>" +
             "            <tr><td>        <td><input type=submit value='Submit'>" +
             "            <tr><td>        <td><input type=submit value='Submit'>" +
             "</table></form>";
             "</table></form>";
Line 108: Line 69:
   form.method = "get";
   form.method = "get";
   form.action = document.location;
   form.action = document.location;
-
 
-
  document.getElementById("username").focus();
 
-
  }
 
}
}
function generate_main_report() {
function generate_main_report() {
-
   fetch_data(params["username"].replace(/\\+/g, " "),
+
   fetch_data(params["username"], "", output_main_report, 0, []);
-
"", output_main_report, 0, []);
+
}
}
-
 
+
function output_main_report(data) {
-
function add_stats_row(left_col, right_col) {
+
-
var row = document.createElement("tr");
+
-
var left = document.createElement("td");
+
-
var right = document.createElement("td");
+
-
+
-
document.getElementById("basic_stats").appendChild(row);
+
-
row.appendChild(left);
+
-
row.appendChild(right);
+
-
//left.innerHTML = left_col;
+
-
left.appendChild( document.createTextNode(left_col) );
+
-
right.appendChild( document.createTextNode(right_col) );
+
-
return row;
+
-
}
+
-
 
+
-
function output_main_report(history) {
+
-
// -- generate summary statistics
+
-
var unique_articles = new Array();
+
-
var namespace_numedits = new Array();
+
-
for (var i=0; i<namespaces.length; i++) {
+
-
namespace_numedits[ namespaces[i] ] = 0;
+
-
}
+
-
namespace_numedits[""] = 0;
+
-
for (var i=0; i<history.length; i++) {
+
-
var h = history[i];
+
-
unique_articles[  h["title"] ]++;
+
-
namespace_numedits[  h["namespace"] ]++;
+
-
}
+
-
var unique_articles_keys = keys(unique_articles);
+
-
 
+
-
// -- output report
+
-
var table = document.createElement("table");
+
-
table.id = "basic_stats";
+
-
document.getElementById("bodyContent").appendChild(table);
+
-
 
+
-
add_stats_row("Username", params["username"].replace(/\\+/g, " "));
+
-
add_stats_row("Total edits", history.length);
+
-
add_stats_row("Distinct pages edited", unique_articles_keys.length);
+
-
add_stats_row("Average edits/page", new Number(history.length / unique_articles_keys.length).toFixed(3));
+
-
add_stats_row("First edit", history[ history.length-1 ]["date_text"] );
+
-
 
+
-
// add a blank row
+
-
add_stats_row("", "").childNodes[0].style.height = "1em";
+
-
 
+
-
add_stats_row("(main)", namespace_numedits[""]);
+
-
for (var i=0; i<namespaces.length; i++) {
+
-
var nmspc = namespaces[i];
+
-
if (namespace_numedits[nmspc]) {
+
-
add_stats_row(nmspc, namespace_numedits[nmspc]);
+
-
}
+
-
}
+
}
}
-
 
-
// ===================================== HTML-scraping backend =========================================
 
-
 
-
function add_loading_notice() {
 
-
if (document.getElementById("loading_notice"))
 
-
return;
 
-
var loading = document.createElement("div");
 
-
loading.id = "loading_notice";
 
-
loading.innerHTML = "<br><br>Retrieving data<blink>...</blink>";
 
-
document.getElementById("bodyContent").appendChild(loading);
 
-
}
 
-
function remove_loading_notice() {
 
-
var loading = document.getElementById("loading_notice");
 
-
if (!loading) return;
 
-
loading.parentNode.removeChild(loading);
 
-
}
 
var offset_regexp = /href="[^"]+:Contributions[^"]+offset=(\\d+)/gi;
var offset_regexp = /href="[^"]+:Contributions[^"]+offset=(\\d+)/gi;
function fetch_data(username, end_date, handler, offset, page_list) {
function fetch_data(username, end_date, handler, offset, page_list) {
-
add_loading_notice();
+
    var url = prefix + "Special:Contributions/" + username + "?offset=" + offset + "&limit=500";
-
var url = prefix + "Special:Contributions/" + username + "?offset=" + offset + "&limit=5000";
+
    loadXMLDoc(url,  
-
loadXMLDoc(url,  
+
        function (request) {
-
function (request) {
+
            var next_offset = 0;
-
var next_offset = 0;
+
            if (request.readyState != 4)  return;
-
if (request.readyState != 4)  return;
+
            if (request.status == 200) {
-
if (request.status == 200) {
+
                page_list.push(request.responseText);
-
page_list.push(request.responseText);
+
                //dump_text(request.responseText);
-
//dump_text(request.responseText);
+
-
// see if there's another pageful to get
+
                // see if there's another pageful to get
-
var matches = map( function(p){
+
                var matches = map( function(p){
-
return p.match( /(\\d+)$/ )[0];
+
                        return p.match( /(\\d+)$/ )[0];
-
}, request.responseText.match( offset_regexp ) );
+
                    }, request.responseText.match( offset_regexp ) );
-
for (var i=0; i<matches.length; i++) {
+
                for (var i=0; i<matches.length; i++) {
-
var v = matches[i] * 1;
+
                    var v = matches[i] * 1;
-
if (v != 0 && (offset == 0 || v < offset)) {
+
                    if (v != 0 && (offset == 0 || v < offset)) {
-
next_offset = v;
+
                        next_offset = v;
-
break;
+
                        break;
-
}
+
                    }
-
}
+
                }
-
}
+
            }
-
//next_offset = 0; // for testing only, retrieve just the first page of results
+
            if (next_offset == 0) {
-
 
+
                parse_data(page_list, handler);
-
if (next_offset == 0) {
+
            } else {
-
parse_data(page_list, handler);
+
                // tail recurse
-
} else {
+
                fetch_data(username, end_date, handler, next_offset, page_list);
-
// tail recurse
+
            }
-
fetch_data(username, end_date, handler, next_offset, page_list);
+
        });
-
}
+
-
});
+
}
}
-
// input: a list of strings, each string containing the HTML from a single page
 
-
// output: a list, where each individual entry is a specific edit from history
 
function parse_data(page_list, handler) {
function parse_data(page_list, handler) {
-
//var total_len = 0;
+
    //var total_len = 0;
-
//for (var i=0; i<page_list.length; i++) total_len += page_list[i].length;
+
    //for (var i=0; i<page_list.length; i++) total_len += page_list[i].length;
-
//alert("parsing " + page_list.length + " pages comprising " + total_len + " total bytes");
+
    //alert("parsing " + page_list.length + " pages comprising " + total_len + " total bytes");
-
 
+
-
var last_history_ent = [];
+
-
last_history_ent["title"] = "";
+
-
last_history_ent["oldid"] = "";
+
-
 
+
-
var edit_history = new Array();
+
-
for (var pagecnt=0; pagecnt<page_list.length; pagecnt++) {
+
-
var matches = page_list[pagecnt].match( /^<li>[^(]+\\(<a href="[^"]+action=history.*/gim );
+
-
//dump_lines(matches);
+
-
for (var matchcnt=0; matchcnt<matches.length; matchcnt++) {
+
-
var history_text = matches[matchcnt];
+
-
 
+
-
var history_entry = new Array();
+
-
history_entry["date_text"] = history_text.match( /^<li>([^(<]+)/i )[1]
+
-
.replace( / +$/, "");
+
-
history_entry["date"] = date_parse( history_entry["date_text"] );
+
-
history_entry["title"] = history_text.match( /title="([^"]+)"/i )[1]
+
-
.replace( /&quot;/g, "\\"")
+
-
.replace( /&amp;/g, "&");
+
-
var find_comment = history_text.replace(/<span class="autocomment">.*?<\\/span> ?/, "");
+
-
history_entry["comment"] = ifmatch(find_comment.match( /<span class='comment'>(.*?)<\\/span>/ ))
+
-
.replace(/^\\((.*)\\)$/, "$1");
+
-
history_entry["minor"] = /<span class="minor"/.test(history_text);
+
-
history_entry["oldid"] = ifmatch(history_text.match(/oldid=([0-9]+)/i));
+
-
 
+
-
history_entry["namespace"] = "";
+
-
for (var nmspc_ctr=0; nmspc_ctr<namespaces.length; nmspc_ctr++) {
+
-
var nmspc = namespaces[nmspc_ctr] + ":";
+
-
if (history_entry["title"].substring(0, nmspc.length) == nmspc) {
+
-
history_entry["namespace"] = namespaces[nmspc_ctr];
+
-
break;
+
-
}
+
-
}
+
-
 
+
-
//dump_object(history_entry);
+
-
 
+
-
if (history_entry["title"] != last_history_ent["title"] || history_entry["oldid"] != last_history_ent["oldid"])
+
-
edit_history.push(history_entry);
+
-
last_history_ent = history_entry;
+
-
}
+
-
}
+
-
 
+
-
remove_loading_notice();
+
-
 
+
-
handler(edit_history);
+
}
}
-
 
Line 300: Line 140:
function dump_lines(ary) {
function dump_lines(ary) {
-
   dump_text("--> " + ary.join("\
+
   dump_text(ary.join("\
-
--> "));
+
"));
-
}
+
-
 
+
-
function dump_object(obj) {
+
-
var toString = "";
+
-
for (var prop in obj) {
+
-
toString += prop + ": " + obj[prop] + "\
+
-
";
+
-
}
+
-
dump_text(toString);
+
}
}
Line 326: Line 157:
   }
   }
}
}
-
 
function parse_params() {
function parse_params() {
Line 337: Line 167:
   return ret;  
   return ret;  
}
}
-
 
function loadXMLDoc(url, handler)
function loadXMLDoc(url, handler)
Line 344: Line 173:
     if (window.XMLHttpRequest) {
     if (window.XMLHttpRequest) {
         req = new XMLHttpRequest();
         req = new XMLHttpRequest();
-
req.onreadystatechange = function () {handler(req)};
+
    req.onreadystatechange = function () {handler(req)};
         req.open("GET", url, true);
         req.open("GET", url, true);
         req.send(null);
         req.send(null);
Line 357: Line 186:
     }
     }
}
}
-
 
// see http://search.cpan.org/dist/perl/pod/perlfunc.pod#map
// see http://search.cpan.org/dist/perl/pod/perlfunc.pod#map
Line 367: Line 195:
   }
   }
   return ret;
   return ret;
-
}
 
-
 
-
// see http://search.cpan.org/dist/perl/pod/perlfunc.pod#keys
 
-
function keys (obj) {
 
-
var ret = new Array();
 
-
for (var key in obj) {
 
-
ret.push(key);
 
-
}
 
-
return ret;
 
-
}
 
-
 
-
 
-
function ifmatch(ary) {
 
-
if (ary && ary.length >= 2) {
 
-
return ary[1];
 
-
} else {
 
-
return "";
 
-
}
 
}
}

Current revision as of 20:11, 8 March 2007

// see http://paperlined.org/apps/wikipedia/Tool2/ for instructions on adding this to your monobook.js

// To run this tool on other servers:
//  1. copy this script to the target server (this is required because of javascript cross-site security restrictions)

//  2. update the following URL
//      for example: "User:Interiot/Tool2/code.js"
var tool2_url = "User:Canderous/editcount.js";

//  3. update this namespace list, extracted from something like http://en.wikiquote.org/wiki/Special:Export//
var namespaces = [
"Talk",
"User",
"User talk",
"Editthis",
"Editthis talk",
"Image",
"Image talk",
"MediaWiki",
"MediaWiki talk",
"Template",
"Template talk",
"Help",
"Help talk",
"Category",
"Category talk"
];


// TODO:
//  - the current document.location method doesn't work when the page is accessed sans-mod_rewrite
//  - test with non-ASCII characters
//      - non-ascii usernames
//      - ??



var prefix = "";
var params = parse_params();

addOnloadFunction(function() {
  var path_len = document.location.pathname.length;
  // trigger once we view the right page
  if (document.location.pathname.substring(path_len - tool2_url.length, path_len) == tool2_url) {
    // get the prefix (needs to be fixed to work sans-mod_rewrite
    prefix = document.location.protocol + "//" + document.location.host + "/"
            + document.location.pathname.substring(1, path_len - tool2_url.length);

    // blank the inner contents of the page
    var bodyContent = document.getElementById("bodyContent");
    while (bodyContent.childNodes.length > 0) bodyContent.removeChild(bodyContent.lastChild);

    if (document.location.search.length == 0) {
      generate_input_form(bodyContent);
    } else {
      generate_main_report(bodyContent);
    }
  }
});


function generate_input_form(bodyContent) {
  bodyContent.innerHTML =
            "<form><table><tr><td>Username <td><input maxlength=128 name=username value='' title='username'>" +
            "             <tr><td>         <td><input type=submit value='Submit'>" +
            "</table></form>";

  var form = bodyContent.getElementsByTagName("form")[0];
  form.method = "get";
  form.action = document.location;
}

function generate_main_report() {
  fetch_data(params["username"], "", output_main_report, 0, []);
}

function output_main_report(data) {
}



var offset_regexp = /href="[^"]+:Contributions[^"]+offset=(\\d+)/gi;
function fetch_data(username, end_date, handler, offset, page_list) {
    var url = prefix + "Special:Contributions/" + username + "?offset=" + offset + "&limit=500";
    loadXMLDoc(url, 
        function (request) {
            var next_offset = 0;
            if (request.readyState != 4)   return;
            if (request.status == 200) {
                page_list.push(request.responseText);
                //dump_text(request.responseText);

                // see if there's another pageful to get
                var matches = map( function(p){
                        return p.match( /(\\d+)$/ )[0];
                    }, request.responseText.match( offset_regexp ) );
                for (var i=0; i<matches.length; i++) {
                    var v = matches[i] * 1;
                    if (v != 0 && (offset == 0 || v < offset)) {
                        next_offset = v;
                        break;
                    }
                }
            }

            if (next_offset == 0) {
                parse_data(page_list, handler);
            } else {
                // tail recurse
                fetch_data(username, end_date, handler, next_offset, page_list);
            }
        });
}


function parse_data(page_list, handler) {
    //var total_len = 0;
    //for (var i=0; i<page_list.length; i++) total_len += page_list[i].length;
    //alert("parsing " + page_list.length + " pages comprising " + total_len + " total bytes");
}



// ===================================== test/debug functions =========================================

function dump_text(text) {
  //alert("dump_text, with text of size " + text.length);

  var pre = document.createElement("pre");

  var div = document.createElement("div");
  div.style.width = "60em";
  div.style.maxHeight = "40em";
  div.style.overflow = "auto";

  pre.appendChild(document.createTextNode(text));
  div.appendChild(pre);
  document.getElementById("bodyContent").appendChild(div);
}

function dump_lines(ary) {
  dump_text(ary.join("\
"));
}


// ===================================== utility functions =========================================

function addOnloadFunction(f) {
  if (window.addEventListener) window.addEventListener("load",f,false);
  else if (window.attachEvent) window.attachEvent("onload",f);
  else {
    var oldOnload='_old_onload_'+addOnloadFunction.uid;
    addOnloadFunction[oldOnload] = window.onload ? window.onload : function () {};
    window.onload = function() { addOnloadFunction[oldOnload]();  f(); }
    ++addOnloadFunction.uid;
  }
}

function parse_params() {
  var pairs = document.location.search.substring(1).split("&");
  var ret = [];
  for (var i=0; i < pairs.length; i++) {
    var values = pairs[i].split("=");
    ret[values[0]] = unescape(values[1]);
  }
  return ret; 
}

function loadXMLDoc(url, handler)
{
    // branch for native XMLHttpRequest object
    if (window.XMLHttpRequest) {
        req = new XMLHttpRequest();
    req.onreadystatechange = function () {handler(req)};
        req.open("GET", url, true);
        req.send(null);
    // branch for IE/Windows ActiveX version
    } else if (window.ActiveXObject) {
        req = new ActiveXObject("Microsoft.XMLHTTP");
        if (req) {
            req.onreadystatechange = function () {handler(req)};
            req.open("GET", url, true);
            req.send();
        }
    }
}

// see http://search.cpan.org/dist/perl/pod/perlfunc.pod#map
function map (handler, list) {
  var ret = new Array();
  for (var i=0; i<list.length; i++) {
    ret[i] = handler( list[i] );
    // ret.push( handler( list[i] ) );
  }
  return ret;
}
Personal tools