Brūcend:PiRSquared17/spellingstyle
/*********************************************************
* Old English Wikipedia transliterator * * Deals with the following orthographies: gw, ȝƿ, runes * * Created by PiRSquared17 * * Please report bugs on talk page or village pump * * Currently supports: "gw", "ȝƿ", and "runes" * *********************************************************/
/**
* Actually clone content, and transliterate * * @param event The event: event.data.outputstyle (see convertStyle args 2,3) * @returns nothing (undefined) */
function doConv(event) {
var $ = jQuery; if ($("#mw-content-text-clone").length) $("#mw-content-text-clone").remove(); //console.log("Entered doConv, (possibly removed old clone)"); // get target style var targetstyle = event.data.outputstyle; var contentClone; $("#mw-content-text").show(); contentClone = $("#mw-content-text").clone(); contentClone.attr("id", "mw-content-text-clone"); convertStyle(contentClone, "gw", targetstyle); convertStyle(contentClone, "ȝƿ", targetstyle); convertStyle(contentClone, "runes", targetstyle); $("#mw-content-text").hide(); if (targetstyle == "ȝƿ") contentClone.addClass("content-yoghwynn"); else contentClone.addClass("content-" + targetstyle); contentClone.insertAfter("#mw-content-text"); $(".click-gw").click({"outputstyle": "gw"}, doConv); $(".click-yoghwynn").click({"outputstyle": "ȝƿ"}, doConv); $(".click-runes").click({"outputstyle": "runes"}, doConv);
}
// any errors? Fix them var runes = { // rune to latin substitutions
"ᚠ": "f", "ᚢ": "u", "ᚦ": "þ", "ᚩ": "o", "ᚱ": "r", "ᚳ": "c", "ᚷ": "ġ", "ᚹ": "w", "ᚻ": "h", "ᚾ": "n", "ᛁ": "i", "ᛄ": "j", "ᛇ": "ēo", "ᛈ": "p", "ᛉ": "x", "ᛋ": "s", "ᛏ": "t", "ᛒ": "b", "ᛖ": "e", "ᛗ": "m", "ᛚ": "l", "ᛝ": "ng", // this is correct "ᛟ": "œ", "ᛞ": "d", "ᚪ": "a", "ᚫ": "æ", "ᚣ": "y", "ᛡ": "io", // not ia "ᛠ": "ea", // this is ok "ᛢ": "cw", "ᛣ": "c", "ᛤ": "cc", "ᛥ": "st", "ᚸ": "g"
};
// again, please report any errors, please include replacement for this var runes2 = { // latin -> runes
"a": "ᚪ", "ā": "ᚪ", "b": "ᛒ", "c": "ᚳ", "ċ": "ᚳ", // this is appropriate "d": "ᛞ", "e": "ᛖ", "ē": "ᛖ", "f": "ᚠ", "g": "ᚷ", "h": "ᚻ", "i": "ᛁ", "ī": "ᛁ", "ġ": "ᛄ", "k": "ᚳ", "l": "ᛚ", "m": "ᛗ", "n": "ᚾ", "o": "ᚩ", "ō": "ᚩ", "p": "ᛈ", "q": "ᛢ", "r": "ᚱ", "s": "ᛋ", "t": "ᛏ", "u": "ᚢ", "ū": "ᚢ", "v": "ᚹ", // maybe should convert to F instead of W? "w": "ᚹ", "x": "ᛉ", "y": "ᚣ", "ȳ": "ᚣ", "z": "ᛋ", "æ": "ᚫ", "œ": "ᛟ", "þ": "ᚦ", "ð": "ᚦ" // no way to distinguish, unless we want to check whether or not it's the last letter, etc. (???)
};
/**
* Two or more characters -> a single rune or a pattern of runes * Put here anything that should be converted from two or more gw characters to one or more rune. */
rune2_exceptions = [
["ea", "ᛠ"], ["eo", "ᛇ"], ["io", "ᛡ"], ["ng", "ᛝ"], ["cc", "ᛤ"], ["cw", "ᛢ"]
];
/**
* Replace occurrences of regex, possibly normalize * * For nodes (not text) input, modifies object * @param input the input text or jQuery object * @param regex the regular expression * @param replacement replacement * @param norm Normalize input? (also converts to lowercase) * @returns the converted version of input (as text/DOM node) */
var myReplace = function(input, regex, replacement, norm) {
var $ = jQuery; if (typeof regex == "string") regex = new RegExp(regex, "g"); if (typeof input == "string") return norm?normalizeString(input).toLowerCase():input.replace(regex,replacement); if (typeof input == "undefined") return; var node = input[0]; if (typeof node == "undefined") node = input; if (!("nodeType" in node)) return node; if (node.nodeType == 3) { if (norm) node.nodeValue = normalizeString(node.nodeValue).toLowerCase(); node.nodeValue = node.nodeValue.replace(regex, replacement); } else { if ($(node).hasClass("nochange")) return node; if (!("childNodes" in node)) return node; for (var i = 0, len = node.childNodes.length; i < len; i++) myReplace($(node.childNodes[i]), regex, replacement, norm); } return node;
}
/**
* Convert style of text/jQuery node from one spelling style to another * * @param inputhtml input text or jQuery node * @param inputstyle possible values: "gw", "ȝƿ", "runes" * @param outputstyle possible values:"gw", "ȝƿ", "runes" * @returns converted version of inputhtml */
function convertStyle(inputhtml, inputstyle, outputstyle) {
var temp = inputhtml; if (inputstyle == outputstyle) return inputhtml; if (inputstyle == "gw" && outputstyle == "ȝƿ") { temp = myReplace(temp, /G/g, 'Ȝ'); temp = myReplace(temp, /g/g, 'ȝ'); temp = myReplace(temp, /W/g, 'Ƿ'); temp = myReplace(temp, /w/g, 'ƿ'); } else if (inputstyle == "ȝƿ" && outputstyle == "gw") { temp = myReplace(temp, /Ȝ/g, "G"); temp = myReplace(temp, /ȝ/g, "g"); temp = myReplace(temp, /Ƿ/g, "W"); temp = myReplace(temp, /ƿ/g, "w"); } else if (inputstyle == "runes") { for (var rune in runes) { temp = myReplace(temp, rune, runes[rune]); } return convertStyle(temp, "gw", outputstyle); } else if (outputstyle == "runes") { temp = convertStyle(myReplace(temp,"","",1), inputstyle, "gw"); for (var i = 0; i < rune2_exceptions.length; i++) { temp = myReplace(temp,rune2_exceptions[i][0],rune2_exceptions[i][1]); } for (var latin in runes2) { temp = myReplace(temp, latin, runes2[latin]); } } return temp;
}
/**
* Remove some accents, in an Anglo-Saxon-centric manner * * @param r the string * @returns normalized version (same case, e.g., É -> E, é -> e) */
function normalizeString(r){
// from http://stackoverflow.com/questions/8186302/javascript-removing-accents , modified // same code is found in another S.O. post r = myReplace(r, /ċ/g , "c"); r = myReplace(r, /Ċ/g , "C"); r = myReplace(r, "Ġ" , "G"); r = myReplace(r, "ġ" , "g"); r = myReplace(r, /[àáâãäåā]/g, "a"); r = myReplace(r, /[ÀÁÂÃÄÅĀ]/g, "A"); r = myReplace(r, /ç/g , "s"); r = myReplace(r, /Ç/g , "S"); r = myReplace(r, /[èéêëē]/g , "e"); r = myReplace(r, /[ÈÉÊËĒ]/g , "E"); r = myReplace(r, /[ìíîïī]/g , "i"); r = myReplace(r, /[ÌÍÎÏĪ]/g , "I"); r = myReplace(r, /ñ/g , "n"); r = myReplace(r, /Ñ/g , "n"); r = myReplace(r, /[òóôõöō]/g , "o"); r = myReplace(r, /[ÒÓÔÕÖŌ]/g , "O"); r = myReplace(r, /[ùúûüū]/g , "u"); r = myReplace(r, /[ÙÚÛÜŪ]/g , "U"); r = myReplace(r, /[ýÿȳ]/g , "y"); r = myReplace(r, /[ŸȲ]/g , "Y"); r = myReplace(r, /ǣ/g , "æ"); r = myReplace(r, /Ǣ/g , "Æ"); r = myReplace(r, /Ḡ/g , "G"); r = myReplace(r, /ḡ/g , "g"); return r;
}
/*
* This is code to be executed when the document is ready * Basically, add [ gw ] [ ȝƿ ] [ ᚱᚢᚾ ]. * Clicking each link converts the document to that style. * (see doConv) */
$(function() {
$ = jQuery;
$("#mw-content-text").prepend($("
"));
$(".click-gw").click({"outputstyle": "gw"}, doConv); $(".click-yoghwynn").click({"outputstyle": "ȝƿ"}, doConv); $(".click-runes").click({"outputstyle": "runes"}, doConv);
});