MediaWiki:Gadget-I18n-js.js: Difference between revisions
From Tardis Wiki, the free Doctor Who reference
(prevent xss via parsed messages by using separate empty document for jquery calls) |
(add msg().exists; don't duplicate escape code) |
||
Line 4: | Line 4: | ||
* | * | ||
* @author Cqm <https://dev.wikia.com/User:Cqm> | * @author Cqm <https://dev.wikia.com/User:Cqm> | ||
* @version 0.4. | * @version 0.4.2 | ||
* | * | ||
* @notes Also used by VSTF wiki for their reporting forms (with a non-dev i18n.json page) | * @notes Also used by VSTF wiki for their reporting forms (with a non-dev i18n.json page) | ||
Line 465: | Line 465: | ||
return { | return { | ||
/* | |||
* Boolean representing whether the message exists. | |||
*/ | |||
exists: msg !== noMsg, | |||
/* | /* | ||
* Parse wikitext links in the message and return the result. | * Parse wikitext links in the message and return the result. | ||
Line 473: | Line 478: | ||
// skip parsing if the message wasn't found otherwise | // skip parsing if the message wasn't found otherwise | ||
// the sanitisation will mess with it | // the sanitisation will mess with it | ||
if ( | if (!this.exists) { | ||
return | return this.escape(); | ||
} | } | ||
Line 488: | Line 493: | ||
// skip parsing if the message wasn't found otherwise | // skip parsing if the message wasn't found otherwise | ||
// the sanitisation will mess with it | // the sanitisation will mess with it | ||
if ( | if (!this.exists) { | ||
return | return this.escape(); | ||
} | } | ||
Revision as of 18:28, 16 August 2018
/* <nowiki>
* Library for accessing i18n messages for use in Dev Wiki scripts.
* See [[I18n-js]] for documentation.
*
* @author Cqm <https://dev.wikia.com/User:Cqm>
* @version 0.4.2
*
* @notes Also used by VSTF wiki for their reporting forms (with a non-dev i18n.json page)
* @notes This is apparently a commonly used library for a number of scripts and also includes
* a check to prevent double loading. This can make it painful to test from your JS
* console. to get around this, add ?usesitejs=0&useuserjs=0 to your URL.
*/
/*global mediaWiki */
/*jshint bitwise:true, camelcase:true, curly:true, eqeqeq:true, es3:false,
forin:true, immed:true, indent:4, latedef:true, newcap:true,
noarg:true, noempty:true, nonew:true, plusplus:true, quotmark:single,
undef:true, unused:true, strict:true, trailing:true,
browser:true, devel:false, jquery:true,
onevar:true
*/
;(function (window, $, mw, undefined) {
'use strict';
window.dev = window.dev || {};
// prevent double loading and loss of cache
if (window.dev.i18n !== undefined) {
return;
}
/*
* Cache of mw config variables.
*/
var conf = mw.config.get([
'wgContentLanguage',
'wgUserLanguage'
]),
/*
* Cache of loaded I18n instances.
*/
cache = {},
/*
* Initial overrides object, initialised below with the i18n global variable.
* Allows end-users to override specific messages. See documentation for how to use.
*/
overrides = null,
/*
* Language fallbacks for those that don't fallback to English.
* Shouldn't need updating unless Wikia change theirs.
*
* To generate this, use `$ grep -R "fallback =" /path/to/messages/`,
* pipe the result to a text file and format the result.
*/
fallbacks = {
'ab': 'ru',
'ace': 'id',
'aln': 'sq',
'als': 'gsw',
'an': 'es',
'anp': 'hi',
'arn': 'es',
'arz': 'ar',
'av': 'ru',
'ay': 'es',
'ba': 'ru',
'bar': 'de',
'bat-smg': 'sgs',
'bcc': 'fa',
'be-x-old': 'be-tarask',
'bh': 'bho',
'bjn': 'id',
'bm': 'fr',
'bpy': 'bn',
'bqi': 'fa',
'bug': 'id',
'cbk-zam': 'es',
'ce': 'ru',
'ckb': 'ckb-arab',
'crh': 'crh-latn',
'crh-cyrl': 'ru',
'csb': 'pl',
'cv': 'ru',
'de-at': 'de',
'de-ch': 'de',
'de-formal': 'de',
'dsb': 'de',
'dtp': 'ms',
'eml': 'it',
'ff': 'fr',
'fiu-vro': 'vro',
'frc': 'fr',
'frp': 'fr',
'frr': 'de',
'fur': 'it',
'gag': 'tr',
'gan': 'gan-hant',
'gan-hans': 'zh-hans',
'gan-hant': 'zh-hant',
'gl': 'pt',
'glk': 'fa',
'gn': 'es',
'gsw': 'de',
'hif': 'hif-latn',
'hsb': 'de',
'ht': 'fr',
'ii': 'zh-cn',
'inh': 'ru',
'iu': 'ike-cans',
'jut': 'da',
'jv': 'id',
'kaa': 'kk-latn',
'kbd': 'kbd-cyrl',
'kbd-cyrl': 'ru',
'khw': 'ur',
'kiu': 'tr',
'kk': 'kk-cyrl',
'kk-arab': 'kk-cyrl',
'kk-cn': 'kk-arab',
'kk-kz': 'kk-cyrl',
'kk-latn': 'kk-cyrl',
'kk-tr': 'kk-latn',
'kl': 'da',
'koi': 'ru',
'ko-kp': 'ko',
'krc': 'ru',
'ks': 'ks-arab',
'ksh': 'de',
'ku': 'ku-latn',
'ku-arab': 'ckb',
'kv': 'ru',
'lad': 'es',
'lb': 'de',
'lbe': 'ru',
'lez': 'ru',
'li': 'nl',
'lij': 'it',
'liv': 'et',
'lmo': 'it',
'ln': 'fr',
'ltg': 'lv',
'lzz': 'tr',
'mai': 'hi',
'map-bms': 'jv',
'mg': 'fr',
'mhr': 'ru',
'min': 'id',
'mo': 'ro',
'mrj': 'ru',
'mwl': 'pt',
'myv': 'ru',
'mzn': 'fa',
'nah': 'es',
'nap': 'it',
'nds': 'de',
'nds-nl': 'nl',
'nl-informal': 'nl',
'no': 'nb',
'os': 'ru',
'pcd': 'fr',
'pdc': 'de',
'pdt': 'de',
'pfl': 'de',
'pms': 'it',
// 'pt': 'pt-br',
'pt-br': 'pt',
'qu': 'es',
'qug': 'qu',
'rgn': 'it',
'rmy': 'ro',
'rue': 'uk',
'ruq': 'ruq-latn',
'ruq-cyrl': 'mk',
'ruq-latn': 'ro',
'sa': 'hi',
'sah': 'ru',
'scn': 'it',
'sg': 'fr',
'sgs': 'lt',
'shi': 'ar',
'simple': 'en',
'sli': 'de',
'sr': 'sr-ec',
'srn': 'nl',
'stq': 'de',
'su': 'id',
'szl': 'pl',
'tcy': 'kn',
'tg': 'tg-cyrl',
'tt': 'tt-cyrl',
'tt-cyrl': 'ru',
'ty': 'fr',
'udm': 'ru',
'ug': 'ug-arab',
'uk': 'ru',
'vec': 'it',
'vep': 'et',
'vls': 'nl',
'vmf': 'de',
'vot': 'fi',
'vro': 'et',
'wa': 'fr',
'wo': 'fr',
'wuu': 'zh-hans',
'xal': 'ru',
'xmf': 'ka',
'yi': 'he',
'za': 'zh-hans',
'zea': 'nl',
'zh': 'zh-hans',
'zh-classical': 'lzh',
'zh-cn': 'zh-hans',
'zh-hant': 'zh-hans',
'zh-hk': 'zh-hant',
'zh-min-nan': 'nan',
'zh-mo': 'zh-hk',
'zh-my': 'zh-sg',
'zh-sg': 'zh-hans',
'zh-tw': 'zh-hant',
'zh-yue': 'yue'
};
/*
* Get a translation of a message from the messages object in the
* requested language.
*
* @param messages the message object to look the message up in.
* @param name The name of the message to get.
* @param lang The language to get the message in.
* @param messageKey
*
* @return The requested translation or the name wrapped in < ... > if no
* message could be found.
*/
function getMsg(messages, name, lang, messageKey) {
// if the message has been overridden, use that without checking the language
if (overrides[messageKey] && overrides[messageKey][name]) {
return overrides[messageKey][name];
}
if (messages[lang] && messages[lang][name]) {
return messages[lang][name];
}
if (lang === 'en') {
return '<' + name + '>';
}
lang = fallbacks[lang] || 'en';
return getMsg(messages, name, lang);
}
/*
* Substitute arguments into the string, where arguments are represented
* as $n where n > 0.
*
* @param message The message to substitute arguments into
* @param arguments The arguments to substitute in.
*
* @return The resulting message.
*/
function handleArgs(message, args) {
args.forEach(function (elem, index) {
var rgx = new RegExp('\\$' + (index + 1), 'g');
message = message.replace(rgx, elem);
});
return message;
}
/*
* Generate a HTML link using the supplied parameters.
*
* @param href The href of the link which will be converted to
* '/wiki/href'.
* @param text The text and title of the link. If this is not supplied, it
* will default to href.
*
* @return The generated link.
*/
function makeLink(href, text) {
var hasProtocol = (href.indexOf('http') === 0 || href.indexOf('//') === 0);
text = text || href;
href = hasProtocol ? href : mw.util.getUrl(href);
text = mw.html.escape(text);
href = mw.html.escape(href);
return '<a href="' + href + '" title="' + text + '">' + text + '</a>';
}
/*
* Allow basic inline HTML tags in wikitext.does not support <a> as that's handled by the
* wikitext links instead.
*
* Supports the following tags:
* - <i>
* - <b>
* - <em>
* - <strong>
* - <span>
*
* Supports the following tag attributes:
* - title
* - style
* - class
*
* @param html
*
* @return
*/
function sanitiseHtml(html) {
var context = document.implementation.createHTMLDocument(''),
$html = $.parseHTML(html, /* document */ context, /* keepscripts */ false),
$div = $('<div>', context).append($html),
whitelistAttrs = [
'title',
'style',
'class'
],
whitelistTags = [
'i',
'b',
'em',
'strong',
'span'
];
$div.find('*').each(function () {
var $this = $(this),
tagname = $this.prop('tagName').toLowerCase(),
attrs,
array,
style;
if (whitelistTags.indexOf(tagname) === -1) {
mw.log('[I18n-js] Disallowed tag in message: ' + tagname);
$this.remove();
return;
}
attrs = $this.prop('attributes');
array = Array.prototype.slice.call(attrs);
array.forEach(function (attr) {
if (whitelistAttrs.indexOf(attr.name) === -1) {
mw.log('[I18n-js] Disallowed attribute in message: ' + attr.name + ', tag: ' + tagname);
$this.removeAttr(attr.name);
return;
}
// make sure there's nothing nasty in style attributes
if (attr.name === 'style') {
style = $this.attr('style');
if (style.indexOf('url(') > -1) {
mw.log('[I18n-js] Disallowed url() in style attribute');
$this.removeAttr('style');
}
}
});
});
return $div.prop('innerHTML');
}
/*
* Parse basic wikitext links into HTML. Also supports basic inline HTML tags.
*
* Will process:
* - [url text]
* - [[pagename]]
* - [[pagename|text]]
*
* @param message The message to process.
*
* @return The resulting string.
*/
function parse(message) {
// [url text] -> [$1 $2]
var urlRgx = /\[((?:https?:)?\/\/.+?) (.+?)\]/g,
// [[pagename]] -> [[$1]]
simplePageRgx = /\[\[([^|]*?)\]\]/g,
// [[pagename|text]] -> [[$1|$2]]
pageWithTextRgx = /\[\[(.+?)\|(.+?)\]\]/g;
if (message.indexOf('<') > -1) {
message = sanitiseHtml(message);
}
return message
.replace(urlRgx, function (_match, href, text) {
return makeLink(href, text);
})
.replace(simplePageRgx, function (_match, href) {
return makeLink(href);
})
.replace(pageWithTextRgx, function (_match, href, text) {
return makeLink(href, text);
});
}
/*
* Parse markdown links into HTML. Also supports basic inline HTML tags.
*
* Will process:
* - [text](url)
* - [page]
* - [text](page)
*
* @param The message to process.
*
* @return the resulting string.
*/
function markdown(message) {
// [text](url)
var urlRgx = /\[(.+?)\]\(((?:https?:)?\/\/.+?)\)/g,
// [page]
simplePageRgx = /\[(.+?)\]/g,
// [text](page)
pageWithTextRgx = /\[(.+?)\]\((.+?)\)/g;
if (message.indexOf('<') > -1) {
message = sanitiseHtml(message);
}
return message
.replace(urlRgx, function (_match, text, href) {
return makeLink(href, text);
})
.replace(simplePageRgx, function (_match, href) {
return makeLink(href);
})
.replace(pageWithTextRgx, function (_match, text, href) {
return makeLink(href, text);
});
}
/*
* Create a new Message instance.
*
* @param message The name of the message.
* @param defaultLang
* @param args Any arguments to substitute into the message.
* @param messageKey
*/
function message(messages, defaultLang, args, messageKey) {
if (!args.length) {
return;
}
var msgName = args.shift(),
noMsg = '<' + msgName + '>',
msg = getMsg(messages, msgName, defaultLang, messageKey);
if (args.length) {
msg = handleArgs(msg, args);
}
return {
/*
* Boolean representing whether the message exists.
*/
exists: msg !== noMsg,
/*
* Parse wikitext links in the message and return the result.
*
* @return The resulting string.
*/
parse: function () {
// skip parsing if the message wasn't found otherwise
// the sanitisation will mess with it
if (!this.exists) {
return this.escape();
}
return parse(msg);
},
/*
* Parse markdown links in the message and return the result.
*
* @return The resulting string.
*/
markdown: function () {
// skip parsing if the message wasn't found otherwise
// the sanitisation will mess with it
if (!this.exists) {
return this.escape();
}
return markdown(msg);
},
/*
* Escape any HTML in the message and return the result.
*
* @return The resulting string.
*/
escape: function () {
return mw.html.escape(msg);
},
/*
* Return the message as is.
*
* @return The resulting string.
*/
plain: function () {
return msg;
}
};
}
/*
* Create a new i18n object.
*
* @param messages The message object to look translations up in.
* @param name
*/
function i18n(messages, name) {
var defaultLang = conf.wgUserLanguage,
tempLang = null,
messageKey = null;
if (name.indexOf('u:') !== 0) {
messageKey = name;
}
return {
/*
* Set the default language.
*
* @param lang The language code to use by default.
*/
useLang: function (lang) {
defaultLang = lang;
},
/*
* Set the language for the next msg call.
*
* @param lang The language code to use for the next `msg` call.
*
* @return The current object for use in chaining.
*/
inLang: function (lang) {
tempLang = lang;
return this;
},
/*
* Set the default language to the content language.
*/
useContentLang: function () {
defaultLang = conf.wgContentLanguage;
},
/*
* Set the language for the next `msg` call to the content language.
*
* @return The current object for use in chaining.
*/
inContentLang: function () {
tempLang = conf.wgContentLanguage;
return this;
},
/*
* Set the default language to the user's language.
*/
useUserLang: function () {
defaultLang = conf.wgUserLanguage;
},
/*
* Set the language for the next msg call to the user's language.
*
* @return The current object for use in chaining.
*/
inUserLang: function () {
tempLang = conf.wgUserLanguage;
return this;
},
/*
* Create a new instance of Message.
*/
msg: function () {
var args = Array.prototype.slice.call(arguments),
lang;
if (tempLang !== null) {
lang = tempLang;
tempLang = null;
return message(messages, lang, args, messageKey);
}
return message(messages, defaultLang, args, messageKey);
},
/*
* For accessing the raw messages.
*/
_messages: messages
};
}
/*
* Strip comments from a JSON string which are illegal under the JSON spec.
*
* @param json The JSON string.
*
* @return The JSON string after any comments have been removed.
*/
function stripComments(json) {
mw.log('[I18n-js] Raw i18n.json:', json);
json = json.trim()
// inline comments
.replace(/\/\/[^\n]*/g, '')
// block comments
// this is a bit basic, so will break on comments inside strings
.replace(/\/\*[\s\S]*?\*\//g, '')
// for some reason a semi-colon can be appended to the JSON
.replace(/;$/, '');
mw.log('[I18n-js] Comment-stripped i18n.json:', json);
return json;
}
/*
* Parse JSON string loaded from page and create an i18n object.
*
* @param name
* @param res The JSON string.
*
* @return The resulting i18n object.
*/
function parseMessagesToObject(name, res) {
var json = {},
obj,
msg;
// handle parse errors gracefully
try {
res = stripComments(res);
json = JSON.parse(res);
} catch (e) {
if (e.message === 'Unexpected end of JSON input') {
msg = e.message + '. This may be caused by a non-existent i18n.json page.';
} else {
msg = e.message;
}
console.log('[I18n-js] SyntaxError in messages: ' + msg);
}
obj = i18n(json, name);
// cache the result in case it's used multiple times
cache[name] = obj;
return obj;
}
/*
* Load messages stored as JSON on a page.
*
* @param name The name of the script the messages are for. This will be
* used to get messages from
* https://dev.wikia.com/wiki/MediaWiki:Custom-name/i18n.json.
*
* @return A jQuery.Deferred instance.
*/
function loadMessages(name) {
var deferred = $.Deferred(),
page,
params;
if (cache[name]) {
deferred.resolve(cache[name]);
} else {
// allow custom i18n pages to be specified on other wikis
// mainly for VSTF wiki to keep their own JSON file
page = 'u:dev:MediaWiki:Custom-' + name + '/i18n.json';
if (name.indexOf('u:') === 0) {
page = name;
}
params = {
mode: 'articles',
articles: page,
only: 'styles',
// keep the json unminified as vstf wiki use comments in their json file
debug: '1'
};
// site and user are dependencies so end-users can set overrides in their local JS
// and have it take effect before we load the messagaes
// generally, we will implicitly depend on those anyway due to where/when this is loaded
mw.loader.using(['mediawiki.util'/*, 'site', 'user'*/], function () {
$.get(mw.util.wikiScript('load'), params).done(function (res) {
deferred.resolve(parseMessagesToObject(name, res));
});
});
}
return deferred;
}
// expose under the dev global
window.dev.i18n = window.dev.i18n || {};
window.dev.i18n = $.extend(window.dev.i18n, {
loadMessages: loadMessages,
// 'hidden' functions to allow testing
_stripComments: stripComments,
_getMsg: getMsg,
_handleArgs: handleArgs,
_parse: parse,
_markdown: markdown,
_fallbacks: fallbacks
});
// initialise overrides object
window.dev.i18n.overrides = window.dev.i18n.overrides || {};
overrides = window.dev.i18n.overrides;
// fire an event on load
mw.hook('dev.i18n').fire(window.dev.i18n);
// alternatively, use $.getScript (or mw.loader)
// and use the returned promise
}(this, jQuery, mediaWiki));