mirror of
https://github.com/laurent22/joplin.git
synced 2024-12-12 08:54:00 +02:00
61 lines
1.8 KiB
JavaScript
61 lines
1.8 KiB
JavaScript
(function() {
|
|
var L = require('./L').L,
|
|
N = require('./N').N,
|
|
Z = require('./Z').Z,
|
|
M = require('./M').M,
|
|
unorm = require('unorm');
|
|
|
|
var nodeEmoji = require('node-emoji')
|
|
|
|
var _unicodeCategory = function(code) {
|
|
if (~L.indexOf(code)) return 'L';
|
|
if (~N.indexOf(code)) return 'N';
|
|
if (~Z.indexOf(code)) return 'Z';
|
|
if (~M.indexOf(code)) return 'M';
|
|
return undefined;
|
|
};
|
|
|
|
module.exports = function(string, options) {
|
|
string = string || '';
|
|
options = options || {};
|
|
var allowedChars = options.allowedChars || '-_~';
|
|
var lower = typeof options.lower === 'boolean' ? options.lower : true;
|
|
var spaces = typeof options.spaces === 'boolean' ? options.spaces : false;
|
|
var rv = [];
|
|
var noEmojiString = nodeEmoji.unemojify(string);
|
|
var chars = unorm.nfkc(noEmojiString);
|
|
for(var i = 0; i < chars.length; i++) {
|
|
var c = chars[i];
|
|
var code = c.charCodeAt(0);
|
|
// Allow Common CJK Unified Ideographs
|
|
// See: http://www.unicode.org/versions/Unicode6.0.0/ch12.pdf - Table 12-2
|
|
if (0x4E00 <= code && code <= 0x9FFF) {
|
|
rv.push(c);
|
|
continue;
|
|
}
|
|
|
|
// Allow Hangul
|
|
if (0xAC00 <= code && code <= 0xD7A3) {
|
|
rv.push(c);
|
|
continue;
|
|
}
|
|
|
|
// Japanese ideographic punctuation
|
|
if ((0x3000 <= code && code <= 0x3002) || (0xFF01 <= code && code <= 0xFF02)) {
|
|
rv.push(' ');
|
|
}
|
|
|
|
if (allowedChars.indexOf(c) != -1) {
|
|
rv.push(c);
|
|
continue;
|
|
}
|
|
var val = _unicodeCategory(code);
|
|
if (val && ~'LNM'.indexOf(val)) rv.push(c);
|
|
if (val && ~'Z'.indexOf(val)) rv.push(' ');
|
|
}
|
|
var slug = rv.join('').replace(/^\s+|\s+$/g, '').replace(/\s+/g,' ');
|
|
if (!spaces) slug = slug.replace(/[\s\-]+/g,'-');
|
|
if (lower) slug = slug.toLowerCase();
|
|
return slug;
|
|
};
|
|
}()); |