// Note: run `npm install unicode-7.0.0` first. // Which Unicode version should be used? var version = '7.0.0'; var start = require('unicode-' + version + '/properties/ID_Start/code-points') .filter(function(ch) { return ch > 127; }); var cont = [0x200c, 0x200d].concat(require('unicode-' + version + '/properties/ID_Continue/code-points') .filter(function(ch) { return ch > 127 && start.indexOf(ch) == -1; })); function pad(str, width) { while (str.length < width) str = "0" + str; return str; } function esc(code) { var hex = code.toString(16); if (hex.length <= 2) return "\\x" + pad(hex, 2); else return "\\u" + pad(hex, 4); } function generate(chars) { var astral = [], re = ""; for (var i = 0, at = 0x10000; i < chars.length; i++) { var from = chars[i], to = from; while (i < chars.length - 1 && chars[i + 1] == to + 1) { i++; to++; } if (to <= 0xffff) { if (from == to) re += esc(from); else if (from + 1 == to) re += esc(from) + esc(to); else re += esc(from) + "-" + esc(to); } else { astral.push(from - at, to - from); at = to; } } return {nonASCII: re, astral: astral}; } var startData = generate(start), contData = generate(cont); console.log(" var nonASCIIidentifierStartChars = \"" + startData.nonASCII + "\";"); console.log(" var nonASCIIidentifierChars = \"" + contData.nonASCII + "\";"); console.log(" var astralIdentifierStartCodes = " + JSON.stringify(startData.astral) + ";"); console.log(" var astralIdentifierCodes = " + JSON.stringify(contData.astral) + ";");