123456789101112131415161718192021222324252627282930313233343536373839404142434445464748 |
- // Note: run `npm install unicode-7.0.0` first.
-
- // Which Unicode version should be used?
- var version = '7.0.0';
-
- var start = require('unicode-' + version + '/properties/ID_Start/code-points')
- .filter(function(ch) { return ch > 127; });
- var cont = [0x200c, 0x200d].concat(require('unicode-' + version + '/properties/ID_Continue/code-points')
- .filter(function(ch) { return ch > 127 && start.indexOf(ch) == -1; }));
-
- function pad(str, width) {
- while (str.length < width) str = "0" + str;
- return str;
- }
-
- function esc(code) {
- var hex = code.toString(16);
- if (hex.length <= 2) return "\\x" + pad(hex, 2);
- else return "\\u" + pad(hex, 4);
- }
-
- function generate(chars) {
- var astral = [], re = "";
- for (var i = 0, at = 0x10000; i < chars.length; i++) {
- var from = chars[i], to = from;
- while (i < chars.length - 1 && chars[i + 1] == to + 1) {
- i++;
- to++;
- }
- if (to <= 0xffff) {
- if (from == to) re += esc(from);
- else if (from + 1 == to) re += esc(from) + esc(to);
- else re += esc(from) + "-" + esc(to);
- } else {
- astral.push(from - at, to - from);
- at = to;
- }
- }
- return {nonASCII: re, astral: astral};
- }
-
- var startData = generate(start), contData = generate(cont);
-
- console.log(" var nonASCIIidentifierStartChars = \"" + startData.nonASCII + "\";");
- console.log(" var nonASCIIidentifierChars = \"" + contData.nonASCII + "\";");
- console.log(" var astralIdentifierStartCodes = " + JSON.stringify(startData.astral) + ";");
- console.log(" var astralIdentifierCodes = " + JSON.stringify(contData.astral) + ";");
|