0% found this document useful (0 votes)

60 views8 pages

Punycode Es6

The document defines constants and functions for encoding and decoding Punycode strings. It includes constants for the Punycode parameters like the base and minimum/maximum values. It also defines error messages and regular expressions. The main functions are decode() and encode() which convert between Unicode symbols and Punycode ASCII strings. Additional functions map domains and convert between code points and digits.

Uploaded by

TodDynHØ UtKz

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

0% found this document useful (0 votes)

60 views8 pages

Punycode Es6

Uploaded by

TodDynHØ UtKz

We take content rights seriously. If you suspect this is your content, claim it here.

Available Formats

Download as TXT, PDF, TXT or read online on Scribd

You are on page 1/ 8

'use strict';

/** Highest positive signed 32-bit float value */

const maxInt = 2147483647; // aka. 0x7FFFFFFF or 2^31-1

/** Bootstring parameters */

const base = 36;
const tMin = 1;
const tMax = 26;
const skew = 38;
const damp = 700;
const initialBias = 72;
const initialN = 128; // 0x80
const delimiter = '-'; // '\x2D'

/** Regular expressions */

const regexPunycode = /^xn--/;
const regexNonASCII = /[^\0-\x7F]/; // Note: U+007F DEL is excluded too.
const regexSeparators = /[\x2E\u3002\uFF0E\uFF61]/g; // RFC 3490 separators

/** Error messages */

const errors = {
'overflow': 'Overflow: input needs wider integers to process',
'not-basic': 'Illegal input >= 0x80 (not a basic code point)',
'invalid-input': 'Invalid input'
};

/** Convenience shortcuts */

const baseMinusTMin = base - tMin;
const floor = Math.floor;
const stringFromCharCode = String.fromCharCode;

/*--------------------------------------------------------------------------*/

/**
* A generic error utility function.
* @private
* @param {String} type The error type.
* @returns {Error} Throws a `RangeError` with the applicable error message.
*/
function error(type) {
throw new RangeError(errors[type]);
}

/**
* A generic `Array#map` utility function.
* @private
* @param {Array} array The array to iterate over.
* @param {Function} callback The function that gets called for every array
* item.
* @returns {Array} A new array of values returned by the callback function.
*/
function map(array, callback) {
const result = [];
let length = array.length;
while (length--) {
result[length] = callback(array[length]);
}
return result;
}

/**
* A simple `Array#map`-like wrapper to work with domain name strings or email
* addresses.
* @private
* @param {String} domain The domain name or email address.
* @param {Function} callback The function that gets called for every
* character.
* @returns {String} A new string of characters returned by the callback
* function.
*/
function mapDomain(domain, callback) {
const parts = domain.split('@');
let result = '';
if (parts.length > 1) {
// In email addresses, only the domain name should be punycoded. Leave
// the local part (i.e. everything up to `@`) intact.
result = parts[0] + '@';
domain = parts[1];
}
// Avoid `split(regex)` for IE8 compatibility. See #17.
domain = domain.replace(regexSeparators, '\x2E');
const labels = domain.split('.');
const encoded = map(labels, callback).join('.');
return result + encoded;
}

/**
* Creates an array containing the numeric code points of each Unicode
* character in the string. While JavaScript uses UCS-2 internally,
* this function will convert a pair of surrogate halves (each of which
* UCS-2 exposes as separate characters) into a single code point,
* matching UTF-16.
* @see `punycode.ucs2.encode`
* @see <https://mathiasbynens.be/notes/javascript-encoding>
* @memberOf punycode.ucs2
* @name decode
* @param {String} string The Unicode input string (UCS-2).
* @returns {Array} The new array of code points.
*/
function ucs2decode(string) {
const output = [];
let counter = 0;
const length = string.length;
while (counter < length) {
const value = string.charCodeAt(counter++);
if (value >= 0xD800 && value <= 0xDBFF && counter < length) {
// It's a high surrogate, and there is a next character.
const extra = string.charCodeAt(counter++);
if ((extra & 0xFC00) == 0xDC00) { // Low surrogate.
output.push(((value & 0x3FF) << 10) + (extra & 0x3FF) +
0x10000);
} else {
// It's an unmatched surrogate; only append this code unit,
in case the
// next code unit is the high surrogate of a surrogate
pair.
output.push(value);
counter--;
}
} else {
output.push(value);
}
}
return output;
}

/**
* Creates a string based on an array of numeric code points.
* @see `punycode.ucs2.decode`
* @memberOf punycode.ucs2
* @name encode
* @param {Array} codePoints The array of numeric code points.
* @returns {String} The new Unicode string (UCS-2).
*/
const ucs2encode = codePoints => String.fromCodePoint(...codePoints);

/**
* Converts a basic code point into a digit/integer.
* @see `digitToBasic()`
* @private
* @param {Number} codePoint The basic numeric code point value.
* @returns {Number} The numeric value of a basic code point (for use in
* representing integers) in the range `0` to `base - 1`, or `base` if
* the code point does not represent a value.
*/
const basicToDigit = function(codePoint) {
if (codePoint >= 0x30 && codePoint < 0x3A) {
return 26 + (codePoint - 0x30);
}
if (codePoint >= 0x41 && codePoint < 0x5B) {
return codePoint - 0x41;
}
if (codePoint >= 0x61 && codePoint < 0x7B) {
return codePoint - 0x61;
}
return base;
};

/**
* Converts a digit/integer into a basic code point.
* @see `basicToDigit()`
* @private
* @param {Number} digit The numeric value of a basic code point.
* @returns {Number} The basic code point whose value (when used for
* representing integers) is `digit`, which needs to be in the range
* `0` to `base - 1`. If `flag` is non-zero, the uppercase form is
* used; else, the lowercase form is used. The behavior is undefined
* if `flag` is non-zero and `digit` has no uppercase form.
*/
const digitToBasic = function(digit, flag) {
// 0..25 map to ASCII a..z or A..Z
// 26..35 map to ASCII 0..9
return digit + 22 + 75 * (digit < 26) - ((flag != 0) << 5);
};

/**
* Bias adaptation function as per section 3.4 of RFC 3492.
* https://tools.ietf.org/html/rfc3492#section-3.4
* @private
*/
const adapt = function(delta, numPoints, firstTime) {
let k = 0;
delta = firstTime ? floor(delta / damp) : delta >> 1;
delta += floor(delta / numPoints);
for (/* no initialization */; delta > baseMinusTMin * tMax >> 1; k += base) {
delta = floor(delta / baseMinusTMin);
}
return floor(k + (baseMinusTMin + 1) * delta / (delta + skew));
};

/**
* Converts a Punycode string of ASCII-only symbols to a string of Unicode
* symbols.
* @memberOf punycode
* @param {String} input The Punycode string of ASCII-only symbols.
* @returns {String} The resulting string of Unicode symbols.
*/
const decode = function(input) {
// Don't use UCS-2.
const output = [];
const inputLength = input.length;
let i = 0;
let n = initialN;
let bias = initialBias;

// Handle the basic code points: let `basic` be the number of input code
// points before the last delimiter, or `0` if there is none, then copy
// the first basic code points to the output.

let basic = input.lastIndexOf(delimiter);

if (basic < 0) {
basic = 0;
}

for (let j = 0; j < basic; ++j) {

// if it's not a basic code point
if (input.charCodeAt(j) >= 0x80) {
error('not-basic');
}
output.push(input.charCodeAt(j));
}

// Main decoding loop: start just after the last delimiter if any basic code
// points were copied; start at the beginning otherwise.

for (let index = basic > 0 ? basic + 1 : 0; index < inputLength; /* no final
expression */) {

// `index` is the index of the next character to be consumed.

// Decode a generalized variable-length integer into `delta`,
// which gets added to `i`. The overflow checking is easier
// if we increase `i` as we go, then subtract off its starting
// value at the end to obtain `delta`.
const oldi = i;
for (let w = 1, k = base; /* no condition */; k += base) {
if (index >= inputLength) {
error('invalid-input');
}

const digit = basicToDigit(input.charCodeAt(index++));

if (digit >= base) {

error('invalid-input');
}
if (digit > floor((maxInt - i) / w)) {
error('overflow');
}

i += digit * w;
const t = k <= bias ? tMin : (k >= bias + tMax ? tMax : k -
bias);

if (digit < t) {
break;
}

const baseMinusT = base - t;

if (w > floor(maxInt / baseMinusT)) {
error('overflow');
}

w *= baseMinusT;

const out = output.length + 1;

bias = adapt(i - oldi, out, oldi == 0);

// `i` was supposed to wrap around from `out` to `0`,

// incrementing `n` each time, so we'll fix that now:
if (floor(i / out) > maxInt - n) {
error('overflow');
}

n += floor(i / out);
i %= out;

// Insert `n` at position `i` of the output.

output.splice(i++, 0, n);

return String.fromCodePoint(...output);
};

/**
* Converts a string of Unicode symbols (e.g. a domain name label) to a
* Punycode string of ASCII-only symbols.
* @memberOf punycode
* @param {String} input The string of Unicode symbols.
* @returns {String} The resulting Punycode string of ASCII-only symbols.
*/
const encode = function(input) {
const output = [];

// Convert the input in UCS-2 to an array of Unicode code points.

input = ucs2decode(input);

// Cache the length.

const inputLength = input.length;

// Initialize the state.

let n = initialN;
let delta = 0;
let bias = initialBias;

// Handle the basic code points.

for (const currentValue of input) {
if (currentValue < 0x80) {
output.push(stringFromCharCode(currentValue));
}
}

const basicLength = output.length;

let handledCPCount = basicLength;

// `handledCPCount` is the number of code points that have been handled;

// `basicLength` is the number of basic code points.

// Finish the basic string with a delimiter unless it's empty.

if (basicLength) {
output.push(delimiter);
}

// Main encoding loop:

while (handledCPCount < inputLength) {

// All non-basic code points < n have been handled already. Find the
next
// larger one:
let m = maxInt;
for (const currentValue of input) {
if (currentValue >= n && currentValue < m) {
m = currentValue;
}
}

// Increase `delta` enough to advance the decoder's <n,i> state to

<m,0>,
// but guard against overflow.
const handledCPCountPlusOne = handledCPCount + 1;
if (m - n > floor((maxInt - delta) / handledCPCountPlusOne)) {
error('overflow');
}

delta += (m - n) * handledCPCountPlusOne;
n = m;

for (const currentValue of input) {

if (currentValue < n && ++delta > maxInt) {
error('overflow');
}
if (currentValue === n) {
// Represent delta as a generalized variable-length
integer.
let q = delta;
for (let k = base; /* no condition */; k += base) {
const t = k <= bias ? tMin : (k >= bias + tMax ? tMax
: k - bias);
if (q < t) {
break;
}
const qMinusT = q - t;
const baseMinusT = base - t;
output.push(
stringFromCharCode(digitToBasic(t + qMinusT %
baseMinusT, 0))
);
q = floor(qMinusT / baseMinusT);
}

output.push(stringFromCharCode(digitToBasic(q, 0)));
bias = adapt(delta, handledCPCountPlusOne, handledCPCount
=== basicLength);
delta = 0;
++handledCPCount;
}
}

++delta;
++n;

}
return output.join('');
};

/**
* Converts a Punycode string representing a domain name or an email address
* to Unicode. Only the Punycoded parts of the input will be converted, i.e.
* it doesn't matter if you call it on a string that has already been
* converted to Unicode.
* @memberOf punycode
* @param {String} input The Punycoded domain name or email address to
* convert to Unicode.
* @returns {String} The Unicode representation of the given Punycode
* string.
*/
const toUnicode = function(input) {
return mapDomain(input, function(string) {
return regexPunycode.test(string)
? decode(string.slice(4).toLowerCase())
: string;
});
};

/**
* Converts a Unicode string representing a domain name or an email address to
* Punycode. Only the non-ASCII parts of the domain name will be converted,
* i.e. it doesn't matter if you call it with a domain that's already in
* ASCII.
* @memberOf punycode
* @param {String} input The domain name or email address to convert, as a
* Unicode string.
* @returns {String} The Punycode representation of the given domain name or
* email address.
*/
const toASCII = function(input) {
return mapDomain(input, function(string) {
return regexNonASCII.test(string)
? 'xn--' + encode(string)
: string;
});
};

/*--------------------------------------------------------------------------*/

/** Define the public API */

const punycode = {
/**
* A string representing the current Punycode.js version number.
* @memberOf punycode
* @type String
*/
'version': '2.1.0',
/**
* An object of methods to convert from JavaScript's internal character
* representation (UCS-2) to Unicode code points, and back.
* @see <https://mathiasbynens.be/notes/javascript-encoding>
* @memberOf punycode
* @type Object
*/
'ucs2': {
'decode': ucs2decode,
'encode': ucs2encode
},
'decode': decode,
'encode': encode,
'toASCII': toASCII,
'toUnicode': toUnicode
};

export { ucs2decode, ucs2encode, decode, encode, toASCII, toUnicode };

export default punycode;

Base64
No ratings yet
Base64
8 pages
IoT Identification Technology - L2 (1)
No ratings yet
IoT Identification Technology - L2 (1)
20 pages
jszip.js
No ratings yet
jszip.js
197 pages
New Userscript 1.User
No ratings yet
New Userscript 1.User
190 pages
Unicodebook PDF
No ratings yet
Unicodebook PDF
73 pages
Unicode in C++ - McNellis - CppCon 2014
No ratings yet
Unicode in C++ - McNellis - CppCon 2014
125 pages
Message 26
No ratings yet
Message 26
223 pages
decode-encode
No ratings yet
decode-encode
15 pages
MicroSCADA X SYS600 Process Picture Design Manual
No ratings yet
MicroSCADA X SYS600 Process Picture Design Manual
218 pages
Quickstart Guide to Meta
No ratings yet
Quickstart Guide to Meta
1 page
Project Documentation by Divyanshi Verma (719057)
No ratings yet
Project Documentation by Divyanshi Verma (719057)
298 pages
Accelaterm WI1989.55 INST
No ratings yet
Accelaterm WI1989.55 INST
44 pages
auto5
No ratings yet
auto5
40 pages
Module 4_ Network Forensics
No ratings yet
Module 4_ Network Forensics
40 pages
nafess boa
No ratings yet
nafess boa
1 page
AIDA Article Template
No ratings yet
AIDA Article Template
23 pages
1
No ratings yet
1
4 pages
lec05 arithmetic coding II
No ratings yet
lec05 arithmetic coding II
44 pages
JS CheatSheet
No ratings yet
JS CheatSheet
4 pages
AKM BHAI CSS(U-2) 5Star Notes
No ratings yet
AKM BHAI CSS(U-2) 5Star Notes
40 pages
f5868240
No ratings yet
f5868240
5 pages
JavaScript_CheatSheet__1746934285
No ratings yet
JavaScript_CheatSheet__1746934285
4 pages
STRINGS
No ratings yet
STRINGS
5 pages
Installation Procedures For ECR Setting Tool
0% (1)
Installation Procedures For ECR Setting Tool
5 pages
2018 Assigment 2
No ratings yet
2018 Assigment 2
11 pages
JSPDF
No ratings yet
JSPDF
471 pages
Unicode CPP PDF
No ratings yet
Unicode CPP PDF
139 pages
CSE220 Homework 3
No ratings yet
CSE220 Homework 3
8 pages
Divert Btc266778
No ratings yet
Divert Btc266778
6 pages
832451202-810254541-DivertJJKIHZ77897Cs-Hussy – kopija
No ratings yet
832451202-810254541-DivertJJKIHZ77897Cs-Hussy – kopija
6 pages
810254541 Divert Btc Cs Hussy
No ratings yet
810254541 Divert Btc Cs Hussy
5 pages
Lec4 Arith Compression
No ratings yet
Lec4 Arith Compression
36 pages
810254541 Divert Btc Cs Hussy
No ratings yet
810254541 Divert Btc Cs Hussy
6 pages
Recover Shell
No ratings yet
Recover Shell
238 pages
Section 4
No ratings yet
Section 4
5 pages
JavaScript Cheatsheet
No ratings yet
JavaScript Cheatsheet
28 pages
Pre-Test - Mathematics 6
No ratings yet
Pre-Test - Mathematics 6
8 pages
Assignment 4
No ratings yet
Assignment 4
15 pages
Sri Paramakalyani College: Alwarkurichi
No ratings yet
Sri Paramakalyani College: Alwarkurichi
18 pages
Lab - 01 DFA Simulation
No ratings yet
Lab - 01 DFA Simulation
4 pages
Новый документ
No ratings yet
Новый документ
3 pages
Новый документ
No ratings yet
Новый документ
3 pages
Script Error
No ratings yet
Script Error
82 pages
Chapter 12 - Javascript: Objects: Math String
No ratings yet
Chapter 12 - Javascript: Objects: Math String
68 pages
Project Infinite v.P.1.1
No ratings yet
Project Infinite v.P.1.1
197 pages
Running SAS in Batch Mode in Windows OS
No ratings yet
Running SAS in Batch Mode in Windows OS
9 pages
Divert Btc2
No ratings yet
Divert Btc2
6 pages
Design of IIR Elliptical Band Pass Filter: Expt. No.: 3A
No ratings yet
Design of IIR Elliptical Band Pass Filter: Expt. No.: 3A
12 pages
WEBshortnote
No ratings yet
WEBshortnote
16 pages
Lec 05 - Arithmetic Coding
No ratings yet
Lec 05 - Arithmetic Coding
44 pages
Asdad
No ratings yet
Asdad
14 pages
810254541 Divert Btc Cs Hussy
No ratings yet
810254541 Divert Btc Cs Hussy
5 pages
Chapter 5 of PHP (WBP)
No ratings yet
Chapter 5 of PHP (WBP)
25 pages
Message 6 1
No ratings yet
Message 6 1
135 pages
1 - Primitive Data Types (2019) - 2
No ratings yet
1 - Primitive Data Types (2019) - 2
50 pages
DIVERT BTC CS HUSSY
100% (1)
DIVERT BTC CS HUSSY
5 pages
Tabela 1 DNP3 Device Profile - r01
No ratings yet
Tabela 1 DNP3 Device Profile - r01
3 pages
Range Coding
No ratings yet
Range Coding
6 pages
810254541 Divert Btc Cs Hussy
100% (1)
810254541 Divert Btc Cs Hussy
5 pages
ABAP Proxy To File On SAP PI 731
No ratings yet
ABAP Proxy To File On SAP PI 731
40 pages
Robtics: Lunatico Astronomia Seletek ARMADILLO 2 Controller
No ratings yet
Robtics: Lunatico Astronomia Seletek ARMADILLO 2 Controller
3 pages
Notes From Session
No ratings yet
Notes From Session
6 pages
Spectrum Archive VM
No ratings yet
Spectrum Archive VM
83 pages
15A05806 Cyber Security
No ratings yet
15A05806 Cyber Security
1 page
Entropy & Run Length Coding
No ratings yet
Entropy & Run Length Coding
45 pages
Arithmetic Coding Algorithm and Implementation Issues
No ratings yet
Arithmetic Coding Algorithm and Implementation Issues
7 pages
Fontes WimpplA
No ratings yet
Fontes WimpplA
1 page
Arini, MT, MSC: Basic Compression Entropy Coding Statistical
No ratings yet
Arini, MT, MSC: Basic Compression Entropy Coding Statistical
34 pages
Js Cheatsheet: Basics Loops
No ratings yet
Js Cheatsheet: Basics Loops
23 pages
Datasheet VSOL EPON OLT V1.1
No ratings yet
Datasheet VSOL EPON OLT V1.1
15 pages
Programming Methodology: Student Name: Kennan Philip Course: CIT102 Lecturer Name: Kem Emmanuel Due Date: 14
No ratings yet
Programming Methodology: Student Name: Kennan Philip Course: CIT102 Lecturer Name: Kem Emmanuel Due Date: 14
13 pages
Data Communication Note 1
No ratings yet
Data Communication Note 1
11 pages
Introduction To Computer Science
No ratings yet
Introduction To Computer Science
5 pages
Expert System: Made By: Rohit Khare B.Tech 2nd Year College:Srmcem, Lko
No ratings yet
Expert System: Made By: Rohit Khare B.Tech 2nd Year College:Srmcem, Lko
18 pages
Unit 3 - Week 2 Lectures: Building Your Webapp: Assignment 2
No ratings yet
Unit 3 - Week 2 Lectures: Building Your Webapp: Assignment 2
5 pages
(Eduwaves360) MOD - 12th (2019C) - E
100% (1)
(Eduwaves360) MOD - 12th (2019C) - E
32 pages
Operator: A Set of Symbol Which Deals With Some Operand To Perform Some Task
No ratings yet
Operator: A Set of Symbol Which Deals With Some Operand To Perform Some Task
15 pages
Digital Systems I EC 381: Mohamed Elgalhud
No ratings yet
Digital Systems I EC 381: Mohamed Elgalhud
22 pages
Javascript (Object) : Erick Kurniawan, S.Kom
No ratings yet
Javascript (Object) : Erick Kurniawan, S.Kom
27 pages
ID Automation
No ratings yet
ID Automation
28 pages
Arithmetic Coding
No ratings yet
Arithmetic Coding
12 pages
How To Find Correct Firmware For Samsung Device
No ratings yet
How To Find Correct Firmware For Samsung Device
11 pages
Base 58
No ratings yet
Base 58
3 pages
Apna College JavaScript CheatSheet
100% (1)
Apna College JavaScript CheatSheet
28 pages
Image Compression
No ratings yet
Image Compression
10 pages
Report For Review1 A) Title, Abstract and Keywords
No ratings yet
Report For Review1 A) Title, Abstract and Keywords
9 pages
Wireless Sensor Networks: (Professional Elective - IV)
No ratings yet
Wireless Sensor Networks: (Professional Elective - IV)
5 pages
C++ Functions and tutorial
From Everand
C++ Functions and tutorial
Nino Paiotta
No ratings yet
150+ C Pattern Programs
From Everand
150+ C Pattern Programs
Hernando Abella
No ratings yet
Computer Engineering Laboratory Solution Primer
From Everand
Computer Engineering Laboratory Solution Primer
Karan Bhandari
No ratings yet

Punycode Es6

Uploaded by

Punycode Es6

Uploaded by

'use strict';

/** Highest positive signed 32-bit float value */

/** Bootstring parameters */

/** Regular expressions */

/** Error messages */

/** Convenience shortcuts */

let basic = input.lastIndexOf(delimiter);

for (let j = 0; j < basic; ++j) {

// `index` is the index of the next character to be consumed.

const digit = basicToDigit(input.charCodeAt(index++));

if (digit >= base) {

const baseMinusT = base - t;

const out = output.length + 1;

// `i` was supposed to wrap around from `out` to `0`,

// Insert `n` at position `i` of the output.

// Convert the input in UCS-2 to an array of Unicode code points.

// Cache the length.

// Initialize the state.

// Handle the basic code points.

const basicLength = output.length;

// `handledCPCount` is the number of code points that have been handled;

// Finish the basic string with a delimiter unless it's empty.

// Main encoding loop:

// Increase `delta` enough to advance the decoder's <n,i> state to

for (const currentValue of input) {

/** Define the public API */

export { ucs2decode, ucs2encode, decode, encode, toASCII, toUnicode };

You might also like