diff options
author | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-21 11:44:51 +0000 |
---|---|---|
committer | Daniel Baumann <daniel.baumann@progress-linux.org> | 2024-04-21 11:44:51 +0000 |
commit | 9e3c08db40b8916968b9f30096c7be3f00ce9647 (patch) | |
tree | a68f146d7fa01f0134297619fbe7e33db084e0aa /devtools/client/shared/unicode-url.js | |
parent | Initial commit. (diff) | |
download | thunderbird-9e3c08db40b8916968b9f30096c7be3f00ce9647.tar.xz thunderbird-9e3c08db40b8916968b9f30096c7be3f00ce9647.zip |
Adding upstream version 1:115.7.0.upstream/1%115.7.0upstream
Signed-off-by: Daniel Baumann <daniel.baumann@progress-linux.org>
Diffstat (limited to 'devtools/client/shared/unicode-url.js')
-rw-r--r-- | devtools/client/shared/unicode-url.js | 106 |
1 files changed, 106 insertions, 0 deletions
diff --git a/devtools/client/shared/unicode-url.js b/devtools/client/shared/unicode-url.js new file mode 100644 index 0000000000..36fae098eb --- /dev/null +++ b/devtools/client/shared/unicode-url.js @@ -0,0 +1,106 @@ +/* This Source Code Form is subject to the terms of the Mozilla Public + * License, v. 2.0. If a copy of the MPL was not distributed with this + * file, You can obtain one at http://mozilla.org/MPL/2.0/. */ +"use strict"; + +const idnService = Cc["@mozilla.org/network/idn-service;1"].getService( + Ci.nsIIDNService +); + +/** + * Gets a readble Unicode hostname from a hostname. + * + * If the `hostname` is a readable ASCII hostname, such as example.org, then + * this function will simply return the original `hostname`. + * + * If the `hostname` is a Punycode hostname representing a Unicode domain name, + * such as xn--g6w.xn--8pv, then this function will return the readable Unicode + * domain name by decoding the Punycode hostname. + * + * @param {string} hostname + * the hostname from which the Unicode hostname will be + * parsed, such as example.org, xn--g6w.xn--8pv. + * @return {string} The Unicode hostname. It may be the same as the `hostname` + * passed to this function if the `hostname` itself is + * a readable ASCII hostname or a Unicode hostname. + */ +function getUnicodeHostname(hostname) { + return idnService.convertToDisplayIDN(hostname, {}); +} + +/** + * Gets a readble Unicode URL pathname from a URL pathname. + * + * If the `urlPath` is a readable ASCII URL pathname, such as /a/b/c.js, then + * this function will simply return the original `urlPath`. + * + * If the `urlPath` is a URI-encoded pathname, such as %E8%A9%A6/%E6%B8%AC.js, + * then this function will return the readable Unicode pathname. + * + * If the `urlPath` is a malformed URL pathname, then this function will simply + * return the original `urlPath`. + * + * @param {string} urlPath + * the URL path from which the Unicode URL path will be parsed, + * such as /a/b/c.js, %E8%A9%A6/%E6%B8%AC.js. + * @return {string} The Unicode URL Path. It may be the same as the `urlPath` + * passed to this function if the `urlPath` itself is a readable + * ASCII url or a Unicode url. + */ +function getUnicodeUrlPath(urlPath) { + try { + return decodeURIComponent(urlPath); + } catch (err) {} + return urlPath; +} + +/** + * Gets a readable Unicode URL from a URL. + * + * If the `url` is a readable ASCII URL, such as http://example.org/a/b/c.js, + * then this function will simply return the original `url`. + * + * If the `url` includes either an unreadable Punycode domain name or an + * unreadable URI-encoded pathname, such as + * http://xn--g6w.xn--8pv/%E8%A9%A6/%E6%B8%AC.js, then this function will return + * the readable URL by decoding all its unreadable URL components to Unicode + * characters. The character `#` is not decoded from escape sequences. + * + * If the `url` is a malformed URL, then this function will return the original + * `url`. + * + * If the `url` is a data: URI, then this function will return the original + * `url`. + * + * @param {string} url + * the full URL, or a data: URI. from which the readable URL + * will be parsed, such as, http://example.org/a/b/c.js, + * http://xn--g6w.xn--8pv/%E8%A9%A6/%E6%B8%AC.js + * @return {string} The readable URL. It may be the same as the `url` passed to + * this function if the `url` itself is readable. + */ +function getUnicodeUrl(url) { + try { + const { protocol, hostname } = new URL(url); + if (protocol === "data:") { + // Never convert a data: URI. + return url; + } + const readableHostname = getUnicodeHostname(hostname); + + /* We use `decodeURIComponent` instead of decodeURI as the + * later does not decode some characters, it only can decode characters + * previously encoded by the encodeURI. See + * https://developer.mozilla.org/en-US/docs/Web/JavaScript/Reference/Global_Objects/encodeURI#Description + */ + url = decodeURIComponent(url); + return url.replace(hostname, readableHostname); + } catch (err) {} + return url; +} + +module.exports = { + getUnicodeHostname, + getUnicodeUrlPath, + getUnicodeUrl, +}; |