feat: add suffix lookup functionality with trie structure
- Implemented a new suffix-trie.ts file for efficient domain suffix lookups. - Introduced a lookupInTrie function to search for public suffixes in a trie. - Added suffixLookup function to check if a hostname has a valid public suffix. - Created package.json and package-lock.json to manage dependencies, including tldts and tldts-core.
This commit is contained in:
+1
@@ -0,0 +1 @@
|
||||
../tldts/bin/cli.js
|
||||
+23
@@ -0,0 +1,23 @@
|
||||
{
|
||||
"name": "cpmp",
|
||||
"lockfileVersion": 3,
|
||||
"requires": true,
|
||||
"packages": {
|
||||
"node_modules/tldts": {
|
||||
"version": "7.0.18",
|
||||
"resolved": "https://registry.npmjs.org/tldts/-/tldts-7.0.18.tgz",
|
||||
"integrity": "sha512-lCcgTAgMxQ1JKOWrVGo6E69Ukbnx4Gc1wiYLRf6J5NN4HRYJtCby1rPF8rkQ4a6qqoFBK5dvjJ1zJ0F7VfDSvw==",
|
||||
"dependencies": {
|
||||
"tldts-core": "^7.0.18"
|
||||
},
|
||||
"bin": {
|
||||
"tldts": "bin/cli.js"
|
||||
}
|
||||
},
|
||||
"node_modules/tldts-core": {
|
||||
"version": "7.0.18",
|
||||
"resolved": "https://registry.npmjs.org/tldts-core/-/tldts-core-7.0.18.tgz",
|
||||
"integrity": "sha512-jqJC13oP4FFAahv4JT/0WTDrCF9Okv7lpKtOZUGPLiAnNbACcSg8Y8T+Z9xthOmRBqi/Sob4yi0TE0miRCvF7Q=="
|
||||
}
|
||||
}
|
||||
}
|
||||
+13
@@ -0,0 +1,13 @@
|
||||
Copyright (c) 2017 Thomas Parisot, 2018 Rémi Berson
|
||||
|
||||
Permission is hereby granted, free of charge, to any person obtaining a copy of this software and
|
||||
associated documentation files (the "Software"), to deal in the Software without restriction,
|
||||
including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
||||
and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so,
|
||||
subject to the following conditions:
|
||||
|
||||
The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.
|
||||
|
||||
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
|
||||
WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
||||
+3
@@ -0,0 +1,3 @@
|
||||
# `tldts-core`
|
||||
|
||||
> core building blocks of tldts, used by both `tldts` and `tldts-experimental` packages.
|
||||
+564
@@ -0,0 +1,564 @@
|
||||
'use strict';
|
||||
|
||||
/**
|
||||
* Check if `vhost` is a valid suffix of `hostname` (top-domain)
|
||||
*
|
||||
* It means that `vhost` needs to be a suffix of `hostname` and we then need to
|
||||
* make sure that: either they are equal, or the character preceding `vhost` in
|
||||
* `hostname` is a '.' (it should not be a partial label).
|
||||
*
|
||||
* * hostname = 'not.evil.com' and vhost = 'vil.com' => not ok
|
||||
* * hostname = 'not.evil.com' and vhost = 'evil.com' => ok
|
||||
* * hostname = 'not.evil.com' and vhost = 'not.evil.com' => ok
|
||||
*/
|
||||
function shareSameDomainSuffix(hostname, vhost) {
|
||||
if (hostname.endsWith(vhost)) {
|
||||
return (hostname.length === vhost.length ||
|
||||
hostname[hostname.length - vhost.length - 1] === '.');
|
||||
}
|
||||
return false;
|
||||
}
|
||||
/**
|
||||
* Given a hostname and its public suffix, extract the general domain.
|
||||
*/
|
||||
function extractDomainWithSuffix(hostname, publicSuffix) {
|
||||
// Locate the index of the last '.' in the part of the `hostname` preceding
|
||||
// the public suffix.
|
||||
//
|
||||
// examples:
|
||||
// 1. not.evil.co.uk => evil.co.uk
|
||||
// ^ ^
|
||||
// | | start of public suffix
|
||||
// | index of the last dot
|
||||
//
|
||||
// 2. example.co.uk => example.co.uk
|
||||
// ^ ^
|
||||
// | | start of public suffix
|
||||
// |
|
||||
// | (-1) no dot found before the public suffix
|
||||
const publicSuffixIndex = hostname.length - publicSuffix.length - 2;
|
||||
const lastDotBeforeSuffixIndex = hostname.lastIndexOf('.', publicSuffixIndex);
|
||||
// No '.' found, then `hostname` is the general domain (no sub-domain)
|
||||
if (lastDotBeforeSuffixIndex === -1) {
|
||||
return hostname;
|
||||
}
|
||||
// Extract the part between the last '.'
|
||||
return hostname.slice(lastDotBeforeSuffixIndex + 1);
|
||||
}
|
||||
/**
|
||||
* Detects the domain based on rules and upon and a host string
|
||||
*/
|
||||
function getDomain(suffix, hostname, options) {
|
||||
// Check if `hostname` ends with a member of `validHosts`.
|
||||
if (options.validHosts !== null) {
|
||||
const validHosts = options.validHosts;
|
||||
for (const vhost of validHosts) {
|
||||
if ( /*@__INLINE__*/shareSameDomainSuffix(hostname, vhost)) {
|
||||
return vhost;
|
||||
}
|
||||
}
|
||||
}
|
||||
let numberOfLeadingDots = 0;
|
||||
if (hostname.startsWith('.')) {
|
||||
while (numberOfLeadingDots < hostname.length &&
|
||||
hostname[numberOfLeadingDots] === '.') {
|
||||
numberOfLeadingDots += 1;
|
||||
}
|
||||
}
|
||||
// If `hostname` is a valid public suffix, then there is no domain to return.
|
||||
// Since we already know that `getPublicSuffix` returns a suffix of `hostname`
|
||||
// there is no need to perform a string comparison and we only compare the
|
||||
// size.
|
||||
if (suffix.length === hostname.length - numberOfLeadingDots) {
|
||||
return null;
|
||||
}
|
||||
// To extract the general domain, we start by identifying the public suffix
|
||||
// (if any), then consider the domain to be the public suffix with one added
|
||||
// level of depth. (e.g.: if hostname is `not.evil.co.uk` and public suffix:
|
||||
// `co.uk`, then we take one more level: `evil`, giving the final result:
|
||||
// `evil.co.uk`).
|
||||
return /*@__INLINE__*/ extractDomainWithSuffix(hostname, suffix);
|
||||
}
|
||||
|
||||
/**
|
||||
* Return the part of domain without suffix.
|
||||
*
|
||||
* Example: for domain 'foo.com', the result would be 'foo'.
|
||||
*/
|
||||
function getDomainWithoutSuffix(domain, suffix) {
|
||||
// Note: here `domain` and `suffix` cannot have the same length because in
|
||||
// this case we set `domain` to `null` instead. It is thus safe to assume
|
||||
// that `suffix` is shorter than `domain`.
|
||||
return domain.slice(0, -suffix.length - 1);
|
||||
}
|
||||
|
||||
/**
|
||||
* @param url - URL we want to extract a hostname from.
|
||||
* @param urlIsValidHostname - hint from caller; true if `url` is already a valid hostname.
|
||||
*/
|
||||
function extractHostname(url, urlIsValidHostname) {
|
||||
let start = 0;
|
||||
let end = url.length;
|
||||
let hasUpper = false;
|
||||
// If url is not already a valid hostname, then try to extract hostname.
|
||||
if (!urlIsValidHostname) {
|
||||
// Special handling of data URLs
|
||||
if (url.startsWith('data:')) {
|
||||
return null;
|
||||
}
|
||||
// Trim leading spaces
|
||||
while (start < url.length && url.charCodeAt(start) <= 32) {
|
||||
start += 1;
|
||||
}
|
||||
// Trim trailing spaces
|
||||
while (end > start + 1 && url.charCodeAt(end - 1) <= 32) {
|
||||
end -= 1;
|
||||
}
|
||||
// Skip scheme.
|
||||
if (url.charCodeAt(start) === 47 /* '/' */ &&
|
||||
url.charCodeAt(start + 1) === 47 /* '/' */) {
|
||||
start += 2;
|
||||
}
|
||||
else {
|
||||
const indexOfProtocol = url.indexOf(':/', start);
|
||||
if (indexOfProtocol !== -1) {
|
||||
// Implement fast-path for common protocols. We expect most protocols
|
||||
// should be one of these 4 and thus we will not need to perform the
|
||||
// more expansive validity check most of the time.
|
||||
const protocolSize = indexOfProtocol - start;
|
||||
const c0 = url.charCodeAt(start);
|
||||
const c1 = url.charCodeAt(start + 1);
|
||||
const c2 = url.charCodeAt(start + 2);
|
||||
const c3 = url.charCodeAt(start + 3);
|
||||
const c4 = url.charCodeAt(start + 4);
|
||||
if (protocolSize === 5 &&
|
||||
c0 === 104 /* 'h' */ &&
|
||||
c1 === 116 /* 't' */ &&
|
||||
c2 === 116 /* 't' */ &&
|
||||
c3 === 112 /* 'p' */ &&
|
||||
c4 === 115 /* 's' */) ;
|
||||
else if (protocolSize === 4 &&
|
||||
c0 === 104 /* 'h' */ &&
|
||||
c1 === 116 /* 't' */ &&
|
||||
c2 === 116 /* 't' */ &&
|
||||
c3 === 112 /* 'p' */) ;
|
||||
else if (protocolSize === 3 &&
|
||||
c0 === 119 /* 'w' */ &&
|
||||
c1 === 115 /* 's' */ &&
|
||||
c2 === 115 /* 's' */) ;
|
||||
else if (protocolSize === 2 &&
|
||||
c0 === 119 /* 'w' */ &&
|
||||
c1 === 115 /* 's' */) ;
|
||||
else {
|
||||
// Check that scheme is valid
|
||||
for (let i = start; i < indexOfProtocol; i += 1) {
|
||||
const lowerCaseCode = url.charCodeAt(i) | 32;
|
||||
if (!(((lowerCaseCode >= 97 && lowerCaseCode <= 122) || // [a, z]
|
||||
(lowerCaseCode >= 48 && lowerCaseCode <= 57) || // [0, 9]
|
||||
lowerCaseCode === 46 || // '.'
|
||||
lowerCaseCode === 45 || // '-'
|
||||
lowerCaseCode === 43) // '+'
|
||||
)) {
|
||||
return null;
|
||||
}
|
||||
}
|
||||
}
|
||||
// Skip 0, 1 or more '/' after ':/'
|
||||
start = indexOfProtocol + 2;
|
||||
while (url.charCodeAt(start) === 47 /* '/' */) {
|
||||
start += 1;
|
||||
}
|
||||
}
|
||||
}
|
||||
// Detect first occurrence of '/', '?' or '#'. We also keep track of the
|
||||
// last occurrence of '@', ']' or ':' to speed-up subsequent parsing of
|
||||
// (respectively), identifier, ipv6 or port.
|
||||
let indexOfIdentifier = -1;
|
||||
let indexOfClosingBracket = -1;
|
||||
let indexOfPort = -1;
|
||||
for (let i = start; i < end; i += 1) {
|
||||
const code = url.charCodeAt(i);
|
||||
if (code === 35 || // '#'
|
||||
code === 47 || // '/'
|
||||
code === 63 // '?'
|
||||
) {
|
||||
end = i;
|
||||
break;
|
||||
}
|
||||
else if (code === 64) {
|
||||
// '@'
|
||||
indexOfIdentifier = i;
|
||||
}
|
||||
else if (code === 93) {
|
||||
// ']'
|
||||
indexOfClosingBracket = i;
|
||||
}
|
||||
else if (code === 58) {
|
||||
// ':'
|
||||
indexOfPort = i;
|
||||
}
|
||||
else if (code >= 65 && code <= 90) {
|
||||
hasUpper = true;
|
||||
}
|
||||
}
|
||||
// Detect identifier: '@'
|
||||
if (indexOfIdentifier !== -1 &&
|
||||
indexOfIdentifier > start &&
|
||||
indexOfIdentifier < end) {
|
||||
start = indexOfIdentifier + 1;
|
||||
}
|
||||
// Handle ipv6 addresses
|
||||
if (url.charCodeAt(start) === 91 /* '[' */) {
|
||||
if (indexOfClosingBracket !== -1) {
|
||||
return url.slice(start + 1, indexOfClosingBracket).toLowerCase();
|
||||
}
|
||||
return null;
|
||||
}
|
||||
else if (indexOfPort !== -1 && indexOfPort > start && indexOfPort < end) {
|
||||
// Detect port: ':'
|
||||
end = indexOfPort;
|
||||
}
|
||||
}
|
||||
// Trim trailing dots
|
||||
while (end > start + 1 && url.charCodeAt(end - 1) === 46 /* '.' */) {
|
||||
end -= 1;
|
||||
}
|
||||
const hostname = start !== 0 || end !== url.length ? url.slice(start, end) : url;
|
||||
if (hasUpper) {
|
||||
return hostname.toLowerCase();
|
||||
}
|
||||
return hostname;
|
||||
}
|
||||
|
||||
/**
|
||||
* Check if a hostname is an IP. You should be aware that this only works
|
||||
* because `hostname` is already garanteed to be a valid hostname!
|
||||
*/
|
||||
function isProbablyIpv4(hostname) {
|
||||
// Cannot be shorted than 1.1.1.1
|
||||
if (hostname.length < 7) {
|
||||
return false;
|
||||
}
|
||||
// Cannot be longer than: 255.255.255.255
|
||||
if (hostname.length > 15) {
|
||||
return false;
|
||||
}
|
||||
let numberOfDots = 0;
|
||||
for (let i = 0; i < hostname.length; i += 1) {
|
||||
const code = hostname.charCodeAt(i);
|
||||
if (code === 46 /* '.' */) {
|
||||
numberOfDots += 1;
|
||||
}
|
||||
else if (code < 48 /* '0' */ || code > 57 /* '9' */) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
return (numberOfDots === 3 &&
|
||||
hostname.charCodeAt(0) !== 46 /* '.' */ &&
|
||||
hostname.charCodeAt(hostname.length - 1) !== 46 /* '.' */);
|
||||
}
|
||||
/**
|
||||
* Similar to isProbablyIpv4.
|
||||
*/
|
||||
function isProbablyIpv6(hostname) {
|
||||
if (hostname.length < 3) {
|
||||
return false;
|
||||
}
|
||||
let start = hostname.startsWith('[') ? 1 : 0;
|
||||
let end = hostname.length;
|
||||
if (hostname[end - 1] === ']') {
|
||||
end -= 1;
|
||||
}
|
||||
// We only consider the maximum size of a normal IPV6. Note that this will
|
||||
// fail on so-called "IPv4 mapped IPv6 addresses" but this is a corner-case
|
||||
// and a proper validation library should be used for these.
|
||||
if (end - start > 39) {
|
||||
return false;
|
||||
}
|
||||
let hasColon = false;
|
||||
for (; start < end; start += 1) {
|
||||
const code = hostname.charCodeAt(start);
|
||||
if (code === 58 /* ':' */) {
|
||||
hasColon = true;
|
||||
}
|
||||
else if (!(((code >= 48 && code <= 57) || // 0-9
|
||||
(code >= 97 && code <= 102) || // a-f
|
||||
(code >= 65 && code <= 90)) // A-F
|
||||
)) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
return hasColon;
|
||||
}
|
||||
/**
|
||||
* Check if `hostname` is *probably* a valid ip addr (either ipv6 or ipv4).
|
||||
* This *will not* work on any string. We need `hostname` to be a valid
|
||||
* hostname.
|
||||
*/
|
||||
function isIp(hostname) {
|
||||
return isProbablyIpv6(hostname) || isProbablyIpv4(hostname);
|
||||
}
|
||||
|
||||
/**
|
||||
* Implements fast shallow verification of hostnames. This does not perform a
|
||||
* struct check on the content of labels (classes of Unicode characters, etc.)
|
||||
* but instead check that the structure is valid (number of labels, length of
|
||||
* labels, etc.).
|
||||
*
|
||||
* If you need stricter validation, consider using an external library.
|
||||
*/
|
||||
function isValidAscii(code) {
|
||||
return ((code >= 97 && code <= 122) || (code >= 48 && code <= 57) || code > 127);
|
||||
}
|
||||
/**
|
||||
* Check if a hostname string is valid. It's usually a preliminary check before
|
||||
* trying to use getDomain or anything else.
|
||||
*
|
||||
* Beware: it does not check if the TLD exists.
|
||||
*/
|
||||
function isValidHostname (hostname) {
|
||||
if (hostname.length > 255) {
|
||||
return false;
|
||||
}
|
||||
if (hostname.length === 0) {
|
||||
return false;
|
||||
}
|
||||
if (
|
||||
/*@__INLINE__*/ !isValidAscii(hostname.charCodeAt(0)) &&
|
||||
hostname.charCodeAt(0) !== 46 && // '.' (dot)
|
||||
hostname.charCodeAt(0) !== 95 // '_' (underscore)
|
||||
) {
|
||||
return false;
|
||||
}
|
||||
// Validate hostname according to RFC
|
||||
let lastDotIndex = -1;
|
||||
let lastCharCode = -1;
|
||||
const len = hostname.length;
|
||||
for (let i = 0; i < len; i += 1) {
|
||||
const code = hostname.charCodeAt(i);
|
||||
if (code === 46 /* '.' */) {
|
||||
if (
|
||||
// Check that previous label is < 63 bytes long (64 = 63 + '.')
|
||||
i - lastDotIndex > 64 ||
|
||||
// Check that previous character was not already a '.'
|
||||
lastCharCode === 46 ||
|
||||
// Check that the previous label does not end with a '-' (dash)
|
||||
lastCharCode === 45 ||
|
||||
// Check that the previous label does not end with a '_' (underscore)
|
||||
lastCharCode === 95) {
|
||||
return false;
|
||||
}
|
||||
lastDotIndex = i;
|
||||
}
|
||||
else if (!( /*@__INLINE__*/(isValidAscii(code) || code === 45 || code === 95))) {
|
||||
// Check if there is a forbidden character in the label
|
||||
return false;
|
||||
}
|
||||
lastCharCode = code;
|
||||
}
|
||||
return (
|
||||
// Check that last label is shorter than 63 chars
|
||||
len - lastDotIndex - 1 <= 63 &&
|
||||
// Check that the last character is an allowed trailing label character.
|
||||
// Since we already checked that the char is a valid hostname character,
|
||||
// we only need to check that it's different from '-'.
|
||||
lastCharCode !== 45);
|
||||
}
|
||||
|
||||
function setDefaultsImpl({ allowIcannDomains = true, allowPrivateDomains = false, detectIp = true, extractHostname = true, mixedInputs = true, validHosts = null, validateHostname = true, }) {
|
||||
return {
|
||||
allowIcannDomains,
|
||||
allowPrivateDomains,
|
||||
detectIp,
|
||||
extractHostname,
|
||||
mixedInputs,
|
||||
validHosts,
|
||||
validateHostname,
|
||||
};
|
||||
}
|
||||
const DEFAULT_OPTIONS = /*@__INLINE__*/ setDefaultsImpl({});
|
||||
function setDefaults(options) {
|
||||
if (options === undefined) {
|
||||
return DEFAULT_OPTIONS;
|
||||
}
|
||||
return /*@__INLINE__*/ setDefaultsImpl(options);
|
||||
}
|
||||
|
||||
/**
|
||||
* Returns the subdomain of a hostname string
|
||||
*/
|
||||
function getSubdomain(hostname, domain) {
|
||||
// If `hostname` and `domain` are the same, then there is no sub-domain
|
||||
if (domain.length === hostname.length) {
|
||||
return '';
|
||||
}
|
||||
return hostname.slice(0, -domain.length - 1);
|
||||
}
|
||||
|
||||
/**
|
||||
* Implement a factory allowing to plug different implementations of suffix
|
||||
* lookup (e.g.: using a trie or the packed hashes datastructures). This is used
|
||||
* and exposed in `tldts.ts` and `tldts-experimental.ts` bundle entrypoints.
|
||||
*/
|
||||
function getEmptyResult() {
|
||||
return {
|
||||
domain: null,
|
||||
domainWithoutSuffix: null,
|
||||
hostname: null,
|
||||
isIcann: null,
|
||||
isIp: null,
|
||||
isPrivate: null,
|
||||
publicSuffix: null,
|
||||
subdomain: null,
|
||||
};
|
||||
}
|
||||
function resetResult(result) {
|
||||
result.domain = null;
|
||||
result.domainWithoutSuffix = null;
|
||||
result.hostname = null;
|
||||
result.isIcann = null;
|
||||
result.isIp = null;
|
||||
result.isPrivate = null;
|
||||
result.publicSuffix = null;
|
||||
result.subdomain = null;
|
||||
}
|
||||
function parseImpl(url, step, suffixLookup, partialOptions, result) {
|
||||
const options = /*@__INLINE__*/ setDefaults(partialOptions);
|
||||
// Very fast approximate check to make sure `url` is a string. This is needed
|
||||
// because the library will not necessarily be used in a typed setup and
|
||||
// values of arbitrary types might be given as argument.
|
||||
if (typeof url !== 'string') {
|
||||
return result;
|
||||
}
|
||||
// Extract hostname from `url` only if needed. This can be made optional
|
||||
// using `options.extractHostname`. This option will typically be used
|
||||
// whenever we are sure the inputs to `parse` are already hostnames and not
|
||||
// arbitrary URLs.
|
||||
//
|
||||
// `mixedInput` allows to specify if we expect a mix of URLs and hostnames
|
||||
// as input. If only hostnames are expected then `extractHostname` can be
|
||||
// set to `false` to speed-up parsing. If only URLs are expected then
|
||||
// `mixedInputs` can be set to `false`. The `mixedInputs` is only a hint
|
||||
// and will not change the behavior of the library.
|
||||
if (!options.extractHostname) {
|
||||
result.hostname = url;
|
||||
}
|
||||
else if (options.mixedInputs) {
|
||||
result.hostname = extractHostname(url, isValidHostname(url));
|
||||
}
|
||||
else {
|
||||
result.hostname = extractHostname(url, false);
|
||||
}
|
||||
// Check if `hostname` is a valid ip address
|
||||
if (options.detectIp && result.hostname !== null) {
|
||||
result.isIp = isIp(result.hostname);
|
||||
if (result.isIp) {
|
||||
return result;
|
||||
}
|
||||
}
|
||||
// Perform hostname validation if enabled. If hostname is not valid, no need to
|
||||
// go further as there will be no valid domain or sub-domain. This validation
|
||||
// is applied before any early returns to ensure consistent behavior across
|
||||
// all API methods including getHostname().
|
||||
if (options.validateHostname &&
|
||||
options.extractHostname &&
|
||||
result.hostname !== null &&
|
||||
!isValidHostname(result.hostname)) {
|
||||
result.hostname = null;
|
||||
return result;
|
||||
}
|
||||
if (step === 0 /* FLAG.HOSTNAME */ || result.hostname === null) {
|
||||
return result;
|
||||
}
|
||||
// Extract public suffix
|
||||
suffixLookup(result.hostname, options, result);
|
||||
if (step === 2 /* FLAG.PUBLIC_SUFFIX */ || result.publicSuffix === null) {
|
||||
return result;
|
||||
}
|
||||
// Extract domain
|
||||
result.domain = getDomain(result.publicSuffix, result.hostname, options);
|
||||
if (step === 3 /* FLAG.DOMAIN */ || result.domain === null) {
|
||||
return result;
|
||||
}
|
||||
// Extract subdomain
|
||||
result.subdomain = getSubdomain(result.hostname, result.domain);
|
||||
if (step === 4 /* FLAG.SUB_DOMAIN */) {
|
||||
return result;
|
||||
}
|
||||
// Extract domain without suffix
|
||||
result.domainWithoutSuffix = getDomainWithoutSuffix(result.domain, result.publicSuffix);
|
||||
return result;
|
||||
}
|
||||
|
||||
function fastPath (hostname, options, out) {
|
||||
// Fast path for very popular suffixes; this allows to by-pass lookup
|
||||
// completely as well as any extra allocation or string manipulation.
|
||||
if (!options.allowPrivateDomains && hostname.length > 3) {
|
||||
const last = hostname.length - 1;
|
||||
const c3 = hostname.charCodeAt(last);
|
||||
const c2 = hostname.charCodeAt(last - 1);
|
||||
const c1 = hostname.charCodeAt(last - 2);
|
||||
const c0 = hostname.charCodeAt(last - 3);
|
||||
if (c3 === 109 /* 'm' */ &&
|
||||
c2 === 111 /* 'o' */ &&
|
||||
c1 === 99 /* 'c' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'com';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 103 /* 'g' */ &&
|
||||
c2 === 114 /* 'r' */ &&
|
||||
c1 === 111 /* 'o' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'org';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 117 /* 'u' */ &&
|
||||
c2 === 100 /* 'd' */ &&
|
||||
c1 === 101 /* 'e' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'edu';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 118 /* 'v' */ &&
|
||||
c2 === 111 /* 'o' */ &&
|
||||
c1 === 103 /* 'g' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'gov';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 116 /* 't' */ &&
|
||||
c2 === 101 /* 'e' */ &&
|
||||
c1 === 110 /* 'n' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'net';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 101 /* 'e' */ &&
|
||||
c2 === 100 /* 'd' */ &&
|
||||
c1 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'de';
|
||||
return true;
|
||||
}
|
||||
}
|
||||
return false;
|
||||
}
|
||||
|
||||
exports.fastPathLookup = fastPath;
|
||||
exports.getEmptyResult = getEmptyResult;
|
||||
exports.parseImpl = parseImpl;
|
||||
exports.resetResult = resetResult;
|
||||
exports.setDefaults = setDefaults;
|
||||
//# sourceMappingURL=index.js.map
|
||||
+1
File diff suppressed because one or more lines are too long
+15
@@ -0,0 +1,15 @@
|
||||
"use strict";
|
||||
Object.defineProperty(exports, "__esModule", { value: true });
|
||||
exports.default = getDomainWithoutSuffix;
|
||||
/**
|
||||
* Return the part of domain without suffix.
|
||||
*
|
||||
* Example: for domain 'foo.com', the result would be 'foo'.
|
||||
*/
|
||||
function getDomainWithoutSuffix(domain, suffix) {
|
||||
// Note: here `domain` and `suffix` cannot have the same length because in
|
||||
// this case we set `domain` to `null` instead. It is thus safe to assume
|
||||
// that `suffix` is shorter than `domain`.
|
||||
return domain.slice(0, -suffix.length - 1);
|
||||
}
|
||||
//# sourceMappingURL=domain-without-suffix.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"domain-without-suffix.js","sourceRoot":"","sources":["../../../src/domain-without-suffix.ts"],"names":[],"mappings":";;AAKA,yCAQC;AAbD;;;;GAIG;AACH,SAAwB,sBAAsB,CAC5C,MAAc,EACd,MAAc;IAEd,0EAA0E;IAC1E,yEAAyE;IACzE,0CAA0C;IAC1C,OAAO,MAAM,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,MAAM,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;AAC7C,CAAC"}
|
||||
+83
@@ -0,0 +1,83 @@
|
||||
"use strict";
|
||||
Object.defineProperty(exports, "__esModule", { value: true });
|
||||
exports.default = getDomain;
|
||||
/**
|
||||
* Check if `vhost` is a valid suffix of `hostname` (top-domain)
|
||||
*
|
||||
* It means that `vhost` needs to be a suffix of `hostname` and we then need to
|
||||
* make sure that: either they are equal, or the character preceding `vhost` in
|
||||
* `hostname` is a '.' (it should not be a partial label).
|
||||
*
|
||||
* * hostname = 'not.evil.com' and vhost = 'vil.com' => not ok
|
||||
* * hostname = 'not.evil.com' and vhost = 'evil.com' => ok
|
||||
* * hostname = 'not.evil.com' and vhost = 'not.evil.com' => ok
|
||||
*/
|
||||
function shareSameDomainSuffix(hostname, vhost) {
|
||||
if (hostname.endsWith(vhost)) {
|
||||
return (hostname.length === vhost.length ||
|
||||
hostname[hostname.length - vhost.length - 1] === '.');
|
||||
}
|
||||
return false;
|
||||
}
|
||||
/**
|
||||
* Given a hostname and its public suffix, extract the general domain.
|
||||
*/
|
||||
function extractDomainWithSuffix(hostname, publicSuffix) {
|
||||
// Locate the index of the last '.' in the part of the `hostname` preceding
|
||||
// the public suffix.
|
||||
//
|
||||
// examples:
|
||||
// 1. not.evil.co.uk => evil.co.uk
|
||||
// ^ ^
|
||||
// | | start of public suffix
|
||||
// | index of the last dot
|
||||
//
|
||||
// 2. example.co.uk => example.co.uk
|
||||
// ^ ^
|
||||
// | | start of public suffix
|
||||
// |
|
||||
// | (-1) no dot found before the public suffix
|
||||
const publicSuffixIndex = hostname.length - publicSuffix.length - 2;
|
||||
const lastDotBeforeSuffixIndex = hostname.lastIndexOf('.', publicSuffixIndex);
|
||||
// No '.' found, then `hostname` is the general domain (no sub-domain)
|
||||
if (lastDotBeforeSuffixIndex === -1) {
|
||||
return hostname;
|
||||
}
|
||||
// Extract the part between the last '.'
|
||||
return hostname.slice(lastDotBeforeSuffixIndex + 1);
|
||||
}
|
||||
/**
|
||||
* Detects the domain based on rules and upon and a host string
|
||||
*/
|
||||
function getDomain(suffix, hostname, options) {
|
||||
// Check if `hostname` ends with a member of `validHosts`.
|
||||
if (options.validHosts !== null) {
|
||||
const validHosts = options.validHosts;
|
||||
for (const vhost of validHosts) {
|
||||
if ( /*@__INLINE__*/shareSameDomainSuffix(hostname, vhost)) {
|
||||
return vhost;
|
||||
}
|
||||
}
|
||||
}
|
||||
let numberOfLeadingDots = 0;
|
||||
if (hostname.startsWith('.')) {
|
||||
while (numberOfLeadingDots < hostname.length &&
|
||||
hostname[numberOfLeadingDots] === '.') {
|
||||
numberOfLeadingDots += 1;
|
||||
}
|
||||
}
|
||||
// If `hostname` is a valid public suffix, then there is no domain to return.
|
||||
// Since we already know that `getPublicSuffix` returns a suffix of `hostname`
|
||||
// there is no need to perform a string comparison and we only compare the
|
||||
// size.
|
||||
if (suffix.length === hostname.length - numberOfLeadingDots) {
|
||||
return null;
|
||||
}
|
||||
// To extract the general domain, we start by identifying the public suffix
|
||||
// (if any), then consider the domain to be the public suffix with one added
|
||||
// level of depth. (e.g.: if hostname is `not.evil.co.uk` and public suffix:
|
||||
// `co.uk`, then we take one more level: `evil`, giving the final result:
|
||||
// `evil.co.uk`).
|
||||
return /*@__INLINE__*/ extractDomainWithSuffix(hostname, suffix);
|
||||
}
|
||||
//# sourceMappingURL=domain.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"domain.js","sourceRoot":"","sources":["../../../src/domain.ts"],"names":[],"mappings":";;AA4DA,4BAuCC;AAjGD;;;;;;;;;;GAUG;AACH,SAAS,qBAAqB,CAAC,QAAgB,EAAE,KAAa;IAC5D,IAAI,QAAQ,CAAC,QAAQ,CAAC,KAAK,CAAC,EAAE,CAAC;QAC7B,OAAO,CACL,QAAQ,CAAC,MAAM,KAAK,KAAK,CAAC,MAAM;YAChC,QAAQ,CAAC,QAAQ,CAAC,MAAM,GAAG,KAAK,CAAC,MAAM,GAAG,CAAC,CAAC,KAAK,GAAG,CACrD,CAAC;IACJ,CAAC;IAED,OAAO,KAAK,CAAC;AACf,CAAC;AAED;;GAEG;AACH,SAAS,uBAAuB,CAC9B,QAAgB,EAChB,YAAoB;IAEpB,2EAA2E;IAC3E,qBAAqB;IACrB,EAAE;IACF,YAAY;IACZ,qCAAqC;IACrC,iBAAiB;IACjB,wCAAwC;IACxC,kCAAkC;IAClC,EAAE;IACF,wCAAwC;IACxC,gBAAgB;IAChB,uCAAuC;IACvC,QAAQ;IACR,mDAAmD;IACnD,MAAM,iBAAiB,GAAG,QAAQ,CAAC,MAAM,GAAG,YAAY,CAAC,MAAM,GAAG,CAAC,CAAC;IACpE,MAAM,wBAAwB,GAAG,QAAQ,CAAC,WAAW,CAAC,GAAG,EAAE,iBAAiB,CAAC,CAAC;IAE9E,sEAAsE;IACtE,IAAI,wBAAwB,KAAK,CAAC,CAAC,EAAE,CAAC;QACpC,OAAO,QAAQ,CAAC;IAClB,CAAC;IAED,wCAAwC;IACxC,OAAO,QAAQ,CAAC,KAAK,CAAC,wBAAwB,GAAG,CAAC,CAAC,CAAC;AACtD,CAAC;AAED;;GAEG;AACH,SAAwB,SAAS,CAC/B,MAAc,EACd,QAAgB,EAChB,OAAiB;IAEjB,0DAA0D;IAC1D,IAAI,OAAO,CAAC,UAAU,KAAK,IAAI,EAAE,CAAC;QAChC,MAAM,UAAU,GAAG,OAAO,CAAC,UAAU,CAAC;QACtC,KAAK,MAAM,KAAK,IAAI,UAAU,EAAE,CAAC;YAC/B,KAAI,eAAgB,qBAAqB,CAAC,QAAQ,EAAE,KAAK,CAAC,EAAE,CAAC;gBAC3D,OAAO,KAAK,CAAC;YACf,CAAC;QACH,CAAC;IACH,CAAC;IAED,IAAI,mBAAmB,GAAG,CAAC,CAAC;IAC5B,IAAI,QAAQ,CAAC,UAAU,CAAC,GAAG,CAAC,EAAE,CAAC;QAC7B,OACE,mBAAmB,GAAG,QAAQ,CAAC,MAAM;YACrC,QAAQ,CAAC,mBAAmB,CAAC,KAAK,GAAG,EACrC,CAAC;YACD,mBAAmB,IAAI,CAAC,CAAC;QAC3B,CAAC;IACH,CAAC;IAED,6EAA6E;IAC7E,8EAA8E;IAC9E,0EAA0E;IAC1E,QAAQ;IACR,IAAI,MAAM,CAAC,MAAM,KAAK,QAAQ,CAAC,MAAM,GAAG,mBAAmB,EAAE,CAAC;QAC5D,OAAO,IAAI,CAAC;IACd,CAAC;IAED,2EAA2E;IAC3E,4EAA4E;IAC5E,4EAA4E;IAC5E,yEAAyE;IACzE,iBAAiB;IACjB,OAAO,eAAe,CAAC,uBAAuB,CAAC,QAAQ,EAAE,MAAM,CAAC,CAAC;AACnE,CAAC"}
|
||||
+149
@@ -0,0 +1,149 @@
|
||||
"use strict";
|
||||
Object.defineProperty(exports, "__esModule", { value: true });
|
||||
exports.default = extractHostname;
|
||||
/**
|
||||
* @param url - URL we want to extract a hostname from.
|
||||
* @param urlIsValidHostname - hint from caller; true if `url` is already a valid hostname.
|
||||
*/
|
||||
function extractHostname(url, urlIsValidHostname) {
|
||||
let start = 0;
|
||||
let end = url.length;
|
||||
let hasUpper = false;
|
||||
// If url is not already a valid hostname, then try to extract hostname.
|
||||
if (!urlIsValidHostname) {
|
||||
// Special handling of data URLs
|
||||
if (url.startsWith('data:')) {
|
||||
return null;
|
||||
}
|
||||
// Trim leading spaces
|
||||
while (start < url.length && url.charCodeAt(start) <= 32) {
|
||||
start += 1;
|
||||
}
|
||||
// Trim trailing spaces
|
||||
while (end > start + 1 && url.charCodeAt(end - 1) <= 32) {
|
||||
end -= 1;
|
||||
}
|
||||
// Skip scheme.
|
||||
if (url.charCodeAt(start) === 47 /* '/' */ &&
|
||||
url.charCodeAt(start + 1) === 47 /* '/' */) {
|
||||
start += 2;
|
||||
}
|
||||
else {
|
||||
const indexOfProtocol = url.indexOf(':/', start);
|
||||
if (indexOfProtocol !== -1) {
|
||||
// Implement fast-path for common protocols. We expect most protocols
|
||||
// should be one of these 4 and thus we will not need to perform the
|
||||
// more expansive validity check most of the time.
|
||||
const protocolSize = indexOfProtocol - start;
|
||||
const c0 = url.charCodeAt(start);
|
||||
const c1 = url.charCodeAt(start + 1);
|
||||
const c2 = url.charCodeAt(start + 2);
|
||||
const c3 = url.charCodeAt(start + 3);
|
||||
const c4 = url.charCodeAt(start + 4);
|
||||
if (protocolSize === 5 &&
|
||||
c0 === 104 /* 'h' */ &&
|
||||
c1 === 116 /* 't' */ &&
|
||||
c2 === 116 /* 't' */ &&
|
||||
c3 === 112 /* 'p' */ &&
|
||||
c4 === 115 /* 's' */) {
|
||||
// https
|
||||
}
|
||||
else if (protocolSize === 4 &&
|
||||
c0 === 104 /* 'h' */ &&
|
||||
c1 === 116 /* 't' */ &&
|
||||
c2 === 116 /* 't' */ &&
|
||||
c3 === 112 /* 'p' */) {
|
||||
// http
|
||||
}
|
||||
else if (protocolSize === 3 &&
|
||||
c0 === 119 /* 'w' */ &&
|
||||
c1 === 115 /* 's' */ &&
|
||||
c2 === 115 /* 's' */) {
|
||||
// wss
|
||||
}
|
||||
else if (protocolSize === 2 &&
|
||||
c0 === 119 /* 'w' */ &&
|
||||
c1 === 115 /* 's' */) {
|
||||
// ws
|
||||
}
|
||||
else {
|
||||
// Check that scheme is valid
|
||||
for (let i = start; i < indexOfProtocol; i += 1) {
|
||||
const lowerCaseCode = url.charCodeAt(i) | 32;
|
||||
if (!(((lowerCaseCode >= 97 && lowerCaseCode <= 122) || // [a, z]
|
||||
(lowerCaseCode >= 48 && lowerCaseCode <= 57) || // [0, 9]
|
||||
lowerCaseCode === 46 || // '.'
|
||||
lowerCaseCode === 45 || // '-'
|
||||
lowerCaseCode === 43) // '+'
|
||||
)) {
|
||||
return null;
|
||||
}
|
||||
}
|
||||
}
|
||||
// Skip 0, 1 or more '/' after ':/'
|
||||
start = indexOfProtocol + 2;
|
||||
while (url.charCodeAt(start) === 47 /* '/' */) {
|
||||
start += 1;
|
||||
}
|
||||
}
|
||||
}
|
||||
// Detect first occurrence of '/', '?' or '#'. We also keep track of the
|
||||
// last occurrence of '@', ']' or ':' to speed-up subsequent parsing of
|
||||
// (respectively), identifier, ipv6 or port.
|
||||
let indexOfIdentifier = -1;
|
||||
let indexOfClosingBracket = -1;
|
||||
let indexOfPort = -1;
|
||||
for (let i = start; i < end; i += 1) {
|
||||
const code = url.charCodeAt(i);
|
||||
if (code === 35 || // '#'
|
||||
code === 47 || // '/'
|
||||
code === 63 // '?'
|
||||
) {
|
||||
end = i;
|
||||
break;
|
||||
}
|
||||
else if (code === 64) {
|
||||
// '@'
|
||||
indexOfIdentifier = i;
|
||||
}
|
||||
else if (code === 93) {
|
||||
// ']'
|
||||
indexOfClosingBracket = i;
|
||||
}
|
||||
else if (code === 58) {
|
||||
// ':'
|
||||
indexOfPort = i;
|
||||
}
|
||||
else if (code >= 65 && code <= 90) {
|
||||
hasUpper = true;
|
||||
}
|
||||
}
|
||||
// Detect identifier: '@'
|
||||
if (indexOfIdentifier !== -1 &&
|
||||
indexOfIdentifier > start &&
|
||||
indexOfIdentifier < end) {
|
||||
start = indexOfIdentifier + 1;
|
||||
}
|
||||
// Handle ipv6 addresses
|
||||
if (url.charCodeAt(start) === 91 /* '[' */) {
|
||||
if (indexOfClosingBracket !== -1) {
|
||||
return url.slice(start + 1, indexOfClosingBracket).toLowerCase();
|
||||
}
|
||||
return null;
|
||||
}
|
||||
else if (indexOfPort !== -1 && indexOfPort > start && indexOfPort < end) {
|
||||
// Detect port: ':'
|
||||
end = indexOfPort;
|
||||
}
|
||||
}
|
||||
// Trim trailing dots
|
||||
while (end > start + 1 && url.charCodeAt(end - 1) === 46 /* '.' */) {
|
||||
end -= 1;
|
||||
}
|
||||
const hostname = start !== 0 || end !== url.length ? url.slice(start, end) : url;
|
||||
if (hasUpper) {
|
||||
return hostname.toLowerCase();
|
||||
}
|
||||
return hostname;
|
||||
}
|
||||
//# sourceMappingURL=extract-hostname.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"extract-hostname.js","sourceRoot":"","sources":["../../../src/extract-hostname.ts"],"names":[],"mappings":";;AAIA,kCAqKC;AAzKD;;;GAGG;AACH,SAAwB,eAAe,CACrC,GAAW,EACX,kBAA2B;IAE3B,IAAI,KAAK,GAAG,CAAC,CAAC;IACd,IAAI,GAAG,GAAW,GAAG,CAAC,MAAM,CAAC;IAC7B,IAAI,QAAQ,GAAG,KAAK,CAAC;IAErB,wEAAwE;IACxE,IAAI,CAAC,kBAAkB,EAAE,CAAC;QACxB,gCAAgC;QAChC,IAAI,GAAG,CAAC,UAAU,CAAC,OAAO,CAAC,EAAE,CAAC;YAC5B,OAAO,IAAI,CAAC;QACd,CAAC;QAED,sBAAsB;QACtB,OAAO,KAAK,GAAG,GAAG,CAAC,MAAM,IAAI,GAAG,CAAC,UAAU,CAAC,KAAK,CAAC,IAAI,EAAE,EAAE,CAAC;YACzD,KAAK,IAAI,CAAC,CAAC;QACb,CAAC;QAED,uBAAuB;QACvB,OAAO,GAAG,GAAG,KAAK,GAAG,CAAC,IAAI,GAAG,CAAC,UAAU,CAAC,GAAG,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC;YACxD,GAAG,IAAI,CAAC,CAAC;QACX,CAAC;QAED,eAAe;QACf,IACE,GAAG,CAAC,UAAU,CAAC,KAAK,CAAC,KAAK,EAAE,CAAC,SAAS;YACtC,GAAG,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,KAAK,EAAE,CAAC,SAAS,EAC1C,CAAC;YACD,KAAK,IAAI,CAAC,CAAC;QACb,CAAC;aAAM,CAAC;YACN,MAAM,eAAe,GAAG,GAAG,CAAC,OAAO,CAAC,IAAI,EAAE,KAAK,CAAC,CAAC;YACjD,IAAI,eAAe,KAAK,CAAC,CAAC,EAAE,CAAC;gBAC3B,qEAAqE;gBACrE,oEAAoE;gBACpE,kDAAkD;gBAClD,MAAM,YAAY,GAAG,eAAe,GAAG,KAAK,CAAC;gBAC7C,MAAM,EAAE,GAAG,GAAG,CAAC,UAAU,CAAC,KAAK,CAAC,CAAC;gBACjC,MAAM,EAAE,GAAG,GAAG,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC;gBACrC,MAAM,EAAE,GAAG,GAAG,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC;gBACrC,MAAM,EAAE,GAAG,GAAG,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC;gBACrC,MAAM,EAAE,GAAG,GAAG,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC;gBAErC,IACE,YAAY,KAAK,CAAC;oBAClB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS,EACpB,CAAC;oBACD,QAAQ;gBACV,CAAC;qBAAM,IACL,YAAY,KAAK,CAAC;oBAClB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS,EACpB,CAAC;oBACD,OAAO;gBACT,CAAC;qBAAM,IACL,YAAY,KAAK,CAAC;oBAClB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS,EACpB,CAAC;oBACD,MAAM;gBACR,CAAC;qBAAM,IACL,YAAY,KAAK,CAAC;oBAClB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS,EACpB,CAAC;oBACD,KAAK;gBACP,CAAC;qBAAM,CAAC;oBACN,6BAA6B;oBAC7B,KAAK,IAAI,CAAC,GAAG,KAAK,EAAE,CAAC,GAAG,eAAe,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC;wBAChD,MAAM,aAAa,GAAG,GAAG,CAAC,UAAU,CAAC,CAAC,CAAC,GAAG,EAAE,CAAC;wBAC7C,IACE,CAAC,CACC,CACE,CAAC,aAAa,IAAI,EAAE,IAAI,aAAa,IAAI,GAAG,CAAC,IAAI,SAAS;4BAC1D,CAAC,aAAa,IAAI,EAAE,IAAI,aAAa,IAAI,EAAE,CAAC,IAAI,SAAS;4BACzD,aAAa,KAAK,EAAE,IAAI,MAAM;4BAC9B,aAAa,KAAK,EAAE,IAAI,MAAM;4BAC9B,aAAa,KAAK,EAAE,CACrB,CAAC,MAAM;yBACT,EACD,CAAC;4BACD,OAAO,IAAI,CAAC;wBACd,CAAC;oBACH,CAAC;gBACH,CAAC;gBAED,mCAAmC;gBACnC,KAAK,GAAG,eAAe,GAAG,CAAC,CAAC;gBAC5B,OAAO,GAAG,CAAC,UAAU,CAAC,KAAK,CAAC,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;oBAC9C,KAAK,IAAI,CAAC,CAAC;gBACb,CAAC;YACH,CAAC;QACH,CAAC;QAED,wEAAwE;QACxE,uEAAuE;QACvE,4CAA4C;QAC5C,IAAI,iBAAiB,GAAG,CAAC,CAAC,CAAC;QAC3B,IAAI,qBAAqB,GAAG,CAAC,CAAC,CAAC;QAC/B,IAAI,WAAW,GAAG,CAAC,CAAC,CAAC;QACrB,KAAK,IAAI,CAAC,GAAG,KAAK,EAAE,CAAC,GAAG,GAAG,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC;YACpC,MAAM,IAAI,GAAW,GAAG,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;YACvC,IACE,IAAI,KAAK,EAAE,IAAI,MAAM;gBACrB,IAAI,KAAK,EAAE,IAAI,MAAM;gBACrB,IAAI,KAAK,EAAE,CAAC,MAAM;cAClB,CAAC;gBACD,GAAG,GAAG,CAAC,CAAC;gBACR,MAAM;YACR,CAAC;iBAAM,IAAI,IAAI,KAAK,EAAE,EAAE,CAAC;gBACvB,MAAM;gBACN,iBAAiB,GAAG,CAAC,CAAC;YACxB,CAAC;iBAAM,IAAI,IAAI,KAAK,EAAE,EAAE,CAAC;gBACvB,MAAM;gBACN,qBAAqB,GAAG,CAAC,CAAC;YAC5B,CAAC;iBAAM,IAAI,IAAI,KAAK,EAAE,EAAE,CAAC;gBACvB,MAAM;gBACN,WAAW,GAAG,CAAC,CAAC;YAClB,CAAC;iBAAM,IAAI,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,EAAE,EAAE,CAAC;gBACpC,QAAQ,GAAG,IAAI,CAAC;YAClB,CAAC;QACH,CAAC;QAED,yBAAyB;QACzB,IACE,iBAAiB,KAAK,CAAC,CAAC;YACxB,iBAAiB,GAAG,KAAK;YACzB,iBAAiB,GAAG,GAAG,EACvB,CAAC;YACD,KAAK,GAAG,iBAAiB,GAAG,CAAC,CAAC;QAChC,CAAC;QAED,wBAAwB;QACxB,IAAI,GAAG,CAAC,UAAU,CAAC,KAAK,CAAC,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;YAC3C,IAAI,qBAAqB,KAAK,CAAC,CAAC,EAAE,CAAC;gBACjC,OAAO,GAAG,CAAC,KAAK,CAAC,KAAK,GAAG,CAAC,EAAE,qBAAqB,CAAC,CAAC,WAAW,EAAE,CAAC;YACnE,CAAC;YACD,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IAAI,WAAW,KAAK,CAAC,CAAC,IAAI,WAAW,GAAG,KAAK,IAAI,WAAW,GAAG,GAAG,EAAE,CAAC;YAC1E,mBAAmB;YACnB,GAAG,GAAG,WAAW,CAAC;QACpB,CAAC;IACH,CAAC;IAED,qBAAqB;IACrB,OAAO,GAAG,GAAG,KAAK,GAAG,CAAC,IAAI,GAAG,CAAC,UAAU,CAAC,GAAG,GAAG,CAAC,CAAC,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;QACnE,GAAG,IAAI,CAAC,CAAC;IACX,CAAC;IAED,MAAM,QAAQ,GACZ,KAAK,KAAK,CAAC,IAAI,GAAG,KAAK,GAAG,CAAC,MAAM,CAAC,CAAC,CAAC,GAAG,CAAC,KAAK,CAAC,KAAK,EAAE,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC;IAElE,IAAI,QAAQ,EAAE,CAAC;QACb,OAAO,QAAQ,CAAC,WAAW,EAAE,CAAC;IAChC,CAAC;IAED,OAAO,QAAQ,CAAC;AAClB,CAAC"}
|
||||
+107
@@ -0,0 +1,107 @@
|
||||
"use strict";
|
||||
/**
|
||||
* Implement a factory allowing to plug different implementations of suffix
|
||||
* lookup (e.g.: using a trie or the packed hashes datastructures). This is used
|
||||
* and exposed in `tldts.ts` and `tldts-experimental.ts` bundle entrypoints.
|
||||
*/
|
||||
Object.defineProperty(exports, "__esModule", { value: true });
|
||||
exports.getEmptyResult = getEmptyResult;
|
||||
exports.resetResult = resetResult;
|
||||
exports.parseImpl = parseImpl;
|
||||
const domain_1 = require("./domain");
|
||||
const domain_without_suffix_1 = require("./domain-without-suffix");
|
||||
const extract_hostname_1 = require("./extract-hostname");
|
||||
const is_ip_1 = require("./is-ip");
|
||||
const is_valid_1 = require("./is-valid");
|
||||
const options_1 = require("./options");
|
||||
const subdomain_1 = require("./subdomain");
|
||||
function getEmptyResult() {
|
||||
return {
|
||||
domain: null,
|
||||
domainWithoutSuffix: null,
|
||||
hostname: null,
|
||||
isIcann: null,
|
||||
isIp: null,
|
||||
isPrivate: null,
|
||||
publicSuffix: null,
|
||||
subdomain: null,
|
||||
};
|
||||
}
|
||||
function resetResult(result) {
|
||||
result.domain = null;
|
||||
result.domainWithoutSuffix = null;
|
||||
result.hostname = null;
|
||||
result.isIcann = null;
|
||||
result.isIp = null;
|
||||
result.isPrivate = null;
|
||||
result.publicSuffix = null;
|
||||
result.subdomain = null;
|
||||
}
|
||||
function parseImpl(url, step, suffixLookup, partialOptions, result) {
|
||||
const options = /*@__INLINE__*/ (0, options_1.setDefaults)(partialOptions);
|
||||
// Very fast approximate check to make sure `url` is a string. This is needed
|
||||
// because the library will not necessarily be used in a typed setup and
|
||||
// values of arbitrary types might be given as argument.
|
||||
if (typeof url !== 'string') {
|
||||
return result;
|
||||
}
|
||||
// Extract hostname from `url` only if needed. This can be made optional
|
||||
// using `options.extractHostname`. This option will typically be used
|
||||
// whenever we are sure the inputs to `parse` are already hostnames and not
|
||||
// arbitrary URLs.
|
||||
//
|
||||
// `mixedInput` allows to specify if we expect a mix of URLs and hostnames
|
||||
// as input. If only hostnames are expected then `extractHostname` can be
|
||||
// set to `false` to speed-up parsing. If only URLs are expected then
|
||||
// `mixedInputs` can be set to `false`. The `mixedInputs` is only a hint
|
||||
// and will not change the behavior of the library.
|
||||
if (!options.extractHostname) {
|
||||
result.hostname = url;
|
||||
}
|
||||
else if (options.mixedInputs) {
|
||||
result.hostname = (0, extract_hostname_1.default)(url, (0, is_valid_1.default)(url));
|
||||
}
|
||||
else {
|
||||
result.hostname = (0, extract_hostname_1.default)(url, false);
|
||||
}
|
||||
// Check if `hostname` is a valid ip address
|
||||
if (options.detectIp && result.hostname !== null) {
|
||||
result.isIp = (0, is_ip_1.default)(result.hostname);
|
||||
if (result.isIp) {
|
||||
return result;
|
||||
}
|
||||
}
|
||||
// Perform hostname validation if enabled. If hostname is not valid, no need to
|
||||
// go further as there will be no valid domain or sub-domain. This validation
|
||||
// is applied before any early returns to ensure consistent behavior across
|
||||
// all API methods including getHostname().
|
||||
if (options.validateHostname &&
|
||||
options.extractHostname &&
|
||||
result.hostname !== null &&
|
||||
!(0, is_valid_1.default)(result.hostname)) {
|
||||
result.hostname = null;
|
||||
return result;
|
||||
}
|
||||
if (step === 0 /* FLAG.HOSTNAME */ || result.hostname === null) {
|
||||
return result;
|
||||
}
|
||||
// Extract public suffix
|
||||
suffixLookup(result.hostname, options, result);
|
||||
if (step === 2 /* FLAG.PUBLIC_SUFFIX */ || result.publicSuffix === null) {
|
||||
return result;
|
||||
}
|
||||
// Extract domain
|
||||
result.domain = (0, domain_1.default)(result.publicSuffix, result.hostname, options);
|
||||
if (step === 3 /* FLAG.DOMAIN */ || result.domain === null) {
|
||||
return result;
|
||||
}
|
||||
// Extract subdomain
|
||||
result.subdomain = (0, subdomain_1.default)(result.hostname, result.domain);
|
||||
if (step === 4 /* FLAG.SUB_DOMAIN */) {
|
||||
return result;
|
||||
}
|
||||
// Extract domain without suffix
|
||||
result.domainWithoutSuffix = (0, domain_without_suffix_1.default)(result.domain, result.publicSuffix);
|
||||
return result;
|
||||
}
|
||||
//# sourceMappingURL=factory.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"factory.js","sourceRoot":"","sources":["../../../src/factory.ts"],"names":[],"mappings":";AAAA;;;;GAIG;;AAgCH,wCAWC;AAED,kCASC;AAeD,8BAyFC;AA5JD,qCAAiC;AACjC,mEAA6D;AAC7D,yDAAiD;AACjD,mCAA2B;AAC3B,yCAAyC;AAEzC,uCAAkD;AAClD,2CAAuC;AAuBvC,SAAgB,cAAc;IAC5B,OAAO;QACL,MAAM,EAAE,IAAI;QACZ,mBAAmB,EAAE,IAAI;QACzB,QAAQ,EAAE,IAAI;QACd,OAAO,EAAE,IAAI;QACb,IAAI,EAAE,IAAI;QACV,SAAS,EAAE,IAAI;QACf,YAAY,EAAE,IAAI;QAClB,SAAS,EAAE,IAAI;KAChB,CAAC;AACJ,CAAC;AAED,SAAgB,WAAW,CAAC,MAAe;IACzC,MAAM,CAAC,MAAM,GAAG,IAAI,CAAC;IACrB,MAAM,CAAC,mBAAmB,GAAG,IAAI,CAAC;IAClC,MAAM,CAAC,QAAQ,GAAG,IAAI,CAAC;IACvB,MAAM,CAAC,OAAO,GAAG,IAAI,CAAC;IACtB,MAAM,CAAC,IAAI,GAAG,IAAI,CAAC;IACnB,MAAM,CAAC,SAAS,GAAG,IAAI,CAAC;IACxB,MAAM,CAAC,YAAY,GAAG,IAAI,CAAC;IAC3B,MAAM,CAAC,SAAS,GAAG,IAAI,CAAC;AAC1B,CAAC;AAeD,SAAgB,SAAS,CACvB,GAAW,EACX,IAAU,EACV,YAIS,EACT,cAAiC,EACjC,MAAe;IAEf,MAAM,OAAO,GAAa,eAAe,CAAC,IAAA,qBAAW,EAAC,cAAc,CAAC,CAAC;IAEtE,6EAA6E;IAC7E,wEAAwE;IACxE,wDAAwD;IACxD,IAAI,OAAO,GAAG,KAAK,QAAQ,EAAE,CAAC;QAC5B,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,wEAAwE;IACxE,sEAAsE;IACtE,2EAA2E;IAC3E,kBAAkB;IAClB,EAAE;IACF,0EAA0E;IAC1E,yEAAyE;IACzE,qEAAqE;IACrE,wEAAwE;IACxE,mDAAmD;IACnD,IAAI,CAAC,OAAO,CAAC,eAAe,EAAE,CAAC;QAC7B,MAAM,CAAC,QAAQ,GAAG,GAAG,CAAC;IACxB,CAAC;SAAM,IAAI,OAAO,CAAC,WAAW,EAAE,CAAC;QAC/B,MAAM,CAAC,QAAQ,GAAG,IAAA,0BAAe,EAAC,GAAG,EAAE,IAAA,kBAAe,EAAC,GAAG,CAAC,CAAC,CAAC;IAC/D,CAAC;SAAM,CAAC;QACN,MAAM,CAAC,QAAQ,GAAG,IAAA,0BAAe,EAAC,GAAG,EAAE,KAAK,CAAC,CAAC;IAChD,CAAC;IAED,4CAA4C;IAC5C,IAAI,OAAO,CAAC,QAAQ,IAAI,MAAM,CAAC,QAAQ,KAAK,IAAI,EAAE,CAAC;QACjD,MAAM,CAAC,IAAI,GAAG,IAAA,eAAI,EAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;QACpC,IAAI,MAAM,CAAC,IAAI,EAAE,CAAC;YAChB,OAAO,MAAM,CAAC;QAChB,CAAC;IACH,CAAC;IAED,+EAA+E;IAC/E,6EAA6E;IAC7E,2EAA2E;IAC3E,2CAA2C;IAC3C,IACE,OAAO,CAAC,gBAAgB;QACxB,OAAO,CAAC,eAAe;QACvB,MAAM,CAAC,QAAQ,KAAK,IAAI;QACxB,CAAC,IAAA,kBAAe,EAAC,MAAM,CAAC,QAAQ,CAAC,EACjC,CAAC;QACD,MAAM,CAAC,QAAQ,GAAG,IAAI,CAAC;QACvB,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,IAAI,IAAI,0BAAkB,IAAI,MAAM,CAAC,QAAQ,KAAK,IAAI,EAAE,CAAC;QACvD,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,wBAAwB;IACxB,YAAY,CAAC,MAAM,CAAC,QAAQ,EAAE,OAAO,EAAE,MAAM,CAAC,CAAC;IAC/C,IAAI,IAAI,+BAAuB,IAAI,MAAM,CAAC,YAAY,KAAK,IAAI,EAAE,CAAC;QAChE,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,iBAAiB;IACjB,MAAM,CAAC,MAAM,GAAG,IAAA,gBAAS,EAAC,MAAM,CAAC,YAAY,EAAE,MAAM,CAAC,QAAQ,EAAE,OAAO,CAAC,CAAC;IACzE,IAAI,IAAI,wBAAgB,IAAI,MAAM,CAAC,MAAM,KAAK,IAAI,EAAE,CAAC;QACnD,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,oBAAoB;IACpB,MAAM,CAAC,SAAS,GAAG,IAAA,mBAAY,EAAC,MAAM,CAAC,QAAQ,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC;IAChE,IAAI,IAAI,4BAAoB,EAAE,CAAC;QAC7B,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,gCAAgC;IAChC,MAAM,CAAC,mBAAmB,GAAG,IAAA,+BAAsB,EACjD,MAAM,CAAC,MAAM,EACb,MAAM,CAAC,YAAY,CACpB,CAAC;IAEF,OAAO,MAAM,CAAC;AAChB,CAAC"}
|
||||
+72
@@ -0,0 +1,72 @@
|
||||
"use strict";
|
||||
Object.defineProperty(exports, "__esModule", { value: true });
|
||||
exports.default = isIp;
|
||||
/**
|
||||
* Check if a hostname is an IP. You should be aware that this only works
|
||||
* because `hostname` is already garanteed to be a valid hostname!
|
||||
*/
|
||||
function isProbablyIpv4(hostname) {
|
||||
// Cannot be shorted than 1.1.1.1
|
||||
if (hostname.length < 7) {
|
||||
return false;
|
||||
}
|
||||
// Cannot be longer than: 255.255.255.255
|
||||
if (hostname.length > 15) {
|
||||
return false;
|
||||
}
|
||||
let numberOfDots = 0;
|
||||
for (let i = 0; i < hostname.length; i += 1) {
|
||||
const code = hostname.charCodeAt(i);
|
||||
if (code === 46 /* '.' */) {
|
||||
numberOfDots += 1;
|
||||
}
|
||||
else if (code < 48 /* '0' */ || code > 57 /* '9' */) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
return (numberOfDots === 3 &&
|
||||
hostname.charCodeAt(0) !== 46 /* '.' */ &&
|
||||
hostname.charCodeAt(hostname.length - 1) !== 46 /* '.' */);
|
||||
}
|
||||
/**
|
||||
* Similar to isProbablyIpv4.
|
||||
*/
|
||||
function isProbablyIpv6(hostname) {
|
||||
if (hostname.length < 3) {
|
||||
return false;
|
||||
}
|
||||
let start = hostname.startsWith('[') ? 1 : 0;
|
||||
let end = hostname.length;
|
||||
if (hostname[end - 1] === ']') {
|
||||
end -= 1;
|
||||
}
|
||||
// We only consider the maximum size of a normal IPV6. Note that this will
|
||||
// fail on so-called "IPv4 mapped IPv6 addresses" but this is a corner-case
|
||||
// and a proper validation library should be used for these.
|
||||
if (end - start > 39) {
|
||||
return false;
|
||||
}
|
||||
let hasColon = false;
|
||||
for (; start < end; start += 1) {
|
||||
const code = hostname.charCodeAt(start);
|
||||
if (code === 58 /* ':' */) {
|
||||
hasColon = true;
|
||||
}
|
||||
else if (!(((code >= 48 && code <= 57) || // 0-9
|
||||
(code >= 97 && code <= 102) || // a-f
|
||||
(code >= 65 && code <= 90)) // A-F
|
||||
)) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
return hasColon;
|
||||
}
|
||||
/**
|
||||
* Check if `hostname` is *probably* a valid ip addr (either ipv6 or ipv4).
|
||||
* This *will not* work on any string. We need `hostname` to be a valid
|
||||
* hostname.
|
||||
*/
|
||||
function isIp(hostname) {
|
||||
return isProbablyIpv6(hostname) || isProbablyIpv4(hostname);
|
||||
}
|
||||
//# sourceMappingURL=is-ip.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"is-ip.js","sourceRoot":"","sources":["../../../src/is-ip.ts"],"names":[],"mappings":";;AAoFA,uBAEC;AAtFD;;;GAGG;AACH,SAAS,cAAc,CAAC,QAAgB;IACtC,iCAAiC;IACjC,IAAI,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QACxB,OAAO,KAAK,CAAC;IACf,CAAC;IAED,yCAAyC;IACzC,IAAI,QAAQ,CAAC,MAAM,GAAG,EAAE,EAAE,CAAC;QACzB,OAAO,KAAK,CAAC;IACf,CAAC;IAED,IAAI,YAAY,GAAG,CAAC,CAAC;IAErB,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,QAAQ,CAAC,MAAM,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC;QAC5C,MAAM,IAAI,GAAG,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;QAEpC,IAAI,IAAI,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;YAC1B,YAAY,IAAI,CAAC,CAAC;QACpB,CAAC;aAAM,IAAI,IAAI,GAAG,EAAE,CAAC,SAAS,IAAI,IAAI,GAAG,EAAE,CAAC,SAAS,EAAE,CAAC;YACtD,OAAO,KAAK,CAAC;QACf,CAAC;IACH,CAAC;IAED,OAAO,CACL,YAAY,KAAK,CAAC;QAClB,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,KAAK,EAAE,CAAC,SAAS;QACvC,QAAQ,CAAC,UAAU,CAAC,QAAQ,CAAC,MAAM,GAAG,CAAC,CAAC,KAAK,EAAE,CAAC,SAAS,CAC1D,CAAC;AACJ,CAAC;AAED;;GAEG;AACH,SAAS,cAAc,CAAC,QAAgB;IACtC,IAAI,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QACxB,OAAO,KAAK,CAAC;IACf,CAAC;IAED,IAAI,KAAK,GAAG,QAAQ,CAAC,UAAU,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;IAC7C,IAAI,GAAG,GAAG,QAAQ,CAAC,MAAM,CAAC;IAE1B,IAAI,QAAQ,CAAC,GAAG,GAAG,CAAC,CAAC,KAAK,GAAG,EAAE,CAAC;QAC9B,GAAG,IAAI,CAAC,CAAC;IACX,CAAC;IAED,0EAA0E;IAC1E,2EAA2E;IAC3E,4DAA4D;IAC5D,IAAI,GAAG,GAAG,KAAK,GAAG,EAAE,EAAE,CAAC;QACrB,OAAO,KAAK,CAAC;IACf,CAAC;IAED,IAAI,QAAQ,GAAG,KAAK,CAAC;IAErB,OAAO,KAAK,GAAG,GAAG,EAAE,KAAK,IAAI,CAAC,EAAE,CAAC;QAC/B,MAAM,IAAI,GAAG,QAAQ,CAAC,UAAU,CAAC,KAAK,CAAC,CAAC;QAExC,IAAI,IAAI,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;YAC1B,QAAQ,GAAG,IAAI,CAAC;QAClB,CAAC;aAAM,IACL,CAAC,CACC,CACE,CAAC,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,EAAE,CAAC,IAAI,MAAM;YACpC,CAAC,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,GAAG,CAAC,IAAI,MAAM;YACrC,CAAC,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,EAAE,CAAC,CAC3B,CAAC,MAAM;SACT,EACD,CAAC;YACD,OAAO,KAAK,CAAC;QACf,CAAC;IACH,CAAC;IAED,OAAO,QAAQ,CAAC;AAClB,CAAC;AAED;;;;GAIG;AACH,SAAwB,IAAI,CAAC,QAAgB;IAC3C,OAAO,cAAc,CAAC,QAAQ,CAAC,IAAI,cAAc,CAAC,QAAQ,CAAC,CAAC;AAC9D,CAAC"}
|
||||
+69
@@ -0,0 +1,69 @@
|
||||
"use strict";
|
||||
/**
|
||||
* Implements fast shallow verification of hostnames. This does not perform a
|
||||
* struct check on the content of labels (classes of Unicode characters, etc.)
|
||||
* but instead check that the structure is valid (number of labels, length of
|
||||
* labels, etc.).
|
||||
*
|
||||
* If you need stricter validation, consider using an external library.
|
||||
*/
|
||||
Object.defineProperty(exports, "__esModule", { value: true });
|
||||
exports.default = default_1;
|
||||
function isValidAscii(code) {
|
||||
return ((code >= 97 && code <= 122) || (code >= 48 && code <= 57) || code > 127);
|
||||
}
|
||||
/**
|
||||
* Check if a hostname string is valid. It's usually a preliminary check before
|
||||
* trying to use getDomain or anything else.
|
||||
*
|
||||
* Beware: it does not check if the TLD exists.
|
||||
*/
|
||||
function default_1(hostname) {
|
||||
if (hostname.length > 255) {
|
||||
return false;
|
||||
}
|
||||
if (hostname.length === 0) {
|
||||
return false;
|
||||
}
|
||||
if (
|
||||
/*@__INLINE__*/ !isValidAscii(hostname.charCodeAt(0)) &&
|
||||
hostname.charCodeAt(0) !== 46 && // '.' (dot)
|
||||
hostname.charCodeAt(0) !== 95 // '_' (underscore)
|
||||
) {
|
||||
return false;
|
||||
}
|
||||
// Validate hostname according to RFC
|
||||
let lastDotIndex = -1;
|
||||
let lastCharCode = -1;
|
||||
const len = hostname.length;
|
||||
for (let i = 0; i < len; i += 1) {
|
||||
const code = hostname.charCodeAt(i);
|
||||
if (code === 46 /* '.' */) {
|
||||
if (
|
||||
// Check that previous label is < 63 bytes long (64 = 63 + '.')
|
||||
i - lastDotIndex > 64 ||
|
||||
// Check that previous character was not already a '.'
|
||||
lastCharCode === 46 ||
|
||||
// Check that the previous label does not end with a '-' (dash)
|
||||
lastCharCode === 45 ||
|
||||
// Check that the previous label does not end with a '_' (underscore)
|
||||
lastCharCode === 95) {
|
||||
return false;
|
||||
}
|
||||
lastDotIndex = i;
|
||||
}
|
||||
else if (!( /*@__INLINE__*/(isValidAscii(code) || code === 45 || code === 95))) {
|
||||
// Check if there is a forbidden character in the label
|
||||
return false;
|
||||
}
|
||||
lastCharCode = code;
|
||||
}
|
||||
return (
|
||||
// Check that last label is shorter than 63 chars
|
||||
len - lastDotIndex - 1 <= 63 &&
|
||||
// Check that the last character is an allowed trailing label character.
|
||||
// Since we already checked that the char is a valid hostname character,
|
||||
// we only need to check that it's different from '-'.
|
||||
lastCharCode !== 45);
|
||||
}
|
||||
//# sourceMappingURL=is-valid.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"is-valid.js","sourceRoot":"","sources":["../../../src/is-valid.ts"],"names":[],"mappings":";AAAA;;;;;;;GAOG;;AAcH,4BAyDC;AArED,SAAS,YAAY,CAAC,IAAY;IAChC,OAAO,CACL,CAAC,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,GAAG,CAAC,IAAI,CAAC,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,EAAE,CAAC,IAAI,IAAI,GAAG,GAAG,CACxE,CAAC;AACJ,CAAC;AAED;;;;;GAKG;AACH,mBAAyB,QAAgB;IACvC,IAAI,QAAQ,CAAC,MAAM,GAAG,GAAG,EAAE,CAAC;QAC1B,OAAO,KAAK,CAAC;IACf,CAAC;IAED,IAAI,QAAQ,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QAC1B,OAAO,KAAK,CAAC;IACf,CAAC;IAED;IACE,eAAe,CAAC,CAAC,YAAY,CAAC,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;QACrD,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,KAAK,EAAE,IAAI,YAAY;QAC7C,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,KAAK,EAAE,CAAC,mBAAmB;MACjD,CAAC;QACD,OAAO,KAAK,CAAC;IACf,CAAC;IAED,qCAAqC;IACrC,IAAI,YAAY,GAAG,CAAC,CAAC,CAAC;IACtB,IAAI,YAAY,GAAG,CAAC,CAAC,CAAC;IACtB,MAAM,GAAG,GAAG,QAAQ,CAAC,MAAM,CAAC;IAE5B,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,GAAG,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC;QAChC,MAAM,IAAI,GAAG,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;QACpC,IAAI,IAAI,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;YAC1B;YACE,+DAA+D;YAC/D,CAAC,GAAG,YAAY,GAAG,EAAE;gBACrB,sDAAsD;gBACtD,YAAY,KAAK,EAAE;gBACnB,+DAA+D;gBAC/D,YAAY,KAAK,EAAE;gBACnB,qEAAqE;gBACrE,YAAY,KAAK,EAAE,EACnB,CAAC;gBACD,OAAO,KAAK,CAAC;YACf,CAAC;YAED,YAAY,GAAG,CAAC,CAAC;QACnB,CAAC;aAAM,IACL,CAAC,EAAC,eAAgB,CAAC,YAAY,CAAC,IAAI,CAAC,IAAI,IAAI,KAAK,EAAE,IAAI,IAAI,KAAK,EAAE,CAAC,CAAC,EACrE,CAAC;YACD,uDAAuD;YACvD,OAAO,KAAK,CAAC;QACf,CAAC;QAED,YAAY,GAAG,IAAI,CAAC;IACtB,CAAC;IAED,OAAO;IACL,iDAAiD;IACjD,GAAG,GAAG,YAAY,GAAG,CAAC,IAAI,EAAE;QAC5B,wEAAwE;QACxE,wEAAwE;QACxE,sDAAsD;QACtD,YAAY,KAAK,EAAE,CACpB,CAAC;AACJ,CAAC"}
|
||||
+69
@@ -0,0 +1,69 @@
|
||||
"use strict";
|
||||
Object.defineProperty(exports, "__esModule", { value: true });
|
||||
exports.default = default_1;
|
||||
function default_1(hostname, options, out) {
|
||||
// Fast path for very popular suffixes; this allows to by-pass lookup
|
||||
// completely as well as any extra allocation or string manipulation.
|
||||
if (!options.allowPrivateDomains && hostname.length > 3) {
|
||||
const last = hostname.length - 1;
|
||||
const c3 = hostname.charCodeAt(last);
|
||||
const c2 = hostname.charCodeAt(last - 1);
|
||||
const c1 = hostname.charCodeAt(last - 2);
|
||||
const c0 = hostname.charCodeAt(last - 3);
|
||||
if (c3 === 109 /* 'm' */ &&
|
||||
c2 === 111 /* 'o' */ &&
|
||||
c1 === 99 /* 'c' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'com';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 103 /* 'g' */ &&
|
||||
c2 === 114 /* 'r' */ &&
|
||||
c1 === 111 /* 'o' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'org';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 117 /* 'u' */ &&
|
||||
c2 === 100 /* 'd' */ &&
|
||||
c1 === 101 /* 'e' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'edu';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 118 /* 'v' */ &&
|
||||
c2 === 111 /* 'o' */ &&
|
||||
c1 === 103 /* 'g' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'gov';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 116 /* 't' */ &&
|
||||
c2 === 101 /* 'e' */ &&
|
||||
c1 === 110 /* 'n' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'net';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 101 /* 'e' */ &&
|
||||
c2 === 100 /* 'd' */ &&
|
||||
c1 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'de';
|
||||
return true;
|
||||
}
|
||||
}
|
||||
return false;
|
||||
}
|
||||
//# sourceMappingURL=fast-path.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"fast-path.js","sourceRoot":"","sources":["../../../../src/lookup/fast-path.ts"],"names":[],"mappings":";;AAEA,4BA6EC;AA7ED,mBACE,QAAgB,EAChB,OAA6B,EAC7B,GAAkB;IAElB,qEAAqE;IACrE,qEAAqE;IACrE,IAAI,CAAC,OAAO,CAAC,mBAAmB,IAAI,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QACxD,MAAM,IAAI,GAAW,QAAQ,CAAC,MAAM,GAAG,CAAC,CAAC;QACzC,MAAM,EAAE,GAAW,QAAQ,CAAC,UAAU,CAAC,IAAI,CAAC,CAAC;QAC7C,MAAM,EAAE,GAAW,QAAQ,CAAC,UAAU,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC;QACjD,MAAM,EAAE,GAAW,QAAQ,CAAC,UAAU,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC;QACjD,MAAM,EAAE,GAAW,QAAQ,CAAC,UAAU,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC;QAEjD,IACE,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS;YACnB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,KAAK,CAAC;YACzB,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IACL,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,KAAK,CAAC;YACzB,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IACL,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,KAAK,CAAC;YACzB,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IACL,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,KAAK,CAAC;YACzB,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IACL,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,KAAK,CAAC;YACzB,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IACL,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,IAAI,CAAC;YACxB,OAAO,IAAI,CAAC;QACd,CAAC;IACH,CAAC;IAED,OAAO,KAAK,CAAC;AACf,CAAC"}
|
||||
+3
@@ -0,0 +1,3 @@
|
||||
"use strict";
|
||||
Object.defineProperty(exports, "__esModule", { value: true });
|
||||
//# sourceMappingURL=interface.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"interface.js","sourceRoot":"","sources":["../../../../src/lookup/interface.ts"],"names":[],"mappings":""}
|
||||
+22
@@ -0,0 +1,22 @@
|
||||
"use strict";
|
||||
Object.defineProperty(exports, "__esModule", { value: true });
|
||||
exports.setDefaults = setDefaults;
|
||||
function setDefaultsImpl({ allowIcannDomains = true, allowPrivateDomains = false, detectIp = true, extractHostname = true, mixedInputs = true, validHosts = null, validateHostname = true, }) {
|
||||
return {
|
||||
allowIcannDomains,
|
||||
allowPrivateDomains,
|
||||
detectIp,
|
||||
extractHostname,
|
||||
mixedInputs,
|
||||
validHosts,
|
||||
validateHostname,
|
||||
};
|
||||
}
|
||||
const DEFAULT_OPTIONS = /*@__INLINE__*/ setDefaultsImpl({});
|
||||
function setDefaults(options) {
|
||||
if (options === undefined) {
|
||||
return DEFAULT_OPTIONS;
|
||||
}
|
||||
return /*@__INLINE__*/ setDefaultsImpl(options);
|
||||
}
|
||||
//# sourceMappingURL=options.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"options.js","sourceRoot":"","sources":["../../../src/options.ts"],"names":[],"mappings":";;AAgCA,kCAMC;AA5BD,SAAS,eAAe,CAAC,EACvB,iBAAiB,GAAG,IAAI,EACxB,mBAAmB,GAAG,KAAK,EAC3B,QAAQ,GAAG,IAAI,EACf,eAAe,GAAG,IAAI,EACtB,WAAW,GAAG,IAAI,EAClB,UAAU,GAAG,IAAI,EACjB,gBAAgB,GAAG,IAAI,GACL;IAClB,OAAO;QACL,iBAAiB;QACjB,mBAAmB;QACnB,QAAQ;QACR,eAAe;QACf,WAAW;QACX,UAAU;QACV,gBAAgB;KACjB,CAAC;AACJ,CAAC;AAED,MAAM,eAAe,GAAG,eAAe,CAAC,eAAe,CAAC,EAAE,CAAC,CAAC;AAE5D,SAAgB,WAAW,CAAC,OAA2B;IACrD,IAAI,OAAO,KAAK,SAAS,EAAE,CAAC;QAC1B,OAAO,eAAe,CAAC;IACzB,CAAC;IAED,OAAO,eAAe,CAAC,eAAe,CAAC,OAAO,CAAC,CAAC;AAClD,CAAC"}
|
||||
+14
@@ -0,0 +1,14 @@
|
||||
"use strict";
|
||||
Object.defineProperty(exports, "__esModule", { value: true });
|
||||
exports.default = getSubdomain;
|
||||
/**
|
||||
* Returns the subdomain of a hostname string
|
||||
*/
|
||||
function getSubdomain(hostname, domain) {
|
||||
// If `hostname` and `domain` are the same, then there is no sub-domain
|
||||
if (domain.length === hostname.length) {
|
||||
return '';
|
||||
}
|
||||
return hostname.slice(0, -domain.length - 1);
|
||||
}
|
||||
//# sourceMappingURL=subdomain.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"subdomain.js","sourceRoot":"","sources":["../../../src/subdomain.ts"],"names":[],"mappings":";;AAGA,+BAOC;AAVD;;GAEG;AACH,SAAwB,YAAY,CAAC,QAAgB,EAAE,MAAc;IACnE,uEAAuE;IACvE,IAAI,MAAM,CAAC,MAAM,KAAK,QAAQ,CAAC,MAAM,EAAE,CAAC;QACtC,OAAO,EAAE,CAAC;IACZ,CAAC;IAED,OAAO,QAAQ,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,MAAM,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;AAC/C,CAAC"}
|
||||
+1
File diff suppressed because one or more lines are too long
+4
@@ -0,0 +1,4 @@
|
||||
export { parseImpl, getEmptyResult, resetResult, } from './src/factory';
|
||||
export { default as fastPathLookup } from './src/lookup/fast-path';
|
||||
export { setDefaults } from './src/options';
|
||||
//# sourceMappingURL=index.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../index.ts"],"names":[],"mappings":"AAAA,OAAO,EAEL,SAAS,EAET,cAAc,EACd,WAAW,GACZ,MAAM,eAAe,CAAC;AAEvB,OAAO,EAAE,OAAO,IAAI,cAAc,EAAE,MAAM,wBAAwB,CAAC;AACnE,OAAO,EAAY,WAAW,EAAE,MAAM,eAAe,CAAC"}
|
||||
+12
@@ -0,0 +1,12 @@
|
||||
/**
|
||||
* Return the part of domain without suffix.
|
||||
*
|
||||
* Example: for domain 'foo.com', the result would be 'foo'.
|
||||
*/
|
||||
export default function getDomainWithoutSuffix(domain, suffix) {
|
||||
// Note: here `domain` and `suffix` cannot have the same length because in
|
||||
// this case we set `domain` to `null` instead. It is thus safe to assume
|
||||
// that `suffix` is shorter than `domain`.
|
||||
return domain.slice(0, -suffix.length - 1);
|
||||
}
|
||||
//# sourceMappingURL=domain-without-suffix.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"domain-without-suffix.js","sourceRoot":"","sources":["../../../src/domain-without-suffix.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AACH,MAAM,CAAC,OAAO,UAAU,sBAAsB,CAC5C,MAAc,EACd,MAAc;IAEd,0EAA0E;IAC1E,yEAAyE;IACzE,0CAA0C;IAC1C,OAAO,MAAM,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,MAAM,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;AAC7C,CAAC"}
|
||||
+80
@@ -0,0 +1,80 @@
|
||||
/**
|
||||
* Check if `vhost` is a valid suffix of `hostname` (top-domain)
|
||||
*
|
||||
* It means that `vhost` needs to be a suffix of `hostname` and we then need to
|
||||
* make sure that: either they are equal, or the character preceding `vhost` in
|
||||
* `hostname` is a '.' (it should not be a partial label).
|
||||
*
|
||||
* * hostname = 'not.evil.com' and vhost = 'vil.com' => not ok
|
||||
* * hostname = 'not.evil.com' and vhost = 'evil.com' => ok
|
||||
* * hostname = 'not.evil.com' and vhost = 'not.evil.com' => ok
|
||||
*/
|
||||
function shareSameDomainSuffix(hostname, vhost) {
|
||||
if (hostname.endsWith(vhost)) {
|
||||
return (hostname.length === vhost.length ||
|
||||
hostname[hostname.length - vhost.length - 1] === '.');
|
||||
}
|
||||
return false;
|
||||
}
|
||||
/**
|
||||
* Given a hostname and its public suffix, extract the general domain.
|
||||
*/
|
||||
function extractDomainWithSuffix(hostname, publicSuffix) {
|
||||
// Locate the index of the last '.' in the part of the `hostname` preceding
|
||||
// the public suffix.
|
||||
//
|
||||
// examples:
|
||||
// 1. not.evil.co.uk => evil.co.uk
|
||||
// ^ ^
|
||||
// | | start of public suffix
|
||||
// | index of the last dot
|
||||
//
|
||||
// 2. example.co.uk => example.co.uk
|
||||
// ^ ^
|
||||
// | | start of public suffix
|
||||
// |
|
||||
// | (-1) no dot found before the public suffix
|
||||
const publicSuffixIndex = hostname.length - publicSuffix.length - 2;
|
||||
const lastDotBeforeSuffixIndex = hostname.lastIndexOf('.', publicSuffixIndex);
|
||||
// No '.' found, then `hostname` is the general domain (no sub-domain)
|
||||
if (lastDotBeforeSuffixIndex === -1) {
|
||||
return hostname;
|
||||
}
|
||||
// Extract the part between the last '.'
|
||||
return hostname.slice(lastDotBeforeSuffixIndex + 1);
|
||||
}
|
||||
/**
|
||||
* Detects the domain based on rules and upon and a host string
|
||||
*/
|
||||
export default function getDomain(suffix, hostname, options) {
|
||||
// Check if `hostname` ends with a member of `validHosts`.
|
||||
if (options.validHosts !== null) {
|
||||
const validHosts = options.validHosts;
|
||||
for (const vhost of validHosts) {
|
||||
if ( /*@__INLINE__*/shareSameDomainSuffix(hostname, vhost)) {
|
||||
return vhost;
|
||||
}
|
||||
}
|
||||
}
|
||||
let numberOfLeadingDots = 0;
|
||||
if (hostname.startsWith('.')) {
|
||||
while (numberOfLeadingDots < hostname.length &&
|
||||
hostname[numberOfLeadingDots] === '.') {
|
||||
numberOfLeadingDots += 1;
|
||||
}
|
||||
}
|
||||
// If `hostname` is a valid public suffix, then there is no domain to return.
|
||||
// Since we already know that `getPublicSuffix` returns a suffix of `hostname`
|
||||
// there is no need to perform a string comparison and we only compare the
|
||||
// size.
|
||||
if (suffix.length === hostname.length - numberOfLeadingDots) {
|
||||
return null;
|
||||
}
|
||||
// To extract the general domain, we start by identifying the public suffix
|
||||
// (if any), then consider the domain to be the public suffix with one added
|
||||
// level of depth. (e.g.: if hostname is `not.evil.co.uk` and public suffix:
|
||||
// `co.uk`, then we take one more level: `evil`, giving the final result:
|
||||
// `evil.co.uk`).
|
||||
return /*@__INLINE__*/ extractDomainWithSuffix(hostname, suffix);
|
||||
}
|
||||
//# sourceMappingURL=domain.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"domain.js","sourceRoot":"","sources":["../../../src/domain.ts"],"names":[],"mappings":"AAEA;;;;;;;;;;GAUG;AACH,SAAS,qBAAqB,CAAC,QAAgB,EAAE,KAAa;IAC5D,IAAI,QAAQ,CAAC,QAAQ,CAAC,KAAK,CAAC,EAAE,CAAC;QAC7B,OAAO,CACL,QAAQ,CAAC,MAAM,KAAK,KAAK,CAAC,MAAM;YAChC,QAAQ,CAAC,QAAQ,CAAC,MAAM,GAAG,KAAK,CAAC,MAAM,GAAG,CAAC,CAAC,KAAK,GAAG,CACrD,CAAC;IACJ,CAAC;IAED,OAAO,KAAK,CAAC;AACf,CAAC;AAED;;GAEG;AACH,SAAS,uBAAuB,CAC9B,QAAgB,EAChB,YAAoB;IAEpB,2EAA2E;IAC3E,qBAAqB;IACrB,EAAE;IACF,YAAY;IACZ,qCAAqC;IACrC,iBAAiB;IACjB,wCAAwC;IACxC,kCAAkC;IAClC,EAAE;IACF,wCAAwC;IACxC,gBAAgB;IAChB,uCAAuC;IACvC,QAAQ;IACR,mDAAmD;IACnD,MAAM,iBAAiB,GAAG,QAAQ,CAAC,MAAM,GAAG,YAAY,CAAC,MAAM,GAAG,CAAC,CAAC;IACpE,MAAM,wBAAwB,GAAG,QAAQ,CAAC,WAAW,CAAC,GAAG,EAAE,iBAAiB,CAAC,CAAC;IAE9E,sEAAsE;IACtE,IAAI,wBAAwB,KAAK,CAAC,CAAC,EAAE,CAAC;QACpC,OAAO,QAAQ,CAAC;IAClB,CAAC;IAED,wCAAwC;IACxC,OAAO,QAAQ,CAAC,KAAK,CAAC,wBAAwB,GAAG,CAAC,CAAC,CAAC;AACtD,CAAC;AAED;;GAEG;AACH,MAAM,CAAC,OAAO,UAAU,SAAS,CAC/B,MAAc,EACd,QAAgB,EAChB,OAAiB;IAEjB,0DAA0D;IAC1D,IAAI,OAAO,CAAC,UAAU,KAAK,IAAI,EAAE,CAAC;QAChC,MAAM,UAAU,GAAG,OAAO,CAAC,UAAU,CAAC;QACtC,KAAK,MAAM,KAAK,IAAI,UAAU,EAAE,CAAC;YAC/B,KAAI,eAAgB,qBAAqB,CAAC,QAAQ,EAAE,KAAK,CAAC,EAAE,CAAC;gBAC3D,OAAO,KAAK,CAAC;YACf,CAAC;QACH,CAAC;IACH,CAAC;IAED,IAAI,mBAAmB,GAAG,CAAC,CAAC;IAC5B,IAAI,QAAQ,CAAC,UAAU,CAAC,GAAG,CAAC,EAAE,CAAC;QAC7B,OACE,mBAAmB,GAAG,QAAQ,CAAC,MAAM;YACrC,QAAQ,CAAC,mBAAmB,CAAC,KAAK,GAAG,EACrC,CAAC;YACD,mBAAmB,IAAI,CAAC,CAAC;QAC3B,CAAC;IACH,CAAC;IAED,6EAA6E;IAC7E,8EAA8E;IAC9E,0EAA0E;IAC1E,QAAQ;IACR,IAAI,MAAM,CAAC,MAAM,KAAK,QAAQ,CAAC,MAAM,GAAG,mBAAmB,EAAE,CAAC;QAC5D,OAAO,IAAI,CAAC;IACd,CAAC;IAED,2EAA2E;IAC3E,4EAA4E;IAC5E,4EAA4E;IAC5E,yEAAyE;IACzE,iBAAiB;IACjB,OAAO,eAAe,CAAC,uBAAuB,CAAC,QAAQ,EAAE,MAAM,CAAC,CAAC;AACnE,CAAC"}
|
||||
+146
@@ -0,0 +1,146 @@
|
||||
/**
|
||||
* @param url - URL we want to extract a hostname from.
|
||||
* @param urlIsValidHostname - hint from caller; true if `url` is already a valid hostname.
|
||||
*/
|
||||
export default function extractHostname(url, urlIsValidHostname) {
|
||||
let start = 0;
|
||||
let end = url.length;
|
||||
let hasUpper = false;
|
||||
// If url is not already a valid hostname, then try to extract hostname.
|
||||
if (!urlIsValidHostname) {
|
||||
// Special handling of data URLs
|
||||
if (url.startsWith('data:')) {
|
||||
return null;
|
||||
}
|
||||
// Trim leading spaces
|
||||
while (start < url.length && url.charCodeAt(start) <= 32) {
|
||||
start += 1;
|
||||
}
|
||||
// Trim trailing spaces
|
||||
while (end > start + 1 && url.charCodeAt(end - 1) <= 32) {
|
||||
end -= 1;
|
||||
}
|
||||
// Skip scheme.
|
||||
if (url.charCodeAt(start) === 47 /* '/' */ &&
|
||||
url.charCodeAt(start + 1) === 47 /* '/' */) {
|
||||
start += 2;
|
||||
}
|
||||
else {
|
||||
const indexOfProtocol = url.indexOf(':/', start);
|
||||
if (indexOfProtocol !== -1) {
|
||||
// Implement fast-path for common protocols. We expect most protocols
|
||||
// should be one of these 4 and thus we will not need to perform the
|
||||
// more expansive validity check most of the time.
|
||||
const protocolSize = indexOfProtocol - start;
|
||||
const c0 = url.charCodeAt(start);
|
||||
const c1 = url.charCodeAt(start + 1);
|
||||
const c2 = url.charCodeAt(start + 2);
|
||||
const c3 = url.charCodeAt(start + 3);
|
||||
const c4 = url.charCodeAt(start + 4);
|
||||
if (protocolSize === 5 &&
|
||||
c0 === 104 /* 'h' */ &&
|
||||
c1 === 116 /* 't' */ &&
|
||||
c2 === 116 /* 't' */ &&
|
||||
c3 === 112 /* 'p' */ &&
|
||||
c4 === 115 /* 's' */) {
|
||||
// https
|
||||
}
|
||||
else if (protocolSize === 4 &&
|
||||
c0 === 104 /* 'h' */ &&
|
||||
c1 === 116 /* 't' */ &&
|
||||
c2 === 116 /* 't' */ &&
|
||||
c3 === 112 /* 'p' */) {
|
||||
// http
|
||||
}
|
||||
else if (protocolSize === 3 &&
|
||||
c0 === 119 /* 'w' */ &&
|
||||
c1 === 115 /* 's' */ &&
|
||||
c2 === 115 /* 's' */) {
|
||||
// wss
|
||||
}
|
||||
else if (protocolSize === 2 &&
|
||||
c0 === 119 /* 'w' */ &&
|
||||
c1 === 115 /* 's' */) {
|
||||
// ws
|
||||
}
|
||||
else {
|
||||
// Check that scheme is valid
|
||||
for (let i = start; i < indexOfProtocol; i += 1) {
|
||||
const lowerCaseCode = url.charCodeAt(i) | 32;
|
||||
if (!(((lowerCaseCode >= 97 && lowerCaseCode <= 122) || // [a, z]
|
||||
(lowerCaseCode >= 48 && lowerCaseCode <= 57) || // [0, 9]
|
||||
lowerCaseCode === 46 || // '.'
|
||||
lowerCaseCode === 45 || // '-'
|
||||
lowerCaseCode === 43) // '+'
|
||||
)) {
|
||||
return null;
|
||||
}
|
||||
}
|
||||
}
|
||||
// Skip 0, 1 or more '/' after ':/'
|
||||
start = indexOfProtocol + 2;
|
||||
while (url.charCodeAt(start) === 47 /* '/' */) {
|
||||
start += 1;
|
||||
}
|
||||
}
|
||||
}
|
||||
// Detect first occurrence of '/', '?' or '#'. We also keep track of the
|
||||
// last occurrence of '@', ']' or ':' to speed-up subsequent parsing of
|
||||
// (respectively), identifier, ipv6 or port.
|
||||
let indexOfIdentifier = -1;
|
||||
let indexOfClosingBracket = -1;
|
||||
let indexOfPort = -1;
|
||||
for (let i = start; i < end; i += 1) {
|
||||
const code = url.charCodeAt(i);
|
||||
if (code === 35 || // '#'
|
||||
code === 47 || // '/'
|
||||
code === 63 // '?'
|
||||
) {
|
||||
end = i;
|
||||
break;
|
||||
}
|
||||
else if (code === 64) {
|
||||
// '@'
|
||||
indexOfIdentifier = i;
|
||||
}
|
||||
else if (code === 93) {
|
||||
// ']'
|
||||
indexOfClosingBracket = i;
|
||||
}
|
||||
else if (code === 58) {
|
||||
// ':'
|
||||
indexOfPort = i;
|
||||
}
|
||||
else if (code >= 65 && code <= 90) {
|
||||
hasUpper = true;
|
||||
}
|
||||
}
|
||||
// Detect identifier: '@'
|
||||
if (indexOfIdentifier !== -1 &&
|
||||
indexOfIdentifier > start &&
|
||||
indexOfIdentifier < end) {
|
||||
start = indexOfIdentifier + 1;
|
||||
}
|
||||
// Handle ipv6 addresses
|
||||
if (url.charCodeAt(start) === 91 /* '[' */) {
|
||||
if (indexOfClosingBracket !== -1) {
|
||||
return url.slice(start + 1, indexOfClosingBracket).toLowerCase();
|
||||
}
|
||||
return null;
|
||||
}
|
||||
else if (indexOfPort !== -1 && indexOfPort > start && indexOfPort < end) {
|
||||
// Detect port: ':'
|
||||
end = indexOfPort;
|
||||
}
|
||||
}
|
||||
// Trim trailing dots
|
||||
while (end > start + 1 && url.charCodeAt(end - 1) === 46 /* '.' */) {
|
||||
end -= 1;
|
||||
}
|
||||
const hostname = start !== 0 || end !== url.length ? url.slice(start, end) : url;
|
||||
if (hasUpper) {
|
||||
return hostname.toLowerCase();
|
||||
}
|
||||
return hostname;
|
||||
}
|
||||
//# sourceMappingURL=extract-hostname.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"extract-hostname.js","sourceRoot":"","sources":["../../../src/extract-hostname.ts"],"names":[],"mappings":"AAAA;;;GAGG;AACH,MAAM,CAAC,OAAO,UAAU,eAAe,CACrC,GAAW,EACX,kBAA2B;IAE3B,IAAI,KAAK,GAAG,CAAC,CAAC;IACd,IAAI,GAAG,GAAW,GAAG,CAAC,MAAM,CAAC;IAC7B,IAAI,QAAQ,GAAG,KAAK,CAAC;IAErB,wEAAwE;IACxE,IAAI,CAAC,kBAAkB,EAAE,CAAC;QACxB,gCAAgC;QAChC,IAAI,GAAG,CAAC,UAAU,CAAC,OAAO,CAAC,EAAE,CAAC;YAC5B,OAAO,IAAI,CAAC;QACd,CAAC;QAED,sBAAsB;QACtB,OAAO,KAAK,GAAG,GAAG,CAAC,MAAM,IAAI,GAAG,CAAC,UAAU,CAAC,KAAK,CAAC,IAAI,EAAE,EAAE,CAAC;YACzD,KAAK,IAAI,CAAC,CAAC;QACb,CAAC;QAED,uBAAuB;QACvB,OAAO,GAAG,GAAG,KAAK,GAAG,CAAC,IAAI,GAAG,CAAC,UAAU,CAAC,GAAG,GAAG,CAAC,CAAC,IAAI,EAAE,EAAE,CAAC;YACxD,GAAG,IAAI,CAAC,CAAC;QACX,CAAC;QAED,eAAe;QACf,IACE,GAAG,CAAC,UAAU,CAAC,KAAK,CAAC,KAAK,EAAE,CAAC,SAAS;YACtC,GAAG,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,KAAK,EAAE,CAAC,SAAS,EAC1C,CAAC;YACD,KAAK,IAAI,CAAC,CAAC;QACb,CAAC;aAAM,CAAC;YACN,MAAM,eAAe,GAAG,GAAG,CAAC,OAAO,CAAC,IAAI,EAAE,KAAK,CAAC,CAAC;YACjD,IAAI,eAAe,KAAK,CAAC,CAAC,EAAE,CAAC;gBAC3B,qEAAqE;gBACrE,oEAAoE;gBACpE,kDAAkD;gBAClD,MAAM,YAAY,GAAG,eAAe,GAAG,KAAK,CAAC;gBAC7C,MAAM,EAAE,GAAG,GAAG,CAAC,UAAU,CAAC,KAAK,CAAC,CAAC;gBACjC,MAAM,EAAE,GAAG,GAAG,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC;gBACrC,MAAM,EAAE,GAAG,GAAG,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC;gBACrC,MAAM,EAAE,GAAG,GAAG,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC;gBACrC,MAAM,EAAE,GAAG,GAAG,CAAC,UAAU,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC;gBAErC,IACE,YAAY,KAAK,CAAC;oBAClB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS,EACpB,CAAC;oBACD,QAAQ;gBACV,CAAC;qBAAM,IACL,YAAY,KAAK,CAAC;oBAClB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS,EACpB,CAAC;oBACD,OAAO;gBACT,CAAC;qBAAM,IACL,YAAY,KAAK,CAAC;oBAClB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS,EACpB,CAAC;oBACD,MAAM;gBACR,CAAC;qBAAM,IACL,YAAY,KAAK,CAAC;oBAClB,EAAE,KAAK,GAAG,CAAC,SAAS;oBACpB,EAAE,KAAK,GAAG,CAAC,SAAS,EACpB,CAAC;oBACD,KAAK;gBACP,CAAC;qBAAM,CAAC;oBACN,6BAA6B;oBAC7B,KAAK,IAAI,CAAC,GAAG,KAAK,EAAE,CAAC,GAAG,eAAe,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC;wBAChD,MAAM,aAAa,GAAG,GAAG,CAAC,UAAU,CAAC,CAAC,CAAC,GAAG,EAAE,CAAC;wBAC7C,IACE,CAAC,CACC,CACE,CAAC,aAAa,IAAI,EAAE,IAAI,aAAa,IAAI,GAAG,CAAC,IAAI,SAAS;4BAC1D,CAAC,aAAa,IAAI,EAAE,IAAI,aAAa,IAAI,EAAE,CAAC,IAAI,SAAS;4BACzD,aAAa,KAAK,EAAE,IAAI,MAAM;4BAC9B,aAAa,KAAK,EAAE,IAAI,MAAM;4BAC9B,aAAa,KAAK,EAAE,CACrB,CAAC,MAAM;yBACT,EACD,CAAC;4BACD,OAAO,IAAI,CAAC;wBACd,CAAC;oBACH,CAAC;gBACH,CAAC;gBAED,mCAAmC;gBACnC,KAAK,GAAG,eAAe,GAAG,CAAC,CAAC;gBAC5B,OAAO,GAAG,CAAC,UAAU,CAAC,KAAK,CAAC,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;oBAC9C,KAAK,IAAI,CAAC,CAAC;gBACb,CAAC;YACH,CAAC;QACH,CAAC;QAED,wEAAwE;QACxE,uEAAuE;QACvE,4CAA4C;QAC5C,IAAI,iBAAiB,GAAG,CAAC,CAAC,CAAC;QAC3B,IAAI,qBAAqB,GAAG,CAAC,CAAC,CAAC;QAC/B,IAAI,WAAW,GAAG,CAAC,CAAC,CAAC;QACrB,KAAK,IAAI,CAAC,GAAG,KAAK,EAAE,CAAC,GAAG,GAAG,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC;YACpC,MAAM,IAAI,GAAW,GAAG,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;YACvC,IACE,IAAI,KAAK,EAAE,IAAI,MAAM;gBACrB,IAAI,KAAK,EAAE,IAAI,MAAM;gBACrB,IAAI,KAAK,EAAE,CAAC,MAAM;cAClB,CAAC;gBACD,GAAG,GAAG,CAAC,CAAC;gBACR,MAAM;YACR,CAAC;iBAAM,IAAI,IAAI,KAAK,EAAE,EAAE,CAAC;gBACvB,MAAM;gBACN,iBAAiB,GAAG,CAAC,CAAC;YACxB,CAAC;iBAAM,IAAI,IAAI,KAAK,EAAE,EAAE,CAAC;gBACvB,MAAM;gBACN,qBAAqB,GAAG,CAAC,CAAC;YAC5B,CAAC;iBAAM,IAAI,IAAI,KAAK,EAAE,EAAE,CAAC;gBACvB,MAAM;gBACN,WAAW,GAAG,CAAC,CAAC;YAClB,CAAC;iBAAM,IAAI,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,EAAE,EAAE,CAAC;gBACpC,QAAQ,GAAG,IAAI,CAAC;YAClB,CAAC;QACH,CAAC;QAED,yBAAyB;QACzB,IACE,iBAAiB,KAAK,CAAC,CAAC;YACxB,iBAAiB,GAAG,KAAK;YACzB,iBAAiB,GAAG,GAAG,EACvB,CAAC;YACD,KAAK,GAAG,iBAAiB,GAAG,CAAC,CAAC;QAChC,CAAC;QAED,wBAAwB;QACxB,IAAI,GAAG,CAAC,UAAU,CAAC,KAAK,CAAC,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;YAC3C,IAAI,qBAAqB,KAAK,CAAC,CAAC,EAAE,CAAC;gBACjC,OAAO,GAAG,CAAC,KAAK,CAAC,KAAK,GAAG,CAAC,EAAE,qBAAqB,CAAC,CAAC,WAAW,EAAE,CAAC;YACnE,CAAC;YACD,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IAAI,WAAW,KAAK,CAAC,CAAC,IAAI,WAAW,GAAG,KAAK,IAAI,WAAW,GAAG,GAAG,EAAE,CAAC;YAC1E,mBAAmB;YACnB,GAAG,GAAG,WAAW,CAAC;QACpB,CAAC;IACH,CAAC;IAED,qBAAqB;IACrB,OAAO,GAAG,GAAG,KAAK,GAAG,CAAC,IAAI,GAAG,CAAC,UAAU,CAAC,GAAG,GAAG,CAAC,CAAC,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;QACnE,GAAG,IAAI,CAAC,CAAC;IACX,CAAC;IAED,MAAM,QAAQ,GACZ,KAAK,KAAK,CAAC,IAAI,GAAG,KAAK,GAAG,CAAC,MAAM,CAAC,CAAC,CAAC,GAAG,CAAC,KAAK,CAAC,KAAK,EAAE,GAAG,CAAC,CAAC,CAAC,CAAC,GAAG,CAAC;IAElE,IAAI,QAAQ,EAAE,CAAC;QACb,OAAO,QAAQ,CAAC,WAAW,EAAE,CAAC;IAChC,CAAC;IAED,OAAO,QAAQ,CAAC;AAClB,CAAC"}
|
||||
+102
@@ -0,0 +1,102 @@
|
||||
/**
|
||||
* Implement a factory allowing to plug different implementations of suffix
|
||||
* lookup (e.g.: using a trie or the packed hashes datastructures). This is used
|
||||
* and exposed in `tldts.ts` and `tldts-experimental.ts` bundle entrypoints.
|
||||
*/
|
||||
import getDomain from './domain';
|
||||
import getDomainWithoutSuffix from './domain-without-suffix';
|
||||
import extractHostname from './extract-hostname';
|
||||
import isIp from './is-ip';
|
||||
import isValidHostname from './is-valid';
|
||||
import { setDefaults } from './options';
|
||||
import getSubdomain from './subdomain';
|
||||
export function getEmptyResult() {
|
||||
return {
|
||||
domain: null,
|
||||
domainWithoutSuffix: null,
|
||||
hostname: null,
|
||||
isIcann: null,
|
||||
isIp: null,
|
||||
isPrivate: null,
|
||||
publicSuffix: null,
|
||||
subdomain: null,
|
||||
};
|
||||
}
|
||||
export function resetResult(result) {
|
||||
result.domain = null;
|
||||
result.domainWithoutSuffix = null;
|
||||
result.hostname = null;
|
||||
result.isIcann = null;
|
||||
result.isIp = null;
|
||||
result.isPrivate = null;
|
||||
result.publicSuffix = null;
|
||||
result.subdomain = null;
|
||||
}
|
||||
export function parseImpl(url, step, suffixLookup, partialOptions, result) {
|
||||
const options = /*@__INLINE__*/ setDefaults(partialOptions);
|
||||
// Very fast approximate check to make sure `url` is a string. This is needed
|
||||
// because the library will not necessarily be used in a typed setup and
|
||||
// values of arbitrary types might be given as argument.
|
||||
if (typeof url !== 'string') {
|
||||
return result;
|
||||
}
|
||||
// Extract hostname from `url` only if needed. This can be made optional
|
||||
// using `options.extractHostname`. This option will typically be used
|
||||
// whenever we are sure the inputs to `parse` are already hostnames and not
|
||||
// arbitrary URLs.
|
||||
//
|
||||
// `mixedInput` allows to specify if we expect a mix of URLs and hostnames
|
||||
// as input. If only hostnames are expected then `extractHostname` can be
|
||||
// set to `false` to speed-up parsing. If only URLs are expected then
|
||||
// `mixedInputs` can be set to `false`. The `mixedInputs` is only a hint
|
||||
// and will not change the behavior of the library.
|
||||
if (!options.extractHostname) {
|
||||
result.hostname = url;
|
||||
}
|
||||
else if (options.mixedInputs) {
|
||||
result.hostname = extractHostname(url, isValidHostname(url));
|
||||
}
|
||||
else {
|
||||
result.hostname = extractHostname(url, false);
|
||||
}
|
||||
// Check if `hostname` is a valid ip address
|
||||
if (options.detectIp && result.hostname !== null) {
|
||||
result.isIp = isIp(result.hostname);
|
||||
if (result.isIp) {
|
||||
return result;
|
||||
}
|
||||
}
|
||||
// Perform hostname validation if enabled. If hostname is not valid, no need to
|
||||
// go further as there will be no valid domain or sub-domain. This validation
|
||||
// is applied before any early returns to ensure consistent behavior across
|
||||
// all API methods including getHostname().
|
||||
if (options.validateHostname &&
|
||||
options.extractHostname &&
|
||||
result.hostname !== null &&
|
||||
!isValidHostname(result.hostname)) {
|
||||
result.hostname = null;
|
||||
return result;
|
||||
}
|
||||
if (step === 0 /* FLAG.HOSTNAME */ || result.hostname === null) {
|
||||
return result;
|
||||
}
|
||||
// Extract public suffix
|
||||
suffixLookup(result.hostname, options, result);
|
||||
if (step === 2 /* FLAG.PUBLIC_SUFFIX */ || result.publicSuffix === null) {
|
||||
return result;
|
||||
}
|
||||
// Extract domain
|
||||
result.domain = getDomain(result.publicSuffix, result.hostname, options);
|
||||
if (step === 3 /* FLAG.DOMAIN */ || result.domain === null) {
|
||||
return result;
|
||||
}
|
||||
// Extract subdomain
|
||||
result.subdomain = getSubdomain(result.hostname, result.domain);
|
||||
if (step === 4 /* FLAG.SUB_DOMAIN */) {
|
||||
return result;
|
||||
}
|
||||
// Extract domain without suffix
|
||||
result.domainWithoutSuffix = getDomainWithoutSuffix(result.domain, result.publicSuffix);
|
||||
return result;
|
||||
}
|
||||
//# sourceMappingURL=factory.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"factory.js","sourceRoot":"","sources":["../../../src/factory.ts"],"names":[],"mappings":"AAAA;;;;GAIG;AAEH,OAAO,SAAS,MAAM,UAAU,CAAC;AACjC,OAAO,sBAAsB,MAAM,yBAAyB,CAAC;AAC7D,OAAO,eAAe,MAAM,oBAAoB,CAAC;AACjD,OAAO,IAAI,MAAM,SAAS,CAAC;AAC3B,OAAO,eAAe,MAAM,YAAY,CAAC;AAEzC,OAAO,EAAY,WAAW,EAAE,MAAM,WAAW,CAAC;AAClD,OAAO,YAAY,MAAM,aAAa,CAAC;AAuBvC,MAAM,UAAU,cAAc;IAC5B,OAAO;QACL,MAAM,EAAE,IAAI;QACZ,mBAAmB,EAAE,IAAI;QACzB,QAAQ,EAAE,IAAI;QACd,OAAO,EAAE,IAAI;QACb,IAAI,EAAE,IAAI;QACV,SAAS,EAAE,IAAI;QACf,YAAY,EAAE,IAAI;QAClB,SAAS,EAAE,IAAI;KAChB,CAAC;AACJ,CAAC;AAED,MAAM,UAAU,WAAW,CAAC,MAAe;IACzC,MAAM,CAAC,MAAM,GAAG,IAAI,CAAC;IACrB,MAAM,CAAC,mBAAmB,GAAG,IAAI,CAAC;IAClC,MAAM,CAAC,QAAQ,GAAG,IAAI,CAAC;IACvB,MAAM,CAAC,OAAO,GAAG,IAAI,CAAC;IACtB,MAAM,CAAC,IAAI,GAAG,IAAI,CAAC;IACnB,MAAM,CAAC,SAAS,GAAG,IAAI,CAAC;IACxB,MAAM,CAAC,YAAY,GAAG,IAAI,CAAC;IAC3B,MAAM,CAAC,SAAS,GAAG,IAAI,CAAC;AAC1B,CAAC;AAeD,MAAM,UAAU,SAAS,CACvB,GAAW,EACX,IAAU,EACV,YAIS,EACT,cAAiC,EACjC,MAAe;IAEf,MAAM,OAAO,GAAa,eAAe,CAAC,WAAW,CAAC,cAAc,CAAC,CAAC;IAEtE,6EAA6E;IAC7E,wEAAwE;IACxE,wDAAwD;IACxD,IAAI,OAAO,GAAG,KAAK,QAAQ,EAAE,CAAC;QAC5B,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,wEAAwE;IACxE,sEAAsE;IACtE,2EAA2E;IAC3E,kBAAkB;IAClB,EAAE;IACF,0EAA0E;IAC1E,yEAAyE;IACzE,qEAAqE;IACrE,wEAAwE;IACxE,mDAAmD;IACnD,IAAI,CAAC,OAAO,CAAC,eAAe,EAAE,CAAC;QAC7B,MAAM,CAAC,QAAQ,GAAG,GAAG,CAAC;IACxB,CAAC;SAAM,IAAI,OAAO,CAAC,WAAW,EAAE,CAAC;QAC/B,MAAM,CAAC,QAAQ,GAAG,eAAe,CAAC,GAAG,EAAE,eAAe,CAAC,GAAG,CAAC,CAAC,CAAC;IAC/D,CAAC;SAAM,CAAC;QACN,MAAM,CAAC,QAAQ,GAAG,eAAe,CAAC,GAAG,EAAE,KAAK,CAAC,CAAC;IAChD,CAAC;IAED,4CAA4C;IAC5C,IAAI,OAAO,CAAC,QAAQ,IAAI,MAAM,CAAC,QAAQ,KAAK,IAAI,EAAE,CAAC;QACjD,MAAM,CAAC,IAAI,GAAG,IAAI,CAAC,MAAM,CAAC,QAAQ,CAAC,CAAC;QACpC,IAAI,MAAM,CAAC,IAAI,EAAE,CAAC;YAChB,OAAO,MAAM,CAAC;QAChB,CAAC;IACH,CAAC;IAED,+EAA+E;IAC/E,6EAA6E;IAC7E,2EAA2E;IAC3E,2CAA2C;IAC3C,IACE,OAAO,CAAC,gBAAgB;QACxB,OAAO,CAAC,eAAe;QACvB,MAAM,CAAC,QAAQ,KAAK,IAAI;QACxB,CAAC,eAAe,CAAC,MAAM,CAAC,QAAQ,CAAC,EACjC,CAAC;QACD,MAAM,CAAC,QAAQ,GAAG,IAAI,CAAC;QACvB,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,IAAI,IAAI,0BAAkB,IAAI,MAAM,CAAC,QAAQ,KAAK,IAAI,EAAE,CAAC;QACvD,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,wBAAwB;IACxB,YAAY,CAAC,MAAM,CAAC,QAAQ,EAAE,OAAO,EAAE,MAAM,CAAC,CAAC;IAC/C,IAAI,IAAI,+BAAuB,IAAI,MAAM,CAAC,YAAY,KAAK,IAAI,EAAE,CAAC;QAChE,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,iBAAiB;IACjB,MAAM,CAAC,MAAM,GAAG,SAAS,CAAC,MAAM,CAAC,YAAY,EAAE,MAAM,CAAC,QAAQ,EAAE,OAAO,CAAC,CAAC;IACzE,IAAI,IAAI,wBAAgB,IAAI,MAAM,CAAC,MAAM,KAAK,IAAI,EAAE,CAAC;QACnD,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,oBAAoB;IACpB,MAAM,CAAC,SAAS,GAAG,YAAY,CAAC,MAAM,CAAC,QAAQ,EAAE,MAAM,CAAC,MAAM,CAAC,CAAC;IAChE,IAAI,IAAI,4BAAoB,EAAE,CAAC;QAC7B,OAAO,MAAM,CAAC;IAChB,CAAC;IAED,gCAAgC;IAChC,MAAM,CAAC,mBAAmB,GAAG,sBAAsB,CACjD,MAAM,CAAC,MAAM,EACb,MAAM,CAAC,YAAY,CACpB,CAAC;IAEF,OAAO,MAAM,CAAC;AAChB,CAAC"}
|
||||
+69
@@ -0,0 +1,69 @@
|
||||
/**
|
||||
* Check if a hostname is an IP. You should be aware that this only works
|
||||
* because `hostname` is already garanteed to be a valid hostname!
|
||||
*/
|
||||
function isProbablyIpv4(hostname) {
|
||||
// Cannot be shorted than 1.1.1.1
|
||||
if (hostname.length < 7) {
|
||||
return false;
|
||||
}
|
||||
// Cannot be longer than: 255.255.255.255
|
||||
if (hostname.length > 15) {
|
||||
return false;
|
||||
}
|
||||
let numberOfDots = 0;
|
||||
for (let i = 0; i < hostname.length; i += 1) {
|
||||
const code = hostname.charCodeAt(i);
|
||||
if (code === 46 /* '.' */) {
|
||||
numberOfDots += 1;
|
||||
}
|
||||
else if (code < 48 /* '0' */ || code > 57 /* '9' */) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
return (numberOfDots === 3 &&
|
||||
hostname.charCodeAt(0) !== 46 /* '.' */ &&
|
||||
hostname.charCodeAt(hostname.length - 1) !== 46 /* '.' */);
|
||||
}
|
||||
/**
|
||||
* Similar to isProbablyIpv4.
|
||||
*/
|
||||
function isProbablyIpv6(hostname) {
|
||||
if (hostname.length < 3) {
|
||||
return false;
|
||||
}
|
||||
let start = hostname.startsWith('[') ? 1 : 0;
|
||||
let end = hostname.length;
|
||||
if (hostname[end - 1] === ']') {
|
||||
end -= 1;
|
||||
}
|
||||
// We only consider the maximum size of a normal IPV6. Note that this will
|
||||
// fail on so-called "IPv4 mapped IPv6 addresses" but this is a corner-case
|
||||
// and a proper validation library should be used for these.
|
||||
if (end - start > 39) {
|
||||
return false;
|
||||
}
|
||||
let hasColon = false;
|
||||
for (; start < end; start += 1) {
|
||||
const code = hostname.charCodeAt(start);
|
||||
if (code === 58 /* ':' */) {
|
||||
hasColon = true;
|
||||
}
|
||||
else if (!(((code >= 48 && code <= 57) || // 0-9
|
||||
(code >= 97 && code <= 102) || // a-f
|
||||
(code >= 65 && code <= 90)) // A-F
|
||||
)) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
return hasColon;
|
||||
}
|
||||
/**
|
||||
* Check if `hostname` is *probably* a valid ip addr (either ipv6 or ipv4).
|
||||
* This *will not* work on any string. We need `hostname` to be a valid
|
||||
* hostname.
|
||||
*/
|
||||
export default function isIp(hostname) {
|
||||
return isProbablyIpv6(hostname) || isProbablyIpv4(hostname);
|
||||
}
|
||||
//# sourceMappingURL=is-ip.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"is-ip.js","sourceRoot":"","sources":["../../../src/is-ip.ts"],"names":[],"mappings":"AAAA;;;GAGG;AACH,SAAS,cAAc,CAAC,QAAgB;IACtC,iCAAiC;IACjC,IAAI,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QACxB,OAAO,KAAK,CAAC;IACf,CAAC;IAED,yCAAyC;IACzC,IAAI,QAAQ,CAAC,MAAM,GAAG,EAAE,EAAE,CAAC;QACzB,OAAO,KAAK,CAAC;IACf,CAAC;IAED,IAAI,YAAY,GAAG,CAAC,CAAC;IAErB,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,QAAQ,CAAC,MAAM,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC;QAC5C,MAAM,IAAI,GAAG,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;QAEpC,IAAI,IAAI,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;YAC1B,YAAY,IAAI,CAAC,CAAC;QACpB,CAAC;aAAM,IAAI,IAAI,GAAG,EAAE,CAAC,SAAS,IAAI,IAAI,GAAG,EAAE,CAAC,SAAS,EAAE,CAAC;YACtD,OAAO,KAAK,CAAC;QACf,CAAC;IACH,CAAC;IAED,OAAO,CACL,YAAY,KAAK,CAAC;QAClB,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,KAAK,EAAE,CAAC,SAAS;QACvC,QAAQ,CAAC,UAAU,CAAC,QAAQ,CAAC,MAAM,GAAG,CAAC,CAAC,KAAK,EAAE,CAAC,SAAS,CAC1D,CAAC;AACJ,CAAC;AAED;;GAEG;AACH,SAAS,cAAc,CAAC,QAAgB;IACtC,IAAI,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QACxB,OAAO,KAAK,CAAC;IACf,CAAC;IAED,IAAI,KAAK,GAAG,QAAQ,CAAC,UAAU,CAAC,GAAG,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC,CAAC;IAC7C,IAAI,GAAG,GAAG,QAAQ,CAAC,MAAM,CAAC;IAE1B,IAAI,QAAQ,CAAC,GAAG,GAAG,CAAC,CAAC,KAAK,GAAG,EAAE,CAAC;QAC9B,GAAG,IAAI,CAAC,CAAC;IACX,CAAC;IAED,0EAA0E;IAC1E,2EAA2E;IAC3E,4DAA4D;IAC5D,IAAI,GAAG,GAAG,KAAK,GAAG,EAAE,EAAE,CAAC;QACrB,OAAO,KAAK,CAAC;IACf,CAAC;IAED,IAAI,QAAQ,GAAG,KAAK,CAAC;IAErB,OAAO,KAAK,GAAG,GAAG,EAAE,KAAK,IAAI,CAAC,EAAE,CAAC;QAC/B,MAAM,IAAI,GAAG,QAAQ,CAAC,UAAU,CAAC,KAAK,CAAC,CAAC;QAExC,IAAI,IAAI,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;YAC1B,QAAQ,GAAG,IAAI,CAAC;QAClB,CAAC;aAAM,IACL,CAAC,CACC,CACE,CAAC,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,EAAE,CAAC,IAAI,MAAM;YACpC,CAAC,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,GAAG,CAAC,IAAI,MAAM;YACrC,CAAC,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,EAAE,CAAC,CAC3B,CAAC,MAAM;SACT,EACD,CAAC;YACD,OAAO,KAAK,CAAC;QACf,CAAC;IACH,CAAC;IAED,OAAO,QAAQ,CAAC;AAClB,CAAC;AAED;;;;GAIG;AACH,MAAM,CAAC,OAAO,UAAU,IAAI,CAAC,QAAgB;IAC3C,OAAO,cAAc,CAAC,QAAQ,CAAC,IAAI,cAAc,CAAC,QAAQ,CAAC,CAAC;AAC9D,CAAC"}
|
||||
+66
@@ -0,0 +1,66 @@
|
||||
/**
|
||||
* Implements fast shallow verification of hostnames. This does not perform a
|
||||
* struct check on the content of labels (classes of Unicode characters, etc.)
|
||||
* but instead check that the structure is valid (number of labels, length of
|
||||
* labels, etc.).
|
||||
*
|
||||
* If you need stricter validation, consider using an external library.
|
||||
*/
|
||||
function isValidAscii(code) {
|
||||
return ((code >= 97 && code <= 122) || (code >= 48 && code <= 57) || code > 127);
|
||||
}
|
||||
/**
|
||||
* Check if a hostname string is valid. It's usually a preliminary check before
|
||||
* trying to use getDomain or anything else.
|
||||
*
|
||||
* Beware: it does not check if the TLD exists.
|
||||
*/
|
||||
export default function (hostname) {
|
||||
if (hostname.length > 255) {
|
||||
return false;
|
||||
}
|
||||
if (hostname.length === 0) {
|
||||
return false;
|
||||
}
|
||||
if (
|
||||
/*@__INLINE__*/ !isValidAscii(hostname.charCodeAt(0)) &&
|
||||
hostname.charCodeAt(0) !== 46 && // '.' (dot)
|
||||
hostname.charCodeAt(0) !== 95 // '_' (underscore)
|
||||
) {
|
||||
return false;
|
||||
}
|
||||
// Validate hostname according to RFC
|
||||
let lastDotIndex = -1;
|
||||
let lastCharCode = -1;
|
||||
const len = hostname.length;
|
||||
for (let i = 0; i < len; i += 1) {
|
||||
const code = hostname.charCodeAt(i);
|
||||
if (code === 46 /* '.' */) {
|
||||
if (
|
||||
// Check that previous label is < 63 bytes long (64 = 63 + '.')
|
||||
i - lastDotIndex > 64 ||
|
||||
// Check that previous character was not already a '.'
|
||||
lastCharCode === 46 ||
|
||||
// Check that the previous label does not end with a '-' (dash)
|
||||
lastCharCode === 45 ||
|
||||
// Check that the previous label does not end with a '_' (underscore)
|
||||
lastCharCode === 95) {
|
||||
return false;
|
||||
}
|
||||
lastDotIndex = i;
|
||||
}
|
||||
else if (!( /*@__INLINE__*/(isValidAscii(code) || code === 45 || code === 95))) {
|
||||
// Check if there is a forbidden character in the label
|
||||
return false;
|
||||
}
|
||||
lastCharCode = code;
|
||||
}
|
||||
return (
|
||||
// Check that last label is shorter than 63 chars
|
||||
len - lastDotIndex - 1 <= 63 &&
|
||||
// Check that the last character is an allowed trailing label character.
|
||||
// Since we already checked that the char is a valid hostname character,
|
||||
// we only need to check that it's different from '-'.
|
||||
lastCharCode !== 45);
|
||||
}
|
||||
//# sourceMappingURL=is-valid.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"is-valid.js","sourceRoot":"","sources":["../../../src/is-valid.ts"],"names":[],"mappings":"AAAA;;;;;;;GAOG;AAEH,SAAS,YAAY,CAAC,IAAY;IAChC,OAAO,CACL,CAAC,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,GAAG,CAAC,IAAI,CAAC,IAAI,IAAI,EAAE,IAAI,IAAI,IAAI,EAAE,CAAC,IAAI,IAAI,GAAG,GAAG,CACxE,CAAC;AACJ,CAAC;AAED;;;;;GAKG;AACH,MAAM,CAAC,OAAO,WAAW,QAAgB;IACvC,IAAI,QAAQ,CAAC,MAAM,GAAG,GAAG,EAAE,CAAC;QAC1B,OAAO,KAAK,CAAC;IACf,CAAC;IAED,IAAI,QAAQ,CAAC,MAAM,KAAK,CAAC,EAAE,CAAC;QAC1B,OAAO,KAAK,CAAC;IACf,CAAC;IAED;IACE,eAAe,CAAC,CAAC,YAAY,CAAC,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;QACrD,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,KAAK,EAAE,IAAI,YAAY;QAC7C,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,KAAK,EAAE,CAAC,mBAAmB;MACjD,CAAC;QACD,OAAO,KAAK,CAAC;IACf,CAAC;IAED,qCAAqC;IACrC,IAAI,YAAY,GAAG,CAAC,CAAC,CAAC;IACtB,IAAI,YAAY,GAAG,CAAC,CAAC,CAAC;IACtB,MAAM,GAAG,GAAG,QAAQ,CAAC,MAAM,CAAC;IAE5B,KAAK,IAAI,CAAC,GAAG,CAAC,EAAE,CAAC,GAAG,GAAG,EAAE,CAAC,IAAI,CAAC,EAAE,CAAC;QAChC,MAAM,IAAI,GAAG,QAAQ,CAAC,UAAU,CAAC,CAAC,CAAC,CAAC;QACpC,IAAI,IAAI,KAAK,EAAE,CAAC,SAAS,EAAE,CAAC;YAC1B;YACE,+DAA+D;YAC/D,CAAC,GAAG,YAAY,GAAG,EAAE;gBACrB,sDAAsD;gBACtD,YAAY,KAAK,EAAE;gBACnB,+DAA+D;gBAC/D,YAAY,KAAK,EAAE;gBACnB,qEAAqE;gBACrE,YAAY,KAAK,EAAE,EACnB,CAAC;gBACD,OAAO,KAAK,CAAC;YACf,CAAC;YAED,YAAY,GAAG,CAAC,CAAC;QACnB,CAAC;aAAM,IACL,CAAC,EAAC,eAAgB,CAAC,YAAY,CAAC,IAAI,CAAC,IAAI,IAAI,KAAK,EAAE,IAAI,IAAI,KAAK,EAAE,CAAC,CAAC,EACrE,CAAC;YACD,uDAAuD;YACvD,OAAO,KAAK,CAAC;QACf,CAAC;QAED,YAAY,GAAG,IAAI,CAAC;IACtB,CAAC;IAED,OAAO;IACL,iDAAiD;IACjD,GAAG,GAAG,YAAY,GAAG,CAAC,IAAI,EAAE;QAC5B,wEAAwE;QACxE,wEAAwE;QACxE,sDAAsD;QACtD,YAAY,KAAK,EAAE,CACpB,CAAC;AACJ,CAAC"}
|
||||
+66
@@ -0,0 +1,66 @@
|
||||
export default function (hostname, options, out) {
|
||||
// Fast path for very popular suffixes; this allows to by-pass lookup
|
||||
// completely as well as any extra allocation or string manipulation.
|
||||
if (!options.allowPrivateDomains && hostname.length > 3) {
|
||||
const last = hostname.length - 1;
|
||||
const c3 = hostname.charCodeAt(last);
|
||||
const c2 = hostname.charCodeAt(last - 1);
|
||||
const c1 = hostname.charCodeAt(last - 2);
|
||||
const c0 = hostname.charCodeAt(last - 3);
|
||||
if (c3 === 109 /* 'm' */ &&
|
||||
c2 === 111 /* 'o' */ &&
|
||||
c1 === 99 /* 'c' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'com';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 103 /* 'g' */ &&
|
||||
c2 === 114 /* 'r' */ &&
|
||||
c1 === 111 /* 'o' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'org';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 117 /* 'u' */ &&
|
||||
c2 === 100 /* 'd' */ &&
|
||||
c1 === 101 /* 'e' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'edu';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 118 /* 'v' */ &&
|
||||
c2 === 111 /* 'o' */ &&
|
||||
c1 === 103 /* 'g' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'gov';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 116 /* 't' */ &&
|
||||
c2 === 101 /* 'e' */ &&
|
||||
c1 === 110 /* 'n' */ &&
|
||||
c0 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'net';
|
||||
return true;
|
||||
}
|
||||
else if (c3 === 101 /* 'e' */ &&
|
||||
c2 === 100 /* 'd' */ &&
|
||||
c1 === 46 /* '.' */) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'de';
|
||||
return true;
|
||||
}
|
||||
}
|
||||
return false;
|
||||
}
|
||||
//# sourceMappingURL=fast-path.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"fast-path.js","sourceRoot":"","sources":["../../../../src/lookup/fast-path.ts"],"names":[],"mappings":"AAEA,MAAM,CAAC,OAAO,WACZ,QAAgB,EAChB,OAA6B,EAC7B,GAAkB;IAElB,qEAAqE;IACrE,qEAAqE;IACrE,IAAI,CAAC,OAAO,CAAC,mBAAmB,IAAI,QAAQ,CAAC,MAAM,GAAG,CAAC,EAAE,CAAC;QACxD,MAAM,IAAI,GAAW,QAAQ,CAAC,MAAM,GAAG,CAAC,CAAC;QACzC,MAAM,EAAE,GAAW,QAAQ,CAAC,UAAU,CAAC,IAAI,CAAC,CAAC;QAC7C,MAAM,EAAE,GAAW,QAAQ,CAAC,UAAU,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC;QACjD,MAAM,EAAE,GAAW,QAAQ,CAAC,UAAU,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC;QACjD,MAAM,EAAE,GAAW,QAAQ,CAAC,UAAU,CAAC,IAAI,GAAG,CAAC,CAAC,CAAC;QAEjD,IACE,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS;YACnB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,KAAK,CAAC;YACzB,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IACL,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,KAAK,CAAC;YACzB,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IACL,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,KAAK,CAAC;YACzB,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IACL,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,KAAK,CAAC;YACzB,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IACL,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,KAAK,CAAC;YACzB,OAAO,IAAI,CAAC;QACd,CAAC;aAAM,IACL,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,GAAG,CAAC,SAAS;YACpB,EAAE,KAAK,EAAE,CAAC,SAAS,EACnB,CAAC;YACD,GAAG,CAAC,OAAO,GAAG,IAAI,CAAC;YACnB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;YACtB,GAAG,CAAC,YAAY,GAAG,IAAI,CAAC;YACxB,OAAO,IAAI,CAAC;QACd,CAAC;IACH,CAAC;IAED,OAAO,KAAK,CAAC;AACf,CAAC"}
|
||||
+2
@@ -0,0 +1,2 @@
|
||||
export {};
|
||||
//# sourceMappingURL=interface.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"interface.js","sourceRoot":"","sources":["../../../../src/lookup/interface.ts"],"names":[],"mappings":""}
|
||||
+19
@@ -0,0 +1,19 @@
|
||||
function setDefaultsImpl({ allowIcannDomains = true, allowPrivateDomains = false, detectIp = true, extractHostname = true, mixedInputs = true, validHosts = null, validateHostname = true, }) {
|
||||
return {
|
||||
allowIcannDomains,
|
||||
allowPrivateDomains,
|
||||
detectIp,
|
||||
extractHostname,
|
||||
mixedInputs,
|
||||
validHosts,
|
||||
validateHostname,
|
||||
};
|
||||
}
|
||||
const DEFAULT_OPTIONS = /*@__INLINE__*/ setDefaultsImpl({});
|
||||
export function setDefaults(options) {
|
||||
if (options === undefined) {
|
||||
return DEFAULT_OPTIONS;
|
||||
}
|
||||
return /*@__INLINE__*/ setDefaultsImpl(options);
|
||||
}
|
||||
//# sourceMappingURL=options.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"options.js","sourceRoot":"","sources":["../../../src/options.ts"],"names":[],"mappings":"AAUA,SAAS,eAAe,CAAC,EACvB,iBAAiB,GAAG,IAAI,EACxB,mBAAmB,GAAG,KAAK,EAC3B,QAAQ,GAAG,IAAI,EACf,eAAe,GAAG,IAAI,EACtB,WAAW,GAAG,IAAI,EAClB,UAAU,GAAG,IAAI,EACjB,gBAAgB,GAAG,IAAI,GACL;IAClB,OAAO;QACL,iBAAiB;QACjB,mBAAmB;QACnB,QAAQ;QACR,eAAe;QACf,WAAW;QACX,UAAU;QACV,gBAAgB;KACjB,CAAC;AACJ,CAAC;AAED,MAAM,eAAe,GAAG,eAAe,CAAC,eAAe,CAAC,EAAE,CAAC,CAAC;AAE5D,MAAM,UAAU,WAAW,CAAC,OAA2B;IACrD,IAAI,OAAO,KAAK,SAAS,EAAE,CAAC;QAC1B,OAAO,eAAe,CAAC;IACzB,CAAC;IAED,OAAO,eAAe,CAAC,eAAe,CAAC,OAAO,CAAC,CAAC;AAClD,CAAC"}
|
||||
+11
@@ -0,0 +1,11 @@
|
||||
/**
|
||||
* Returns the subdomain of a hostname string
|
||||
*/
|
||||
export default function getSubdomain(hostname, domain) {
|
||||
// If `hostname` and `domain` are the same, then there is no sub-domain
|
||||
if (domain.length === hostname.length) {
|
||||
return '';
|
||||
}
|
||||
return hostname.slice(0, -domain.length - 1);
|
||||
}
|
||||
//# sourceMappingURL=subdomain.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"subdomain.js","sourceRoot":"","sources":["../../../src/subdomain.ts"],"names":[],"mappings":"AAAA;;GAEG;AACH,MAAM,CAAC,OAAO,UAAU,YAAY,CAAC,QAAgB,EAAE,MAAc;IACnE,uEAAuE;IACvE,IAAI,MAAM,CAAC,MAAM,KAAK,QAAQ,CAAC,MAAM,EAAE,CAAC;QACtC,OAAO,EAAE,CAAC;IACZ,CAAC;IAED,OAAO,QAAQ,CAAC,KAAK,CAAC,CAAC,EAAE,CAAC,MAAM,CAAC,MAAM,GAAG,CAAC,CAAC,CAAC;AAC/C,CAAC"}
|
||||
+1
File diff suppressed because one or more lines are too long
+4
@@ -0,0 +1,4 @@
|
||||
export { FLAG, parseImpl, IResult, getEmptyResult, resetResult, } from './src/factory';
|
||||
export { IPublicSuffix, ISuffixLookupOptions } from './src/lookup/interface';
|
||||
export { default as fastPathLookup } from './src/lookup/fast-path';
|
||||
export { IOptions, setDefaults } from './src/options';
|
||||
+6
@@ -0,0 +1,6 @@
|
||||
/**
|
||||
* Return the part of domain without suffix.
|
||||
*
|
||||
* Example: for domain 'foo.com', the result would be 'foo'.
|
||||
*/
|
||||
export default function getDomainWithoutSuffix(domain: string, suffix: string): string;
|
||||
+5
@@ -0,0 +1,5 @@
|
||||
import { IOptions } from './options';
|
||||
/**
|
||||
* Detects the domain based on rules and upon and a host string
|
||||
*/
|
||||
export default function getDomain(suffix: string, hostname: string, options: IOptions): string | null;
|
||||
+5
@@ -0,0 +1,5 @@
|
||||
/**
|
||||
* @param url - URL we want to extract a hostname from.
|
||||
* @param urlIsValidHostname - hint from caller; true if `url` is already a valid hostname.
|
||||
*/
|
||||
export default function extractHostname(url: string, urlIsValidHostname: boolean): string | null;
|
||||
+28
@@ -0,0 +1,28 @@
|
||||
/**
|
||||
* Implement a factory allowing to plug different implementations of suffix
|
||||
* lookup (e.g.: using a trie or the packed hashes datastructures). This is used
|
||||
* and exposed in `tldts.ts` and `tldts-experimental.ts` bundle entrypoints.
|
||||
*/
|
||||
import { IPublicSuffix, ISuffixLookupOptions } from './lookup/interface';
|
||||
import { IOptions } from './options';
|
||||
export interface IResult {
|
||||
hostname: string | null;
|
||||
isIp: boolean | null;
|
||||
subdomain: string | null;
|
||||
domain: string | null;
|
||||
publicSuffix: string | null;
|
||||
domainWithoutSuffix: string | null;
|
||||
isIcann: boolean | null;
|
||||
isPrivate: boolean | null;
|
||||
}
|
||||
export declare function getEmptyResult(): IResult;
|
||||
export declare function resetResult(result: IResult): void;
|
||||
export declare const enum FLAG {
|
||||
HOSTNAME = 0,
|
||||
IS_VALID = 1,
|
||||
PUBLIC_SUFFIX = 2,
|
||||
DOMAIN = 3,
|
||||
SUB_DOMAIN = 4,
|
||||
ALL = 5
|
||||
}
|
||||
export declare function parseImpl(url: string, step: FLAG, suffixLookup: (_1: string, _2: ISuffixLookupOptions, _3: IPublicSuffix) => void, partialOptions: Partial<IOptions>, result: IResult): IResult;
|
||||
+6
@@ -0,0 +1,6 @@
|
||||
/**
|
||||
* Check if `hostname` is *probably* a valid ip addr (either ipv6 or ipv4).
|
||||
* This *will not* work on any string. We need `hostname` to be a valid
|
||||
* hostname.
|
||||
*/
|
||||
export default function isIp(hostname: string): boolean;
|
||||
+15
@@ -0,0 +1,15 @@
|
||||
/**
|
||||
* Implements fast shallow verification of hostnames. This does not perform a
|
||||
* struct check on the content of labels (classes of Unicode characters, etc.)
|
||||
* but instead check that the structure is valid (number of labels, length of
|
||||
* labels, etc.).
|
||||
*
|
||||
* If you need stricter validation, consider using an external library.
|
||||
*/
|
||||
/**
|
||||
* Check if a hostname string is valid. It's usually a preliminary check before
|
||||
* trying to use getDomain or anything else.
|
||||
*
|
||||
* Beware: it does not check if the TLD exists.
|
||||
*/
|
||||
export default function (hostname: string): boolean;
|
||||
+2
@@ -0,0 +1,2 @@
|
||||
import { IPublicSuffix, ISuffixLookupOptions } from './interface';
|
||||
export default function (hostname: string, options: ISuffixLookupOptions, out: IPublicSuffix): boolean;
|
||||
+9
@@ -0,0 +1,9 @@
|
||||
export interface IPublicSuffix {
|
||||
isIcann: boolean | null;
|
||||
isPrivate: boolean | null;
|
||||
publicSuffix: string | null;
|
||||
}
|
||||
export interface ISuffixLookupOptions {
|
||||
allowIcannDomains: boolean;
|
||||
allowPrivateDomains: boolean;
|
||||
}
|
||||
+10
@@ -0,0 +1,10 @@
|
||||
export interface IOptions {
|
||||
allowIcannDomains: boolean;
|
||||
allowPrivateDomains: boolean;
|
||||
detectIp: boolean;
|
||||
extractHostname: boolean;
|
||||
mixedInputs: boolean;
|
||||
validHosts: string[] | null;
|
||||
validateHostname: boolean;
|
||||
}
|
||||
export declare function setDefaults(options?: Partial<IOptions>): IOptions;
|
||||
+4
@@ -0,0 +1,4 @@
|
||||
/**
|
||||
* Returns the subdomain of a hostname string
|
||||
*/
|
||||
export default function getSubdomain(hostname: string, domain: string): string;
|
||||
+10
@@ -0,0 +1,10 @@
|
||||
export {
|
||||
FLAG,
|
||||
parseImpl,
|
||||
IResult,
|
||||
getEmptyResult,
|
||||
resetResult,
|
||||
} from './src/factory';
|
||||
export { IPublicSuffix, ISuffixLookupOptions } from './src/lookup/interface';
|
||||
export { default as fastPathLookup } from './src/lookup/fast-path';
|
||||
export { IOptions, setDefaults } from './src/options';
|
||||
+68
@@ -0,0 +1,68 @@
|
||||
{
|
||||
"name": "tldts-core",
|
||||
"version": "7.0.18",
|
||||
"description": "tldts core primitives (internal module)",
|
||||
"author": {
|
||||
"name": "Rémi Berson"
|
||||
},
|
||||
"contributors": [
|
||||
"Alexei <alexeiatyahoodotcom@gmail.com>",
|
||||
"Alexey <kureev-mail@ya.ru>",
|
||||
"Andrew <chefandrew@seomoz.org>",
|
||||
"Johannes Ewald <johannes.ewald@peerigon.com>",
|
||||
"Jérôme Desboeufs <jerome.desboeufs@gmail.com>",
|
||||
"Kelly Campbell <kelly.a.campbell@gmail.com>",
|
||||
"Kiko Beats <josefrancisco.verdu@gmail.com>",
|
||||
"Kris Reeves <krisreeves@searchfanatics.com>",
|
||||
"Krzysztof Jan Modras <chrmod@chrmod.net>",
|
||||
"Olivier Melcher <olivier.melcher@gmail.com>",
|
||||
"Rémi Berson <remi.berson@pm.me>",
|
||||
"Saad Rashid <srashid@lendinghome.com>",
|
||||
"Thomas Parisot <hi@oncletom.io>",
|
||||
"Timo Tijhof <krinklemail@gmail.com>",
|
||||
"Xavier Damman <xdamman@gmail.com>",
|
||||
"Yehezkiel Syamsuhadi <yehezkielbs@gmail.com>"
|
||||
],
|
||||
"publishConfig": {
|
||||
"access": "public"
|
||||
},
|
||||
"license": "MIT",
|
||||
"homepage": "https://github.com/remusao/tldts#readme",
|
||||
"bugs": {
|
||||
"url": "https://github.com/remusao/tldts/issues"
|
||||
},
|
||||
"repository": {
|
||||
"type": "git",
|
||||
"url": "git+ssh://git@github.com/remusao/tldts.git"
|
||||
},
|
||||
"main": "dist/cjs/index.js",
|
||||
"module": "dist/es6/index.js",
|
||||
"types": "dist/types/index.d.ts",
|
||||
"files": [
|
||||
"dist",
|
||||
"src",
|
||||
"index.ts"
|
||||
],
|
||||
"scripts": {
|
||||
"clean": "rimraf dist",
|
||||
"build": "tsc --build ./tsconfig.json",
|
||||
"bundle": "tsc --build ./tsconfig.bundle.json && rollup --config ./rollup.config.ts --configPlugin typescript",
|
||||
"prepack": "yarn run bundle",
|
||||
"test": "nyc mocha --config ../../.mocharc.cjs"
|
||||
},
|
||||
"devDependencies": {
|
||||
"@rollup/plugin-node-resolve": "^16.0.0",
|
||||
"@rollup/plugin-typescript": "^12.1.0",
|
||||
"@types/chai": "^4.2.18",
|
||||
"@types/mocha": "^10.0.0",
|
||||
"@types/node": "^24.3.1",
|
||||
"chai": "^4.4.1",
|
||||
"mocha": "^11.0.1",
|
||||
"nyc": "^17.0.0",
|
||||
"rimraf": "^5.0.1",
|
||||
"rollup": "^4.1.0",
|
||||
"rollup-plugin-sourcemaps": "^0.6.1",
|
||||
"typescript": "^5.0.4"
|
||||
},
|
||||
"gitHead": "17dbd3feec774960ed4fe88592f90237aaba7936"
|
||||
}
|
||||
+14
@@ -0,0 +1,14 @@
|
||||
/**
|
||||
* Return the part of domain without suffix.
|
||||
*
|
||||
* Example: for domain 'foo.com', the result would be 'foo'.
|
||||
*/
|
||||
export default function getDomainWithoutSuffix(
|
||||
domain: string,
|
||||
suffix: string,
|
||||
): string {
|
||||
// Note: here `domain` and `suffix` cannot have the same length because in
|
||||
// this case we set `domain` to `null` instead. It is thus safe to assume
|
||||
// that `suffix` is shorter than `domain`.
|
||||
return domain.slice(0, -suffix.length - 1);
|
||||
}
|
||||
+100
@@ -0,0 +1,100 @@
|
||||
import { IOptions } from './options';
|
||||
|
||||
/**
|
||||
* Check if `vhost` is a valid suffix of `hostname` (top-domain)
|
||||
*
|
||||
* It means that `vhost` needs to be a suffix of `hostname` and we then need to
|
||||
* make sure that: either they are equal, or the character preceding `vhost` in
|
||||
* `hostname` is a '.' (it should not be a partial label).
|
||||
*
|
||||
* * hostname = 'not.evil.com' and vhost = 'vil.com' => not ok
|
||||
* * hostname = 'not.evil.com' and vhost = 'evil.com' => ok
|
||||
* * hostname = 'not.evil.com' and vhost = 'not.evil.com' => ok
|
||||
*/
|
||||
function shareSameDomainSuffix(hostname: string, vhost: string): boolean {
|
||||
if (hostname.endsWith(vhost)) {
|
||||
return (
|
||||
hostname.length === vhost.length ||
|
||||
hostname[hostname.length - vhost.length - 1] === '.'
|
||||
);
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
|
||||
/**
|
||||
* Given a hostname and its public suffix, extract the general domain.
|
||||
*/
|
||||
function extractDomainWithSuffix(
|
||||
hostname: string,
|
||||
publicSuffix: string,
|
||||
): string {
|
||||
// Locate the index of the last '.' in the part of the `hostname` preceding
|
||||
// the public suffix.
|
||||
//
|
||||
// examples:
|
||||
// 1. not.evil.co.uk => evil.co.uk
|
||||
// ^ ^
|
||||
// | | start of public suffix
|
||||
// | index of the last dot
|
||||
//
|
||||
// 2. example.co.uk => example.co.uk
|
||||
// ^ ^
|
||||
// | | start of public suffix
|
||||
// |
|
||||
// | (-1) no dot found before the public suffix
|
||||
const publicSuffixIndex = hostname.length - publicSuffix.length - 2;
|
||||
const lastDotBeforeSuffixIndex = hostname.lastIndexOf('.', publicSuffixIndex);
|
||||
|
||||
// No '.' found, then `hostname` is the general domain (no sub-domain)
|
||||
if (lastDotBeforeSuffixIndex === -1) {
|
||||
return hostname;
|
||||
}
|
||||
|
||||
// Extract the part between the last '.'
|
||||
return hostname.slice(lastDotBeforeSuffixIndex + 1);
|
||||
}
|
||||
|
||||
/**
|
||||
* Detects the domain based on rules and upon and a host string
|
||||
*/
|
||||
export default function getDomain(
|
||||
suffix: string,
|
||||
hostname: string,
|
||||
options: IOptions,
|
||||
): string | null {
|
||||
// Check if `hostname` ends with a member of `validHosts`.
|
||||
if (options.validHosts !== null) {
|
||||
const validHosts = options.validHosts;
|
||||
for (const vhost of validHosts) {
|
||||
if (/*@__INLINE__*/ shareSameDomainSuffix(hostname, vhost)) {
|
||||
return vhost;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
let numberOfLeadingDots = 0;
|
||||
if (hostname.startsWith('.')) {
|
||||
while (
|
||||
numberOfLeadingDots < hostname.length &&
|
||||
hostname[numberOfLeadingDots] === '.'
|
||||
) {
|
||||
numberOfLeadingDots += 1;
|
||||
}
|
||||
}
|
||||
|
||||
// If `hostname` is a valid public suffix, then there is no domain to return.
|
||||
// Since we already know that `getPublicSuffix` returns a suffix of `hostname`
|
||||
// there is no need to perform a string comparison and we only compare the
|
||||
// size.
|
||||
if (suffix.length === hostname.length - numberOfLeadingDots) {
|
||||
return null;
|
||||
}
|
||||
|
||||
// To extract the general domain, we start by identifying the public suffix
|
||||
// (if any), then consider the domain to be the public suffix with one added
|
||||
// level of depth. (e.g.: if hostname is `not.evil.co.uk` and public suffix:
|
||||
// `co.uk`, then we take one more level: `evil`, giving the final result:
|
||||
// `evil.co.uk`).
|
||||
return /*@__INLINE__*/ extractDomainWithSuffix(hostname, suffix);
|
||||
}
|
||||
+170
@@ -0,0 +1,170 @@
|
||||
/**
|
||||
* @param url - URL we want to extract a hostname from.
|
||||
* @param urlIsValidHostname - hint from caller; true if `url` is already a valid hostname.
|
||||
*/
|
||||
export default function extractHostname(
|
||||
url: string,
|
||||
urlIsValidHostname: boolean,
|
||||
): string | null {
|
||||
let start = 0;
|
||||
let end: number = url.length;
|
||||
let hasUpper = false;
|
||||
|
||||
// If url is not already a valid hostname, then try to extract hostname.
|
||||
if (!urlIsValidHostname) {
|
||||
// Special handling of data URLs
|
||||
if (url.startsWith('data:')) {
|
||||
return null;
|
||||
}
|
||||
|
||||
// Trim leading spaces
|
||||
while (start < url.length && url.charCodeAt(start) <= 32) {
|
||||
start += 1;
|
||||
}
|
||||
|
||||
// Trim trailing spaces
|
||||
while (end > start + 1 && url.charCodeAt(end - 1) <= 32) {
|
||||
end -= 1;
|
||||
}
|
||||
|
||||
// Skip scheme.
|
||||
if (
|
||||
url.charCodeAt(start) === 47 /* '/' */ &&
|
||||
url.charCodeAt(start + 1) === 47 /* '/' */
|
||||
) {
|
||||
start += 2;
|
||||
} else {
|
||||
const indexOfProtocol = url.indexOf(':/', start);
|
||||
if (indexOfProtocol !== -1) {
|
||||
// Implement fast-path for common protocols. We expect most protocols
|
||||
// should be one of these 4 and thus we will not need to perform the
|
||||
// more expansive validity check most of the time.
|
||||
const protocolSize = indexOfProtocol - start;
|
||||
const c0 = url.charCodeAt(start);
|
||||
const c1 = url.charCodeAt(start + 1);
|
||||
const c2 = url.charCodeAt(start + 2);
|
||||
const c3 = url.charCodeAt(start + 3);
|
||||
const c4 = url.charCodeAt(start + 4);
|
||||
|
||||
if (
|
||||
protocolSize === 5 &&
|
||||
c0 === 104 /* 'h' */ &&
|
||||
c1 === 116 /* 't' */ &&
|
||||
c2 === 116 /* 't' */ &&
|
||||
c3 === 112 /* 'p' */ &&
|
||||
c4 === 115 /* 's' */
|
||||
) {
|
||||
// https
|
||||
} else if (
|
||||
protocolSize === 4 &&
|
||||
c0 === 104 /* 'h' */ &&
|
||||
c1 === 116 /* 't' */ &&
|
||||
c2 === 116 /* 't' */ &&
|
||||
c3 === 112 /* 'p' */
|
||||
) {
|
||||
// http
|
||||
} else if (
|
||||
protocolSize === 3 &&
|
||||
c0 === 119 /* 'w' */ &&
|
||||
c1 === 115 /* 's' */ &&
|
||||
c2 === 115 /* 's' */
|
||||
) {
|
||||
// wss
|
||||
} else if (
|
||||
protocolSize === 2 &&
|
||||
c0 === 119 /* 'w' */ &&
|
||||
c1 === 115 /* 's' */
|
||||
) {
|
||||
// ws
|
||||
} else {
|
||||
// Check that scheme is valid
|
||||
for (let i = start; i < indexOfProtocol; i += 1) {
|
||||
const lowerCaseCode = url.charCodeAt(i) | 32;
|
||||
if (
|
||||
!(
|
||||
(
|
||||
(lowerCaseCode >= 97 && lowerCaseCode <= 122) || // [a, z]
|
||||
(lowerCaseCode >= 48 && lowerCaseCode <= 57) || // [0, 9]
|
||||
lowerCaseCode === 46 || // '.'
|
||||
lowerCaseCode === 45 || // '-'
|
||||
lowerCaseCode === 43
|
||||
) // '+'
|
||||
)
|
||||
) {
|
||||
return null;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// Skip 0, 1 or more '/' after ':/'
|
||||
start = indexOfProtocol + 2;
|
||||
while (url.charCodeAt(start) === 47 /* '/' */) {
|
||||
start += 1;
|
||||
}
|
||||
}
|
||||
}
|
||||
|
||||
// Detect first occurrence of '/', '?' or '#'. We also keep track of the
|
||||
// last occurrence of '@', ']' or ':' to speed-up subsequent parsing of
|
||||
// (respectively), identifier, ipv6 or port.
|
||||
let indexOfIdentifier = -1;
|
||||
let indexOfClosingBracket = -1;
|
||||
let indexOfPort = -1;
|
||||
for (let i = start; i < end; i += 1) {
|
||||
const code: number = url.charCodeAt(i);
|
||||
if (
|
||||
code === 35 || // '#'
|
||||
code === 47 || // '/'
|
||||
code === 63 // '?'
|
||||
) {
|
||||
end = i;
|
||||
break;
|
||||
} else if (code === 64) {
|
||||
// '@'
|
||||
indexOfIdentifier = i;
|
||||
} else if (code === 93) {
|
||||
// ']'
|
||||
indexOfClosingBracket = i;
|
||||
} else if (code === 58) {
|
||||
// ':'
|
||||
indexOfPort = i;
|
||||
} else if (code >= 65 && code <= 90) {
|
||||
hasUpper = true;
|
||||
}
|
||||
}
|
||||
|
||||
// Detect identifier: '@'
|
||||
if (
|
||||
indexOfIdentifier !== -1 &&
|
||||
indexOfIdentifier > start &&
|
||||
indexOfIdentifier < end
|
||||
) {
|
||||
start = indexOfIdentifier + 1;
|
||||
}
|
||||
|
||||
// Handle ipv6 addresses
|
||||
if (url.charCodeAt(start) === 91 /* '[' */) {
|
||||
if (indexOfClosingBracket !== -1) {
|
||||
return url.slice(start + 1, indexOfClosingBracket).toLowerCase();
|
||||
}
|
||||
return null;
|
||||
} else if (indexOfPort !== -1 && indexOfPort > start && indexOfPort < end) {
|
||||
// Detect port: ':'
|
||||
end = indexOfPort;
|
||||
}
|
||||
}
|
||||
|
||||
// Trim trailing dots
|
||||
while (end > start + 1 && url.charCodeAt(end - 1) === 46 /* '.' */) {
|
||||
end -= 1;
|
||||
}
|
||||
|
||||
const hostname: string =
|
||||
start !== 0 || end !== url.length ? url.slice(start, end) : url;
|
||||
|
||||
if (hasUpper) {
|
||||
return hostname.toLowerCase();
|
||||
}
|
||||
|
||||
return hostname;
|
||||
}
|
||||
+163
@@ -0,0 +1,163 @@
|
||||
/**
|
||||
* Implement a factory allowing to plug different implementations of suffix
|
||||
* lookup (e.g.: using a trie or the packed hashes datastructures). This is used
|
||||
* and exposed in `tldts.ts` and `tldts-experimental.ts` bundle entrypoints.
|
||||
*/
|
||||
|
||||
import getDomain from './domain';
|
||||
import getDomainWithoutSuffix from './domain-without-suffix';
|
||||
import extractHostname from './extract-hostname';
|
||||
import isIp from './is-ip';
|
||||
import isValidHostname from './is-valid';
|
||||
import { IPublicSuffix, ISuffixLookupOptions } from './lookup/interface';
|
||||
import { IOptions, setDefaults } from './options';
|
||||
import getSubdomain from './subdomain';
|
||||
|
||||
export interface IResult {
|
||||
// `hostname` is either a registered name (including but not limited to a
|
||||
// hostname), or an IP address. IPv4 addresses must be in dot-decimal
|
||||
// notation, and IPv6 addresses must be enclosed in brackets ([]). This is
|
||||
// directly extracted from the input URL.
|
||||
hostname: string | null;
|
||||
|
||||
// Is `hostname` an IP? (IPv4 or IPv6)
|
||||
isIp: boolean | null;
|
||||
|
||||
// `hostname` split between subdomain, domain and its public suffix (if any)
|
||||
subdomain: string | null;
|
||||
domain: string | null;
|
||||
publicSuffix: string | null;
|
||||
domainWithoutSuffix: string | null;
|
||||
|
||||
// Specifies if `publicSuffix` comes from the ICANN or PRIVATE section of the list
|
||||
isIcann: boolean | null;
|
||||
isPrivate: boolean | null;
|
||||
}
|
||||
|
||||
export function getEmptyResult(): IResult {
|
||||
return {
|
||||
domain: null,
|
||||
domainWithoutSuffix: null,
|
||||
hostname: null,
|
||||
isIcann: null,
|
||||
isIp: null,
|
||||
isPrivate: null,
|
||||
publicSuffix: null,
|
||||
subdomain: null,
|
||||
};
|
||||
}
|
||||
|
||||
export function resetResult(result: IResult): void {
|
||||
result.domain = null;
|
||||
result.domainWithoutSuffix = null;
|
||||
result.hostname = null;
|
||||
result.isIcann = null;
|
||||
result.isIp = null;
|
||||
result.isPrivate = null;
|
||||
result.publicSuffix = null;
|
||||
result.subdomain = null;
|
||||
}
|
||||
|
||||
// Flags representing steps in the `parse` function. They are used to implement
|
||||
// an early stop mechanism (simulating some form of laziness) to avoid doing
|
||||
// more work than necessary to perform a given action (e.g.: we don't need to
|
||||
// extract the domain and subdomain if we are only interested in public suffix).
|
||||
export const enum FLAG {
|
||||
HOSTNAME,
|
||||
IS_VALID,
|
||||
PUBLIC_SUFFIX,
|
||||
DOMAIN,
|
||||
SUB_DOMAIN,
|
||||
ALL,
|
||||
}
|
||||
|
||||
export function parseImpl(
|
||||
url: string,
|
||||
step: FLAG,
|
||||
suffixLookup: (
|
||||
_1: string,
|
||||
_2: ISuffixLookupOptions,
|
||||
_3: IPublicSuffix,
|
||||
) => void,
|
||||
partialOptions: Partial<IOptions>,
|
||||
result: IResult,
|
||||
): IResult {
|
||||
const options: IOptions = /*@__INLINE__*/ setDefaults(partialOptions);
|
||||
|
||||
// Very fast approximate check to make sure `url` is a string. This is needed
|
||||
// because the library will not necessarily be used in a typed setup and
|
||||
// values of arbitrary types might be given as argument.
|
||||
if (typeof url !== 'string') {
|
||||
return result;
|
||||
}
|
||||
|
||||
// Extract hostname from `url` only if needed. This can be made optional
|
||||
// using `options.extractHostname`. This option will typically be used
|
||||
// whenever we are sure the inputs to `parse` are already hostnames and not
|
||||
// arbitrary URLs.
|
||||
//
|
||||
// `mixedInput` allows to specify if we expect a mix of URLs and hostnames
|
||||
// as input. If only hostnames are expected then `extractHostname` can be
|
||||
// set to `false` to speed-up parsing. If only URLs are expected then
|
||||
// `mixedInputs` can be set to `false`. The `mixedInputs` is only a hint
|
||||
// and will not change the behavior of the library.
|
||||
if (!options.extractHostname) {
|
||||
result.hostname = url;
|
||||
} else if (options.mixedInputs) {
|
||||
result.hostname = extractHostname(url, isValidHostname(url));
|
||||
} else {
|
||||
result.hostname = extractHostname(url, false);
|
||||
}
|
||||
|
||||
// Check if `hostname` is a valid ip address
|
||||
if (options.detectIp && result.hostname !== null) {
|
||||
result.isIp = isIp(result.hostname);
|
||||
if (result.isIp) {
|
||||
return result;
|
||||
}
|
||||
}
|
||||
|
||||
// Perform hostname validation if enabled. If hostname is not valid, no need to
|
||||
// go further as there will be no valid domain or sub-domain. This validation
|
||||
// is applied before any early returns to ensure consistent behavior across
|
||||
// all API methods including getHostname().
|
||||
if (
|
||||
options.validateHostname &&
|
||||
options.extractHostname &&
|
||||
result.hostname !== null &&
|
||||
!isValidHostname(result.hostname)
|
||||
) {
|
||||
result.hostname = null;
|
||||
return result;
|
||||
}
|
||||
|
||||
if (step === FLAG.HOSTNAME || result.hostname === null) {
|
||||
return result;
|
||||
}
|
||||
|
||||
// Extract public suffix
|
||||
suffixLookup(result.hostname, options, result);
|
||||
if (step === FLAG.PUBLIC_SUFFIX || result.publicSuffix === null) {
|
||||
return result;
|
||||
}
|
||||
|
||||
// Extract domain
|
||||
result.domain = getDomain(result.publicSuffix, result.hostname, options);
|
||||
if (step === FLAG.DOMAIN || result.domain === null) {
|
||||
return result;
|
||||
}
|
||||
|
||||
// Extract subdomain
|
||||
result.subdomain = getSubdomain(result.hostname, result.domain);
|
||||
if (step === FLAG.SUB_DOMAIN) {
|
||||
return result;
|
||||
}
|
||||
|
||||
// Extract domain without suffix
|
||||
result.domainWithoutSuffix = getDomainWithoutSuffix(
|
||||
result.domain,
|
||||
result.publicSuffix,
|
||||
);
|
||||
|
||||
return result;
|
||||
}
|
||||
+87
@@ -0,0 +1,87 @@
|
||||
/**
|
||||
* Check if a hostname is an IP. You should be aware that this only works
|
||||
* because `hostname` is already garanteed to be a valid hostname!
|
||||
*/
|
||||
function isProbablyIpv4(hostname: string): boolean {
|
||||
// Cannot be shorted than 1.1.1.1
|
||||
if (hostname.length < 7) {
|
||||
return false;
|
||||
}
|
||||
|
||||
// Cannot be longer than: 255.255.255.255
|
||||
if (hostname.length > 15) {
|
||||
return false;
|
||||
}
|
||||
|
||||
let numberOfDots = 0;
|
||||
|
||||
for (let i = 0; i < hostname.length; i += 1) {
|
||||
const code = hostname.charCodeAt(i);
|
||||
|
||||
if (code === 46 /* '.' */) {
|
||||
numberOfDots += 1;
|
||||
} else if (code < 48 /* '0' */ || code > 57 /* '9' */) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
return (
|
||||
numberOfDots === 3 &&
|
||||
hostname.charCodeAt(0) !== 46 /* '.' */ &&
|
||||
hostname.charCodeAt(hostname.length - 1) !== 46 /* '.' */
|
||||
);
|
||||
}
|
||||
|
||||
/**
|
||||
* Similar to isProbablyIpv4.
|
||||
*/
|
||||
function isProbablyIpv6(hostname: string): boolean {
|
||||
if (hostname.length < 3) {
|
||||
return false;
|
||||
}
|
||||
|
||||
let start = hostname.startsWith('[') ? 1 : 0;
|
||||
let end = hostname.length;
|
||||
|
||||
if (hostname[end - 1] === ']') {
|
||||
end -= 1;
|
||||
}
|
||||
|
||||
// We only consider the maximum size of a normal IPV6. Note that this will
|
||||
// fail on so-called "IPv4 mapped IPv6 addresses" but this is a corner-case
|
||||
// and a proper validation library should be used for these.
|
||||
if (end - start > 39) {
|
||||
return false;
|
||||
}
|
||||
|
||||
let hasColon = false;
|
||||
|
||||
for (; start < end; start += 1) {
|
||||
const code = hostname.charCodeAt(start);
|
||||
|
||||
if (code === 58 /* ':' */) {
|
||||
hasColon = true;
|
||||
} else if (
|
||||
!(
|
||||
(
|
||||
(code >= 48 && code <= 57) || // 0-9
|
||||
(code >= 97 && code <= 102) || // a-f
|
||||
(code >= 65 && code <= 90)
|
||||
) // A-F
|
||||
)
|
||||
) {
|
||||
return false;
|
||||
}
|
||||
}
|
||||
|
||||
return hasColon;
|
||||
}
|
||||
|
||||
/**
|
||||
* Check if `hostname` is *probably* a valid ip addr (either ipv6 or ipv4).
|
||||
* This *will not* work on any string. We need `hostname` to be a valid
|
||||
* hostname.
|
||||
*/
|
||||
export default function isIp(hostname: string): boolean {
|
||||
return isProbablyIpv6(hostname) || isProbablyIpv4(hostname);
|
||||
}
|
||||
+79
@@ -0,0 +1,79 @@
|
||||
/**
|
||||
* Implements fast shallow verification of hostnames. This does not perform a
|
||||
* struct check on the content of labels (classes of Unicode characters, etc.)
|
||||
* but instead check that the structure is valid (number of labels, length of
|
||||
* labels, etc.).
|
||||
*
|
||||
* If you need stricter validation, consider using an external library.
|
||||
*/
|
||||
|
||||
function isValidAscii(code: number): boolean {
|
||||
return (
|
||||
(code >= 97 && code <= 122) || (code >= 48 && code <= 57) || code > 127
|
||||
);
|
||||
}
|
||||
|
||||
/**
|
||||
* Check if a hostname string is valid. It's usually a preliminary check before
|
||||
* trying to use getDomain or anything else.
|
||||
*
|
||||
* Beware: it does not check if the TLD exists.
|
||||
*/
|
||||
export default function (hostname: string): boolean {
|
||||
if (hostname.length > 255) {
|
||||
return false;
|
||||
}
|
||||
|
||||
if (hostname.length === 0) {
|
||||
return false;
|
||||
}
|
||||
|
||||
if (
|
||||
/*@__INLINE__*/ !isValidAscii(hostname.charCodeAt(0)) &&
|
||||
hostname.charCodeAt(0) !== 46 && // '.' (dot)
|
||||
hostname.charCodeAt(0) !== 95 // '_' (underscore)
|
||||
) {
|
||||
return false;
|
||||
}
|
||||
|
||||
// Validate hostname according to RFC
|
||||
let lastDotIndex = -1;
|
||||
let lastCharCode = -1;
|
||||
const len = hostname.length;
|
||||
|
||||
for (let i = 0; i < len; i += 1) {
|
||||
const code = hostname.charCodeAt(i);
|
||||
if (code === 46 /* '.' */) {
|
||||
if (
|
||||
// Check that previous label is < 63 bytes long (64 = 63 + '.')
|
||||
i - lastDotIndex > 64 ||
|
||||
// Check that previous character was not already a '.'
|
||||
lastCharCode === 46 ||
|
||||
// Check that the previous label does not end with a '-' (dash)
|
||||
lastCharCode === 45 ||
|
||||
// Check that the previous label does not end with a '_' (underscore)
|
||||
lastCharCode === 95
|
||||
) {
|
||||
return false;
|
||||
}
|
||||
|
||||
lastDotIndex = i;
|
||||
} else if (
|
||||
!(/*@__INLINE__*/ (isValidAscii(code) || code === 45 || code === 95))
|
||||
) {
|
||||
// Check if there is a forbidden character in the label
|
||||
return false;
|
||||
}
|
||||
|
||||
lastCharCode = code;
|
||||
}
|
||||
|
||||
return (
|
||||
// Check that last label is shorter than 63 chars
|
||||
len - lastDotIndex - 1 <= 63 &&
|
||||
// Check that the last character is an allowed trailing label character.
|
||||
// Since we already checked that the char is a valid hostname character,
|
||||
// we only need to check that it's different from '-'.
|
||||
lastCharCode !== 45
|
||||
);
|
||||
}
|
||||
+80
@@ -0,0 +1,80 @@
|
||||
import { IPublicSuffix, ISuffixLookupOptions } from './interface';
|
||||
|
||||
export default function (
|
||||
hostname: string,
|
||||
options: ISuffixLookupOptions,
|
||||
out: IPublicSuffix,
|
||||
): boolean {
|
||||
// Fast path for very popular suffixes; this allows to by-pass lookup
|
||||
// completely as well as any extra allocation or string manipulation.
|
||||
if (!options.allowPrivateDomains && hostname.length > 3) {
|
||||
const last: number = hostname.length - 1;
|
||||
const c3: number = hostname.charCodeAt(last);
|
||||
const c2: number = hostname.charCodeAt(last - 1);
|
||||
const c1: number = hostname.charCodeAt(last - 2);
|
||||
const c0: number = hostname.charCodeAt(last - 3);
|
||||
|
||||
if (
|
||||
c3 === 109 /* 'm' */ &&
|
||||
c2 === 111 /* 'o' */ &&
|
||||
c1 === 99 /* 'c' */ &&
|
||||
c0 === 46 /* '.' */
|
||||
) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'com';
|
||||
return true;
|
||||
} else if (
|
||||
c3 === 103 /* 'g' */ &&
|
||||
c2 === 114 /* 'r' */ &&
|
||||
c1 === 111 /* 'o' */ &&
|
||||
c0 === 46 /* '.' */
|
||||
) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'org';
|
||||
return true;
|
||||
} else if (
|
||||
c3 === 117 /* 'u' */ &&
|
||||
c2 === 100 /* 'd' */ &&
|
||||
c1 === 101 /* 'e' */ &&
|
||||
c0 === 46 /* '.' */
|
||||
) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'edu';
|
||||
return true;
|
||||
} else if (
|
||||
c3 === 118 /* 'v' */ &&
|
||||
c2 === 111 /* 'o' */ &&
|
||||
c1 === 103 /* 'g' */ &&
|
||||
c0 === 46 /* '.' */
|
||||
) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'gov';
|
||||
return true;
|
||||
} else if (
|
||||
c3 === 116 /* 't' */ &&
|
||||
c2 === 101 /* 'e' */ &&
|
||||
c1 === 110 /* 'n' */ &&
|
||||
c0 === 46 /* '.' */
|
||||
) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'net';
|
||||
return true;
|
||||
} else if (
|
||||
c3 === 101 /* 'e' */ &&
|
||||
c2 === 100 /* 'd' */ &&
|
||||
c1 === 46 /* '.' */
|
||||
) {
|
||||
out.isIcann = true;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = 'de';
|
||||
return true;
|
||||
}
|
||||
}
|
||||
|
||||
return false;
|
||||
}
|
||||
+10
@@ -0,0 +1,10 @@
|
||||
export interface IPublicSuffix {
|
||||
isIcann: boolean | null;
|
||||
isPrivate: boolean | null;
|
||||
publicSuffix: string | null;
|
||||
}
|
||||
|
||||
export interface ISuffixLookupOptions {
|
||||
allowIcannDomains: boolean;
|
||||
allowPrivateDomains: boolean;
|
||||
}
|
||||
+39
@@ -0,0 +1,39 @@
|
||||
export interface IOptions {
|
||||
allowIcannDomains: boolean;
|
||||
allowPrivateDomains: boolean;
|
||||
detectIp: boolean;
|
||||
extractHostname: boolean;
|
||||
mixedInputs: boolean;
|
||||
validHosts: string[] | null;
|
||||
validateHostname: boolean;
|
||||
}
|
||||
|
||||
function setDefaultsImpl({
|
||||
allowIcannDomains = true,
|
||||
allowPrivateDomains = false,
|
||||
detectIp = true,
|
||||
extractHostname = true,
|
||||
mixedInputs = true,
|
||||
validHosts = null,
|
||||
validateHostname = true,
|
||||
}: Partial<IOptions>): IOptions {
|
||||
return {
|
||||
allowIcannDomains,
|
||||
allowPrivateDomains,
|
||||
detectIp,
|
||||
extractHostname,
|
||||
mixedInputs,
|
||||
validHosts,
|
||||
validateHostname,
|
||||
};
|
||||
}
|
||||
|
||||
const DEFAULT_OPTIONS = /*@__INLINE__*/ setDefaultsImpl({});
|
||||
|
||||
export function setDefaults(options?: Partial<IOptions>): IOptions {
|
||||
if (options === undefined) {
|
||||
return DEFAULT_OPTIONS;
|
||||
}
|
||||
|
||||
return /*@__INLINE__*/ setDefaultsImpl(options);
|
||||
}
|
||||
+11
@@ -0,0 +1,11 @@
|
||||
/**
|
||||
* Returns the subdomain of a hostname string
|
||||
*/
|
||||
export default function getSubdomain(hostname: string, domain: string): string {
|
||||
// If `hostname` and `domain` are the same, then there is no sub-domain
|
||||
if (domain.length === hostname.length) {
|
||||
return '';
|
||||
}
|
||||
|
||||
return hostname.slice(0, -domain.length - 1);
|
||||
}
|
||||
+13
@@ -0,0 +1,13 @@
|
||||
Copyright (c) 2017 Thomas Parisot, 2018 Rémi Berson
|
||||
|
||||
Permission is hereby granted, free of charge, to any person obtaining a copy of this software and
|
||||
associated documentation files (the "Software"), to deal in the Software without restriction,
|
||||
including without limitation the rights to use, copy, modify, merge, publish, distribute, sublicense,
|
||||
and/or sell copies of the Software, and to permit persons to whom the Software is furnished to do so,
|
||||
subject to the following conditions:
|
||||
|
||||
The above copyright notice and this permission notice shall be included in all copies or substantial portions of the Software.
|
||||
|
||||
THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
|
||||
FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER LIABILITY,
|
||||
WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER DEALINGS IN THE SOFTWARE.
|
||||
+327
@@ -0,0 +1,327 @@
|
||||
# tldts - Blazing Fast URL Parsing
|
||||
|
||||
`tldts` is a JavaScript library to extract hostnames, domains, public suffixes, top-level domains and subdomains from URLs.
|
||||
|
||||
**Features**:
|
||||
|
||||
1. Tuned for **performance** (order of 0.1 to 1 μs per input)
|
||||
2. Handles both URLs and hostnames
|
||||
3. Full Unicode/IDNA support
|
||||
4. Support parsing email addresses
|
||||
5. Detect IPv4 and IPv6 addresses
|
||||
6. Continuously updated version of the public suffix list
|
||||
7. **TypeScript**, ships with `umd`, `esm`, `cjs` bundles and _type definitions_
|
||||
8. Small bundles and small memory footprint
|
||||
9. Battle tested: full test coverage and production use
|
||||
|
||||
# Install
|
||||
|
||||
```bash
|
||||
npm install --save tldts
|
||||
```
|
||||
|
||||
# Usage
|
||||
|
||||
Using the command-line interface:
|
||||
|
||||
```js
|
||||
$ npx tldts 'http://www.writethedocs.org/conf/eu/2017/'
|
||||
{
|
||||
"domain": "writethedocs.org",
|
||||
"domainWithoutSuffix": "writethedocs",
|
||||
"hostname": "www.writethedocs.org",
|
||||
"isIcann": true,
|
||||
"isIp": false,
|
||||
"isPrivate": false,
|
||||
"publicSuffix": "org",
|
||||
"subdomain": "www"
|
||||
}
|
||||
```
|
||||
|
||||
Programmatically:
|
||||
|
||||
```js
|
||||
const { parse } = require('tldts');
|
||||
|
||||
// Retrieving hostname related informations of a given URL
|
||||
parse('http://www.writethedocs.org/conf/eu/2017/');
|
||||
// { domain: 'writethedocs.org',
|
||||
// domainWithoutSuffix: 'writethedocs',
|
||||
// hostname: 'www.writethedocs.org',
|
||||
// isIcann: true,
|
||||
// isIp: false,
|
||||
// isPrivate: false,
|
||||
// publicSuffix: 'org',
|
||||
// subdomain: 'www' }
|
||||
```
|
||||
|
||||
Modern _ES6 modules import_ is also supported:
|
||||
|
||||
```js
|
||||
import { parse } from 'tldts';
|
||||
```
|
||||
|
||||
Alternatively, you can try it _directly in your browser_ here: https://npm.runkit.com/tldts
|
||||
|
||||
# API
|
||||
|
||||
- `tldts.parse(url | hostname, options)`
|
||||
- `tldts.getHostname(url | hostname, options)`
|
||||
- `tldts.getDomain(url | hostname, options)`
|
||||
- `tldts.getPublicSuffix(url | hostname, options)`
|
||||
- `tldts.getSubdomain(url, | hostname, options)`
|
||||
- `tldts.getDomainWithoutSuffix(url | hostname, options)`
|
||||
|
||||
The behavior of `tldts` can be customized using an `options` argument for all
|
||||
the functions exposed as part of the public API. This is useful to both change
|
||||
the behavior of the library as well as fine-tune the performance depending on
|
||||
your inputs.
|
||||
|
||||
```js
|
||||
{
|
||||
// Use suffixes from ICANN section (default: true)
|
||||
allowIcannDomains: boolean;
|
||||
// Use suffixes from Private section (default: false)
|
||||
allowPrivateDomains: boolean;
|
||||
// Extract and validate hostname (default: true)
|
||||
// When set to `false`, inputs will be considered valid hostnames.
|
||||
extractHostname: boolean;
|
||||
// Validate hostnames after parsing (default: true)
|
||||
// If a hostname is not valid, not further processing is performed. When set
|
||||
// to `false`, inputs to the library will be considered valid and parsing will
|
||||
// proceed regardless.
|
||||
validateHostname: boolean;
|
||||
// Perform IP address detection (default: true).
|
||||
detectIp: boolean;
|
||||
// Assume that both URLs and hostnames can be given as input (default: true)
|
||||
// If set to `false` we assume only URLs will be given as input, which
|
||||
// speed-ups processing.
|
||||
mixedInputs: boolean;
|
||||
// Specifies extra valid suffixes (default: null)
|
||||
validHosts: string[] | null;
|
||||
}
|
||||
```
|
||||
|
||||
The `parse` method returns handy **properties about a URL or a hostname**.
|
||||
|
||||
```js
|
||||
const tldts = require('tldts');
|
||||
|
||||
tldts.parse('https://spark-public.s3.amazonaws.com/dataanalysis/loansData.csv');
|
||||
// { domain: 'amazonaws.com',
|
||||
// domainWithoutSuffix: 'amazonaws',
|
||||
// hostname: 'spark-public.s3.amazonaws.com',
|
||||
// isIcann: true,
|
||||
// isIp: false,
|
||||
// isPrivate: false,
|
||||
// publicSuffix: 'com',
|
||||
// subdomain: 'spark-public.s3' }
|
||||
|
||||
tldts.parse(
|
||||
'https://spark-public.s3.amazonaws.com/dataanalysis/loansData.csv',
|
||||
{ allowPrivateDomains: true },
|
||||
);
|
||||
// { domain: 'spark-public.s3.amazonaws.com',
|
||||
// domainWithoutSuffix: 'spark-public',
|
||||
// hostname: 'spark-public.s3.amazonaws.com',
|
||||
// isIcann: false,
|
||||
// isIp: false,
|
||||
// isPrivate: true,
|
||||
// publicSuffix: 's3.amazonaws.com',
|
||||
// subdomain: '' }
|
||||
|
||||
tldts.parse('gopher://domain.unknown/');
|
||||
// { domain: 'domain.unknown',
|
||||
// domainWithoutSuffix: 'domain',
|
||||
// hostname: 'domain.unknown',
|
||||
// isIcann: false,
|
||||
// isIp: false,
|
||||
// isPrivate: false,
|
||||
// publicSuffix: 'unknown',
|
||||
// subdomain: '' }
|
||||
|
||||
tldts.parse('https://192.168.0.0'); // IPv4
|
||||
// { domain: null,
|
||||
// domainWithoutSuffix: null,
|
||||
// hostname: '192.168.0.0',
|
||||
// isIcann: null,
|
||||
// isIp: true,
|
||||
// isPrivate: null,
|
||||
// publicSuffix: null,
|
||||
// subdomain: null }
|
||||
|
||||
tldts.parse('https://[::1]'); // IPv6
|
||||
// { domain: null,
|
||||
// domainWithoutSuffix: null,
|
||||
// hostname: '::1',
|
||||
// isIcann: null,
|
||||
// isIp: true,
|
||||
// isPrivate: null,
|
||||
// publicSuffix: null,
|
||||
// subdomain: null }
|
||||
|
||||
tldts.parse('tldts@emailprovider.co.uk'); // email
|
||||
// { domain: 'emailprovider.co.uk',
|
||||
// domainWithoutSuffix: 'emailprovider',
|
||||
// hostname: 'emailprovider.co.uk',
|
||||
// isIcann: true,
|
||||
// isIp: false,
|
||||
// isPrivate: false,
|
||||
// publicSuffix: 'co.uk',
|
||||
// subdomain: '' }
|
||||
```
|
||||
|
||||
| Property Name | Type | Description |
|
||||
| :-------------------- | :----- | :---------------------------------------------- |
|
||||
| `hostname` | `str` | `hostname` of the input extracted automatically |
|
||||
| `domain` | `str` | Domain (tld + sld) |
|
||||
| `domainWithoutSuffix` | `str` | Domain without public suffix |
|
||||
| `subdomain` | `str` | Sub domain (what comes after `domain`) |
|
||||
| `publicSuffix` | `str` | Public Suffix (tld) of `hostname` |
|
||||
| `isIcann` | `bool` | Does TLD come from ICANN part of the list |
|
||||
| `isPrivate` | `bool` | Does TLD come from Private part of the list |
|
||||
| `isIP` | `bool` | Is `hostname` an IP address? |
|
||||
|
||||
## Single purpose methods
|
||||
|
||||
These methods are shorthands if you want to retrieve only a single value (and
|
||||
will perform better than `parse` because less work will be needed).
|
||||
|
||||
### getHostname(url | hostname, options?)
|
||||
|
||||
Returns the hostname from a given string.
|
||||
|
||||
```javascript
|
||||
const { getHostname } = require('tldts');
|
||||
|
||||
getHostname('google.com'); // returns `google.com`
|
||||
getHostname('fr.google.com'); // returns `fr.google.com`
|
||||
getHostname('fr.google.google'); // returns `fr.google.google`
|
||||
getHostname('foo.google.co.uk'); // returns `foo.google.co.uk`
|
||||
getHostname('t.co'); // returns `t.co`
|
||||
getHostname('fr.t.co'); // returns `fr.t.co`
|
||||
getHostname(
|
||||
'https://user:password@example.co.uk:8080/some/path?and&query#hash',
|
||||
); // returns `example.co.uk`
|
||||
```
|
||||
|
||||
### getDomain(url | hostname, options?)
|
||||
|
||||
Returns the fully qualified domain from a given string.
|
||||
|
||||
```javascript
|
||||
const { getDomain } = require('tldts');
|
||||
|
||||
getDomain('google.com'); // returns `google.com`
|
||||
getDomain('fr.google.com'); // returns `google.com`
|
||||
getDomain('fr.google.google'); // returns `google.google`
|
||||
getDomain('foo.google.co.uk'); // returns `google.co.uk`
|
||||
getDomain('t.co'); // returns `t.co`
|
||||
getDomain('fr.t.co'); // returns `t.co`
|
||||
getDomain('https://user:password@example.co.uk:8080/some/path?and&query#hash'); // returns `example.co.uk`
|
||||
```
|
||||
|
||||
### getDomainWithoutSuffix(url | hostname, options?)
|
||||
|
||||
Returns the domain (as returned by `getDomain(...)`) without the public suffix part.
|
||||
|
||||
```javascript
|
||||
const { getDomainWithoutSuffix } = require('tldts');
|
||||
|
||||
getDomainWithoutSuffix('google.com'); // returns `google`
|
||||
getDomainWithoutSuffix('fr.google.com'); // returns `google`
|
||||
getDomainWithoutSuffix('fr.google.google'); // returns `google`
|
||||
getDomainWithoutSuffix('foo.google.co.uk'); // returns `google`
|
||||
getDomainWithoutSuffix('t.co'); // returns `t`
|
||||
getDomainWithoutSuffix('fr.t.co'); // returns `t`
|
||||
getDomainWithoutSuffix(
|
||||
'https://user:password@example.co.uk:8080/some/path?and&query#hash',
|
||||
); // returns `example`
|
||||
```
|
||||
|
||||
### getSubdomain(url | hostname, options?)
|
||||
|
||||
Returns the complete subdomain for a given string.
|
||||
|
||||
```javascript
|
||||
const { getSubdomain } = require('tldts');
|
||||
|
||||
getSubdomain('google.com'); // returns ``
|
||||
getSubdomain('fr.google.com'); // returns `fr`
|
||||
getSubdomain('google.co.uk'); // returns ``
|
||||
getSubdomain('foo.google.co.uk'); // returns `foo`
|
||||
getSubdomain('moar.foo.google.co.uk'); // returns `moar.foo`
|
||||
getSubdomain('t.co'); // returns ``
|
||||
getSubdomain('fr.t.co'); // returns `fr`
|
||||
getSubdomain(
|
||||
'https://user:password@secure.example.co.uk:443/some/path?and&query#hash',
|
||||
); // returns `secure`
|
||||
```
|
||||
|
||||
### getPublicSuffix(url | hostname, options?)
|
||||
|
||||
Returns the [public suffix][] for a given string.
|
||||
|
||||
```javascript
|
||||
const { getPublicSuffix } = require('tldts');
|
||||
|
||||
getPublicSuffix('google.com'); // returns `com`
|
||||
getPublicSuffix('fr.google.com'); // returns `com`
|
||||
getPublicSuffix('google.co.uk'); // returns `co.uk`
|
||||
getPublicSuffix('s3.amazonaws.com'); // returns `com`
|
||||
getPublicSuffix('s3.amazonaws.com', { allowPrivateDomains: true }); // returns `s3.amazonaws.com`
|
||||
getPublicSuffix('tld.is.unknown'); // returns `unknown`
|
||||
```
|
||||
|
||||
# Troubleshooting
|
||||
|
||||
## Retrieving subdomain of `localhost` and custom hostnames
|
||||
|
||||
`tldts` methods `getDomain` and `getSubdomain` are designed to **work only with _known and valid_ TLDs**.
|
||||
This way, you can trust what a domain is.
|
||||
|
||||
`localhost` is a valid hostname but not a TLD. You can pass additional options to each method exposed by `tldts`:
|
||||
|
||||
```js
|
||||
const tldts = require('tldts');
|
||||
|
||||
tldts.getDomain('localhost'); // returns null
|
||||
tldts.getSubdomain('vhost.localhost'); // returns null
|
||||
|
||||
tldts.getDomain('localhost', { validHosts: ['localhost'] }); // returns 'localhost'
|
||||
tldts.getSubdomain('vhost.localhost', { validHosts: ['localhost'] }); // returns 'vhost'
|
||||
```
|
||||
|
||||
## Updating the TLDs List
|
||||
|
||||
`tldts` made the opinionated choice of shipping with a list of suffixes directly
|
||||
in its bundle. There is currently no mechanism to update the lists yourself, but
|
||||
we make sure that the version shipped is always up-to-date.
|
||||
|
||||
If you keep `tldts` updated, the lists should be up-to-date as well!
|
||||
|
||||
# Performance
|
||||
|
||||
`tldts` is the _fastest JavaScript library_ available for parsing hostnames. It is able to parse _millions of inputs per second_ (typically 2-3M depending on your hardware and inputs). It also offers granular options to fine-tune the behavior and performance of the library depending on the kind of inputs you are dealing with (e.g.: if you know you only manipulate valid hostnames you can disable the hostname extraction step with `{ extractHostname: false }`).
|
||||
|
||||
Please see [this detailed comparison](./comparison/comparison.md) with other available libraries.
|
||||
|
||||
## Contributors
|
||||
|
||||
`tldts` is based upon the excellent `tld.js` library and would not exist without
|
||||
the many contributors who worked on the project:
|
||||
<a href="graphs/contributors"><img src="https://opencollective.com/tldjs/contributors.svg?width=890" /></a>
|
||||
|
||||
This project would not be possible without the amazing Mozilla's
|
||||
[public suffix list][]. Thank you for your hard work!
|
||||
|
||||
# License
|
||||
|
||||
[MIT License](LICENSE).
|
||||
|
||||
[badge-ci]: https://secure.travis-ci.org/remusao/tldts.svg?branch=master
|
||||
[badge-downloads]: https://img.shields.io/npm/dm/tldts.svg
|
||||
[public suffix list]: https://publicsuffix.org/list/
|
||||
[list the recent changes]: https://github.com/publicsuffix/list/commits/master
|
||||
[changes Atom Feed]: https://github.com/publicsuffix/list/commits/master.atom
|
||||
[public suffix]: https://publicsuffix.org/learn/
|
||||
+21
@@ -0,0 +1,21 @@
|
||||
#!/usr/bin/env node
|
||||
|
||||
'use strict';
|
||||
|
||||
const { parse } = require('..');
|
||||
const readline = require('readline');
|
||||
|
||||
if (process.argv.length > 2) {
|
||||
// URL(s) was specified in the command arguments
|
||||
console.log(
|
||||
JSON.stringify(parse(process.argv[process.argv.length - 1]), null, 2),
|
||||
);
|
||||
} else {
|
||||
// No arguments were specified, read URLs from each line of STDIN
|
||||
const rlInterface = readline.createInterface({
|
||||
input: process.stdin,
|
||||
});
|
||||
rlInterface.on('line', function (line) {
|
||||
console.log(JSON.stringify(parse(line), null, 2));
|
||||
});
|
||||
}
|
||||
+669
File diff suppressed because one or more lines are too long
+1
File diff suppressed because one or more lines are too long
+14
File diff suppressed because one or more lines are too long
+1
File diff suppressed because one or more lines are too long
+67
@@ -0,0 +1,67 @@
|
||||
"use strict";
|
||||
Object.defineProperty(exports, "__esModule", { value: true });
|
||||
exports.default = suffixLookup;
|
||||
const tldts_core_1 = require("tldts-core");
|
||||
const trie_1 = require("./data/trie");
|
||||
/**
|
||||
* Lookup parts of domain in Trie
|
||||
*/
|
||||
function lookupInTrie(parts, trie, index, allowedMask) {
|
||||
let result = null;
|
||||
let node = trie;
|
||||
while (node !== undefined) {
|
||||
// We have a match!
|
||||
if ((node[0] & allowedMask) !== 0) {
|
||||
result = {
|
||||
index: index + 1,
|
||||
isIcann: node[0] === 1 /* RULE_TYPE.ICANN */,
|
||||
isPrivate: node[0] === 2 /* RULE_TYPE.PRIVATE */,
|
||||
};
|
||||
}
|
||||
// No more `parts` to look for
|
||||
if (index === -1) {
|
||||
break;
|
||||
}
|
||||
const succ = node[1];
|
||||
node = Object.prototype.hasOwnProperty.call(succ, parts[index])
|
||||
? succ[parts[index]]
|
||||
: succ['*'];
|
||||
index -= 1;
|
||||
}
|
||||
return result;
|
||||
}
|
||||
/**
|
||||
* Check if `hostname` has a valid public suffix in `trie`.
|
||||
*/
|
||||
function suffixLookup(hostname, options, out) {
|
||||
var _a;
|
||||
if ((0, tldts_core_1.fastPathLookup)(hostname, options, out)) {
|
||||
return;
|
||||
}
|
||||
const hostnameParts = hostname.split('.');
|
||||
const allowedMask = (options.allowPrivateDomains ? 2 /* RULE_TYPE.PRIVATE */ : 0) |
|
||||
(options.allowIcannDomains ? 1 /* RULE_TYPE.ICANN */ : 0);
|
||||
// Look for exceptions
|
||||
const exceptionMatch = lookupInTrie(hostnameParts, trie_1.exceptions, hostnameParts.length - 1, allowedMask);
|
||||
if (exceptionMatch !== null) {
|
||||
out.isIcann = exceptionMatch.isIcann;
|
||||
out.isPrivate = exceptionMatch.isPrivate;
|
||||
out.publicSuffix = hostnameParts.slice(exceptionMatch.index + 1).join('.');
|
||||
return;
|
||||
}
|
||||
// Look for a match in rules
|
||||
const rulesMatch = lookupInTrie(hostnameParts, trie_1.rules, hostnameParts.length - 1, allowedMask);
|
||||
if (rulesMatch !== null) {
|
||||
out.isIcann = rulesMatch.isIcann;
|
||||
out.isPrivate = rulesMatch.isPrivate;
|
||||
out.publicSuffix = hostnameParts.slice(rulesMatch.index).join('.');
|
||||
return;
|
||||
}
|
||||
// No match found...
|
||||
// Prevailing rule is '*' so we consider the top-level domain to be the
|
||||
// public suffix of `hostname` (e.g.: 'example.org' => 'org').
|
||||
out.isIcann = false;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = (_a = hostnameParts[hostnameParts.length - 1]) !== null && _a !== void 0 ? _a : null;
|
||||
}
|
||||
//# sourceMappingURL=suffix-trie.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"suffix-trie.js","sourceRoot":"","sources":["../../../src/suffix-trie.ts"],"names":[],"mappings":";;AA0DA,+BAmDC;AA7GD,2CAIoB;AACpB,sCAAuD;AAcvD;;GAEG;AACH,SAAS,YAAY,CACnB,KAAe,EACf,IAAW,EACX,KAAa,EACb,WAAmB;IAEnB,IAAI,MAAM,GAAkB,IAAI,CAAC;IACjC,IAAI,IAAI,GAAsB,IAAI,CAAC;IACnC,OAAO,IAAI,KAAK,SAAS,EAAE,CAAC;QAC1B,mBAAmB;QACnB,IAAI,CAAC,IAAI,CAAC,CAAC,CAAC,GAAG,WAAW,CAAC,KAAK,CAAC,EAAE,CAAC;YAClC,MAAM,GAAG;gBACP,KAAK,EAAE,KAAK,GAAG,CAAC;gBAChB,OAAO,EAAE,IAAI,CAAC,CAAC,CAAC,4BAAoB;gBACpC,SAAS,EAAE,IAAI,CAAC,CAAC,CAAC,8BAAsB;aACzC,CAAC;QACJ,CAAC;QAED,8BAA8B;QAC9B,IAAI,KAAK,KAAK,CAAC,CAAC,EAAE,CAAC;YACjB,MAAM;QACR,CAAC;QAED,MAAM,IAAI,GAA+B,IAAI,CAAC,CAAC,CAAC,CAAC;QACjD,IAAI,GAAG,MAAM,CAAC,SAAS,CAAC,cAAc,CAAC,IAAI,CAAC,IAAI,EAAE,KAAK,CAAC,KAAK,CAAE,CAAC;YAC9D,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,KAAK,CAAE,CAAC;YACrB,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;QACd,KAAK,IAAI,CAAC,CAAC;IACb,CAAC;IAED,OAAO,MAAM,CAAC;AAChB,CAAC;AAED;;GAEG;AACH,SAAwB,YAAY,CAClC,QAAgB,EAChB,OAA6B,EAC7B,GAAkB;;IAElB,IAAI,IAAA,2BAAc,EAAC,QAAQ,EAAE,OAAO,EAAE,GAAG,CAAC,EAAE,CAAC;QAC3C,OAAO;IACT,CAAC;IAED,MAAM,aAAa,GAAG,QAAQ,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC;IAE1C,MAAM,WAAW,GACf,CAAC,OAAO,CAAC,mBAAmB,CAAC,CAAC,2BAAmB,CAAC,CAAC,CAAC,CAAC;QACrD,CAAC,OAAO,CAAC,iBAAiB,CAAC,CAAC,yBAAiB,CAAC,CAAC,CAAC,CAAC,CAAC;IAEpD,sBAAsB;IACtB,MAAM,cAAc,GAAG,YAAY,CACjC,aAAa,EACb,iBAAU,EACV,aAAa,CAAC,MAAM,GAAG,CAAC,EACxB,WAAW,CACZ,CAAC;IAEF,IAAI,cAAc,KAAK,IAAI,EAAE,CAAC;QAC5B,GAAG,CAAC,OAAO,GAAG,cAAc,CAAC,OAAO,CAAC;QACrC,GAAG,CAAC,SAAS,GAAG,cAAc,CAAC,SAAS,CAAC;QACzC,GAAG,CAAC,YAAY,GAAG,aAAa,CAAC,KAAK,CAAC,cAAc,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;QAC3E,OAAO;IACT,CAAC;IAED,4BAA4B;IAC5B,MAAM,UAAU,GAAG,YAAY,CAC7B,aAAa,EACb,YAAK,EACL,aAAa,CAAC,MAAM,GAAG,CAAC,EACxB,WAAW,CACZ,CAAC;IAEF,IAAI,UAAU,KAAK,IAAI,EAAE,CAAC;QACxB,GAAG,CAAC,OAAO,GAAG,UAAU,CAAC,OAAO,CAAC;QACjC,GAAG,CAAC,SAAS,GAAG,UAAU,CAAC,SAAS,CAAC;QACrC,GAAG,CAAC,YAAY,GAAG,aAAa,CAAC,KAAK,CAAC,UAAU,CAAC,KAAK,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;QACnE,OAAO;IACT,CAAC;IAED,oBAAoB;IACpB,uEAAuE;IACvE,8DAA8D;IAC9D,GAAG,CAAC,OAAO,GAAG,KAAK,CAAC;IACpB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;IACtB,GAAG,CAAC,YAAY,GAAG,MAAA,aAAa,CAAC,aAAa,CAAC,MAAM,GAAG,CAAC,CAAC,mCAAI,IAAI,CAAC;AACrE,CAAC"}
|
||||
+1
File diff suppressed because one or more lines are too long
+33
@@ -0,0 +1,33 @@
|
||||
import { getEmptyResult, parseImpl, resetResult, } from 'tldts-core';
|
||||
import suffixLookup from './src/suffix-trie';
|
||||
// For all methods but 'parse', it does not make sense to allocate an object
|
||||
// every single time to only return the value of a specific attribute. To avoid
|
||||
// this un-necessary allocation, we use a global object which is re-used.
|
||||
const RESULT = getEmptyResult();
|
||||
export function parse(url, options = {}) {
|
||||
return parseImpl(url, 5 /* FLAG.ALL */, suffixLookup, options, getEmptyResult());
|
||||
}
|
||||
export function getHostname(url, options = {}) {
|
||||
/*@__INLINE__*/ resetResult(RESULT);
|
||||
return parseImpl(url, 0 /* FLAG.HOSTNAME */, suffixLookup, options, RESULT).hostname;
|
||||
}
|
||||
export function getPublicSuffix(url, options = {}) {
|
||||
/*@__INLINE__*/ resetResult(RESULT);
|
||||
return parseImpl(url, 2 /* FLAG.PUBLIC_SUFFIX */, suffixLookup, options, RESULT)
|
||||
.publicSuffix;
|
||||
}
|
||||
export function getDomain(url, options = {}) {
|
||||
/*@__INLINE__*/ resetResult(RESULT);
|
||||
return parseImpl(url, 3 /* FLAG.DOMAIN */, suffixLookup, options, RESULT).domain;
|
||||
}
|
||||
export function getSubdomain(url, options = {}) {
|
||||
/*@__INLINE__*/ resetResult(RESULT);
|
||||
return parseImpl(url, 4 /* FLAG.SUB_DOMAIN */, suffixLookup, options, RESULT)
|
||||
.subdomain;
|
||||
}
|
||||
export function getDomainWithoutSuffix(url, options = {}) {
|
||||
/*@__INLINE__*/ resetResult(RESULT);
|
||||
return parseImpl(url, 5 /* FLAG.ALL */, suffixLookup, options, RESULT)
|
||||
.domainWithoutSuffix;
|
||||
}
|
||||
//# sourceMappingURL=index.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"index.js","sourceRoot":"","sources":["../../index.ts"],"names":[],"mappings":"AAAA,OAAO,EAEL,cAAc,EAGd,SAAS,EACT,WAAW,GACZ,MAAM,YAAY,CAAC;AAEpB,OAAO,YAAY,MAAM,mBAAmB,CAAC;AAE7C,4EAA4E;AAC5E,+EAA+E;AAC/E,yEAAyE;AACzE,MAAM,MAAM,GAAY,cAAc,EAAE,CAAC;AAEzC,MAAM,UAAU,KAAK,CAAC,GAAW,EAAE,UAA6B,EAAE;IAChE,OAAO,SAAS,CAAC,GAAG,oBAAY,YAAY,EAAE,OAAO,EAAE,cAAc,EAAE,CAAC,CAAC;AAC3E,CAAC;AAED,MAAM,UAAU,WAAW,CACzB,GAAW,EACX,UAA6B,EAAE;IAE/B,eAAe,CAAC,WAAW,CAAC,MAAM,CAAC,CAAC;IACpC,OAAO,SAAS,CAAC,GAAG,yBAAiB,YAAY,EAAE,OAAO,EAAE,MAAM,CAAC,CAAC,QAAQ,CAAC;AAC/E,CAAC;AAED,MAAM,UAAU,eAAe,CAC7B,GAAW,EACX,UAA6B,EAAE;IAE/B,eAAe,CAAC,WAAW,CAAC,MAAM,CAAC,CAAC;IACpC,OAAO,SAAS,CAAC,GAAG,8BAAsB,YAAY,EAAE,OAAO,EAAE,MAAM,CAAC;SACrE,YAAY,CAAC;AAClB,CAAC;AAED,MAAM,UAAU,SAAS,CACvB,GAAW,EACX,UAA6B,EAAE;IAE/B,eAAe,CAAC,WAAW,CAAC,MAAM,CAAC,CAAC;IACpC,OAAO,SAAS,CAAC,GAAG,uBAAe,YAAY,EAAE,OAAO,EAAE,MAAM,CAAC,CAAC,MAAM,CAAC;AAC3E,CAAC;AAED,MAAM,UAAU,YAAY,CAC1B,GAAW,EACX,UAA6B,EAAE;IAE/B,eAAe,CAAC,WAAW,CAAC,MAAM,CAAC,CAAC;IACpC,OAAO,SAAS,CAAC,GAAG,2BAAmB,YAAY,EAAE,OAAO,EAAE,MAAM,CAAC;SAClE,SAAS,CAAC;AACf,CAAC;AAED,MAAM,UAAU,sBAAsB,CACpC,GAAW,EACX,UAA6B,EAAE;IAE/B,eAAe,CAAC,WAAW,CAAC,MAAM,CAAC,CAAC;IACpC,OAAO,SAAS,CAAC,GAAG,oBAAY,YAAY,EAAE,OAAO,EAAE,MAAM,CAAC;SAC3D,mBAAmB,CAAC;AACzB,CAAC"}
|
||||
+11
File diff suppressed because one or more lines are too long
+1
File diff suppressed because one or more lines are too long
+64
@@ -0,0 +1,64 @@
|
||||
import { fastPathLookup, } from 'tldts-core';
|
||||
import { exceptions, rules } from './data/trie';
|
||||
/**
|
||||
* Lookup parts of domain in Trie
|
||||
*/
|
||||
function lookupInTrie(parts, trie, index, allowedMask) {
|
||||
let result = null;
|
||||
let node = trie;
|
||||
while (node !== undefined) {
|
||||
// We have a match!
|
||||
if ((node[0] & allowedMask) !== 0) {
|
||||
result = {
|
||||
index: index + 1,
|
||||
isIcann: node[0] === 1 /* RULE_TYPE.ICANN */,
|
||||
isPrivate: node[0] === 2 /* RULE_TYPE.PRIVATE */,
|
||||
};
|
||||
}
|
||||
// No more `parts` to look for
|
||||
if (index === -1) {
|
||||
break;
|
||||
}
|
||||
const succ = node[1];
|
||||
node = Object.prototype.hasOwnProperty.call(succ, parts[index])
|
||||
? succ[parts[index]]
|
||||
: succ['*'];
|
||||
index -= 1;
|
||||
}
|
||||
return result;
|
||||
}
|
||||
/**
|
||||
* Check if `hostname` has a valid public suffix in `trie`.
|
||||
*/
|
||||
export default function suffixLookup(hostname, options, out) {
|
||||
var _a;
|
||||
if (fastPathLookup(hostname, options, out)) {
|
||||
return;
|
||||
}
|
||||
const hostnameParts = hostname.split('.');
|
||||
const allowedMask = (options.allowPrivateDomains ? 2 /* RULE_TYPE.PRIVATE */ : 0) |
|
||||
(options.allowIcannDomains ? 1 /* RULE_TYPE.ICANN */ : 0);
|
||||
// Look for exceptions
|
||||
const exceptionMatch = lookupInTrie(hostnameParts, exceptions, hostnameParts.length - 1, allowedMask);
|
||||
if (exceptionMatch !== null) {
|
||||
out.isIcann = exceptionMatch.isIcann;
|
||||
out.isPrivate = exceptionMatch.isPrivate;
|
||||
out.publicSuffix = hostnameParts.slice(exceptionMatch.index + 1).join('.');
|
||||
return;
|
||||
}
|
||||
// Look for a match in rules
|
||||
const rulesMatch = lookupInTrie(hostnameParts, rules, hostnameParts.length - 1, allowedMask);
|
||||
if (rulesMatch !== null) {
|
||||
out.isIcann = rulesMatch.isIcann;
|
||||
out.isPrivate = rulesMatch.isPrivate;
|
||||
out.publicSuffix = hostnameParts.slice(rulesMatch.index).join('.');
|
||||
return;
|
||||
}
|
||||
// No match found...
|
||||
// Prevailing rule is '*' so we consider the top-level domain to be the
|
||||
// public suffix of `hostname` (e.g.: 'example.org' => 'org').
|
||||
out.isIcann = false;
|
||||
out.isPrivate = false;
|
||||
out.publicSuffix = (_a = hostnameParts[hostnameParts.length - 1]) !== null && _a !== void 0 ? _a : null;
|
||||
}
|
||||
//# sourceMappingURL=suffix-trie.js.map
|
||||
+1
@@ -0,0 +1 @@
|
||||
{"version":3,"file":"suffix-trie.js","sourceRoot":"","sources":["../../../src/suffix-trie.ts"],"names":[],"mappings":"AAAA,OAAO,EACL,cAAc,GAGf,MAAM,YAAY,CAAC;AACpB,OAAO,EAAE,UAAU,EAAS,KAAK,EAAE,MAAM,aAAa,CAAC;AAcvD;;GAEG;AACH,SAAS,YAAY,CACnB,KAAe,EACf,IAAW,EACX,KAAa,EACb,WAAmB;IAEnB,IAAI,MAAM,GAAkB,IAAI,CAAC;IACjC,IAAI,IAAI,GAAsB,IAAI,CAAC;IACnC,OAAO,IAAI,KAAK,SAAS,EAAE,CAAC;QAC1B,mBAAmB;QACnB,IAAI,CAAC,IAAI,CAAC,CAAC,CAAC,GAAG,WAAW,CAAC,KAAK,CAAC,EAAE,CAAC;YAClC,MAAM,GAAG;gBACP,KAAK,EAAE,KAAK,GAAG,CAAC;gBAChB,OAAO,EAAE,IAAI,CAAC,CAAC,CAAC,4BAAoB;gBACpC,SAAS,EAAE,IAAI,CAAC,CAAC,CAAC,8BAAsB;aACzC,CAAC;QACJ,CAAC;QAED,8BAA8B;QAC9B,IAAI,KAAK,KAAK,CAAC,CAAC,EAAE,CAAC;YACjB,MAAM;QACR,CAAC;QAED,MAAM,IAAI,GAA+B,IAAI,CAAC,CAAC,CAAC,CAAC;QACjD,IAAI,GAAG,MAAM,CAAC,SAAS,CAAC,cAAc,CAAC,IAAI,CAAC,IAAI,EAAE,KAAK,CAAC,KAAK,CAAE,CAAC;YAC9D,CAAC,CAAC,IAAI,CAAC,KAAK,CAAC,KAAK,CAAE,CAAC;YACrB,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;QACd,KAAK,IAAI,CAAC,CAAC;IACb,CAAC;IAED,OAAO,MAAM,CAAC;AAChB,CAAC;AAED;;GAEG;AACH,MAAM,CAAC,OAAO,UAAU,YAAY,CAClC,QAAgB,EAChB,OAA6B,EAC7B,GAAkB;;IAElB,IAAI,cAAc,CAAC,QAAQ,EAAE,OAAO,EAAE,GAAG,CAAC,EAAE,CAAC;QAC3C,OAAO;IACT,CAAC;IAED,MAAM,aAAa,GAAG,QAAQ,CAAC,KAAK,CAAC,GAAG,CAAC,CAAC;IAE1C,MAAM,WAAW,GACf,CAAC,OAAO,CAAC,mBAAmB,CAAC,CAAC,2BAAmB,CAAC,CAAC,CAAC,CAAC;QACrD,CAAC,OAAO,CAAC,iBAAiB,CAAC,CAAC,yBAAiB,CAAC,CAAC,CAAC,CAAC,CAAC;IAEpD,sBAAsB;IACtB,MAAM,cAAc,GAAG,YAAY,CACjC,aAAa,EACb,UAAU,EACV,aAAa,CAAC,MAAM,GAAG,CAAC,EACxB,WAAW,CACZ,CAAC;IAEF,IAAI,cAAc,KAAK,IAAI,EAAE,CAAC;QAC5B,GAAG,CAAC,OAAO,GAAG,cAAc,CAAC,OAAO,CAAC;QACrC,GAAG,CAAC,SAAS,GAAG,cAAc,CAAC,SAAS,CAAC;QACzC,GAAG,CAAC,YAAY,GAAG,aAAa,CAAC,KAAK,CAAC,cAAc,CAAC,KAAK,GAAG,CAAC,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;QAC3E,OAAO;IACT,CAAC;IAED,4BAA4B;IAC5B,MAAM,UAAU,GAAG,YAAY,CAC7B,aAAa,EACb,KAAK,EACL,aAAa,CAAC,MAAM,GAAG,CAAC,EACxB,WAAW,CACZ,CAAC;IAEF,IAAI,UAAU,KAAK,IAAI,EAAE,CAAC;QACxB,GAAG,CAAC,OAAO,GAAG,UAAU,CAAC,OAAO,CAAC;QACjC,GAAG,CAAC,SAAS,GAAG,UAAU,CAAC,SAAS,CAAC;QACrC,GAAG,CAAC,YAAY,GAAG,aAAa,CAAC,KAAK,CAAC,UAAU,CAAC,KAAK,CAAC,CAAC,IAAI,CAAC,GAAG,CAAC,CAAC;QACnE,OAAO;IACT,CAAC;IAED,oBAAoB;IACpB,uEAAuE;IACvE,8DAA8D;IAC9D,GAAG,CAAC,OAAO,GAAG,KAAK,CAAC;IACpB,GAAG,CAAC,SAAS,GAAG,KAAK,CAAC;IACtB,GAAG,CAAC,YAAY,GAAG,MAAA,aAAa,CAAC,aAAa,CAAC,MAAM,GAAG,CAAC,CAAC,mCAAI,IAAI,CAAC;AACrE,CAAC"}
|
||||
+1
File diff suppressed because one or more lines are too long
+2
File diff suppressed because one or more lines are too long
+1
File diff suppressed because one or more lines are too long
+2
File diff suppressed because one or more lines are too long
+1
File diff suppressed because one or more lines are too long
+2
File diff suppressed because one or more lines are too long
+1
File diff suppressed because one or more lines are too long
+7
@@ -0,0 +1,7 @@
|
||||
import { IOptions, IResult } from 'tldts-core';
|
||||
export declare function parse(url: string, options?: Partial<IOptions>): IResult;
|
||||
export declare function getHostname(url: string, options?: Partial<IOptions>): string | null;
|
||||
export declare function getPublicSuffix(url: string, options?: Partial<IOptions>): string | null;
|
||||
export declare function getDomain(url: string, options?: Partial<IOptions>): string | null;
|
||||
export declare function getSubdomain(url: string, options?: Partial<IOptions>): string | null;
|
||||
export declare function getDomainWithoutSuffix(url: string, options?: Partial<IOptions>): string | null;
|
||||
+5
@@ -0,0 +1,5 @@
|
||||
export type ITrie = [0 | 1 | 2, {
|
||||
[label: string]: ITrie;
|
||||
}];
|
||||
export declare const exceptions: ITrie;
|
||||
export declare const rules: ITrie;
|
||||
+5
@@ -0,0 +1,5 @@
|
||||
import { IPublicSuffix, ISuffixLookupOptions } from 'tldts-core';
|
||||
/**
|
||||
* Check if `hostname` has a valid public suffix in `trie`.
|
||||
*/
|
||||
export default function suffixLookup(hostname: string, options: ISuffixLookupOptions, out: IPublicSuffix): void;
|
||||
+62
@@ -0,0 +1,62 @@
|
||||
import {
|
||||
FLAG,
|
||||
getEmptyResult,
|
||||
IOptions,
|
||||
IResult,
|
||||
parseImpl,
|
||||
resetResult,
|
||||
} from 'tldts-core';
|
||||
|
||||
import suffixLookup from './src/suffix-trie';
|
||||
|
||||
// For all methods but 'parse', it does not make sense to allocate an object
|
||||
// every single time to only return the value of a specific attribute. To avoid
|
||||
// this un-necessary allocation, we use a global object which is re-used.
|
||||
const RESULT: IResult = getEmptyResult();
|
||||
|
||||
export function parse(url: string, options: Partial<IOptions> = {}): IResult {
|
||||
return parseImpl(url, FLAG.ALL, suffixLookup, options, getEmptyResult());
|
||||
}
|
||||
|
||||
export function getHostname(
|
||||
url: string,
|
||||
options: Partial<IOptions> = {},
|
||||
): string | null {
|
||||
/*@__INLINE__*/ resetResult(RESULT);
|
||||
return parseImpl(url, FLAG.HOSTNAME, suffixLookup, options, RESULT).hostname;
|
||||
}
|
||||
|
||||
export function getPublicSuffix(
|
||||
url: string,
|
||||
options: Partial<IOptions> = {},
|
||||
): string | null {
|
||||
/*@__INLINE__*/ resetResult(RESULT);
|
||||
return parseImpl(url, FLAG.PUBLIC_SUFFIX, suffixLookup, options, RESULT)
|
||||
.publicSuffix;
|
||||
}
|
||||
|
||||
export function getDomain(
|
||||
url: string,
|
||||
options: Partial<IOptions> = {},
|
||||
): string | null {
|
||||
/*@__INLINE__*/ resetResult(RESULT);
|
||||
return parseImpl(url, FLAG.DOMAIN, suffixLookup, options, RESULT).domain;
|
||||
}
|
||||
|
||||
export function getSubdomain(
|
||||
url: string,
|
||||
options: Partial<IOptions> = {},
|
||||
): string | null {
|
||||
/*@__INLINE__*/ resetResult(RESULT);
|
||||
return parseImpl(url, FLAG.SUB_DOMAIN, suffixLookup, options, RESULT)
|
||||
.subdomain;
|
||||
}
|
||||
|
||||
export function getDomainWithoutSuffix(
|
||||
url: string,
|
||||
options: Partial<IOptions> = {},
|
||||
): string | null {
|
||||
/*@__INLINE__*/ resetResult(RESULT);
|
||||
return parseImpl(url, FLAG.ALL, suffixLookup, options, RESULT)
|
||||
.domainWithoutSuffix;
|
||||
}
|
||||
Some files were not shown because too many files have changed in this diff Show More
Reference in New Issue
Block a user