gradio / node_modules /tldts /src /suffix-trie.ts
reisarod's picture
Upload folder using huggingface_hub
5fae594 verified
import {
fastPathLookup,
IPublicSuffix,
ISuffixLookupOptions,
} from 'tldts-core';
import { exceptions, ITrie, rules } from './data/trie';
// Flags used to know if a rule is ICANN or Private
const enum RULE_TYPE {
ICANN = 1,
PRIVATE = 2,
}
interface IMatch {
index: number;
isIcann: boolean;
isPrivate: boolean;
}
/**
* Lookup parts of domain in Trie
*/
function lookupInTrie(
parts: string[],
trie: ITrie,
index: number,
allowedMask: number,
): IMatch | null {
let result: IMatch | null = null;
let node: ITrie | undefined = trie;
while (node !== undefined) {
// We have a match!
if ((node[0] & allowedMask) !== 0) {
result = {
index: index + 1,
isIcann: node[0] === RULE_TYPE.ICANN,
isPrivate: node[0] === RULE_TYPE.PRIVATE,
};
}
// No more `parts` to look for
if (index === -1) {
break;
}
const succ: { [label: string]: ITrie } = node[1];
node = Object.prototype.hasOwnProperty.call(succ, parts[index]!)
? succ[parts[index]!]
: succ['*'];
index -= 1;
}
return result;
}
/**
* Check if `hostname` has a valid public suffix in `trie`.
*/
export default function suffixLookup(
hostname: string,
options: ISuffixLookupOptions,
out: IPublicSuffix,
): void {
if (fastPathLookup(hostname, options, out)) {
return;
}
const hostnameParts = hostname.split('.');
const allowedMask =
(options.allowPrivateDomains ? RULE_TYPE.PRIVATE : 0) |
(options.allowIcannDomains ? RULE_TYPE.ICANN : 0);
// Look for exceptions
const exceptionMatch = lookupInTrie(
hostnameParts,
exceptions,
hostnameParts.length - 1,
allowedMask,
);
if (exceptionMatch !== null) {
out.isIcann = exceptionMatch.isIcann;
out.isPrivate = exceptionMatch.isPrivate;
out.publicSuffix = hostnameParts.slice(exceptionMatch.index + 1).join('.');
return;
}
// Look for a match in rules
const rulesMatch = lookupInTrie(
hostnameParts,
rules,
hostnameParts.length - 1,
allowedMask,
);
if (rulesMatch !== null) {
out.isIcann = rulesMatch.isIcann;
out.isPrivate = rulesMatch.isPrivate;
out.publicSuffix = hostnameParts.slice(rulesMatch.index).join('.');
return;
}
// No match found...
// Prevailing rule is '*' so we consider the top-level domain to be the
// public suffix of `hostname` (e.g.: 'example.org' => 'org').
out.isIcann = false;
out.isPrivate = false;
out.publicSuffix = hostnameParts[hostnameParts.length - 1] ?? null;
}