Frontend/25_01_07/mai/node_modules/psl/index.js
szabomarton 7f4a15b9c3 asd
2025-01-28 11:38:27 +01:00

248 lines
5.6 KiB
JavaScript

import punycode from 'punycode/punycode.js';
import rules from './data/rules.js';
//
// Parse rules from file.
//
const rulesByPunySuffix = rules.reduce(
(map, rule) => {
const suffix = rule.replace(/^(\*\.|\!)/, '');
const punySuffix = punycode.toASCII(suffix);
const firstChar = rule.charAt(0);
if (map.has(punySuffix)) {
throw new Error(`Multiple rules found for ${rule} (${punySuffix})`);
}
map.set(punySuffix, {
rule,
suffix,
punySuffix,
wildcard: firstChar === '*',
exception: firstChar === '!'
});
return map;
},
new Map(),
);
//
// Find rule for a given domain.
//
const findRule = (domain) => {
const punyDomain = punycode.toASCII(domain);
const punyDomainChunks = punyDomain.split('.');
for (let i = 0; i < punyDomainChunks.length; i++) {
const suffix = punyDomainChunks.slice(i).join('.');
const matchingRules = rulesByPunySuffix.get(suffix);
if (matchingRules) {
return matchingRules;
}
}
return null;
};
//
// Error codes and messages.
//
export const errorCodes = {
DOMAIN_TOO_SHORT: 'Domain name too short.',
DOMAIN_TOO_LONG: 'Domain name too long. It should be no more than 255 chars.',
LABEL_STARTS_WITH_DASH: 'Domain name label can not start with a dash.',
LABEL_ENDS_WITH_DASH: 'Domain name label can not end with a dash.',
LABEL_TOO_LONG: 'Domain name label should be at most 63 chars long.',
LABEL_TOO_SHORT: 'Domain name label should be at least 1 character long.',
LABEL_INVALID_CHARS: 'Domain name label can only contain alphanumeric characters or dashes.'
};
//
// Validate domain name and throw if not valid.
//
// From wikipedia:
//
// Hostnames are composed of series of labels concatenated with dots, as are all
// domain names. Each label must be between 1 and 63 characters long, and the
// entire hostname (including the delimiting dots) has a maximum of 255 chars.
//
// Allowed chars:
//
// * `a-z`
// * `0-9`
// * `-` but not as a starting or ending character
// * `.` as a separator for the textual portions of a domain name
//
// * http://en.wikipedia.org/wiki/Domain_name
// * http://en.wikipedia.org/wiki/Hostname
//
const validate = (input) => {
// Before we can validate we need to take care of IDNs with unicode chars.
const ascii = punycode.toASCII(input);
if (ascii.length < 1) {
return 'DOMAIN_TOO_SHORT';
}
if (ascii.length > 255) {
return 'DOMAIN_TOO_LONG';
}
// Check each part's length and allowed chars.
const labels = ascii.split('.');
let label;
for (let i = 0; i < labels.length; ++i) {
label = labels[i];
if (!label.length) {
return 'LABEL_TOO_SHORT';
}
if (label.length > 63) {
return 'LABEL_TOO_LONG';
}
if (label.charAt(0) === '-') {
return 'LABEL_STARTS_WITH_DASH';
}
if (label.charAt(label.length - 1) === '-') {
return 'LABEL_ENDS_WITH_DASH';
}
if (!/^[a-z0-9\-_]+$/.test(label)) {
return 'LABEL_INVALID_CHARS';
}
}
};
//
// Public API
//
//
// Parse domain.
//
export const parse = (input) => {
if (typeof input !== 'string') {
throw new TypeError('Domain name must be a string.');
}
// Force domain to lowercase.
let domain = input.slice(0).toLowerCase();
// Handle FQDN.
// TODO: Simply remove trailing dot?
if (domain.charAt(domain.length - 1) === '.') {
domain = domain.slice(0, domain.length - 1);
}
// Validate and sanitise input.
const error = validate(domain);
if (error) {
return {
input: input,
error: {
message: errorCodes[error],
code: error
}
};
}
const parsed = {
input: input,
tld: null,
sld: null,
domain: null,
subdomain: null,
listed: false
};
const domainParts = domain.split('.');
// Non-Internet TLD
if (domainParts[domainParts.length - 1] === 'local') {
return parsed;
}
const handlePunycode = () => {
if (!/xn--/.test(domain)) {
return parsed;
}
if (parsed.domain) {
parsed.domain = punycode.toASCII(parsed.domain);
}
if (parsed.subdomain) {
parsed.subdomain = punycode.toASCII(parsed.subdomain);
}
return parsed;
};
const rule = findRule(domain);
// Unlisted tld.
if (!rule) {
if (domainParts.length < 2) {
return parsed;
}
parsed.tld = domainParts.pop();
parsed.sld = domainParts.pop();
parsed.domain = [parsed.sld, parsed.tld].join('.');
if (domainParts.length) {
parsed.subdomain = domainParts.pop();
}
return handlePunycode();
}
// At this point we know the public suffix is listed.
parsed.listed = true;
const tldParts = rule.suffix.split('.');
const privateParts = domainParts.slice(0, domainParts.length - tldParts.length);
if (rule.exception) {
privateParts.push(tldParts.shift());
}
parsed.tld = tldParts.join('.');
if (!privateParts.length) {
return handlePunycode();
}
if (rule.wildcard) {
tldParts.unshift(privateParts.pop());
parsed.tld = tldParts.join('.');
}
if (!privateParts.length) {
return handlePunycode();
}
parsed.sld = privateParts.pop();
parsed.domain = [parsed.sld, parsed.tld].join('.');
if (privateParts.length) {
parsed.subdomain = privateParts.join('.');
}
return handlePunycode();
};
//
// Get domain.
//
export const get = (domain) => {
if (!domain) {
return null;
}
return parse(domain).domain || null;
};
//
// Check whether domain belongs to a known public suffix.
//
export const isValid = (domain) => {
const parsed = parse(domain);
return Boolean(parsed.domain && parsed.listed);
};
export default { parse, get, isValid };