|
|
|
@ -25,6 +25,12 @@ const dot_confusables = '.\u002e\u0660\u06f0\u0701\u0702\u2024\ua4f8\ua60e\u10a5
|
|
|
|
|
|
|
|
|
|
const linkRegex = new RegExp(`^\\s*(([${h_confusables}][${t_confusables}][${t_confusables}][${p_confusables}][${s_confusables}]?[${column_confusables}][${slash_confusables}][${slash_confusables}]))?[^:/\\n ]+([${dot_confusables}][^:/\\n ]+)+`);
|
|
|
|
|
|
|
|
|
|
const textMatchesTarget = (text, origin, host) => {
|
|
|
|
|
return (text === origin || text === host
|
|
|
|
|
|| text.startsWith(origin + '/') || text.startsWith(host + '/')
|
|
|
|
|
|| 'www.' + text === host || ('www.' + text).startsWith(host + '/'));
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|
// If `checkUrlLike` is true, consider only URL-like link texts to be misleading
|
|
|
|
|
const isLinkMisleading = (link, checkUrlLike = true) => {
|
|
|
|
|
let linkTextParts = [];
|
|
|
|
@ -54,7 +60,7 @@ const isLinkMisleading = (link, checkUrlLike = true) => {
|
|
|
|
|
const targetURL = new URL(link.href);
|
|
|
|
|
|
|
|
|
|
// The following may not work with international domain names
|
|
|
|
|
if (linkText === targetURL.origin || linkText === targetURL.host || 'www.' + linkText === targetURL.host || linkText.startsWith(targetURL.origin + '/') || linkText.startsWith(targetURL.host + '/') || ('www.' + linkText).startsWith(targetURL.host + '/')) {
|
|
|
|
|
if (textMatchesTarget(linkText, targetURL.origin, targetURL.host) || textMatchesTarget(linkText.toLowerCase(), targetURL.origin, targetURL.host)) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
@ -62,7 +68,7 @@ const isLinkMisleading = (link, checkUrlLike = true) => {
|
|
|
|
|
const hostname = decodeIDNA(targetURL.hostname);
|
|
|
|
|
const host = targetURL.host.replace(targetURL.hostname, hostname);
|
|
|
|
|
const origin = targetURL.origin.replace(targetURL.host, host);
|
|
|
|
|
if (linkText === origin || linkText === host || 'www.' + linkText === host || linkText.startsWith(origin + '/') || linkText.startsWith(host + '/') || ('www.' + linkText).startsWith(host + '/')) {
|
|
|
|
|
if (textMatchesTarget(linkText, origin, host)) {
|
|
|
|
|
return false;
|
|
|
|
|
}
|
|
|
|
|
|
|
|
|
|