Context Navigation

← Previous Revision
Next Revision →
Blame
Revision Log

source: node_modules/autolinker/dist/commonjs/matcher/url-match-validator.js

main

Last change on this file was d24f17c, checked in by Aleksandar Panovski <apano77@…>, 15 months ago
Initial commit
Property mode set to `100644`
File size: 7.9 KB

Line
1	"use strict";
2	Object.defineProperty(exports, "__esModule", { value: true });
3	exports.UrlMatchValidator = void 0;
4	var regex_lib_1 = require("../regex-lib");
5	/**
6	* @private
7	* @class Autolinker.matcher.UrlMatchValidator
8	* @singleton
9	*
10	* Used by Autolinker to filter out false URL positives from the
11	* {@link Autolinker.matcher.Url UrlMatcher}.
12	*
13	* Due to the limitations of regular expressions (including the missing feature
14	* of look-behinds in JS regular expressions), we cannot always determine the
15	* validity of a given match. This class applies a bit of additional logic to
16	* filter out any false positives that have been matched by the
17	* {@link Autolinker.matcher.Url UrlMatcher}.
18	*/
19	var UrlMatchValidator = /** @class */ (function () {
20	function UrlMatchValidator() {
21	}
22	/**
23	* Determines if a given URL match found by the {@link Autolinker.matcher.Url UrlMatcher}
24	* is valid. Will return `false` for:
25	*
26	* 1) URL matches which do not have at least have one period ('.') in the
27	* domain name (effectively skipping over matches like "abc:def").
28	* However, URL matches with a protocol will be allowed (ex: 'http://localhost')
29	* 2) URL matches which do not have at least one word character in the
30	* domain name (effectively skipping over matches like "git:1.0").
31	* However, URL matches with a protocol will be allowed (ex: 'intra-net://271219.76')
32	* 3) A protocol-relative url match (a URL beginning with '//') whose
33	* previous character is a word character (effectively skipping over
34	* strings like "abc//google.com")
35	*
36	* Otherwise, returns `true`.
37	*
38	* @param {String} urlMatch The matched URL, if there was one. Will be an
39	* empty string if the match is not a URL match.
40	* @param {String} protocolUrlMatch The match URL string for a protocol
41	* match. Ex: 'http://yahoo.com'. This is used to match something like
42	* 'http://localhost', where we won't double check that the domain name
43	* has at least one '.' in it.
44	* @return {Boolean} `true` if the match given is valid and should be
45	* processed, or `false` if the match is invalid and/or should just not be
46	* processed.
47	*/
48	UrlMatchValidator.isValid = function (urlMatch, protocolUrlMatch) {
49	if ((protocolUrlMatch && !this.isValidUriScheme(protocolUrlMatch)) \|\|
50	this.urlMatchDoesNotHaveProtocolOrDot(urlMatch, protocolUrlMatch) \|\| // At least one period ('.') must exist in the URL match for us to consider it an actual URL, unless it was a full protocol match (like 'http://localhost')
51	(this.urlMatchDoesNotHaveAtLeastOneWordChar(urlMatch, protocolUrlMatch) && // At least one letter character must exist in the domain name after a protocol match. Ex: skip over something like "git:1.0"
52	!this.isValidIpAddress(urlMatch)) \|\| // Except if it's an IP address
53	this.containsMultipleDots(urlMatch)) {
54	return false;
55	}
56	return true;
57	};
58	UrlMatchValidator.isValidIpAddress = function (uriSchemeMatch) {
59	var newRegex = new RegExp(this.hasFullProtocolRegex.source + this.ipRegex.source);
60	var uriScheme = uriSchemeMatch.match(newRegex);
61	return uriScheme !== null;
62	};
63	UrlMatchValidator.containsMultipleDots = function (urlMatch) {
64	var stringBeforeSlash = urlMatch;
65	if (this.hasFullProtocolRegex.test(urlMatch)) {
66	stringBeforeSlash = urlMatch.split('://')[1];
67	}
68	return stringBeforeSlash.split('/')[0].indexOf('..') > -1;
69	};
70	/**
71	* Determines if the URI scheme is a valid scheme to be autolinked. Returns
72	* `false` if the scheme is 'javascript:' or 'vbscript:'
73	*
74	* @private
75	* @param {String} uriSchemeMatch The match URL string for a full URI scheme
76	* match. Ex: 'http://yahoo.com' or 'mailto:a@a.com'.
77	* @return {Boolean} `true` if the scheme is a valid one, `false` otherwise.
78	*/
79	UrlMatchValidator.isValidUriScheme = function (uriSchemeMatch) {
80	var uriSchemeMatchArr = uriSchemeMatch.match(this.uriSchemeRegex), uriScheme = uriSchemeMatchArr && uriSchemeMatchArr[0].toLowerCase();
81	return uriScheme !== 'javascript:' && uriScheme !== 'vbscript:';
82	};
83	/**
84	* Determines if a URL match does not have either:
85	*
86	* a) a full protocol (i.e. 'http://'), or
87	* b) at least one dot ('.') in the domain name (for a non-full-protocol
88	* match).
89	*
90	* Either situation is considered an invalid URL (ex: 'git:d' does not have
91	* either the '://' part, or at least one dot in the domain name. If the
92	* match was 'git:abc.com', we would consider this valid.)
93	*
94	* @private
95	* @param {String} urlMatch The matched URL, if there was one. Will be an
96	* empty string if the match is not a URL match.
97	* @param {String} protocolUrlMatch The match URL string for a protocol
98	* match. Ex: 'http://yahoo.com'. This is used to match something like
99	* 'http://localhost', where we won't double check that the domain name
100	* has at least one '.' in it.
101	* @return {Boolean} `true` if the URL match does not have a full protocol,
102	* or at least one dot ('.') in a non-full-protocol match.
103	*/
104	UrlMatchValidator.urlMatchDoesNotHaveProtocolOrDot = function (urlMatch, protocolUrlMatch) {
105	return (!!urlMatch &&
106	(!protocolUrlMatch \|\| !this.hasFullProtocolRegex.test(protocolUrlMatch)) &&
107	urlMatch.indexOf('.') === -1);
108	};
109	/**
110	* Determines if a URL match does not have either:
111	*
112	* a) a full protocol (i.e. 'http://'), or
113	* b) at least one word character after the protocol (i.e. in the domain name)
114	*
115	* At least one letter character must exist in the domain name after a
116	* protocol match. Ex: skip over something like "git:1.0"
117	*
118	* @private
119	* @param {String} urlMatch The matched URL, if there was one. Will be an
120	* empty string if the match is not a URL match.
121	* @param {String} protocolUrlMatch The match URL string for a protocol
122	* match. Ex: 'http://yahoo.com'. This is used to know whether or not we
123	* have a protocol in the URL string, in order to check for a word
124	* character after the protocol separator (':').
125	* @return {Boolean} `true` if the URL match does not have a full protocol, or
126	* at least one word character in it, `false` otherwise.
127	*/
128	UrlMatchValidator.urlMatchDoesNotHaveAtLeastOneWordChar = function (urlMatch, protocolUrlMatch) {
129	if (urlMatch && protocolUrlMatch) {
130	return (!this.hasFullProtocolRegex.test(protocolUrlMatch) &&
131	!this.hasWordCharAfterProtocolRegex.test(urlMatch));
132	}
133	else {
134	return false;
135	}
136	};
137	/**
138	* Regex to test for a full protocol, with the two trailing slashes. Ex: 'http://'
139	*
140	* @private
141	* @property {RegExp} hasFullProtocolRegex
142	*/
143	UrlMatchValidator.hasFullProtocolRegex = /^[A-Za-z][-.+A-Za-z0-9]*:\/\//;
144	/**
145	* Regex to find the URI scheme, such as 'mailto:'.
146	*
147	* This is used to filter out 'javascript:' and 'vbscript:' schemes.
148	*
149	* @private
150	* @property {RegExp} uriSchemeRegex
151	*/
152	UrlMatchValidator.uriSchemeRegex = /^[A-Za-z][-.+A-Za-z0-9]*:/;
153	/**
154	* Regex to determine if at least one word char exists after the protocol (i.e. after the ':')
155	*
156	* @private
157	* @property {RegExp} hasWordCharAfterProtocolRegex
158	*/
159	UrlMatchValidator.hasWordCharAfterProtocolRegex = new RegExp(':[^\\s]*?[' + regex_lib_1.alphaCharsStr + ']');
160	/**
161	* Regex to determine if the string is a valid IP address
162	*
163	* @private
164	* @property {RegExp} ipRegex
165	*/
166	UrlMatchValidator.ipRegex = /[0-9][0-9]?[0-9]?\.[0-9][0-9]?[0-9]?\.[0-9][0-9]?[0-9]?\.[0-9][0-9]?[0-9]?(:[0-9]*)?\/?$/;
167	return UrlMatchValidator;
168	}());
169	exports.UrlMatchValidator = UrlMatchValidator;
170	//# sourceMappingURL=url-match-validator.js.map

Note: See TracBrowser for help on using the repository browser.

Download in other formats: