source: node_modules/autolinker/dist/commonjs/matcher/url-match-validator.js

main
Last change on this file was d24f17c, checked in by Aleksandar Panovski <apano77@…>, 15 months ago

Initial commit

  • Property mode set to 100644
File size: 7.9 KB
Line 
1"use strict";
2Object.defineProperty(exports, "__esModule", { value: true });
3exports.UrlMatchValidator = void 0;
4var regex_lib_1 = require("../regex-lib");
5/**
6 * @private
7 * @class Autolinker.matcher.UrlMatchValidator
8 * @singleton
9 *
10 * Used by Autolinker to filter out false URL positives from the
11 * {@link Autolinker.matcher.Url UrlMatcher}.
12 *
13 * Due to the limitations of regular expressions (including the missing feature
14 * of look-behinds in JS regular expressions), we cannot always determine the
15 * validity of a given match. This class applies a bit of additional logic to
16 * filter out any false positives that have been matched by the
17 * {@link Autolinker.matcher.Url UrlMatcher}.
18 */
19var UrlMatchValidator = /** @class */ (function () {
20 function UrlMatchValidator() {
21 }
22 /**
23 * Determines if a given URL match found by the {@link Autolinker.matcher.Url UrlMatcher}
24 * is valid. Will return `false` for:
25 *
26 * 1) URL matches which do not have at least have one period ('.') in the
27 * domain name (effectively skipping over matches like "abc:def").
28 * However, URL matches with a protocol will be allowed (ex: 'http://localhost')
29 * 2) URL matches which do not have at least one word character in the
30 * domain name (effectively skipping over matches like "git:1.0").
31 * However, URL matches with a protocol will be allowed (ex: 'intra-net://271219.76')
32 * 3) A protocol-relative url match (a URL beginning with '//') whose
33 * previous character is a word character (effectively skipping over
34 * strings like "abc//google.com")
35 *
36 * Otherwise, returns `true`.
37 *
38 * @param {String} urlMatch The matched URL, if there was one. Will be an
39 * empty string if the match is not a URL match.
40 * @param {String} protocolUrlMatch The match URL string for a protocol
41 * match. Ex: 'http://yahoo.com'. This is used to match something like
42 * 'http://localhost', where we won't double check that the domain name
43 * has at least one '.' in it.
44 * @return {Boolean} `true` if the match given is valid and should be
45 * processed, or `false` if the match is invalid and/or should just not be
46 * processed.
47 */
48 UrlMatchValidator.isValid = function (urlMatch, protocolUrlMatch) {
49 if ((protocolUrlMatch && !this.isValidUriScheme(protocolUrlMatch)) ||
50 this.urlMatchDoesNotHaveProtocolOrDot(urlMatch, protocolUrlMatch) || // At least one period ('.') must exist in the URL match for us to consider it an actual URL, *unless* it was a full protocol match (like 'http://localhost')
51 (this.urlMatchDoesNotHaveAtLeastOneWordChar(urlMatch, protocolUrlMatch) && // At least one letter character must exist in the domain name after a protocol match. Ex: skip over something like "git:1.0"
52 !this.isValidIpAddress(urlMatch)) || // Except if it's an IP address
53 this.containsMultipleDots(urlMatch)) {
54 return false;
55 }
56 return true;
57 };
58 UrlMatchValidator.isValidIpAddress = function (uriSchemeMatch) {
59 var newRegex = new RegExp(this.hasFullProtocolRegex.source + this.ipRegex.source);
60 var uriScheme = uriSchemeMatch.match(newRegex);
61 return uriScheme !== null;
62 };
63 UrlMatchValidator.containsMultipleDots = function (urlMatch) {
64 var stringBeforeSlash = urlMatch;
65 if (this.hasFullProtocolRegex.test(urlMatch)) {
66 stringBeforeSlash = urlMatch.split('://')[1];
67 }
68 return stringBeforeSlash.split('/')[0].indexOf('..') > -1;
69 };
70 /**
71 * Determines if the URI scheme is a valid scheme to be autolinked. Returns
72 * `false` if the scheme is 'javascript:' or 'vbscript:'
73 *
74 * @private
75 * @param {String} uriSchemeMatch The match URL string for a full URI scheme
76 * match. Ex: 'http://yahoo.com' or 'mailto:a@a.com'.
77 * @return {Boolean} `true` if the scheme is a valid one, `false` otherwise.
78 */
79 UrlMatchValidator.isValidUriScheme = function (uriSchemeMatch) {
80 var uriSchemeMatchArr = uriSchemeMatch.match(this.uriSchemeRegex), uriScheme = uriSchemeMatchArr && uriSchemeMatchArr[0].toLowerCase();
81 return uriScheme !== 'javascript:' && uriScheme !== 'vbscript:';
82 };
83 /**
84 * Determines if a URL match does not have either:
85 *
86 * a) a full protocol (i.e. 'http://'), or
87 * b) at least one dot ('.') in the domain name (for a non-full-protocol
88 * match).
89 *
90 * Either situation is considered an invalid URL (ex: 'git:d' does not have
91 * either the '://' part, or at least one dot in the domain name. If the
92 * match was 'git:abc.com', we would consider this valid.)
93 *
94 * @private
95 * @param {String} urlMatch The matched URL, if there was one. Will be an
96 * empty string if the match is not a URL match.
97 * @param {String} protocolUrlMatch The match URL string for a protocol
98 * match. Ex: 'http://yahoo.com'. This is used to match something like
99 * 'http://localhost', where we won't double check that the domain name
100 * has at least one '.' in it.
101 * @return {Boolean} `true` if the URL match does not have a full protocol,
102 * or at least one dot ('.') in a non-full-protocol match.
103 */
104 UrlMatchValidator.urlMatchDoesNotHaveProtocolOrDot = function (urlMatch, protocolUrlMatch) {
105 return (!!urlMatch &&
106 (!protocolUrlMatch || !this.hasFullProtocolRegex.test(protocolUrlMatch)) &&
107 urlMatch.indexOf('.') === -1);
108 };
109 /**
110 * Determines if a URL match does not have either:
111 *
112 * a) a full protocol (i.e. 'http://'), or
113 * b) at least one word character after the protocol (i.e. in the domain name)
114 *
115 * At least one letter character must exist in the domain name after a
116 * protocol match. Ex: skip over something like "git:1.0"
117 *
118 * @private
119 * @param {String} urlMatch The matched URL, if there was one. Will be an
120 * empty string if the match is not a URL match.
121 * @param {String} protocolUrlMatch The match URL string for a protocol
122 * match. Ex: 'http://yahoo.com'. This is used to know whether or not we
123 * have a protocol in the URL string, in order to check for a word
124 * character after the protocol separator (':').
125 * @return {Boolean} `true` if the URL match does not have a full protocol, or
126 * at least one word character in it, `false` otherwise.
127 */
128 UrlMatchValidator.urlMatchDoesNotHaveAtLeastOneWordChar = function (urlMatch, protocolUrlMatch) {
129 if (urlMatch && protocolUrlMatch) {
130 return (!this.hasFullProtocolRegex.test(protocolUrlMatch) &&
131 !this.hasWordCharAfterProtocolRegex.test(urlMatch));
132 }
133 else {
134 return false;
135 }
136 };
137 /**
138 * Regex to test for a full protocol, with the two trailing slashes. Ex: 'http://'
139 *
140 * @private
141 * @property {RegExp} hasFullProtocolRegex
142 */
143 UrlMatchValidator.hasFullProtocolRegex = /^[A-Za-z][-.+A-Za-z0-9]*:\/\//;
144 /**
145 * Regex to find the URI scheme, such as 'mailto:'.
146 *
147 * This is used to filter out 'javascript:' and 'vbscript:' schemes.
148 *
149 * @private
150 * @property {RegExp} uriSchemeRegex
151 */
152 UrlMatchValidator.uriSchemeRegex = /^[A-Za-z][-.+A-Za-z0-9]*:/;
153 /**
154 * Regex to determine if at least one word char exists after the protocol (i.e. after the ':')
155 *
156 * @private
157 * @property {RegExp} hasWordCharAfterProtocolRegex
158 */
159 UrlMatchValidator.hasWordCharAfterProtocolRegex = new RegExp(':[^\\s]*?[' + regex_lib_1.alphaCharsStr + ']');
160 /**
161 * Regex to determine if the string is a valid IP address
162 *
163 * @private
164 * @property {RegExp} ipRegex
165 */
166 UrlMatchValidator.ipRegex = /[0-9][0-9]?[0-9]?\.[0-9][0-9]?[0-9]?\.[0-9][0-9]?[0-9]?\.[0-9][0-9]?[0-9]?(:[0-9]*)?\/?$/;
167 return UrlMatchValidator;
168}());
169exports.UrlMatchValidator = UrlMatchValidator;
170//# sourceMappingURL=url-match-validator.js.map
Note: See TracBrowser for help on using the repository browser.