| OLD | NEW |
| 1 /* | 1 /* |
| 2 * This file is part of Adblock Plus <https://adblockplus.org/>, | 2 * This file is part of Adblock Plus <https://adblockplus.org/>, |
| 3 * Copyright (C) 2006-present eyeo GmbH | 3 * Copyright (C) 2006-present eyeo GmbH |
| 4 * | 4 * |
| 5 * Adblock Plus is free software: you can redistribute it and/or modify | 5 * Adblock Plus is free software: you can redistribute it and/or modify |
| 6 * it under the terms of the GNU General Public License version 3 as | 6 * it under the terms of the GNU General Public License version 3 as |
| 7 * published by the Free Software Foundation. | 7 * published by the Free Software Foundation. |
| 8 * | 8 * |
| 9 * Adblock Plus is distributed in the hope that it will be useful, | 9 * Adblock Plus is distributed in the hope that it will be useful, |
| 10 * but WITHOUT ANY WARRANTY; without even the implied warranty of | 10 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| (...skipping 40 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... |
| 51 /** | 51 /** |
| 52 * Blacklist/whitelist filter matching | 52 * Blacklist/whitelist filter matching |
| 53 */ | 53 */ |
| 54 class Matcher | 54 class Matcher |
| 55 { | 55 { |
| 56 constructor() | 56 constructor() |
| 57 { | 57 { |
| 58 /** | 58 /** |
| 59 * Lookup table for filters by their associated keyword | 59 * Lookup table for filters by their associated keyword |
| 60 * @type {Map.<string,(Filter|Set.<Filter>)>} | 60 * @type {Map.<string,(Filter|Set.<Filter>)>} |
| 61 * @private |
| 61 */ | 62 */ |
| 62 this.filterByKeyword = new Map(); | 63 this._filterByKeyword = new Map(); |
| 63 } | 64 } |
| 64 | 65 |
| 65 /** | 66 /** |
| 66 * Removes all known filters | 67 * Removes all known filters |
| 67 */ | 68 */ |
| 68 clear() | 69 clear() |
| 69 { | 70 { |
| 70 this.filterByKeyword.clear(); | 71 this._filterByKeyword.clear(); |
| 71 } | 72 } |
| 72 | 73 |
| 73 /** | 74 /** |
| 74 * Adds a filter to the matcher | 75 * Adds a filter to the matcher |
| 75 * @param {RegExpFilter} filter | 76 * @param {RegExpFilter} filter |
| 76 */ | 77 */ |
| 77 add(filter) | 78 add(filter) |
| 78 { | 79 { |
| 79 // Look for a suitable keyword | 80 // Look for a suitable keyword |
| 80 let keyword = this.findKeyword(filter); | 81 let keyword = this.findKeyword(filter); |
| 81 let set = this.filterByKeyword.get(keyword); | 82 let set = this._filterByKeyword.get(keyword); |
| 82 if (typeof set == "undefined") | 83 if (typeof set == "undefined") |
| 83 { | 84 { |
| 84 this.filterByKeyword.set(keyword, filter); | 85 this._filterByKeyword.set(keyword, filter); |
| 85 } | 86 } |
| 86 else if (set.size == 1) | 87 else if (set.size == 1) |
| 87 { | 88 { |
| 88 if (filter != set) | 89 if (filter != set) |
| 89 this.filterByKeyword.set(keyword, new Set([set, filter])); | 90 this._filterByKeyword.set(keyword, new Set([set, filter])); |
| 90 } | 91 } |
| 91 else | 92 else |
| 92 { | 93 { |
| 93 set.add(filter); | 94 set.add(filter); |
| 94 } | 95 } |
| 95 } | 96 } |
| 96 | 97 |
| 97 /** | 98 /** |
| 98 * Removes a filter from the matcher | 99 * Removes a filter from the matcher |
| 99 * @param {RegExpFilter} filter | 100 * @param {RegExpFilter} filter |
| 100 */ | 101 */ |
| 101 remove(filter) | 102 remove(filter) |
| 102 { | 103 { |
| 103 let keyword = this.findKeyword(filter); | 104 let keyword = this.findKeyword(filter); |
| 104 let set = this.filterByKeyword.get(keyword); | 105 let set = this._filterByKeyword.get(keyword); |
| 105 if (typeof set == "undefined") | 106 if (typeof set == "undefined") |
| 106 return; | 107 return; |
| 107 | 108 |
| 108 if (set.size == 1) | 109 if (set.size == 1) |
| 109 { | 110 { |
| 110 if (filter == set) | 111 if (filter == set) |
| 111 this.filterByKeyword.delete(keyword); | 112 this._filterByKeyword.delete(keyword); |
| 112 } | 113 } |
| 113 else | 114 else |
| 114 { | 115 { |
| 115 set.delete(filter); | 116 set.delete(filter); |
| 116 | 117 |
| 117 if (set.size == 1) | 118 if (set.size == 1) |
| 118 this.filterByKeyword.set(keyword, [...set][0]); | 119 this._filterByKeyword.set(keyword, [...set][0]); |
| 119 } | 120 } |
| 120 } | 121 } |
| 121 | 122 |
| 122 /** | 123 /** |
| 123 * Chooses a keyword to be associated with the filter | 124 * Chooses a keyword to be associated with the filter |
| 124 * @param {Filter} filter | 125 * @param {Filter} filter |
| 125 * @returns {string} keyword or an empty string if no keyword could be found | 126 * @returns {string} keyword or an empty string if no keyword could be found |
| 127 * @protected |
| 126 */ | 128 */ |
| 127 findKeyword(filter) | 129 findKeyword(filter) |
| 128 { | 130 { |
| 129 let result = ""; | 131 let result = ""; |
| 130 let {pattern} = filter; | 132 let {pattern} = filter; |
| 131 if (pattern == null) | 133 if (pattern == null) |
| 132 return result; | 134 return result; |
| 133 | 135 |
| 134 let candidates = pattern.toLowerCase().match(allKeywordsRegExp); | 136 let candidates = pattern.toLowerCase().match(allKeywordsRegExp); |
| 135 if (!candidates) | 137 if (!candidates) |
| 136 return result; | 138 return result; |
| 137 | 139 |
| 138 let hash = this.filterByKeyword; | 140 let hash = this._filterByKeyword; |
| 139 let resultCount = 0xFFFFFF; | 141 let resultCount = 0xFFFFFF; |
| 140 let resultLength = 0; | 142 let resultLength = 0; |
| 141 for (let i = 0, l = candidates.length; i < l; i++) | 143 for (let i = 0, l = candidates.length; i < l; i++) |
| 142 { | 144 { |
| 143 let candidate = candidates[i].substr(1); | 145 let candidate = candidates[i].substr(1); |
| 144 let filters = hash.get(candidate); | 146 let filters = hash.get(candidate); |
| 145 let count = typeof filters != "undefined" ? filters.size : 0; | 147 let count = typeof filters != "undefined" ? filters.size : 0; |
| 146 if (count < resultCount || | 148 if (count < resultCount || |
| 147 (count == resultCount && candidate.length > resultLength)) | 149 (count == resultCount && candidate.length > resultLength)) |
| 148 { | 150 { |
| 149 result = candidate; | 151 result = candidate; |
| 150 resultCount = count; | 152 resultCount = count; |
| 151 resultLength = candidate.length; | 153 resultLength = candidate.length; |
| 152 } | 154 } |
| 153 } | 155 } |
| 154 return result; | 156 return result; |
| 155 } | 157 } |
| 156 | 158 |
| 157 /** | 159 /** |
| 158 * Checks whether the entries for a particular keyword match a URL | 160 * Checks whether the entries for a particular keyword match a URL |
| 159 * @param {string} keyword | 161 * @param {string} keyword |
| 160 * @param {string} location | 162 * @param {string} location |
| 161 * @param {number} typeMask | 163 * @param {number} typeMask |
| 162 * @param {string} [docDomain] | 164 * @param {string} [docDomain] |
| 163 * @param {boolean} [thirdParty] | 165 * @param {boolean} [thirdParty] |
| 164 * @param {string} [sitekey] | 166 * @param {string} [sitekey] |
| 165 * @param {boolean} [specificOnly] | 167 * @param {boolean} [specificOnly] |
| 166 * @returns {?Filter} | 168 * @returns {?Filter} |
| 169 * @protected |
| 167 */ | 170 */ |
| 168 _checkEntryMatch(keyword, location, typeMask, docDomain, thirdParty, sitekey, | 171 checkEntryMatch(keyword, location, typeMask, docDomain, thirdParty, sitekey, |
| 169 specificOnly) | 172 specificOnly) |
| 170 { | 173 { |
| 171 let set = this.filterByKeyword.get(keyword); | 174 let set = this._filterByKeyword.get(keyword); |
| 172 if (typeof set == "undefined") | 175 if (typeof set == "undefined") |
| 173 return null; | 176 return null; |
| 174 | 177 |
| 175 for (let filter of set) | 178 for (let filter of set) |
| 176 { | 179 { |
| 177 if (specificOnly && filter.isGeneric() && | 180 if (specificOnly && filter.isGeneric() && |
| 178 !(filter instanceof WhitelistFilter)) | 181 !(filter instanceof WhitelistFilter)) |
| 179 continue; | 182 continue; |
| 180 | 183 |
| 181 if (filter.matches(location, typeMask, docDomain, thirdParty, sitekey)) | 184 if (filter.matches(location, typeMask, docDomain, thirdParty, sitekey)) |
| (...skipping 20 matching lines...) Expand all Loading... |
| 202 * matching filter or <code>null</code> | 205 * matching filter or <code>null</code> |
| 203 */ | 206 */ |
| 204 matchesAny(location, typeMask, docDomain, thirdParty, sitekey, specificOnly) | 207 matchesAny(location, typeMask, docDomain, thirdParty, sitekey, specificOnly) |
| 205 { | 208 { |
| 206 let candidates = location.toLowerCase().match(/[a-z0-9%]{3,}/g); | 209 let candidates = location.toLowerCase().match(/[a-z0-9%]{3,}/g); |
| 207 if (candidates === null) | 210 if (candidates === null) |
| 208 candidates = []; | 211 candidates = []; |
| 209 candidates.push(""); | 212 candidates.push(""); |
| 210 for (let i = 0, l = candidates.length; i < l; i++) | 213 for (let i = 0, l = candidates.length; i < l; i++) |
| 211 { | 214 { |
| 212 let result = this._checkEntryMatch(candidates[i], location, typeMask, | 215 let result = this.checkEntryMatch(candidates[i], location, typeMask, |
| 213 docDomain, thirdParty, sitekey, | 216 docDomain, thirdParty, sitekey, |
| 214 specificOnly); | 217 specificOnly); |
| 215 if (result) | 218 if (result) |
| 216 return result; | 219 return result; |
| 217 } | 220 } |
| 218 | 221 |
| 219 return null; | 222 return null; |
| 220 } | 223 } |
| 221 } | 224 } |
| 222 | 225 |
| 223 exports.Matcher = Matcher; | 226 exports.Matcher = Matcher; |
| 224 | 227 |
| 225 /** | 228 /** |
| 226 * Combines a matcher for blocking and exception rules, automatically sorts | 229 * Combines a matcher for blocking and exception rules, automatically sorts |
| 227 * rules into two {@link Matcher} instances. | 230 * rules into two {@link Matcher} instances. |
| 228 */ | 231 */ |
| 229 class CombinedMatcher | 232 class CombinedMatcher |
| 230 { | 233 { |
| 231 constructor() | 234 constructor() |
| 232 { | 235 { |
| 233 /** | 236 /** |
| 234 * Maximal number of matching cache entries to be kept | 237 * Maximal number of matching cache entries to be kept |
| 235 * @type {number} | 238 * @type {number} |
| 236 */ | 239 */ |
| 237 this.maxCacheEntries = 1000; | 240 this.maxCacheEntries = 1000; |
| 238 | 241 |
| 239 /** | 242 /** |
| 240 * Matcher for blocking rules. | 243 * Matcher for blocking rules. |
| 241 * @type {Matcher} | 244 * @type {Matcher} |
| 245 * @protected |
| 242 */ | 246 */ |
| 243 this.blacklist = new Matcher(); | 247 this.blacklist = new Matcher(); |
| 244 | 248 |
| 245 /** | 249 /** |
| 246 * Matcher for exception rules. | 250 * Matcher for exception rules. |
| 247 * @type {Matcher} | 251 * @type {Matcher} |
| 252 * @protected |
| 248 */ | 253 */ |
| 249 this.whitelist = new Matcher(); | 254 this.whitelist = new Matcher(); |
| 250 | 255 |
| 251 /** | 256 /** |
| 252 * Lookup table of previous {@link Matcher#matchesAny} results | 257 * Lookup table of previous {@link Matcher#matchesAny} results |
| 253 * @type {Map.<string,Filter>} | 258 * @type {Map.<string,Filter>} |
| 259 * @private |
| 254 */ | 260 */ |
| 255 this.resultCache = new Map(); | 261 this._resultCache = new Map(); |
| 256 } | 262 } |
| 257 | 263 |
| 258 /** | 264 /** |
| 259 * @see Matcher#clear | 265 * @see Matcher#clear |
| 260 */ | 266 */ |
| 261 clear() | 267 clear() |
| 262 { | 268 { |
| 263 this.blacklist.clear(); | 269 this.blacklist.clear(); |
| 264 this.whitelist.clear(); | 270 this.whitelist.clear(); |
| 265 this.resultCache.clear(); | 271 this._resultCache.clear(); |
| 266 } | 272 } |
| 267 | 273 |
| 268 /** | 274 /** |
| 269 * @see Matcher#add | 275 * @see Matcher#add |
| 270 * @param {Filter} filter | 276 * @param {Filter} filter |
| 271 */ | 277 */ |
| 272 add(filter) | 278 add(filter) |
| 273 { | 279 { |
| 274 if (filter instanceof WhitelistFilter) | 280 if (filter instanceof WhitelistFilter) |
| 275 this.whitelist.add(filter); | 281 this.whitelist.add(filter); |
| 276 else | 282 else |
| 277 this.blacklist.add(filter); | 283 this.blacklist.add(filter); |
| 278 | 284 |
| 279 this.resultCache.clear(); | 285 this._resultCache.clear(); |
| 280 } | 286 } |
| 281 | 287 |
| 282 /** | 288 /** |
| 283 * @see Matcher#remove | 289 * @see Matcher#remove |
| 284 * @param {Filter} filter | 290 * @param {Filter} filter |
| 285 */ | 291 */ |
| 286 remove(filter) | 292 remove(filter) |
| 287 { | 293 { |
| 288 if (filter instanceof WhitelistFilter) | 294 if (filter instanceof WhitelistFilter) |
| 289 this.whitelist.remove(filter); | 295 this.whitelist.remove(filter); |
| 290 else | 296 else |
| 291 this.blacklist.remove(filter); | 297 this.blacklist.remove(filter); |
| 292 | 298 |
| 293 this.resultCache.clear(); | 299 this._resultCache.clear(); |
| 294 } | 300 } |
| 295 | 301 |
| 296 /** | 302 /** |
| 297 * @see Matcher#findKeyword | 303 * @see Matcher#findKeyword |
| 298 * @param {Filter} filter | 304 * @param {Filter} filter |
| 299 * @returns {string} keyword | 305 * @returns {string} keyword |
| 306 * @protected |
| 300 */ | 307 */ |
| 301 findKeyword(filter) | 308 findKeyword(filter) |
| 302 { | 309 { |
| 303 if (filter instanceof WhitelistFilter) | 310 if (filter instanceof WhitelistFilter) |
| 304 return this.whitelist.findKeyword(filter); | 311 return this.whitelist.findKeyword(filter); |
| 305 return this.blacklist.findKeyword(filter); | 312 return this.blacklist.findKeyword(filter); |
| 306 } | 313 } |
| 307 | 314 |
| 308 /** | 315 /** |
| 309 * Optimized filter matching testing both whitelist and blacklist matchers | 316 * Optimized filter matching testing both whitelist and blacklist matchers |
| 310 * simultaneously. For parameters see | 317 * simultaneously. For parameters see |
| 311 {@link Matcher#matchesAny Matcher.matchesAny()}. | 318 {@link Matcher#matchesAny Matcher.matchesAny()}. |
| 312 * @see Matcher#matchesAny | 319 * @see Matcher#matchesAny |
| 313 * @inheritdoc | 320 * @inheritdoc |
| 321 * @private |
| 314 */ | 322 */ |
| 315 matchesAnyInternal(location, typeMask, docDomain, thirdParty, sitekey, | 323 _matchesAnyInternal(location, typeMask, docDomain, thirdParty, sitekey, |
| 316 specificOnly) | 324 specificOnly) |
| 317 { | 325 { |
| 318 let candidates = location.toLowerCase().match(/[a-z0-9%]{3,}/g); | 326 let candidates = location.toLowerCase().match(/[a-z0-9%]{3,}/g); |
| 319 if (candidates === null) | 327 if (candidates === null) |
| 320 candidates = []; | 328 candidates = []; |
| 321 candidates.push(""); | 329 candidates.push(""); |
| 322 | 330 |
| 323 let blacklistHit = null; | 331 let blacklistHit = null; |
| 324 for (let i = 0, l = candidates.length; i < l; i++) | 332 for (let i = 0, l = candidates.length; i < l; i++) |
| 325 { | 333 { |
| 326 let substr = candidates[i]; | 334 let substr = candidates[i]; |
| 327 let result = this.whitelist._checkEntryMatch( | 335 let result = this.whitelist.checkEntryMatch( |
| 328 substr, location, typeMask, docDomain, thirdParty, sitekey | 336 substr, location, typeMask, docDomain, thirdParty, sitekey |
| 329 ); | 337 ); |
| 330 if (result) | 338 if (result) |
| 331 return result; | 339 return result; |
| 332 if (blacklistHit === null) | 340 if (blacklistHit === null) |
| 333 { | 341 { |
| 334 blacklistHit = this.blacklist._checkEntryMatch( | 342 blacklistHit = this.blacklist.checkEntryMatch( |
| 335 substr, location, typeMask, docDomain, thirdParty, sitekey, | 343 substr, location, typeMask, docDomain, thirdParty, sitekey, |
| 336 specificOnly | 344 specificOnly |
| 337 ); | 345 ); |
| 338 } | 346 } |
| 339 } | 347 } |
| 340 return blacklistHit; | 348 return blacklistHit; |
| 341 } | 349 } |
| 342 | 350 |
| 343 /** | 351 /** |
| 344 * @see Matcher#matchesAny | 352 * @see Matcher#matchesAny |
| 345 * @inheritdoc | 353 * @inheritdoc |
| 346 */ | 354 */ |
| 347 matchesAny(location, typeMask, docDomain, thirdParty, sitekey, specificOnly) | 355 matchesAny(location, typeMask, docDomain, thirdParty, sitekey, specificOnly) |
| 348 { | 356 { |
| 349 let key = location + " " + typeMask + " " + docDomain + " " + thirdParty + | 357 let key = location + " " + typeMask + " " + docDomain + " " + thirdParty + |
| 350 " " + sitekey + " " + specificOnly; | 358 " " + sitekey + " " + specificOnly; |
| 351 | 359 |
| 352 let result = this.resultCache.get(key); | 360 let result = this._resultCache.get(key); |
| 353 if (typeof result != "undefined") | 361 if (typeof result != "undefined") |
| 354 return result; | 362 return result; |
| 355 | 363 |
| 356 result = this.matchesAnyInternal(location, typeMask, docDomain, | 364 result = this._matchesAnyInternal(location, typeMask, docDomain, |
| 357 thirdParty, sitekey, specificOnly); | 365 thirdParty, sitekey, specificOnly); |
| 358 | 366 |
| 359 if (this.resultCache.size >= this.maxCacheEntries) | 367 if (this._resultCache.size >= this.maxCacheEntries) |
| 360 this.resultCache.clear(); | 368 this._resultCache.clear(); |
| 361 | 369 |
| 362 this.resultCache.set(key, result); | 370 this._resultCache.set(key, result); |
| 363 | 371 |
| 364 return result; | 372 return result; |
| 365 } | 373 } |
| 366 } | 374 } |
| 367 | 375 |
| 368 exports.CombinedMatcher = CombinedMatcher; | 376 exports.CombinedMatcher = CombinedMatcher; |
| 369 | 377 |
| 370 /** | 378 /** |
| 371 * Shared {@link CombinedMatcher} instance that should usually be used. | 379 * Shared {@link CombinedMatcher} instance that should usually be used. |
| 372 * @type {CombinedMatcher} | 380 * @type {CombinedMatcher} |
| 373 */ | 381 */ |
| 374 let defaultMatcher = new CombinedMatcher(); | 382 let defaultMatcher = new CombinedMatcher(); |
| 375 | 383 |
| 376 exports.defaultMatcher = defaultMatcher; | 384 exports.defaultMatcher = defaultMatcher; |
| OLD | NEW |