| Index: test/matcher.js |
| =================================================================== |
| new file mode 100644 |
| --- /dev/null |
| +++ b/test/matcher.js |
| @@ -0,0 +1,248 @@ |
| +/* |
| + * This file is part of Adblock Plus <https://adblockplus.org/>, |
| + * Copyright (C) 2006-present eyeo GmbH |
| + * |
| + * Adblock Plus is free software: you can redistribute it and/or modify |
| + * it under the terms of the GNU General Public License version 3 as |
| + * published by the Free Software Foundation. |
| + * |
| + * Adblock Plus is distributed in the hope that it will be useful, |
| + * but WITHOUT ANY WARRANTY; without even the implied warranty of |
| + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the |
| + * GNU General Public License for more details. |
| + * |
| + * You should have received a copy of the GNU General Public License |
| + * along with Adblock Plus. If not, see <http://www.gnu.org/licenses/>. |
| + */ |
| + |
| +"use strict"; |
| + |
| +const {createSandbox} = require("./_common"); |
| + |
| +let Filter = null; |
| +let RegExpFilter = null; |
| +let CombinedMatcher = null; |
| +let defaultMatcher = null; |
| +let Matcher = null; |
| + |
| +exports.setUp = function(callback) |
| +{ |
| + let sandboxedRequire = createSandbox(); |
| + ( |
| + {Filter, RegExpFilter} = sandboxedRequire("../lib/filterClasses"), |
| + {CombinedMatcher, defaultMatcher, Matcher} = sandboxedRequire("../lib/matcher") |
| + ); |
| + |
| + callback(); |
| +}; |
| + |
| +function compareKeywords(test, text, expected) |
| +{ |
| + for (let filter of [Filter.fromText(text), Filter.fromText("@@" + text)]) |
| + { |
| + let matcher = new Matcher(); |
| + let result = []; |
| + for (let i = 0; i < expected.length; i++) |
| + { |
| + let keyword = matcher.findKeyword(filter); |
| + result.push(keyword); |
| + if (keyword) |
| + { |
| + let dummyFilter = Filter.fromText("^" + keyword + "^"); |
| + dummyFilter.filterCount = Infinity; |
| + matcher.add(dummyFilter); |
| + } |
| + } |
| + |
| + test.equal(result.join(", "), expected.join(", "), "Keyword candidates for " + filter.text); |
| + } |
| +} |
| + |
| +function checkMatch(test, filters, location, contentType, docDomain, thirdParty, sitekey, specificOnly, expected) |
| +{ |
| + let matcher = new Matcher(); |
| + for (let filter of filters) |
| + matcher.add(Filter.fromText(filter)); |
| + |
| + let result = matcher.matchesAny(location, RegExpFilter.typeMap[contentType], docDomain, thirdParty, sitekey, specificOnly); |
| + if (result) |
| + result = result.text; |
| + |
| + test.equal(result, expected, "match(" + location + ", " + contentType + ", " + docDomain + ", " + (thirdParty ? "third-party" : "first-party") + ", " + (sitekey || "no-sitekey") + ", " + (specificOnly ? "specificOnly" : "not-specificOnly") + ") with:\n" + filters.join("\n")); |
| + |
| + let combinedMatcher = new CombinedMatcher(); |
| + for (let i = 0; i < 2; i++) |
| + { |
| + for (let filter of filters) |
| + combinedMatcher.add(Filter.fromText(filter)); |
| + |
| + result = combinedMatcher.matchesAny(location, RegExpFilter.typeMap[contentType], docDomain, thirdParty, sitekey, specificOnly); |
| + if (result) |
| + result = result.text; |
| + |
| + test.equal(result, expected, "combinedMatch(" + location + ", " + contentType + ", " + docDomain + ", " + (thirdParty ? "third-party" : "first-party") + ", " + (sitekey || "no-sitekey") + ", " + (specificOnly ? "specificOnly" : "not-specificOnly") + ") with:\n" + filters.join("\n")); |
| + |
| + // Generic whitelisting rules can match for specificOnly searches, so we |
| + // can't easily know which rule will match for these whitelisting tests |
| + if (specificOnly) |
| + continue; |
| + |
| + // For next run: add whitelisting filters for filters that aren't already |
| + filters = filters.map(text => text.substr(0, 2) == "@@" ? text : "@@" + text); |
| + if (expected && expected.substr(0, 2) != "@@") |
| + expected = "@@" + expected; |
| + } |
| +} |
| + |
| +function cacheCheck(test, matcher, location, contentType, docDomain, thirdParty, expected) |
| +{ |
| + let result = matcher.matchesAny(location, RegExpFilter.typeMap[contentType], docDomain, thirdParty); |
| + if (result) |
| + result = result.text; |
| + |
| + test.equal(result, expected, "match(" + location + ", " + contentType + ", " + docDomain + ", " + (thirdParty ? "third-party" : "first-party") + ") with static filters"); |
| +} |
| + |
| +exports.testMatcherClassDefinitions = function(test) |
| +{ |
| + test.equal(typeof Matcher, "function", "typeof Matcher"); |
| + test.equal(typeof CombinedMatcher, "function", "typeof CombinedMatcher"); |
| + test.equal(typeof defaultMatcher, "object", "typeof defaultMatcher"); |
| + test.ok(defaultMatcher instanceof CombinedMatcher, "defaultMatcher is a CombinedMatcher instance"); |
| + |
| + test.done(); |
| +}; |
| + |
| +exports.testKeywordExtraction = function(test) |
| +{ |
| + compareKeywords(test, "*", []); |
| + compareKeywords(test, "asdf", []); |
| + compareKeywords(test, "/asdf/", []); |
| + compareKeywords(test, "/asdf1234", []); |
| + compareKeywords(test, "/asdf/1234", ["asdf"]); |
| + compareKeywords(test, "/asdf/1234^", ["asdf", "1234"]); |
| + compareKeywords(test, "/asdf/123456^", ["123456", "asdf"]); |
| + compareKeywords(test, "^asdf^1234^56as^", ["asdf", "1234", "56as"]); |
| + compareKeywords(test, "*asdf/1234^", ["1234"]); |
| + compareKeywords(test, "|asdf,1234*", ["asdf"]); |
| + compareKeywords(test, "||domain.example^", ["example", "domain"]); |
| + compareKeywords(test, "&asdf=1234|", ["asdf", "1234"]); |
| + compareKeywords(test, "^foo%2Ebar^", ["foo%2ebar"]); |
| + compareKeywords(test, "^aSdF^1234", ["asdf"]); |
| + compareKeywords(test, "_asdf_1234_", ["asdf", "1234"]); |
| + compareKeywords(test, "+asdf-1234=", ["asdf", "1234"]); |
| + compareKeywords(test, "/123^ad2&ad&", ["123", "ad2"]); |
| + compareKeywords(test, "/123^ad2&ad$script,domain=example.com", ["123", "ad2"]); |
| + |
| + test.done(); |
| +}; |
| + |
| +exports.testFilterMatching = function(test) |
| +{ |
| + checkMatch(test, [], "http://abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["abc"], "http://abc/def", "IMAGE", null, false, null, false, "abc"); |
| + checkMatch(test, ["abc", "ddd"], "http://abc/def", "IMAGE", null, false, null, false, "abc"); |
| + checkMatch(test, ["ddd", "abc"], "http://abc/def", "IMAGE", null, false, null, false, "abc"); |
| + checkMatch(test, ["ddd", "abd"], "http://abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["abc", "://abc/d"], "http://abc/def", "IMAGE", null, false, null, false, "://abc/d"); |
| + checkMatch(test, ["://abc/d", "abc"], "http://abc/def", "IMAGE", null, false, null, false, "://abc/d"); |
| + checkMatch(test, ["|http://"], "http://abc/def", "IMAGE", null, false, null, false, "|http://"); |
| + checkMatch(test, ["|http://abc"], "http://abc/def", "IMAGE", null, false, null, false, "|http://abc"); |
| + checkMatch(test, ["|abc"], "http://abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["|/abc/def"], "http://abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["/def|"], "http://abc/def", "IMAGE", null, false, null, false, "/def|"); |
| + checkMatch(test, ["/abc/def|"], "http://abc/def", "IMAGE", null, false, null, false, "/abc/def|"); |
| + checkMatch(test, ["/abc/|"], "http://abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["http://abc/|"], "http://abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["|http://abc/def|"], "http://abc/def", "IMAGE", null, false, null, false, "|http://abc/def|"); |
| + checkMatch(test, ["|/abc/def|"], "http://abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["|http://abc/|"], "http://abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["|/abc/|"], "http://abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["||example.com/abc"], "http://example.com/abc/def", "IMAGE", null, false, null, false, "||example.com/abc"); |
| + checkMatch(test, ["||com/abc/def"], "http://example.com/abc/def", "IMAGE", null, false, null, false, "||com/abc/def"); |
| + checkMatch(test, ["||com/abc"], "http://example.com/abc/def", "IMAGE", null, false, null, false, "||com/abc"); |
| + checkMatch(test, ["||mple.com/abc"], "http://example.com/abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["||.com/abc/def"], "http://example.com/abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["||http://example.com/"], "http://example.com/abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["||example.com/abc/def|"], "http://example.com/abc/def", "IMAGE", null, false, null, false, "||example.com/abc/def|"); |
| + checkMatch(test, ["||com/abc/def|"], "http://example.com/abc/def", "IMAGE", null, false, null, false, "||com/abc/def|"); |
| + checkMatch(test, ["||example.com/abc|"], "http://example.com/abc/def", "IMAGE", null, false, null, false, null); |
| + checkMatch(test, ["abc", "://abc/d", "asdf1234"], "http://abc/def", "IMAGE", null, false, null, false, "://abc/d"); |
| + checkMatch(test, ["foo*://abc/d", "foo*//abc/de", "://abc/de", "asdf1234"], "http://abc/def", "IMAGE", null, false, null, false, "://abc/de"); |
| + checkMatch(test, ["abc$third-party", "abc$~third-party", "ddd"], "http://abc/def", "IMAGE", null, false, null, false, "abc$~third-party"); |
| + checkMatch(test, ["abc$third-party", "abc$~third-party", "ddd"], "http://abc/def", "IMAGE", null, true, null, false, "abc$third-party"); |
| + checkMatch(test, ["//abc/def$third-party", "//abc/def$~third-party", "//abc_def"], "http://abc/def", "IMAGE", null, false, null, false, "//abc/def$~third-party"); |
| + checkMatch(test, ["//abc/def$third-party", "//abc/def$~third-party", "//abc_def"], "http://abc/def", "IMAGE", null, true, null, false, "//abc/def$third-party"); |
| + checkMatch(test, ["abc$third-party", "abc$~third-party", "//abc/def"], "http://abc/def", "IMAGE", null, true, null, false, "//abc/def"); |
| + checkMatch(test, ["//abc/def", "abc$third-party", "abc$~third-party"], "http://abc/def", "IMAGE", null, true, null, false, "//abc/def"); |
| + checkMatch(test, ["abc$third-party", "abc$~third-party", "//abc/def$third-party"], "http://abc/def", "IMAGE", null, true, null, false, "//abc/def$third-party"); |
| + checkMatch(test, ["abc$third-party", "abc$~third-party", "//abc/def$third-party"], "http://abc/def", "IMAGE", null, false, null, false, "abc$~third-party"); |
| + checkMatch(test, ["abc$third-party", "abc$~third-party", "//abc/def$~third-party"], "http://abc/def", "IMAGE", null, true, null, false, "abc$third-party"); |
| + checkMatch(test, ["abc$image", "abc$script", "abc$~image"], "http://abc/def", "IMAGE", null, false, null, false, "abc$image"); |
| + checkMatch(test, ["abc$image", "abc$script", "abc$~script"], "http://abc/def", "SCRIPT", null, false, null, false, "abc$script"); |
| + checkMatch(test, ["abc$image", "abc$script", "abc$~image"], "http://abc/def", "OTHER", null, false, null, false, "abc$~image"); |
| + checkMatch(test, ["//abc/def$image", "//abc/def$script", "//abc/def$~image"], "http://abc/def", "IMAGE", null, false, null, false, "//abc/def$image"); |
| + checkMatch(test, ["//abc/def$image", "//abc/def$script", "//abc/def$~script"], "http://abc/def", "SCRIPT", null, false, null, false, "//abc/def$script"); |
| + checkMatch(test, ["//abc/def$image", "//abc/def$script", "//abc/def$~image"], "http://abc/def", "OTHER", null, false, null, false, "//abc/def$~image"); |
| + checkMatch(test, ["abc$image", "abc$~image", "//abc/def"], "http://abc/def", "IMAGE", null, false, null, false, "//abc/def"); |
| + checkMatch(test, ["//abc/def", "abc$image", "abc$~image"], "http://abc/def", "IMAGE", null, false, null, false, "//abc/def"); |
| + checkMatch(test, ["abc$image", "abc$~image", "//abc/def$image"], "http://abc/def", "IMAGE", null, false, null, false, "//abc/def$image"); |
| + checkMatch(test, ["abc$image", "abc$~image", "//abc/def$script"], "http://abc/def", "IMAGE", null, false, null, false, "abc$image"); |
| + checkMatch(test, ["abc$domain=foo.com", "abc$domain=bar.com", "abc$domain=~foo.com|~bar.com"], "http://abc/def", "IMAGE", "foo.com", false, null, false, "abc$domain=foo.com"); |
| + checkMatch(test, ["abc$domain=foo.com", "abc$domain=bar.com", "abc$domain=~foo.com|~bar.com"], "http://abc/def", "IMAGE", "bar.com", false, null, false, "abc$domain=bar.com"); |
| + checkMatch(test, ["abc$domain=foo.com", "abc$domain=bar.com", "abc$domain=~foo.com|~bar.com"], "http://abc/def", "IMAGE", "baz.com", false, null, false, "abc$domain=~foo.com|~bar.com"); |
| + checkMatch(test, ["abc$domain=foo.com", "cba$domain=bar.com", "ccc$domain=~foo.com|~bar.com"], "http://abc/def", "IMAGE", "foo.com", false, null, false, "abc$domain=foo.com"); |
| + checkMatch(test, ["abc$domain=foo.com", "cba$domain=bar.com", "ccc$domain=~foo.com|~bar.com"], "http://abc/def", "IMAGE", "bar.com", false, null, false, null); |
| + checkMatch(test, ["abc$domain=foo.com", "cba$domain=bar.com", "ccc$domain=~foo.com|~bar.com"], "http://abc/def", "IMAGE", "baz.com", false, null, false, null); |
| + checkMatch(test, ["abc$domain=foo.com", "cba$domain=bar.com", "ccc$domain=~foo.com|~bar.com"], "http://ccc/def", "IMAGE", "baz.com", false, null, false, "ccc$domain=~foo.com|~bar.com"); |
| + checkMatch(test, ["abc$sitekey=foo-publickey", "abc$sitekey=bar-publickey"], "http://abc/def", "IMAGE", "foo.com", false, "foo-publickey", false, "abc$sitekey=foo-publickey"); |
| + checkMatch(test, ["abc$sitekey=foo-publickey", "abc$sitekey=bar-publickey"], "http://abc/def", "IMAGE", "bar.com", false, "bar-publickey", false, "abc$sitekey=bar-publickey"); |
| + checkMatch(test, ["abc$sitekey=foo-publickey", "cba$sitekey=bar-publickey"], "http://abc/def", "IMAGE", "bar.com", false, "bar-publickey", false, null); |
| + checkMatch(test, ["abc$sitekey=foo-publickey", "cba$sitekey=bar-publickey"], "http://abc/def", "IMAGE", "baz.com", false, null, false, null); |
| + checkMatch(test, ["abc$sitekey=foo-publickey,domain=foo.com", "abc$sitekey=bar-publickey,domain=bar.com"], "http://abc/def", "IMAGE", "foo.com", false, "foo-publickey", false, "abc$sitekey=foo-publickey,domain=foo.com"); |
| + checkMatch(test, ["abc$sitekey=foo-publickey,domain=foo.com", "abc$sitekey=bar-publickey,domain=bar.com"], "http://abc/def", "IMAGE", "foo.com", false, "bar-publickey", false, null); |
| + checkMatch(test, ["abc$sitekey=foo-publickey,domain=foo.com", "abc$sitekey=bar-publickey,domain=bar.com"], "http://abc/def", "IMAGE", "bar.com", false, "foo-publickey", false, null); |
| + checkMatch(test, ["abc$sitekey=foo-publickey,domain=foo.com", "abc$sitekey=bar-publickey,domain=bar.com"], "http://abc/def", "IMAGE", "bar.com", false, "bar-publickey", false, "abc$sitekey=bar-publickey,domain=bar.com"); |
| + checkMatch(test, ["@@foo.com$generichide"], "http://foo.com/bar", "GENERICHIDE", "foo.com", false, null, false, "@@foo.com$generichide"); |
| + checkMatch(test, ["@@foo.com$genericblock"], "http://foo.com/bar", "GENERICBLOCK", "foo.com", false, null, false, "@@foo.com$genericblock"); |
| + checkMatch(test, ["@@bar.com$generichide"], "http://foo.com/bar", "GENERICHIDE", "foo.com", false, null, false, null); |
| + checkMatch(test, ["@@bar.com$genericblock"], "http://foo.com/bar", "GENERICBLOCK", "foo.com", false, null, false, null); |
| + checkMatch(test, ["/bar"], "http://foo.com/bar", "IMAGE", "foo.com", false, null, true, null); |
| + checkMatch(test, ["/bar$domain=foo.com"], "http://foo.com/bar", "IMAGE", "foo.com", false, null, true, "/bar$domain=foo.com"); |
| + |
| + test.done(); |
| +}; |
| + |
| +exports.testResultCacheChecks = function(test) |
| +{ |
| + let matcher = new CombinedMatcher(); |
| + matcher.add(Filter.fromText("abc$image")); |
| + matcher.add(Filter.fromText("abc$script")); |
| + matcher.add(Filter.fromText("abc$~image,~script,~media,~ping")); |
| + matcher.add(Filter.fromText("cba$third-party")); |
| + matcher.add(Filter.fromText("cba$~third-party,~script")); |
| + matcher.add(Filter.fromText("http://def$image")); |
| + matcher.add(Filter.fromText("http://def$script")); |
| + matcher.add(Filter.fromText("http://def$~image,~script,~media,~ping")); |
| + matcher.add(Filter.fromText("http://fed$third-party")); |
| + matcher.add(Filter.fromText("http://fed$~third-party,~script")); |
| + |
| + cacheCheck(test, matcher, "http://abc", "IMAGE", null, false, "abc$image"); |
| + cacheCheck(test, matcher, "http://abc", "SCRIPT", null, false, "abc$script"); |
| + cacheCheck(test, matcher, "http://abc", "OTHER", null, false, "abc$~image,~script,~media,~ping"); |
| + cacheCheck(test, matcher, "http://cba", "IMAGE", null, false, "cba$~third-party,~script"); |
| + cacheCheck(test, matcher, "http://cba", "IMAGE", null, true, "cba$third-party"); |
| + cacheCheck(test, matcher, "http://def", "IMAGE", null, false, "http://def$image"); |
| + cacheCheck(test, matcher, "http://def", "SCRIPT", null, false, "http://def$script"); |
| + cacheCheck(test, matcher, "http://def", "OTHER", null, false, "http://def$~image,~script,~media,~ping"); |
| + cacheCheck(test, matcher, "http://fed", "IMAGE", null, false, "http://fed$~third-party,~script"); |
| + cacheCheck(test, matcher, "http://fed", "IMAGE", null, true, "http://fed$third-party"); |
| + cacheCheck(test, matcher, "http://abc_cba", "MEDIA", null, false, "cba$~third-party,~script"); |
| + cacheCheck(test, matcher, "http://abc_cba", "MEDIA", null, true, "cba$third-party"); |
| + cacheCheck(test, matcher, "http://abc_cba", "SCRIPT", null, false, "abc$script"); |
| + cacheCheck(test, matcher, "http://def?http://fed", "MEDIA", null, false, "http://fed$~third-party,~script"); |
| + cacheCheck(test, matcher, "http://def?http://fed", "MEDIA", null, true, "http://fed$third-party"); |
| + cacheCheck(test, matcher, "http://def?http://fed", "SCRIPT", null, false, "http://def$script"); |
| + |
| + test.done(); |
| +}; |