Left: | ||
Right: |
LEFT | RIGHT |
---|---|
1 /* | 1 /* |
2 * This file is part of Adblock Plus <https://adblockplus.org/>, | 2 * This file is part of Adblock Plus <https://adblockplus.org/>, |
3 * Copyright (C) 2006-present eyeo GmbH | 3 * Copyright (C) 2006-present eyeo GmbH |
4 * | 4 * |
5 * Adblock Plus is free software: you can redistribute it and/or modify | 5 * Adblock Plus is free software: you can redistribute it and/or modify |
6 * it under the terms of the GNU General Public License version 3 as | 6 * it under the terms of the GNU General Public License version 3 as |
7 * published by the Free Software Foundation. | 7 * published by the Free Software Foundation. |
8 * | 8 * |
9 * Adblock Plus is distributed in the hope that it will be useful, | 9 * Adblock Plus is distributed in the hope that it will be useful, |
10 * but WITHOUT ANY WARRANTY; without even the implied warranty of | 10 * but WITHOUT ANY WARRANTY; without even the implied warranty of |
(...skipping 80 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
91 /** | 91 /** |
92 * Regular expression that RegExp filters specified as RegExps should match | 92 * Regular expression that RegExp filters specified as RegExps should match |
93 * @type {RegExp} | 93 * @type {RegExp} |
94 */ | 94 */ |
95 Filter.regexpRegExp = /^(@@)?\/.*\/(?:\$~?[\w-]+(?:=[^,\s]+)?(?:,~?[\w-]+(?:=[^, \s]+)?)*)?$/; | 95 Filter.regexpRegExp = /^(@@)?\/.*\/(?:\$~?[\w-]+(?:=[^,\s]+)?(?:,~?[\w-]+(?:=[^, \s]+)?)*)?$/; |
96 /** | 96 /** |
97 * Regular expression that options on a RegExp filter should match | 97 * Regular expression that options on a RegExp filter should match |
98 * @type {RegExp} | 98 * @type {RegExp} |
99 */ | 99 */ |
100 Filter.optionsRegExp = /\$(~?[\w-]+(?:=[^,]+)?(?:,~?[\w-]+(?:=[^,]+)?)*)$/; | 100 Filter.optionsRegExp = /\$(~?[\w-]+(?:=[^,]+)?(?:,~?[\w-]+(?:=[^,]+)?)*)$/; |
101 /** | |
102 * Regular expression that matches an invalid Content Security Policy | |
103 * @type {RegExp} | |
104 */ | |
105 Filter.invalidCSPRegExp = /(;|^) ?(base-uri|referrer|report-to|report-uri|upgrad e-insecure-requests)\b/i; | |
101 | 106 |
102 /** | 107 /** |
103 * Creates a filter of correct type from its text representation - does the | 108 * Creates a filter of correct type from its text representation - does the |
104 * basic parsing and calls the right constructor then. | 109 * basic parsing and calls the right constructor then. |
105 * | 110 * |
106 * @param {string} text as in Filter() | 111 * @param {string} text as in Filter() |
107 * @return {Filter} | 112 * @return {Filter} |
108 */ | 113 */ |
109 Filter.fromText = function(text) | 114 Filter.fromText = function(text) |
110 { | 115 { |
(...skipping 54 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
165 * Removes unnecessary whitespaces from filter text, will only return null if | 170 * Removes unnecessary whitespaces from filter text, will only return null if |
166 * the input parameter is null. | 171 * the input parameter is null. |
167 * @param {string} text | 172 * @param {string} text |
168 * @return {string} | 173 * @return {string} |
169 */ | 174 */ |
170 Filter.normalize = function(text) | 175 Filter.normalize = function(text) |
171 { | 176 { |
172 if (!text) | 177 if (!text) |
173 return text; | 178 return text; |
174 | 179 |
175 // Remove line breaks and such | 180 // Remove line breaks, tabs etc |
176 text = text.replace(/[^\S ]/g, ""); | 181 text = text.replace(/[^\S ]+/g, ""); |
177 | 182 |
178 // Don't remove spaces inside comments | 183 // Don't remove spaces inside comments |
179 if (/^\s*!/.test(text)) | 184 if (/^ *!/.test(text)) |
180 return text.trim(); | 185 return text.trim(); |
181 | 186 |
182 // Special treatment for element hiding filters, right side is allowed to | 187 // Special treatment for element hiding filters, right side is allowed to |
183 // contain spaces | 188 // contain spaces |
184 if (Filter.elemhideRegExp.test(text)) | 189 if (Filter.elemhideRegExp.test(text)) |
185 { | 190 { |
186 let [, domain, separator, selector] = /^(.*?)(#@?#?)(.*)$/.exec(text); | 191 let [, domain, separator, selector] = /^(.*?)(#@?#?)(.*)$/.exec(text); |
187 return domain.replace(/\s/g, "") + separator + selector.trim(); | 192 return domain.replace(/ +/g, "") + separator + selector.trim(); |
188 } | 193 } |
189 | 194 |
190 // For most regexp filters we strip all whitespace, but the values of $csp | 195 // For most regexp filters we strip all spaces, but $csp filter options |
Manish Jethani
2018/03/12 18:53:59
So this doesn't work for the following cases:
1.
Sebastian Noack
2018/03/12 23:19:01
Splitting the options list into an array (for ever
Manish Jethani
2018/03/13 06:59:30
You mean in terms of memory consumption? I ran a t
Manish Jethani
2018/03/13 07:35:00
OK, so I inlined that bit, now this seems to perfo
kzar
2018/03/14 13:54:37
Well spotted, I've added some unit tests for those
Sebastian Noack
2018/03/14 20:59:20
Any reason, why this suggestion was ignored, witho
kzar
2018/03/15 10:26:24
I ignored that since it assumed the first '$' was
Manish Jethani
2018/03/15 10:42:41
I think Sebastian is referring to the rest of the
kzar
2018/03/15 11:38:50
So instead of splitting the options string by ","
Manish Jethani
2018/03/15 12:00:11
Yes, it just turned out to be faster.
Sebastian Noack
2018/03/15 17:25:41
I guess, if it's only in the code path hit for $cs
| |
191 // filter options are allowed to contain single (non trailing) spaces. | 196 // are allowed to contain single (non trailing) spaces. |
192 let strippedText = text.replace(/\s/g, ""); | 197 let strippedText = text.replace(/ +/g, ""); |
Manish Jethani
2018/03/12 16:34:53
Since we have already stripped out all non-space w
kzar
2018/03/14 13:54:38
I think you're right, Done.
| |
193 if (!/csp=/i.test(strippedText)) | 198 if (!strippedText.includes("$") || !/\bcsp=/i.test(strippedText)) |
194 return strippedText; | 199 return strippedText; |
195 | 200 |
196 let optionsMatch = Filter.optionsRegExp.exec(strippedText); | 201 let optionsMatch = Filter.optionsRegExp.exec(strippedText); |
Manish Jethani
2018/03/12 16:34:53
We can just look for "$" here and if none is prese
kzar
2018/03/14 13:54:38
No, that's not good enough unfortunately. There ca
Manish Jethani
2018/03/14 18:10:49
OK, but I wonder if we shouldn't just look for a "
| |
197 if (!optionsMatch) | 202 if (!optionsMatch) |
198 return strippedText; | 203 return strippedText; |
199 | 204 |
200 // We know where the options part starts in the filter text that's stripped | 205 // For $csp filters we must first separate out the options part of the |
201 // of whitespace, next we must find the corresponding position in the original | 206 // text, being careful to preserve its spaces. |
202 // filter text. | 207 let beforeOptions = strippedText.substring(0, optionsMatch.index); |
203 let optionsPosition = 0; | 208 let strippedDollarIndex = -1; |
Manish Jethani
2018/03/12 16:34:53
This part is not being used at all.
kzar
2018/03/14 13:54:38
Whoops, you're right. I've fixed that now.
| |
204 let offset = 0; | 209 let dollarIndex = -1; |
205 while (offset > -1) | 210 do |
206 { | 211 { |
207 optionsPosition = text.substring(optionsPosition).indexOf("$"); | 212 strippedDollarIndex = beforeOptions.indexOf("$", strippedDollarIndex + 1); |
208 offset = strippedText.substring(offset, optionsPosition).indexOf("$"); | 213 dollarIndex = text.indexOf("$", dollarIndex + 1); |
209 } | 214 } |
210 | 215 while (strippedDollarIndex != -1); |
211 // Finally with that we can generally strip whitespace, being careful to not | 216 let optionsText = text.substr(dollarIndex + 1); |
212 // to for $csp filter values. | 217 |
213 let parts = []; | 218 // Then we can normalize spaces in the options part safely |
214 let position = 0; | 219 let options = optionsText.split(","); |
215 let cspRegexp = /(c\s*s\s*p\s*=)([^,]+)/ig; | 220 for (let i = 0; i < options.length; i++) |
216 let cspMatch; | 221 { |
217 while (cspMatch = cspRegexp.exec(text)) | 222 let option = options[i]; |
218 { | 223 let cspMatch = /^ *c *s *p *=/i.exec(option); |
219 parts.push( | 224 if (cspMatch) |
Manish Jethani
2018/03/12 16:34:53
We've already stripped whitespace once, now we're
kzar
2018/03/14 13:54:37
No because we're expecting thousands of non-csp fi
| |
220 text.substring(position, cspMatch.index + cspMatch[1].length) | 225 { |
221 .replace(/\s/g, "") | 226 options[i] = cspMatch[0].replace(/ +/g, "") + |
222 ); | 227 option.substr(cspMatch[0].length).trim().replace(/ +/g, " "); |
223 parts.push( | 228 } |
224 text.substr(cspMatch.index + cspMatch[1].length, cspMatch[2].length) | 229 else |
225 .replace(/\s+/g, " ") | 230 options[i] = option.replace(/ +/g, ""); |
226 .trim() | 231 } |
227 ); | 232 |
228 position = cspMatch.index + cspMatch[0].length; | 233 return beforeOptions + "$" + options.join(); |
229 } | |
230 parts.push(text.substr(position).replace(/\s/g, "")); | |
231 return parts.join(""); | |
232 }; | 234 }; |
233 | 235 |
234 /** | 236 /** |
235 * @see filterToRegExp | 237 * @see filterToRegExp |
236 */ | 238 */ |
237 Filter.toRegExp = filterToRegExp; | 239 Filter.toRegExp = filterToRegExp; |
238 | 240 |
239 /** | 241 /** |
240 * Class for invalid filters | 242 * Class for invalid filters |
241 * @param {string} text see Filter() | 243 * @param {string} text see Filter() |
(...skipping 533 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
775 { | 777 { |
776 options = match[1].split(","); | 778 options = match[1].split(","); |
777 text = match.input.substr(0, match.index); | 779 text = match.input.substr(0, match.index); |
778 for (let option of options) | 780 for (let option of options) |
779 { | 781 { |
780 let value = null; | 782 let value = null; |
781 let separatorIndex = option.indexOf("="); | 783 let separatorIndex = option.indexOf("="); |
782 if (separatorIndex >= 0) | 784 if (separatorIndex >= 0) |
783 { | 785 { |
784 value = option.substr(separatorIndex + 1); | 786 value = option.substr(separatorIndex + 1); |
785 option = option.substr(0, separatorIndex).toUpperCase(); | 787 option = option.substr(0, separatorIndex); |
786 | |
787 if (option == "CSP") | |
788 value = value.trim(); | |
789 else | |
790 value = value.replace(/\s/g, ""); | |
791 } | 788 } |
792 else | 789 option = option.replace(/-/, "_").toUpperCase(); |
793 option = option.toUpperCase(); | |
794 | |
795 option = option.replace(/-/, "_"); | |
796 | |
797 if (option in RegExpFilter.typeMap) | 790 if (option in RegExpFilter.typeMap) |
798 { | 791 { |
799 if (contentType == null) | 792 if (contentType == null) |
800 contentType = 0; | 793 contentType = 0; |
801 contentType |= RegExpFilter.typeMap[option]; | 794 contentType |= RegExpFilter.typeMap[option]; |
802 | 795 |
803 if (option == "CSP" && typeof value != "undefined") | 796 if (option == "CSP" && typeof value != "undefined") |
804 { | 797 csp = value; |
805 if (csp) | |
806 csp.push(value); | |
807 else | |
808 csp = [value]; | |
809 } | |
810 } | 798 } |
811 else if (option[0] == "~" && option.substr(1) in RegExpFilter.typeMap) | 799 else if (option[0] == "~" && option.substr(1) in RegExpFilter.typeMap) |
812 { | 800 { |
813 if (contentType == null) | 801 if (contentType == null) |
814 ({contentType} = RegExpFilter.prototype); | 802 ({contentType} = RegExpFilter.prototype); |
815 contentType &= ~RegExpFilter.typeMap[option.substr(1)]; | 803 contentType &= ~RegExpFilter.typeMap[option.substr(1)]; |
816 } | 804 } |
817 else if (option == "MATCH_CASE") | 805 else if (option == "MATCH_CASE") |
818 matchCase = true; | 806 matchCase = true; |
819 else if (option == "~MATCH_CASE") | 807 else if (option == "~MATCH_CASE") |
820 matchCase = false; | 808 matchCase = false; |
821 else if (option == "DOMAIN" && typeof value != "undefined") | 809 else if (option == "DOMAIN" && typeof value != "undefined") |
822 domains = value.toUpperCase(); | 810 domains = value.toUpperCase(); |
823 else if (option == "THIRD_PARTY") | 811 else if (option == "THIRD_PARTY") |
824 thirdParty = true; | 812 thirdParty = true; |
825 else if (option == "~THIRD_PARTY") | 813 else if (option == "~THIRD_PARTY") |
826 thirdParty = false; | 814 thirdParty = false; |
827 else if (option == "COLLAPSE") | 815 else if (option == "COLLAPSE") |
828 collapse = true; | 816 collapse = true; |
829 else if (option == "~COLLAPSE") | 817 else if (option == "~COLLAPSE") |
830 collapse = false; | 818 collapse = false; |
831 else if (option == "SITEKEY" && typeof value != "undefined") | 819 else if (option == "SITEKEY" && typeof value != "undefined") |
832 sitekeys = value.toUpperCase(); | 820 sitekeys = value.toUpperCase(); |
833 else | 821 else |
834 return new InvalidFilter(origText, "filter_unknown_option"); | 822 return new InvalidFilter(origText, "filter_unknown_option"); |
835 } | 823 } |
836 } | 824 } |
837 text = text.replace(/\s/g, ""); | |
838 | 825 |
839 try | 826 try |
840 { | 827 { |
841 if (blocking) | 828 if (blocking) |
842 { | 829 { |
843 if (csp) | 830 if (csp && Filter.invalidCSPRegExp.test(csp)) |
844 { | 831 return new InvalidFilter(origText, "filter_invalid_csp"); |
845 csp = csp.join("; ").toLowerCase(); | |
846 | |
847 // Prevent filters from injecting report-uri or report-to directives | |
848 // since they are a privacy concern. Regexp based upon reBadCSP[1]. | |
849 // [1] - https://github.com/gorhill/uBlock/blob/67e06f53b4d73df6179f6d32 0553a55da4ead40e/src/js/static-net-filtering.js#L1362 | |
850 if (/(;|^)\s*report-(to|uri)\b/.test(csp)) | |
851 return new InvalidFilter(origText, "filter_invalid_csp"); | |
852 } | |
853 | 832 |
854 return new BlockingFilter(origText, text, contentType, matchCase, domains, | 833 return new BlockingFilter(origText, text, contentType, matchCase, domains, |
855 thirdParty, sitekeys, collapse, csp); | 834 thirdParty, sitekeys, collapse, csp); |
856 } | 835 } |
857 return new WhitelistFilter(origText, text, contentType, matchCase, domains, | 836 return new WhitelistFilter(origText, text, contentType, matchCase, domains, |
858 thirdParty, sitekeys); | 837 thirdParty, sitekeys); |
859 } | 838 } |
860 catch (e) | 839 catch (e) |
861 { | 840 { |
862 return new InvalidFilter(origText, "filter_invalid_regexp"); | 841 return new InvalidFilter(origText, "filter_invalid_regexp"); |
(...skipping 238 matching lines...) Expand 10 before | Expand all | Expand 10 after Loading... | |
1101 */ | 1080 */ |
1102 function ElemHideEmulationFilter(text, domains, selector) | 1081 function ElemHideEmulationFilter(text, domains, selector) |
1103 { | 1082 { |
1104 ElemHideBase.call(this, text, domains, selector); | 1083 ElemHideBase.call(this, text, domains, selector); |
1105 } | 1084 } |
1106 exports.ElemHideEmulationFilter = ElemHideEmulationFilter; | 1085 exports.ElemHideEmulationFilter = ElemHideEmulationFilter; |
1107 | 1086 |
1108 ElemHideEmulationFilter.prototype = extend(ElemHideBase, { | 1087 ElemHideEmulationFilter.prototype = extend(ElemHideBase, { |
1109 type: "elemhideemulation" | 1088 type: "elemhideemulation" |
1110 }); | 1089 }); |
LEFT | RIGHT |