Rietveld Code Review Tool
Help | Bug tracker | Discussion group | Source code

Delta Between Two Patch Sets: abp2blocklist.js

Issue 29336525: Issue 3584 - Work around WebKit uppercase ID matching bug (Closed)
Left Patch Set: Don't forget IDs at the end of the string Created Feb. 17, 2016, 2:06 p.m.
Right Patch Set: Addressed further feedback Created Feb. 17, 2016, 3:33 p.m.
Left:
Right:
Use n/p to move between diff chunks; N/P to move between comments.
Jump to:
Left: Side by side diff | Download
Right: Side by side diff | Download
« no previous file with change/comment | « no previous file | no next file » | no next file with change/comment »
Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Show Comments Hide Comments ('s')
LEFTRIGHT
1 "use strict"; 1 "use strict";
2 2
3 let readline = require("readline"); 3 let readline = require("readline");
4 let punycode = require("punycode"); 4 let punycode = require("punycode");
5 let tldjs = require("tldjs"); 5 let tldjs = require("tldjs");
6 let filterClasses = require("./adblockplus.js"); 6 let filterClasses = require("./adblockplus.js");
7 7
8 let typeMap = filterClasses.RegExpFilter.typeMap; 8 let typeMap = filterClasses.RegExpFilter.typeMap;
9 9
10 const selectorLimit = 5000; 10 const selectorLimit = 5000;
(...skipping 236 matching lines...) Expand 10 before | Expand all | Expand 10 after
247 return true; 247 return true;
248 248
249 for (let name of Object.getOwnPropertyNames(obj)) 249 for (let name of Object.getOwnPropertyNames(obj))
250 if (hasNonASCI(obj[name])) 250 if (hasNonASCI(obj[name]))
251 return true; 251 return true;
252 } 252 }
253 253
254 return false; 254 return false;
255 } 255 }
256 256
257 function attributeSyntaxForIDs(selector) 257 function convertIDSelectorsToAttributeSelectors(selector)
Sebastian Noack 2016/02/17 14:40:59 Perhaps a better name for this function: convertID
kzar 2016/02/17 15:13:52 Done.
258 { 258 {
259 if (selector.indexOf("#") == -1)
Sebastian Noack 2016/02/17 14:22:19 Does this optimization has any measurable impact o
kzar 2016/02/17 15:13:52 No, removed.
260 return selector;
261
262 // First we figure out where all the IDs are 259 // First we figure out where all the IDs are
263 let sep = ""; 260 let sep = "";
264 let IDstart = null; 261 let start = null;
Sebastian Noack 2016/02/17 14:40:59 Nit: Since we only have one kind of start value an
kzar 2016/02/17 15:13:52 Done.
265 let IDpositions = []; 262 let positions = [];
266 for (let i = 0; i < selector.length; i++) 263 for (let i = 0; i < selector.length; i++)
267 { 264 {
268 let chr = selector[i]; 265 let chr = selector[i];
269 266
270 if (chr == "\\") // ignore escaped characters 267 if (chr == "\\") // ignore escaped characters
271 i++; 268 i++;
272 else if (chr == sep) // don't split within quoted text 269 else if (chr == sep) // don't match IDs within quoted text
273 sep = ""; // e.g. [attr=","] 270 sep = ""; // e.g. [attr="#Hello"]
274 else if (sep == "") 271 else if (sep == "")
275 { 272 {
276 if (chr == '"' || chr == "'") 273 if (chr == '"' || chr == "'")
277 sep = chr; 274 sep = chr;
278 else if (IDstart == null) // look for the start of an ID 275 else if (start == null) // look for the start of an ID
279 { 276 {
280 if (chr == "#") 277 if (chr == "#")
281 IDstart = i; 278 start = i;
282 } 279 }
283 else if (chr < "0" && chr != "-" || 280 else if (chr != "-" && chr != "_" &&
284 chr > "9" && chr < "A" || 281 (chr < "0" ||
285 chr > "Z" && chr != "_" && chr < "a" || 282 chr > "9" && chr < "A" ||
286 chr > "z" && chr < "\x80") // look for the end of the ID 283 chr > "Z" && chr < "a" ||
284 chr > "z" && chr < "\x80")) // look for the end of the ID
287 { 285 {
288 IDpositions.push({start: IDstart, end: i}); 286 positions.push({start: start, end: i});
Sebastian Noack 2016/02/17 14:22:19 I wonder we should do the replace inline: selecto
Sebastian Noack 2016/02/17 14:41:00 Here is an example how that could look like: fu
kzar 2016/02/17 15:13:52 Mind if I leave this as is? It works fine and I fi
289 IDstart = null; 287 start = null;
290 } 288 }
291 } 289 }
292 } 290 }
293 if (IDstart != null) 291 if (start != null)
294 IDpositions.push({start: IDstart, end: selector.length}); 292 positions.push({start: start, end: selector.length});
295
296 if (IDpositions.length == 0)
Sebastian Noack 2016/02/17 14:22:20 Does this optimization has any measurable impact o
kzar 2016/02/17 15:13:52 No, removed.
297 return selector;
298 293
299 // Now replace them all with the [id="someID"] form 294 // Now replace them all with the [id="someID"] form
300 let newSelector = ""; 295 let newSelector = [];
301 let position = 0; 296 let i = 0;
302 for (let ID of IDpositions) 297 for (let pos of positions)
303 { 298 {
304 newSelector += selector.substring(position, ID.start); 299 newSelector.push(selector.substring(i, pos.start));
305 newSelector += '[id="' + selector.substring(ID.start + 1, ID.end) + '"]'; 300 newSelector.push('[id=' + selector.substring(pos.start + 1, pos.end) + ']');
Sebastian Noack 2016/02/17 14:22:19 The quotes are actually redundant, as we copy an u
kzar 2016/02/17 15:13:52 Acknowledged.
306 position = ID.end; 301 i = pos.end;
307 } 302 }
308 newSelector += selector.substring(position); 303 newSelector.push(selector.substring(i));
309 304
310 return newSelector; 305 return newSelector.join("");
311 } 306 }
312 307
313 function logRules() 308 function logRules()
314 { 309 {
315 let rules = []; 310 let rules = [];
316 311
317 function addRule(rule) 312 function addRule(rule)
318 { 313 {
319 if (!hasNonASCI(rule)) 314 if (!hasNonASCI(rule))
320 rules.push(rule); 315 rules.push(rule);
(...skipping 18 matching lines...) Expand all
339 } 334 }
340 335
341 groupedElemhideFilters.forEach((selectors, matchDomain) => 336 groupedElemhideFilters.forEach((selectors, matchDomain) =>
342 { 337 {
343 while (selectors.length) 338 while (selectors.length)
344 { 339 {
345 let selector = selectors.splice(0, selectorLimit).join(", "); 340 let selector = selectors.splice(0, selectorLimit).join(", ");
346 341
347 // As of Safari 9.0 element IDs are matched as lowercase. We work around 342 // As of Safari 9.0 element IDs are matched as lowercase. We work around
348 // this by converting to the attribute format [id="elementID"] 343 // this by converting to the attribute format [id="elementID"]
349 selector = attributeSyntaxForIDs(selector); 344 selector = convertIDSelectorsToAttributeSelectors(selector);
350 345
351 addRule({ 346 addRule({
352 trigger: {"url-filter": matchDomain}, 347 trigger: {"url-filter": matchDomain},
353 action: {type: "css-display-none", 348 action: {type: "css-display-none",
354 selector: selector} 349 selector: selector}
355 }); 350 });
356 } 351 }
357 }); 352 });
358 353
359 for (let filter of elemhideExceptions) 354 for (let filter of elemhideExceptions)
360 addRule(convertFilter(filter, "ignore-previous-rules", false)); 355 addRule(convertFilter(filter, "ignore-previous-rules", false));
361 356
362 for (let filter of requestFilters) 357 for (let filter of requestFilters)
363 addRule(convertFilter(filter, "block", true)); 358 addRule(convertFilter(filter, "block", true));
364 for (let filter of requestExceptions) 359 for (let filter of requestExceptions)
365 addRule(convertFilter(filter, "ignore-previous-rules", true)); 360 addRule(convertFilter(filter, "ignore-previous-rules", true));
366 361
367 console.log(JSON.stringify(rules, null, "\t")); 362 console.log(JSON.stringify(rules, null, "\t"));
368 } 363 }
369 364
370 let rl = readline.createInterface({input: process.stdin, terminal: false}); 365 let rl = readline.createInterface({input: process.stdin, terminal: false});
371 rl.on("line", parseFilter); 366 rl.on("line", parseFilter);
372 rl.on("close", logRules); 367 rl.on("close", logRules);
LEFTRIGHT
« no previous file | no next file » | Toggle Intra-line Diffs ('i') | Expand Comments ('e') | Collapse Comments ('c') | Toggle Comments ('s')

Powered by Google App Engine
This is Rietveld