uBlock/src/js/cosmetic-filtering.js

1473 lines
50 KiB
JavaScript
Raw Normal View History

2014-06-24 00:42:43 +02:00
/*******************************************************************************
uBlock Origin - a browser extension to block requests.
2017-03-13 18:03:51 +01:00
Copyright (C) 2014-2017 Raymond Hill
2014-06-24 00:42:43 +02:00
This program is free software: you can redistribute it and/or modify
it under the terms of the GNU General Public License as published by
the Free Software Foundation, either version 3 of the License, or
(at your option) any later version.
This program is distributed in the hope that it will be useful,
but WITHOUT ANY WARRANTY; without even the implied warranty of
MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
GNU General Public License for more details.
You should have received a copy of the GNU General Public License
along with this program. If not, see {http://www.gnu.org/licenses/}.
Home: https://github.com/gorhill/uBlock
*/
'use strict';
2014-06-24 00:42:43 +02:00
/******************************************************************************/
2014-09-08 23:46:58 +02:00
µBlock.cosmeticFilteringEngine = (function(){
2014-06-24 00:42:43 +02:00
/******************************************************************************/
var µb = µBlock;
var cosmeticSurveyingMissCountMax = parseInt(vAPI.localStorage.getItem('cosmeticSurveyingMissCountMax'), 10) || 15;
2014-06-24 00:42:43 +02:00
/******************************************************************************/
/*
var histogram = function(label, buckets) {
var h = [],
bucket;
for ( var k in buckets ) {
if ( buckets.hasOwnProperty(k) === false ) {
continue;
}
bucket = buckets[k];
h.push({
k: k,
n: bucket instanceof FilterBucket ? bucket.filters.length : 1
});
}
console.log('Histogram %s', label);
var total = h.length;
h.sort(function(a, b) { return b.n - a.n; });
// Find indices of entries of interest
var target = 3;
for ( var i = 0; i < total; i++ ) {
if ( h[i].n === target ) {
console.log('\tEntries with only %d filter(s) start at index %s (key = "%s")', target, i, h[i].k);
target -= 1;
}
}
h = h.slice(0, 50);
h.forEach(function(v) {
console.log('\tkey="%s" count=%d', v.k, v.n);
});
console.log('\tTotal buckets count: %d', total);
};
*/
/*******************************************************************************
2014-06-24 00:42:43 +02:00
Each filter class will register itself in the map.
2014-06-24 00:42:43 +02:00
IMPORTANT: any change which modifies the mapping will have to be
reflected with µBlock.systemSettings.compiledMagic.
2014-06-24 00:42:43 +02:00
**/
2014-06-24 00:42:43 +02:00
var filterClasses = [];
2014-09-08 23:46:58 +02:00
var registerFilterClass = function(ctor) {
filterClasses[ctor.prototype.fid] = ctor;
2014-09-08 23:46:58 +02:00
};
var filterFromCompiledData = function(args) {
return filterClasses[args[0]].load(args);
2014-09-08 23:46:58 +02:00
};
/******************************************************************************/
2014-06-24 00:42:43 +02:00
// Any selector specific to a hostname
// Examples:
// search.snapdo.com###ABottomD
// facebook.com##.-cx-PRIVATE-fbAdUnit__root
// sltrib.com###BLContainer + div[style="height:90px;"]
// myps3.com.au##.Boxer[style="height: 250px;"]
// lindaikeji.blogspot.com##a > img[height="600"]
// japantimes.co.jp##table[align="right"][width="250"]
// mobilephonetalk.com##[align="center"] > b > a[href^="http://tinyurl.com/"]
var FilterHostname = function(s, hostname) {
this.s = s;
this.hostname = hostname;
};
FilterHostname.prototype.fid = 8;
2014-07-13 08:36:38 +02:00
FilterHostname.prototype.retrieve = function(hostname, out) {
2018-01-20 15:10:23 +01:00
if ( hostname.endsWith(this.hostname) === false ) { return; }
var i = hostname.length - this.hostname.length;
if ( i === 0 || hostname.charCodeAt(i-1) === 0x2E /* '.' */ ) {
2017-10-21 19:43:46 +02:00
out.add(this.s);
2014-07-13 08:36:38 +02:00
}
};
FilterHostname.prototype.compile = function() {
return [ this.fid, this.s, this.hostname ];
2014-09-08 23:46:58 +02:00
};
FilterHostname.load = function(data) {
return new FilterHostname(data[1], data[2]);
2014-09-08 23:46:58 +02:00
};
registerFilterClass(FilterHostname);
/******************************************************************************/
var FilterBucket = function(a, b) {
this.f = null;
this.filters = [];
if ( a !== undefined ) {
this.filters[0] = a;
this.filters[1] = b;
}
};
FilterBucket.prototype.fid = 10;
FilterBucket.prototype.add = function(a) {
this.filters.push(a);
};
FilterBucket.prototype.retrieve = function(s, out) {
var i = this.filters.length;
while ( i-- ) {
this.filters[i].retrieve(s, out);
}
};
FilterBucket.prototype.compile = function() {
var out = [],
filters = this.filters;
for ( var i = 0, n = filters.length; i < n; i++ ) {
out[i] = filters[i].compile();
}
return [ this.fid, out ];
};
FilterBucket.load = function(data) {
var bucket = new FilterBucket(),
entries = data[1];
for ( var i = 0, n = entries.length; i < n; i++ ) {
bucket.filters[i] = filterFromCompiledData(entries[i]);
}
return bucket;
};
registerFilterClass(FilterBucket);
2014-06-24 00:42:43 +02:00
/******************************************************************************/
/******************************************************************************/
2014-08-14 02:03:55 +02:00
var SelectorCacheEntry = function() {
2014-12-26 21:26:44 +01:00
this.reset();
};
/******************************************************************************/
SelectorCacheEntry.junkyard = [];
SelectorCacheEntry.factory = function() {
var entry = SelectorCacheEntry.junkyard.pop();
if ( entry ) {
return entry.reset();
}
return new SelectorCacheEntry();
};
/******************************************************************************/
2017-10-22 14:59:29 +02:00
var netSelectorCacheLowWaterMark = 20;
var netSelectorCacheHighWaterMark = 30;
2014-12-26 21:26:44 +01:00
/******************************************************************************/
SelectorCacheEntry.prototype.reset = function() {
2017-10-21 19:43:46 +02:00
this.cosmetic = new Set();
this.cosmeticSurveyingMissCount = 0;
2017-10-21 19:43:46 +02:00
this.net = new Map();
2014-08-14 02:03:55 +02:00
this.lastAccessTime = Date.now();
2014-12-26 21:26:44 +01:00
return this;
2014-08-14 02:03:55 +02:00
};
2014-12-26 21:26:44 +01:00
/******************************************************************************/
SelectorCacheEntry.prototype.dispose = function() {
this.cosmetic = this.net = null;
if ( SelectorCacheEntry.junkyard.length < 25 ) {
SelectorCacheEntry.junkyard.push(this);
}
};
/******************************************************************************/
SelectorCacheEntry.prototype.addCosmetic = function(details) {
var selectors = details.selectors,
i = selectors.length || 0;
// https://github.com/gorhill/uBlock/issues/2011
// Avoiding seemingly pointless surveys only if they appear costly.
if ( details.first && i === 0 ) {
if ( (details.cost || 0) >= 80 ) {
this.cosmeticSurveyingMissCount += 1;
}
return;
}
this.cosmeticSurveyingMissCount = 0;
while ( i-- ) {
2017-10-21 19:43:46 +02:00
this.cosmetic.add(selectors[i]);
}
};
2014-12-26 21:26:44 +01:00
/******************************************************************************/
2017-10-22 14:59:29 +02:00
SelectorCacheEntry.prototype.addNet = function(selectors) {
2014-08-15 16:34:13 +02:00
if ( typeof selectors === 'string' ) {
this.addNetOne(selectors, Date.now());
} else {
this.addNetMany(selectors, Date.now());
}
// Net request-derived selectors: I limit the number of cached selectors,
// as I expect cases where the blocked net-requests are never the
// exact same URL.
2017-10-21 19:43:46 +02:00
if ( this.net.size < netSelectorCacheHighWaterMark ) { return; }
2014-08-15 16:34:13 +02:00
var dict = this.net;
2017-10-21 19:43:46 +02:00
var keys = µb.arrayFrom(dict.keys()).sort(function(a, b) {
return dict.get(b) - dict.get(a);
}).slice(netSelectorCacheLowWaterMark);
2014-08-15 16:34:13 +02:00
var i = keys.length;
while ( i-- ) {
2017-10-21 19:43:46 +02:00
dict.delete(keys[i]);
2014-08-15 16:34:13 +02:00
}
};
2014-12-26 21:26:44 +01:00
/******************************************************************************/
2014-08-15 16:34:13 +02:00
SelectorCacheEntry.prototype.addNetOne = function(selector, now) {
2017-10-21 19:43:46 +02:00
this.net.set(selector, now);
2014-08-15 16:34:13 +02:00
};
2014-12-26 21:26:44 +01:00
/******************************************************************************/
2014-08-15 16:34:13 +02:00
SelectorCacheEntry.prototype.addNetMany = function(selectors, now) {
var i = selectors.length || 0;
while ( i-- ) {
2017-10-21 19:43:46 +02:00
this.net.set(selectors[i], now);
}
};
2014-12-26 21:26:44 +01:00
/******************************************************************************/
SelectorCacheEntry.prototype.add = function(details) {
2014-08-14 02:03:55 +02:00
this.lastAccessTime = Date.now();
if ( details.type === 'cosmetic' ) {
this.addCosmetic(details);
} else {
this.addNet(details.selectors);
}
2014-08-14 02:03:55 +02:00
};
2014-12-26 21:26:44 +01:00
/******************************************************************************/
2015-04-07 03:26:05 +02:00
// https://github.com/chrisaljoudi/uBlock/issues/420
2014-12-17 16:32:50 +01:00
SelectorCacheEntry.prototype.remove = function(type) {
this.lastAccessTime = Date.now();
2015-02-11 23:28:19 +01:00
if ( type === undefined || type === 'cosmetic' ) {
2017-10-21 19:43:46 +02:00
this.cosmetic.clear();
this.cosmeticSurveyingMissCount = 0;
2015-02-11 23:28:19 +01:00
}
if ( type === undefined || type === 'net' ) {
2017-10-21 19:43:46 +02:00
this.net.clear();
2014-12-17 16:32:50 +01:00
}
};
2014-12-26 21:26:44 +01:00
/******************************************************************************/
2017-10-22 14:59:29 +02:00
SelectorCacheEntry.prototype.retrieveToArray = function(iterator, out) {
for ( var selector of iterator ) {
out.push(selector);
}
};
SelectorCacheEntry.prototype.retrieveToSet = function(iterator, out) {
for ( var selector of iterator ) {
out.add(selector);
}
};
SelectorCacheEntry.prototype.retrieve = function(type, out) {
2014-08-14 02:03:55 +02:00
this.lastAccessTime = Date.now();
2017-10-22 14:59:29 +02:00
var iterator = type === 'cosmetic' ? this.cosmetic : this.net.keys();
if ( Array.isArray(out) ) {
this.retrieveToArray(iterator, out);
} else {
this.retrieveToSet(iterator, out);
2014-08-14 02:03:55 +02:00
}
};
/******************************************************************************/
/******************************************************************************/
// 0000HHHHHHHHHHHH
// |
// |
// |
// +-- bit 11-0 of FNV
2014-06-24 00:42:43 +02:00
var makeHash = function(token) {
// Ref: Given a URL, returns a unique 4-character long hash string
// Based on: FNV32a
// http://www.isthe.com/chongo/tech/comp/fnv/index.html#FNV-reference-source
// The rest is custom, suited for uBlock.
var i1 = token.length;
var i2 = i1 >> 1;
var i4 = i1 >> 2;
var i8 = i1 >> 3;
var hval = (0x811c9dc5 ^ token.charCodeAt(0)) >>> 0;
hval += (hval<<1) + (hval<<4) + (hval<<7) + (hval<<8) + (hval<<24);
hval >>>= 0;
hval ^= token.charCodeAt(i8);
hval += (hval<<1) + (hval<<4) + (hval<<7) + (hval<<8) + (hval<<24);
hval >>>= 0;
hval ^= token.charCodeAt(i4);
hval += (hval<<1) + (hval<<4) + (hval<<7) + (hval<<8) + (hval<<24);
hval >>>= 0;
hval ^= token.charCodeAt(i4+i8);
hval += (hval<<1) + (hval<<4) + (hval<<7) + (hval<<8) + (hval<<24);
hval >>>= 0;
hval ^= token.charCodeAt(i2);
hval += (hval<<1) + (hval<<4) + (hval<<7) + (hval<<8) + (hval<<24);
hval >>>= 0;
hval ^= token.charCodeAt(i2+i8);
hval += (hval<<1) + (hval<<4) + (hval<<7) + (hval<<8) + (hval<<24);
hval >>>= 0;
hval ^= token.charCodeAt(i2+i4);
hval += (hval<<1) + (hval<<4) + (hval<<7) + (hval<<8) + (hval<<24);
hval >>>= 0;
hval ^= token.charCodeAt(i1-1);
hval += (hval<<1) + (hval<<4) + (hval<<7) + (hval<<8) + (hval<<24);
hval >>>= 0;
hval &= 0x0FFF; // 12 bits
2015-02-24 00:31:29 +01:00
return hval.toString(36);
2014-06-24 00:42:43 +02:00
};
/******************************************************************************/
/******************************************************************************/
// Cosmetic filter family tree:
//
// Generic
// Low generic simple: class or id only
// Low generic complex: class or id + extra stuff after
// High generic:
// High-low generic: [alt="..."],[title="..."]
// High-medium generic: [href^="..."]
// High-high generic: everything else
// Specific
// Specfic hostname
// Specific entity
// Generic filters can only be enforced once the main document is loaded.
// Specific filers can be enforced before the main document is loaded.
2014-06-24 00:42:43 +02:00
var FilterContainer = function() {
this.noDomainHash = '-';
this.reHasUnicode = /[^\x00-\x7F]/;
2016-10-30 20:19:58 +01:00
this.rePlainSelector = /^[#.][\w\\-]+/;
this.rePlainSelectorEscaped = /^[#.](?:\\[0-9A-Fa-f]+ |\\.|\w|-)+/;
2017-10-21 19:43:46 +02:00
this.rePlainSelectorEx = /^[^#.\[(]+([#.][\w-]+)|([#.][\w-]+)$/;
2016-10-30 20:19:58 +01:00
this.reEscapeSequence = /\\([0-9A-Fa-f]+ |.)/g;
2017-10-21 19:43:46 +02:00
this.reSimpleHighGeneric1 = /^[a-z]*\[[^[]+]$/;
this.reHighMedium = /^\[href\^="https?:\/\/([^"]{8})[^"]*"\]$/;
this.reNeedHostname = new RegExp([
'^',
'(?:',
[
'.+?:has',
'.+?:has-text',
'.+?:if',
'.+?:if-not',
'.+?:matches-css(?:-before|-after)?',
'.*?:xpath',
2018-01-12 15:33:01 +01:00
'.+?:style',
'.+?:-abp-contains', // ABP-specific for `:has-text`
'.+?:-abp-has', // ABP-specific for `:if`
'.+?:contains' // Adguard-specific for `:has-text`
].join('|'),
')',
'\\(.+\\)',
'$'
].join(''));
2017-10-21 19:43:46 +02:00
this.selectorCache = new Map();
this.selectorCachePruneDelay = 10 * 60 * 1000; // 10 minutes
this.selectorCacheAgeMax = 120 * 60 * 1000; // 120 minutes
this.selectorCacheCountMin = 25;
this.netSelectorCacheCountMax = netSelectorCacheHighWaterMark;
this.selectorCacheTimer = null;
this.supportsUserStylesheets = vAPI.supportsUserStylesheets;
2017-10-21 19:43:46 +02:00
// generic exception filters
this.genericDonthideSet = new Set();
// TODO: Think about reusing µb.staticExtFilteringEngine.HostnameBasedDB
// for both specific and procedural filters. This would require some
// refactoring.
2017-10-21 19:43:46 +02:00
// hostname, entity-based filters
this.specificFilters = new Map();
this.proceduralFilters = new Map();
// low generic cosmetic filters, organized by id/class then simple/complex.
this.lowlyGeneric = Object.create(null);
this.lowlyGeneric.id = {
canonical: 'ids',
prefix: '#',
simple: new Set(),
complex: new Map()
};
this.lowlyGeneric.cl = {
canonical: 'classes',
prefix: '.',
simple: new Set(),
complex: new Map()
};
// highly generic selectors sets
this.highlyGeneric = Object.create(null);
this.highlyGeneric.simple = {
canonical: 'highGenericHideSimple',
dict: new Set(),
str: '',
mru: new µb.MRUCache(16)
};
this.highlyGeneric.complex = {
canonical: 'highGenericHideComplex',
dict: new Set(),
str: '',
mru: new µb.MRUCache(16)
};
2017-10-21 19:43:46 +02:00
// Short-lived: content is valid only during one function call. These
// is to prevent repeated allocation/deallocation overheads -- the
// constructors/destructors of javascript Set/Map is assumed to be costlier
// than just calling clear() on these.
this.setRegister0 = new Set();
this.setRegister1 = new Set();
this.setRegister2 = new Set();
2017-12-17 14:09:47 +01:00
this.mapRegister0 = new Map();
2017-10-21 19:43:46 +02:00
this.reset();
2014-06-24 00:42:43 +02:00
};
/******************************************************************************/
// Reset all, thus reducing to a minimum memory footprint of the context.
FilterContainer.prototype.reset = function() {
2015-02-24 00:31:29 +01:00
this.µburi = µb.URI;
2014-07-20 21:00:26 +02:00
this.frozen = false;
2014-06-24 00:42:43 +02:00
this.acceptedCount = 0;
2016-03-17 18:56:21 +01:00
this.discardedCount = 0;
this.duplicateBuster = new Set();
2017-10-21 19:43:46 +02:00
this.selectorCache.clear();
if ( this.selectorCacheTimer !== null ) {
clearTimeout(this.selectorCacheTimer);
this.selectorCacheTimer = null;
}
2014-08-14 02:03:55 +02:00
2016-08-13 22:42:58 +02:00
// generic filters
this.hasGenericHide = false;
2017-10-21 19:43:46 +02:00
// generic exception filters
this.genericDonthideSet.clear();
2017-10-21 19:43:46 +02:00
// hostname, entity-based filters
this.specificFilters.clear();
this.proceduralFilters.clear();
2017-10-21 19:43:46 +02:00
// low generic cosmetic filters, organized by id/class then simple/complex.
this.lowlyGeneric.id.simple.clear();
this.lowlyGeneric.id.complex.clear();
this.lowlyGeneric.cl.simple.clear();
this.lowlyGeneric.cl.complex.clear();
2017-10-21 19:43:46 +02:00
// highly generic selectors sets
this.highlyGeneric.simple.dict.clear();
this.highlyGeneric.simple.str = '';
this.highlyGeneric.simple.mru.reset();
this.highlyGeneric.complex.dict.clear();
this.highlyGeneric.complex.str = '';
this.highlyGeneric.complex.mru.reset();
2014-06-24 00:42:43 +02:00
};
/******************************************************************************/
2016-08-13 22:42:58 +02:00
FilterContainer.prototype.freeze = function() {
this.duplicateBuster = new Set();
2016-08-13 22:42:58 +02:00
2017-10-21 19:43:46 +02:00
this.hasGenericHide =
this.lowlyGeneric.id.simple.size !== 0 ||
this.lowlyGeneric.id.complex.size !== 0 ||
this.lowlyGeneric.cl.simple.size !== 0 ||
this.lowlyGeneric.cl.complex.size !== 0 ||
this.highlyGeneric.simple.dict.size !== 0 ||
this.highlyGeneric.complex.dict.size !== 0;
2017-10-21 19:43:46 +02:00
if ( this.genericDonthideSet.size !== 0 ) {
for ( var selector of this.genericDonthideSet ) {
var type = selector.charCodeAt(0);
if ( type === 0x23 /* '#' */ ) {
this.lowlyGeneric.id.simple.delete(selector.slice(1));
} else if ( type === 0x2E /* '.' */ ) {
this.lowlyGeneric.cl.simple.delete(selector.slice(1));
}
// TODO:
// this.lowlyGeneric.id.complex.delete(selector);
// this.lowlyGeneric.cl.complex.delete(selector);
this.highlyGeneric.simple.dict.delete(selector);
this.highlyGeneric.complex.dict.delete(selector);
2017-10-21 19:43:46 +02:00
}
2016-08-13 22:42:58 +02:00
}
this.highlyGeneric.simple.str = µb.arrayFrom(this.highlyGeneric.simple.dict).join(',\n');
this.highlyGeneric.complex.str = µb.arrayFrom(this.highlyGeneric.complex.dict).join(',\n');
2016-08-13 22:42:58 +02:00
this.frozen = true;
};
/******************************************************************************/
2016-10-30 20:19:58 +01:00
// https://github.com/gorhill/uBlock/issues/1668
// The key must be literal: unescape escaped CSS before extracting key.
// It's an uncommon case, so it's best to unescape only when needed.
FilterContainer.prototype.keyFromSelector = function(selector) {
var matches = this.rePlainSelector.exec(selector);
if ( matches === null ) { return; }
var key = matches[0];
if ( key.indexOf('\\') === -1 ) {
return key;
}
key = '';
matches = this.rePlainSelectorEscaped.exec(selector);
if ( matches === null ) { return; }
var escaped = matches[0],
beg = 0;
this.reEscapeSequence.lastIndex = 0;
for (;;) {
matches = this.reEscapeSequence.exec(escaped);
if ( matches === null ) {
return key + escaped.slice(beg);
}
key += escaped.slice(beg, matches.index);
beg = this.reEscapeSequence.lastIndex;
if ( matches[1].length === 1 ) {
key += matches[1];
} else {
key += String.fromCharCode(parseInt(matches[1], 16));
}
}
};
/******************************************************************************/
FilterContainer.prototype.compile = function(parsed, writer) {
// 1000 = cosmetic filtering
writer.select(1000);
2014-06-24 00:42:43 +02:00
var hostnames = parsed.hostnames,
i = hostnames.length;
if ( i === 0 ) {
this.compileGenericSelector(parsed, writer);
2015-02-24 05:25:14 +01:00
return true;
}
2015-04-07 03:26:05 +02:00
// https://github.com/chrisaljoudi/uBlock/issues/151
2015-02-24 05:25:14 +01:00
// Negated hostname means the filter applies to all non-negated hostnames
// of same filter OR globally if there is no non-negated hostnames.
var applyGlobally = true;
while ( i-- ) {
var hostname = hostnames[i];
if ( hostname.startsWith('~') === false ) {
2015-02-24 05:25:14 +01:00
applyGlobally = false;
}
this.compileHostnameSelector(hostname, parsed, writer);
2014-08-13 02:25:11 +02:00
}
2015-02-24 05:25:14 +01:00
if ( applyGlobally ) {
this.compileGenericSelector(parsed, writer);
2015-02-24 05:25:14 +01:00
}
2015-02-24 00:31:29 +01:00
return true;
};
2014-06-24 00:42:43 +02:00
/******************************************************************************/
2014-06-24 00:42:43 +02:00
FilterContainer.prototype.compileGenericSelector = function(parsed, writer) {
if ( parsed.exception === false ) {
this.compileGenericHideSelector(parsed, writer);
} else {
this.compileGenericUnhideSelector(parsed, writer);
2015-03-13 17:26:54 +01:00
}
};
/******************************************************************************/
2015-03-13 17:26:54 +01:00
FilterContainer.prototype.compileGenericHideSelector = function(parsed, writer) {
2018-01-12 15:33:01 +01:00
var selector = parsed.suffix;
// For some selectors, it is mandatory to have a hostname or entity:
// ##.foo:-abp-contains(...)
// ##.foo:-abp-has(...)
// ##.foo:contains(...)
// ##.foo:has(...)
// ##.foo:has-text(...)
// ##.foo:if(...)
// ##.foo:if-not(...)
// ##.foo:matches-css(...)
// ##.foo:matches-css-after(...)
// ##.foo:matches-css-before(...)
// ##:xpath(...)
2018-01-12 15:33:01 +01:00
// ##.foo:style(...)
if ( this.reNeedHostname.test(selector) ) {
µb.logger.writeOne(
'',
'error',
'Cosmetic filtering invalid generic filter: ##' + selector
);
return;
}
2018-01-12 15:33:01 +01:00
var type = selector.charCodeAt(0),
2017-10-21 19:43:46 +02:00
key;
2015-02-24 00:31:29 +01:00
2017-10-21 19:43:46 +02:00
if ( type === 0x23 /* '#' */ ) {
2016-10-30 20:19:58 +01:00
key = this.keyFromSelector(selector);
if ( key === undefined ) { return; }
2017-10-21 19:43:46 +02:00
// Simple selector-based CSS rule: no need to test for whether the
// selector is valid, the regex took care of this. Most generic
// selector falls into that category.
2016-10-30 20:19:58 +01:00
if ( key === selector ) {
2017-10-21 19:43:46 +02:00
writer.push([ 0 /* lg */, key.slice(1) ]);
return;
}
2017-10-21 19:43:46 +02:00
// Complex selector-based CSS rule.
if ( µb.staticExtFilteringEngine.compileSelector(selector) !== undefined ) {
2017-10-21 19:43:46 +02:00
writer.push([ 1 /* lg+ */, key.slice(1), selector ]);
}
return;
}
if ( type === 0x2E /* '.' */ ) {
key = this.keyFromSelector(selector);
if ( key === undefined ) { return; }
// Simple selector-based CSS rule: no need to test for whether the
// selector is valid, the regex took care of this. Most generic
// selector falls into that category.
if ( key === selector ) {
writer.push([ 2 /* lg */, key.slice(1) ]);
return;
}
// Complex selector-based CSS rule.
if ( µb.staticExtFilteringEngine.compileSelector(selector) !== undefined ) {
2017-10-21 19:43:46 +02:00
writer.push([ 3 /* lg+ */, key.slice(1), selector ]);
}
2015-02-24 00:31:29 +01:00
return;
}
2015-02-24 00:31:29 +01:00
var compiled = µb.staticExtFilteringEngine.compileSelector(selector);
if ( compiled === undefined ) { return; }
// TODO: Detect and error on procedural cosmetic filters.
2015-11-19 15:36:15 +01:00
2017-10-21 19:43:46 +02:00
// https://github.com/gorhill/uBlock/issues/909
// Anything which contains a plain id/class selector can be classified
// as a low generic cosmetic filter.
var matches = this.rePlainSelectorEx.exec(selector);
if ( matches !== null ) {
key = matches[1] || matches[2];
type = key.charCodeAt(0);
writer.push([
type === 0x23 ? 1 : 3 /* lg+ */,
key.slice(1),
selector
]);
2015-02-24 00:31:29 +01:00
return;
}
2017-10-21 19:43:46 +02:00
// Pass this point, we are dealing with highly-generic cosmetic filters.
//
// For efficiency purpose, we will distinguish between simple and complex
// selectors.
2015-02-24 00:31:29 +01:00
2017-10-21 19:43:46 +02:00
if ( this.reSimpleHighGeneric1.test(selector) ) {
writer.push([ 4 /* simple */, selector ]);
2015-11-19 15:36:15 +01:00
return;
}
2015-11-19 15:36:15 +01:00
if ( selector.indexOf(' ') === -1 ) {
2017-10-21 19:43:46 +02:00
writer.push([ 4 /* simple */, selector ]);
} else {
2017-10-21 19:43:46 +02:00
writer.push([ 5 /* complex */, selector ]);
}
};
2014-08-06 17:34:59 +02:00
/******************************************************************************/
FilterContainer.prototype.compileGenericUnhideSelector = function(
parsed,
writer
) {
// Procedural cosmetic filters are acceptable as generic exception filters.
var compiled = µb.staticExtFilteringEngine.compileSelector(parsed.suffix);
if ( compiled === undefined ) { return; }
// https://github.com/chrisaljoudi/uBlock/issues/497
// All generic exception filters are put in the same bucket: they are
// expected to be very rare.
writer.push([ 7 /* g1 */, compiled ]);
};
2015-02-24 00:31:29 +01:00
/******************************************************************************/
FilterContainer.prototype.compileHostnameSelector = function(
hostname,
parsed,
writer
) {
2015-04-07 03:26:05 +02:00
// https://github.com/chrisaljoudi/uBlock/issues/145
var unhide = parsed.exception ? 1 : 0;
if ( hostname.startsWith('~') ) {
hostname = hostname.slice(1);
unhide ^= 1;
2014-06-24 00:42:43 +02:00
}
var compiled = µb.staticExtFilteringEngine.compileSelector(parsed.suffix);
if ( compiled === undefined ) { return; }
var domain = this.µburi.domainFromHostname(hostname),
hash;
2015-04-07 03:26:05 +02:00
// https://github.com/chrisaljoudi/uBlock/issues/188
2015-02-24 00:31:29 +01:00
// If not a real domain as per PSL, assign a synthetic one
if ( hostname.endsWith('.*') === false ) {
hash = domain !== '' ? makeHash(domain) : this.noDomainHash;
} else {
hash = makeHash(hostname);
}
if ( unhide === 1 ) {
hash = '!' + hash;
}
// h, hash, example.com, .promoted-tweet
// h, hash, example.*, .promoted-tweet
2017-10-21 19:43:46 +02:00
// 8 = declarative, 9 = procedural
writer.push([
compiled.charCodeAt(0) !== 0x7B /* '{' */ ? 8 : 9,
hash,
hostname,
compiled
]);
};
/******************************************************************************/
FilterContainer.prototype.fromCompiledContent = function(reader, options) {
if ( options.skipCosmetic ) {
this.skipCompiledContent(reader);
2016-08-13 22:42:58 +02:00
return;
}
if ( options.skipGenericCosmetic ) {
this.skipGenericCompiledContent(reader);
2016-08-13 22:42:58 +02:00
return;
}
2017-10-21 19:43:46 +02:00
var fingerprint, args, db, filter, bucket;
2014-08-06 17:34:59 +02:00
// 1000 = cosmetic filtering
reader.select(1000);
while ( reader.next() ) {
2015-02-24 00:31:29 +01:00
this.acceptedCount += 1;
fingerprint = reader.fingerprint();
if ( this.duplicateBuster.has(fingerprint) ) {
2016-03-17 18:56:21 +01:00
this.discardedCount += 1;
continue;
}
this.duplicateBuster.add(fingerprint);
2014-07-04 22:47:34 +02:00
args = reader.args();
switch ( args[0] ) {
2017-10-21 19:43:46 +02:00
// low generic, simple
case 0: // #AdBanner
case 2: // .largeAd
db = args[0] === 0 ? this.lowlyGeneric.id : this.lowlyGeneric.cl;
bucket = db.complex.get(args[1]);
2015-02-24 00:31:29 +01:00
if ( bucket === undefined ) {
2017-10-21 19:43:46 +02:00
db.simple.add(args[1]);
} else if ( Array.isArray(bucket) ) {
bucket.push(args[1]);
2015-02-24 00:31:29 +01:00
} else {
2017-10-21 19:43:46 +02:00
db.complex.set(args[1], [ bucket, args[1] ]);
2015-02-24 00:31:29 +01:00
}
break;
2014-09-25 21:44:58 +02:00
2017-10-21 19:43:46 +02:00
// low generic, complex
case 1: // #tads + div + .c
case 3: // .Mpopup + #Mad > #MadZone
2017-11-05 04:51:44 +01:00
db = args[0] === 1 ? this.lowlyGeneric.id : this.lowlyGeneric.cl;
2017-10-21 19:43:46 +02:00
bucket = db.complex.get(args[1]);
2015-02-24 00:31:29 +01:00
if ( bucket === undefined ) {
2017-10-21 19:43:46 +02:00
if ( db.simple.has(args[1]) ) {
db.complex.set(args[1], [ args[1], args[2] ]);
} else {
2017-10-21 19:43:46 +02:00
db.complex.set(args[1], args[2]);
db.simple.add(args[1]);
}
} else if ( Array.isArray(bucket) ) {
bucket.push(args[2]);
2015-02-24 00:31:29 +01:00
} else {
2017-10-21 19:43:46 +02:00
db.complex.set(args[1], [ bucket, args[2] ]);
2015-02-24 00:31:29 +01:00
}
break;
2015-02-24 00:31:29 +01:00
// High-high generic hide/simple selectors
// div[id^="allo"]
case 4:
this.highlyGeneric.simple.dict.add(args[1]);
break;
// High-high generic hide/complex selectors
// div[id^="allo"] > span
case 5:
this.highlyGeneric.complex.dict.add(args[1]);
break;
2015-02-24 00:31:29 +01:00
2015-04-07 03:26:05 +02:00
// https://github.com/chrisaljoudi/uBlock/issues/497
2015-03-13 17:26:54 +01:00
// Generic exception filters: expected to be a rare occurrence.
// #@#.tweet
case 7:
2017-10-21 19:43:46 +02:00
this.genericDonthideSet.add(args[1]);
break;
2016-08-13 22:42:58 +02:00
// h, hash, example.com, .promoted-tweet
// h, hash, example.*, .promoted-tweet
case 8:
2017-10-21 19:43:46 +02:00
case 9:
db = args[0] === 8 ? this.specificFilters : this.proceduralFilters;
filter = new FilterHostname(args[3], args[2]);
2017-10-21 19:43:46 +02:00
bucket = db.get(args[1]);
if ( bucket === undefined ) {
2017-10-21 19:43:46 +02:00
db.set(args[1], filter);
} else if ( bucket instanceof FilterBucket ) {
bucket.add(filter);
} else {
2017-10-21 19:43:46 +02:00
db.set(args[1], new FilterBucket(bucket, filter));
}
break;
default:
this.discardedCount += 1;
break;
}
2014-06-24 00:42:43 +02:00
}
2015-02-24 00:31:29 +01:00
};
/******************************************************************************/
2014-09-25 21:44:58 +02:00
FilterContainer.prototype.skipGenericCompiledContent = function(reader) {
2017-10-21 19:43:46 +02:00
var fingerprint, args, db, filter, bucket;
2016-08-13 22:42:58 +02:00
// 1000 = cosmetic filtering
reader.select(1000);
while ( reader.next() ) {
2016-08-13 22:42:58 +02:00
this.acceptedCount += 1;
fingerprint = reader.fingerprint();
if ( this.duplicateBuster.has(fingerprint) ) {
2016-08-13 22:42:58 +02:00
this.discardedCount += 1;
continue;
}
args = reader.args();
switch ( args[0] ) {
// https://github.com/chrisaljoudi/uBlock/issues/497
// Generic exception filters: expected to be a rare occurrence.
case 7:
this.duplicateBuster.add(fingerprint);
2017-10-21 19:43:46 +02:00
this.genericDonthideSet.add(args[1]);
break;
// h, hash, example.com, .promoted-tweet
// h, hash, example.*, .promoted-tweet
case 8:
2017-10-21 19:43:46 +02:00
case 9:
db = args[0] === 8 ? this.specificFilters : this.proceduralFilters;
this.duplicateBuster.add(fingerprint);
filter = new FilterHostname(args[3], args[2]);
2017-10-21 19:43:46 +02:00
bucket = db.get(args[1]);
2016-08-13 22:42:58 +02:00
if ( bucket === undefined ) {
2017-10-21 19:43:46 +02:00
db.set(args[1], filter);
2016-08-13 22:42:58 +02:00
} else if ( bucket instanceof FilterBucket ) {
bucket.add(filter);
} else {
2017-10-21 19:43:46 +02:00
db.set(args[1], new FilterBucket(bucket, filter));
2016-08-13 22:42:58 +02:00
}
break;
2014-09-25 21:44:58 +02:00
default:
this.discardedCount += 1;
break;
2015-02-24 00:31:29 +01:00
}
2016-08-13 22:42:58 +02:00
}
};
/******************************************************************************/
FilterContainer.prototype.skipCompiledContent = function(reader) {
// 1000 = cosmetic filtering
reader.select(1000);
2016-08-13 22:42:58 +02:00
while ( reader.next() ) {
2016-03-17 18:56:21 +01:00
this.acceptedCount += 1;
this.discardedCount += 1;
2015-02-24 00:31:29 +01:00
}
2014-06-24 00:42:43 +02:00
};
/******************************************************************************/
2014-09-08 23:46:58 +02:00
FilterContainer.prototype.toSelfie = function() {
var selfieFromMap = function(map) {
var selfie = [];
// Note: destructuring assignment not supported before Chromium 49.
for ( var entry of map ) {
selfie.push([ entry[0], entry[1].compile() ]);
2014-09-08 23:46:58 +02:00
}
return JSON.stringify(selfie);
2014-09-08 23:46:58 +02:00
};
return {
acceptedCount: this.acceptedCount,
2016-03-17 18:56:21 +01:00
discardedCount: this.discardedCount,
specificFilters: selfieFromMap(this.specificFilters),
2017-10-21 19:43:46 +02:00
proceduralFilters: selfieFromMap(this.proceduralFilters),
2016-08-13 22:42:58 +02:00
hasGenericHide: this.hasGenericHide,
2017-10-21 19:43:46 +02:00
lowlyGenericSID: µb.arrayFrom(this.lowlyGeneric.id.simple),
lowlyGenericCID: µb.arrayFrom(this.lowlyGeneric.id.complex),
lowlyGenericSCL: µb.arrayFrom(this.lowlyGeneric.cl.simple),
lowlyGenericCCL: µb.arrayFrom(this.lowlyGeneric.cl.complex),
highSimpleGenericHideArray: µb.arrayFrom(this.highlyGeneric.simple.dict),
highComplexGenericHideArray: µb.arrayFrom(this.highlyGeneric.complex.dict),
genericDonthideArray: µb.arrayFrom(this.genericDonthideSet)
2014-09-08 23:46:58 +02:00
};
};
/******************************************************************************/
FilterContainer.prototype.fromSelfie = function(selfie) {
var mapFromSelfie = function(selfie) {
var entries = JSON.parse(selfie),
out = new Map(),
entry;
for ( var i = 0, n = entries.length; i < n; i++ ) {
entry = entries[i];
out.set(entry[0], filterFromCompiledData(entry[1]));
}
return out;
2014-09-08 23:46:58 +02:00
};
this.acceptedCount = selfie.acceptedCount;
2016-03-17 18:56:21 +01:00
this.discardedCount = selfie.discardedCount;
this.specificFilters = mapFromSelfie(selfie.specificFilters);
2017-10-21 19:43:46 +02:00
this.proceduralFilters = mapFromSelfie(selfie.proceduralFilters);
2016-08-13 22:42:58 +02:00
this.hasGenericHide = selfie.hasGenericHide;
2017-10-21 19:43:46 +02:00
this.lowlyGeneric.id.simple = new Set(selfie.lowlyGenericSID);
this.lowlyGeneric.id.complex = new Map(selfie.lowlyGenericCID);
this.lowlyGeneric.cl.simple = new Set(selfie.lowlyGenericSCL);
this.lowlyGeneric.cl.complex = new Map(selfie.lowlyGenericCCL);
this.highlyGeneric.simple.dict = new Set(selfie.highSimpleGenericHideArray);
this.highlyGeneric.simple.str = selfie.highSimpleGenericHideArray.join(',\n');
this.highlyGeneric.complex.dict = new Set(selfie.highComplexGenericHideArray);
this.highlyGeneric.complex.str = selfie.highComplexGenericHideArray.join(',\n');
2017-10-21 19:43:46 +02:00
this.genericDonthideSet = new Set(selfie.genericDonthideArray);
2015-01-23 21:02:47 +01:00
this.frozen = true;
2014-09-08 23:46:58 +02:00
};
/******************************************************************************/
2014-12-26 21:26:44 +01:00
FilterContainer.prototype.triggerSelectorCachePruner = function() {
// Of interest: http://fitzgeraldnick.com/weblog/40/
// http://googlecode.blogspot.ca/2009/07/gmail-for-mobile-html5-series-using.html
2017-10-21 19:43:46 +02:00
if ( this.selectorCacheTimer === null ) {
this.selectorCacheTimer = vAPI.setTimeout(
this.pruneSelectorCacheAsync.bind(this),
this.selectorCachePruneDelay
);
}
2014-12-26 21:26:44 +01:00
};
/******************************************************************************/
FilterContainer.prototype.addToSelectorCache = function(details) {
var hostname = details.hostname;
2017-10-21 19:43:46 +02:00
if ( typeof hostname !== 'string' || hostname === '' ) { return; }
var selectors = details.selectors;
2017-10-21 19:43:46 +02:00
if ( Array.isArray(selectors) === false ) { return; }
var entry = this.selectorCache.get(hostname);
2014-08-14 02:03:55 +02:00
if ( entry === undefined ) {
2017-10-21 19:43:46 +02:00
entry = SelectorCacheEntry.factory();
this.selectorCache.set(hostname, entry);
if ( this.selectorCache.size > this.selectorCacheCountMin ) {
this.triggerSelectorCachePruner();
}
2014-08-14 02:03:55 +02:00
}
entry.add(details);
2014-08-14 02:03:55 +02:00
};
/******************************************************************************/
2017-10-21 19:43:46 +02:00
FilterContainer.prototype.removeFromSelectorCache = function(
targetHostname,
type
) {
var targetHostnameLength = targetHostname.length,
hostname, item;
for ( var entry of this.selectorCache ) {
hostname = entry[0];
item = entry[1];
if ( targetHostname !== '*' ) {
2017-10-21 19:43:46 +02:00
if ( hostname.endsWith(targetHostname) === false ) { continue; }
if (
hostname.length !== targetHostnameLength &&
hostname.charAt(hostname.length - targetHostnameLength - 1) !== '.'
) {
continue;
}
}
2017-10-21 19:43:46 +02:00
item.remove(type);
2014-12-17 16:32:50 +01:00
}
};
/******************************************************************************/
2017-10-21 19:43:46 +02:00
FilterContainer.prototype.retrieveFromSelectorCache = function(
hostname,
type,
out
) {
var entry = this.selectorCache.get(hostname);
if ( entry !== undefined ) {
entry.retrieve(type, out);
2014-08-14 02:03:55 +02:00
}
};
/******************************************************************************/
2014-12-26 21:26:44 +01:00
FilterContainer.prototype.pruneSelectorCacheAsync = function() {
this.selectorCacheTimer = null;
2017-10-21 19:43:46 +02:00
if ( this.selectorCache.size <= this.selectorCacheCountMin ) { return; }
2014-08-14 02:03:55 +02:00
var cache = this.selectorCache;
2014-12-26 21:26:44 +01:00
// Sorted from most-recently-used to least-recently-used, because
// we loop beginning at the end below.
// We can't avoid sorting because we have to keep a minimum number of
// entries, and these entries should always be the most-recently-used.
2017-10-21 19:43:46 +02:00
var hostnames = µb.arrayFrom(cache.keys())
.sort(function(a, b) {
return cache.get(b).lastAccessTime -
cache.get(a).lastAccessTime;
})
.slice(this.selectorCacheCountMin);
var obsolete = Date.now() - this.selectorCacheAgeMax,
hostname, entry,
i = hostnames.length;
2014-08-14 02:03:55 +02:00
while ( i-- ) {
2014-12-26 21:26:44 +01:00
hostname = hostnames[i];
2017-10-21 19:43:46 +02:00
entry = cache.get(hostname);
if ( entry.lastAccessTime > obsolete ) { break; }
2014-12-26 21:26:44 +01:00
// console.debug('pruneSelectorCacheAsync: flushing "%s"', hostname);
entry.dispose();
2017-10-21 19:43:46 +02:00
cache.delete(hostname);
}
if ( cache.size > this.selectorCacheCountMin ) {
this.triggerSelectorCachePruner();
2014-08-14 02:03:55 +02:00
}
};
/******************************************************************************/
FilterContainer.prototype.randomAlphaToken = function() {
return String.fromCharCode(Date.now() % 26 + 97) +
Math.floor(Math.random() * 982451653 + 982451653).toString(36);
};
/******************************************************************************/
2017-12-17 14:09:47 +01:00
FilterContainer.prototype.retrieveGenericSelectors = function(request) {
2017-10-21 19:43:46 +02:00
if ( this.acceptedCount === 0 ) { return; }
if ( !request.ids && !request.classes ) { return; }
//console.time('cosmeticFilteringEngine.retrieveGenericSelectors');
2017-10-21 19:43:46 +02:00
var simpleSelectors = this.setRegister0,
complexSelectors = this.setRegister1;
var entry, selectors,
strEnd, sliceBeg, sliceEnd,
selector, bucket;
var cacheEntry = this.selectorCache.get(request.hostname),
previousHits = cacheEntry && cacheEntry.cosmetic || this.setRegister2;
2017-10-21 19:43:46 +02:00
for ( var type in this.lowlyGeneric ) {
entry = this.lowlyGeneric[type];
selectors = request[entry.canonical];
if ( typeof selectors !== 'string' ) { continue; }
strEnd = selectors.length;
sliceBeg = 0;
do {
sliceEnd = selectors.indexOf('\n', sliceBeg);
if ( sliceEnd === -1 ) { sliceEnd = strEnd; }
selector = selectors.slice(sliceBeg, sliceEnd);
sliceBeg = sliceEnd + 1;
if ( entry.simple.has(selector) === false ) { continue; }
if ( (bucket = entry.complex.get(selector)) !== undefined ) {
if ( Array.isArray(bucket) ) {
for ( selector of bucket ) {
if ( previousHits.has(selector) === false ) {
complexSelectors.add(selector);
}
2017-10-21 19:43:46 +02:00
}
} else if ( previousHits.has(bucket) === false ) {
2017-10-21 19:43:46 +02:00
complexSelectors.add(bucket);
}
} else {
selector = entry.prefix + selector;
if ( previousHits.has(selector) === false ) {
simpleSelectors.add(selector);
}
2017-10-21 19:43:46 +02:00
}
} while ( sliceBeg < strEnd );
2014-06-24 00:42:43 +02:00
}
2017-10-21 19:43:46 +02:00
// Apply exceptions: it is the responsibility of the caller to provide
// the exceptions to be applied.
if ( Array.isArray(request.exceptions) ) {
for ( var exception of request.exceptions ) {
simpleSelectors.delete(exception);
complexSelectors.delete(exception);
}
}
2014-06-24 00:42:43 +02:00
if ( simpleSelectors.size === 0 && complexSelectors.size === 0 ) {
return;
}
2017-10-21 19:43:46 +02:00
var out = {
simple: µb.arrayFrom(simpleSelectors),
complex: µb.arrayFrom(complexSelectors),
injected: ''
2014-06-24 00:42:43 +02:00
};
// Cache and inject (if user stylesheets supported) looked-up low generic
// cosmetic filters.
if ( typeof request.hostname === 'string' && request.hostname !== '' ) {
this.addToSelectorCache({
cost: request.surveyCost || 0,
hostname: request.hostname,
injectedHideFilters: '',
selectors: out.simple.concat(out.complex),
type: 'cosmetic'
});
}
// If user stylesheets are supported in the current process, inject the
// cosmetic filters now.
if (
this.supportsUserStylesheets &&
2017-12-17 14:09:47 +01:00
request.tabId !== undefined &&
request.frameId !== undefined
) {
var injected = [];
if ( out.simple.length !== 0 ) {
injected.push(out.simple.join(',\n'));
out.simple = [];
}
if ( out.complex.length !== 0 ) {
injected.push(out.complex.join(',\n'));
out.complex = [];
}
out.injected = injected.join(',\n');
2017-12-17 14:09:47 +01:00
vAPI.insertCSS(request.tabId, {
code: out.injected + '\n{display:none!important;}',
cssOrigin: 'user',
2017-12-17 14:09:47 +01:00
frameId: request.frameId,
runAt: 'document_start'
});
2014-06-24 00:42:43 +02:00
}
2017-10-21 19:43:46 +02:00
// Important: always clear used registers before leaving.
this.setRegister0.clear();
this.setRegister1.clear();
2014-06-24 00:42:43 +02:00
//console.timeEnd('cosmeticFilteringEngine.retrieveGenericSelectors');
2017-10-21 19:43:46 +02:00
return out;
2014-06-24 00:42:43 +02:00
};
/******************************************************************************/
2017-10-21 19:43:46 +02:00
FilterContainer.prototype.retrieveDomainSelectors = function(
request,
options
) {
//console.time('cosmeticFilteringEngine.retrieveDomainSelectors');
2014-06-24 00:42:43 +02:00
var hostname = request.hostname,
entity = request.entity,
2017-12-17 14:09:47 +01:00
cacheEntry = this.selectorCache.get(hostname),
entry;
2015-04-07 03:26:05 +02:00
// https://github.com/chrisaljoudi/uBlock/issues/587
// out.ready will tell the content script the cosmetic filtering engine is
2015-01-23 21:02:47 +01:00
// up and ready.
// https://github.com/chrisaljoudi/uBlock/issues/497
// Generic exception filters are to be applied on all pages.
var out = {
2015-01-23 21:02:47 +01:00
ready: this.frozen,
hostname: hostname,
domain: request.domain,
2017-10-21 19:43:46 +02:00
declarativeFilters: [],
exceptionFilters: [],
hideNodeAttr: this.randomAlphaToken(),
hideNodeStyleSheetInjected: false,
highGenericHideSimple: '',
highGenericHideComplex: '',
injectedHideFilters: '',
networkFilters: '',
noDOMSurveying: this.hasGenericHide === false,
proceduralFilters: []
2014-06-24 00:42:43 +02:00
};
2014-06-24 01:23:36 +02:00
2017-10-21 19:43:46 +02:00
if ( options.noCosmeticFiltering !== true ) {
var domainHash = makeHash(request.domain),
2017-10-21 19:43:46 +02:00
entityHash = entity !== '' ? makeHash(entity) : undefined,
exception, bucket;
2017-10-21 19:43:46 +02:00
// Exception cosmetic filters: prime with generic exception filters.
var exceptionSet = this.setRegister0;
// Genetic exceptions (should be extremely rare).
for ( exception of this.genericDonthideSet ) {
exceptionSet.add(exception);
}
// Specific exception cosmetic filters.
2017-10-21 19:43:46 +02:00
if ( (bucket = this.specificFilters.get('!' + domainHash)) ) {
bucket.retrieve(hostname, exceptionSet);
}
if ( (bucket = this.proceduralFilters.get('!' + domainHash)) ) {
bucket.retrieve(hostname, exceptionSet);
}
2017-10-21 19:43:46 +02:00
// Specific entity-based exception cosmetic filters.
if ( entityHash !== undefined ) {
if ( (bucket = this.specificFilters.get('!' + entityHash)) ) {
bucket.retrieve(entity, exceptionSet);
}
if ( (bucket = this.proceduralFilters.get('!' + entityHash)) ) {
bucket.retrieve(entity, exceptionSet);
}
}
// Special bucket for those filters without a valid
// domain name as per PSL.
if ( (bucket = this.specificFilters.get('!' + this.noDomainHash)) ) {
bucket.retrieve(hostname, exceptionSet);
}
if ( (bucket = this.proceduralFilters.get('!' + this.noDomainHash)) ) {
bucket.retrieve(hostname, exceptionSet);
}
2017-10-21 19:43:46 +02:00
if ( exceptionSet.size !== 0 ) {
out.exceptionFilters = µb.arrayFrom(exceptionSet);
}
2017-10-21 19:43:46 +02:00
// Declarative cosmetic filters.
// TODO: Should I go one step further and store specific simple and
// specific complex in different collections? This could simplify
// slightly content script code.
var specificSet = this.setRegister1;
// Specific cosmetic filters.
if ( (bucket = this.specificFilters.get(domainHash)) ) {
bucket.retrieve(hostname, specificSet);
}
// Specific entity-based cosmetic filters.
2017-10-21 19:43:46 +02:00
if ( entityHash !== undefined ) {
if ( (bucket = this.specificFilters.get(entityHash)) ) {
bucket.retrieve(entity, specificSet);
}
}
// https://github.com/chrisaljoudi/uBlock/issues/188
// Special bucket for those filters without a valid domain name as per PSL
if ( (bucket = this.specificFilters.get(this.noDomainHash)) ) {
2017-10-21 19:43:46 +02:00
bucket.retrieve(hostname, specificSet);
}
2017-10-21 19:43:46 +02:00
// Cached cosmetic filters: these are always declarative.
if ( cacheEntry !== undefined ) {
cacheEntry.retrieve('cosmetic', specificSet);
if ( out.noDOMSurveying === false ) {
out.noDOMSurveying = cacheEntry.cosmeticSurveyingMissCount >
2017-10-21 19:43:46 +02:00
cosmeticSurveyingMissCountMax;
}
}
2015-02-24 00:31:29 +01:00
2017-10-21 19:43:46 +02:00
// Procedural cosmetic filters.
var proceduralSet = this.setRegister2;
// Specific cosmetic filters.
if ( (bucket = this.proceduralFilters.get(domainHash)) ) {
bucket.retrieve(hostname, proceduralSet);
}
// Specific entity-based cosmetic filters.
if ( entityHash !== undefined ) {
if ( (bucket = this.proceduralFilters.get(entityHash)) ) {
bucket.retrieve(entity, proceduralSet);
2016-08-13 22:42:58 +02:00
}
}
2017-10-21 19:43:46 +02:00
// https://github.com/chrisaljoudi/uBlock/issues/188
// Special bucket for those filters without a valid domain name as per PSL
if ( (bucket = this.proceduralFilters.get(this.noDomainHash)) ) {
bucket.retrieve(hostname, proceduralSet);
}
// Apply exceptions.
for ( exception of exceptionSet ) {
specificSet.delete(exception);
proceduralSet.delete(exception);
}
if ( specificSet.size !== 0 ) {
out.declarativeFilters = µb.arrayFrom(specificSet);
2017-10-21 19:43:46 +02:00
}
if ( proceduralSet.size !== 0 ) {
out.proceduralFilters = µb.arrayFrom(proceduralSet);
2017-10-21 19:43:46 +02:00
}
// Highly generic cosmetic filters: sent once along with specific ones.
// A most-recent-used cache is used to skip computing the resulting set
// of high generics for a given set of exceptions.
// The resulting set of high generics is stored as a string, ready to
// be used as-is by the content script. The string is stored
// indirectly in the mru cache: this is to prevent duplication of the
// string in memory, which I have observed occurs when the string is
// stored directly as a value in a Map.
2017-10-21 19:43:46 +02:00
if ( options.noGenericCosmeticFiltering !== true ) {
var exceptionHash = out.exceptionFilters.join();
for ( var type in this.highlyGeneric ) {
2017-12-17 14:09:47 +01:00
entry = this.highlyGeneric[type];
var str = entry.mru.lookup(exceptionHash);
if ( str === undefined ) {
str = { s: entry.str };
var genericSet = entry.dict;
var hit = false;
for ( exception of exceptionSet ) {
if ( (hit = genericSet.has(exception)) ) { break; }
}
if ( hit ) {
genericSet = new Set(entry.dict);
for ( exception of exceptionSet ) {
genericSet.delete(exception);
}
str.s = µb.arrayFrom(genericSet).join(',\n');
}
entry.mru.add(exceptionHash, str);
2017-10-21 19:43:46 +02:00
}
out[entry.canonical] = str.s;
2017-10-21 19:43:46 +02:00
}
}
// Important: always clear used registers before leaving.
this.setRegister0.clear();
this.setRegister1.clear();
this.setRegister2.clear();
2014-08-27 19:50:18 +02:00
}
2014-06-24 00:42:43 +02:00
2017-12-17 14:09:47 +01:00
// CSS selectors for collapsible blocked elements
2017-10-22 14:59:29 +02:00
if ( cacheEntry ) {
var networkFilters = [];
cacheEntry.retrieve('net', networkFilters);
out.networkFilters = networkFilters.join(',\n');
2017-10-22 14:59:29 +02:00
}
2014-08-14 02:03:55 +02:00
// https://github.com/gorhill/uBlock/issues/3160
// If user stylesheets are supported in the current process, inject the
// cosmetic filters now.
if (
this.supportsUserStylesheets &&
2017-12-17 14:09:47 +01:00
request.tabId !== undefined &&
request.frameId !== undefined
) {
var injectedHideFilters = [];
if ( out.declarativeFilters.length !== 0 ) {
injectedHideFilters.push(out.declarativeFilters.join(',\n'));
out.declarativeFilters = [];
}
if ( out.proceduralFilters.length !== 0 ) {
injectedHideFilters.push('[' + out.hideNodeAttr + ']');
out.hideNodeStyleSheetInjected = true;
}
if ( out.highGenericHideSimple.length !== 0 ) {
injectedHideFilters.push(out.highGenericHideSimple);
out.highGenericHideSimple = '';
}
if ( out.highGenericHideComplex.length !== 0 ) {
injectedHideFilters.push(out.highGenericHideComplex);
out.highGenericHideComplex = '';
}
out.injectedHideFilters = injectedHideFilters.join(',\n');
var details = {
code: '',
cssOrigin: 'user',
2017-12-17 14:09:47 +01:00
frameId: request.frameId,
runAt: 'document_start'
};
if ( out.injectedHideFilters.length !== 0 ) {
details.code = out.injectedHideFilters + '\n{display:none!important;}';
2017-12-17 14:09:47 +01:00
vAPI.insertCSS(request.tabId, details);
}
if ( out.networkFilters.length !== 0 ) {
details.code = out.networkFilters + '\n{display:none!important;}';
2017-12-17 14:09:47 +01:00
vAPI.insertCSS(request.tabId, details);
out.networkFilters = '';
}
}
//console.timeEnd('cosmeticFilteringEngine.retrieveDomainSelectors');
2014-06-24 00:42:43 +02:00
return out;
2014-06-24 00:42:43 +02:00
};
/******************************************************************************/
FilterContainer.prototype.getFilterCount = function() {
2016-03-17 18:56:21 +01:00
return this.acceptedCount - this.discardedCount;
2014-06-24 00:42:43 +02:00
};
/******************************************************************************/
return new FilterContainer();
/******************************************************************************/
})();
/******************************************************************************/